diff --git "a/wandb/run-20220301_221232-283qa50u/files/wandb-summary.json" "b/wandb/run-20220301_221232-283qa50u/files/wandb-summary.json" --- "a/wandb/run-20220301_221232-283qa50u/files/wandb-summary.json" +++ "b/wandb/run-20220301_221232-283qa50u/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.1867, "train/learning_rate": 8.88e-05, "train/epoch": 1.0, "train/global_step": 446, "_runtime": 6494, "_timestamp": 1646179246, "_step": 447, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 33.0, 233.0, 533.0, 191.0, 23.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.007577896118164, -19.918153762817383, -16.828731536865234, -13.739307403564453, -10.649883270263672, -7.560459136962891, -4.471036911010742, -1.381612777709961, 1.7078113555908203, 4.797235012054443, 7.886658668518066, 10.976081848144531, 14.065505981445312, 17.154930114746094, 20.244352340698242, 23.333776473999023, 26.423200607299805, 29.512624740600586, 32.602046966552734, 35.691471099853516, 38.7808952331543, 41.87031936645508, 44.959739685058594, 48.049163818359375, 51.138587951660156, 54.22801208496094, 57.31743621826172, 60.4068603515625, 63.49628448486328, 66.58570861816406, 69.67512512207031, 72.76455688476562, 75.85397338867188, 78.94339752197266, 82.03282165527344, 85.12224578857422, 88.211669921875, 91.30109405517578, 94.39051818847656, 97.47993469238281, 100.56936645507812, 103.6587905883789, 106.74821472167969, 109.83763885498047, 112.92706298828125, 116.01648712158203, 119.10591125488281, 122.19532775878906, 125.28475189208984, 128.37417602539062, 131.46359252929688, 134.5530242919922, 137.64244079589844, 140.73187255859375, 143.8212890625, 146.9107208251953, 150.00013732910156, 153.0895538330078, 156.17898559570312, 159.26840209960938, 162.3578338623047, 165.44725036621094, 168.53668212890625, 171.6260986328125, 174.7155303955078]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 1.0, 7.0, 7.0, 6.0, 5.0, 9.0, 12.0, 13.0, 9.0, 11.0, 29.0, 28.0, 28.0, 23.0, 25.0, 31.0, 32.0, 39.0, 41.0, 36.0, 49.0, 50.0, 49.0, 33.0, 39.0, 37.0, 42.0, 40.0, 34.0, 35.0, 17.0, 40.0, 22.0, 24.0, 15.0, 14.0, 14.0, 12.0, 14.0, 11.0, 8.0, 8.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.05972671508789, -29.033992767333984, -28.00826072692871, -26.982526779174805, -25.9567928314209, -24.931060791015625, -23.90532684326172, -22.879592895507812, -21.853858947753906, -20.828125, -19.802392959594727, -18.77665901184082, -17.750925064086914, -16.72519302368164, -15.699459075927734, -14.673725128173828, -13.647993087768555, -12.622260093688965, -11.596526145935059, -10.570793151855469, -9.545059204101562, -8.519326210021973, -7.493593215942383, -6.467859745025635, -5.442126274108887, -4.416392803192139, -3.3906595706939697, -2.364926338195801, -1.3391928672790527, -0.3134593963623047, 0.7122735977172852, 1.7380070686340332, 2.7637405395507812, 3.7894740104675293, 4.815207481384277, 5.840940475463867, 6.866673946380615, 7.892407417297363, 8.918140411376953, 9.94387435913086, 10.96960735321045, 11.995340347290039, 13.021074295043945, 14.046807289123535, 15.072540283203125, 16.09827423095703, 17.124008178710938, 18.14974021911621, 19.175474166870117, 20.201208114624023, 21.226940155029297, 22.252674102783203, 23.27840805053711, 24.304141998291016, 25.32987403869629, 26.355607986450195, 27.38134002685547, 28.407073974609375, 29.43280601501465, 30.458539962768555, 31.48427391052246, 32.510005950927734, 33.53573989868164, 34.56147384643555, 35.58720779418945]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 3.0, 2.0, 11.0, 4.0, 6.0, 4.0, 15.0, 12.0, 17.0, 11.0, 23.0, 31.0, 27.0, 27.0, 18.0, 38.0, 39.0, 34.0, 30.0, 42.0, 37.0, 47.0, 56.0, 40.0, 34.0, 43.0, 30.0, 38.0, 51.0, 29.0, 26.0, 28.0, 28.0, 22.0, 20.0, 12.0, 10.0, 15.0, 15.0, 9.0, 11.0, 5.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3164215087890625, -1.271514892578125, -1.2266082763671875, -1.18170166015625, -1.1367950439453125, -1.091888427734375, -1.0469818115234375, -1.0020751953125, -0.9571685791015625, -0.912261962890625, -0.8673553466796875, -0.82244873046875, -0.7775421142578125, -0.732635498046875, -0.6877288818359375, -0.642822265625, -0.5979156494140625, -0.553009033203125, -0.5081024169921875, -0.46319580078125, -0.4182891845703125, -0.373382568359375, -0.3284759521484375, -0.2835693359375, -0.2386627197265625, -0.193756103515625, -0.1488494873046875, -0.10394287109375, -0.0590362548828125, -0.014129638671875, 0.0307769775390625, 0.07568359375, 0.1205902099609375, 0.165496826171875, 0.2104034423828125, 0.25531005859375, 0.3002166748046875, 0.345123291015625, 0.3900299072265625, 0.4349365234375, 0.4798431396484375, 0.524749755859375, 0.5696563720703125, 0.61456298828125, 0.6594696044921875, 0.704376220703125, 0.7492828369140625, 0.794189453125, 0.8390960693359375, 0.884002685546875, 0.9289093017578125, 0.97381591796875, 1.0187225341796875, 1.063629150390625, 1.1085357666015625, 1.1534423828125, 1.1983489990234375, 1.243255615234375, 1.2881622314453125, 1.33306884765625, 1.3779754638671875, 1.422882080078125, 1.4677886962890625, 1.5126953125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 10.0, 9.0, 13.0, 16.0, 17.0, 23.0, 27.0, 44.0, 60.0, 73.0, 99.0, 120.0, 208.0, 281.0, 446.0, 643.0, 1085.0, 1817.0, 3753.0, 9070.0, 28623.0, 141013.0, 1479029.0, 2245036.0, 222844.0, 38747.0, 11184.0, 4406.0, 2179.0, 1165.0, 751.0, 445.0, 298.0, 193.0, 142.0, 107.0, 84.0, 55.0, 45.0, 35.0, 25.0, 20.0, 11.0, 11.0, 5.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.1875, -5.020751953125, -4.85400390625, -4.687255859375, -4.5205078125, -4.353759765625, -4.18701171875, -4.020263671875, -3.853515625, -3.686767578125, -3.52001953125, -3.353271484375, -3.1865234375, -3.019775390625, -2.85302734375, -2.686279296875, -2.51953125, -2.352783203125, -2.18603515625, -2.019287109375, -1.8525390625, -1.685791015625, -1.51904296875, -1.352294921875, -1.185546875, -1.018798828125, -0.85205078125, -0.685302734375, -0.5185546875, -0.351806640625, -0.18505859375, -0.018310546875, 0.1484375, 0.315185546875, 0.48193359375, 0.648681640625, 0.8154296875, 0.982177734375, 1.14892578125, 1.315673828125, 1.482421875, 1.649169921875, 1.81591796875, 1.982666015625, 2.1494140625, 2.316162109375, 2.48291015625, 2.649658203125, 2.81640625, 2.983154296875, 3.14990234375, 3.316650390625, 3.4833984375, 3.650146484375, 3.81689453125, 3.983642578125, 4.150390625, 4.317138671875, 4.48388671875, 4.650634765625, 4.8173828125, 4.984130859375, 5.15087890625, 5.317626953125, 5.484375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 16.0, 30.0, 66.0, 173.0, 441.0, 1089.0, 1279.0, 557.0, 238.0, 87.0, 49.0, 17.0, 11.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3359375, -12.8775634765625, -12.419189453125, -11.9608154296875, -11.50244140625, -11.0440673828125, -10.585693359375, -10.1273193359375, -9.6689453125, -9.2105712890625, -8.752197265625, -8.2938232421875, -7.83544921875, -7.3770751953125, -6.918701171875, -6.4603271484375, -6.001953125, -5.5435791015625, -5.085205078125, -4.6268310546875, -4.16845703125, -3.7100830078125, -3.251708984375, -2.7933349609375, -2.3349609375, -1.8765869140625, -1.418212890625, -0.9598388671875, -0.50146484375, -0.0430908203125, 0.415283203125, 0.8736572265625, 1.33203125, 1.7904052734375, 2.248779296875, 2.7071533203125, 3.16552734375, 3.6239013671875, 4.082275390625, 4.5406494140625, 4.9990234375, 5.4573974609375, 5.915771484375, 6.3741455078125, 6.83251953125, 7.2908935546875, 7.749267578125, 8.2076416015625, 8.666015625, 9.1243896484375, 9.582763671875, 10.0411376953125, 10.49951171875, 10.9578857421875, 11.416259765625, 11.8746337890625, 12.3330078125, 12.7913818359375, 13.249755859375, 13.7081298828125, 14.16650390625, 14.6248779296875, 15.083251953125, 15.5416259765625, 16.0]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 5.0, 3.0, 11.0, 10.0, 12.0, 40.0, 71.0, 194.0, 502.0, 2078.0, 27085.0, 4147883.0, 13883.0, 1694.0, 479.0, 175.0, 71.0, 36.0, 11.0, 13.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.8125, -41.40576171875, -39.9990234375, -38.59228515625, -37.185546875, -35.77880859375, -34.3720703125, -32.96533203125, -31.55859375, -30.15185546875, -28.7451171875, -27.33837890625, -25.931640625, -24.52490234375, -23.1181640625, -21.71142578125, -20.3046875, -18.89794921875, -17.4912109375, -16.08447265625, -14.677734375, -13.27099609375, -11.8642578125, -10.45751953125, -9.05078125, -7.64404296875, -6.2373046875, -4.83056640625, -3.423828125, -2.01708984375, -0.6103515625, 0.79638671875, 2.203125, 3.60986328125, 5.0166015625, 6.42333984375, 7.830078125, 9.23681640625, 10.6435546875, 12.05029296875, 13.45703125, 14.86376953125, 16.2705078125, 17.67724609375, 19.083984375, 20.49072265625, 21.8974609375, 23.30419921875, 24.7109375, 26.11767578125, 27.5244140625, 28.93115234375, 30.337890625, 31.74462890625, 33.1513671875, 34.55810546875, 35.96484375, 37.37158203125, 38.7783203125, 40.18505859375, 41.591796875, 42.99853515625, 44.4052734375, 45.81201171875, 47.21875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 61.0, 348.0, 424.0, 158.0, 14.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.08546447753906, -98.74624633789062, -96.40702056884766, -94.06779479980469, -91.72857666015625, -89.38935852050781, -87.05013275146484, -84.71090698242188, -82.37168884277344, -80.032470703125, -77.69324493408203, -75.35401916503906, -73.01480102539062, -70.67558288574219, -68.33635711669922, -65.99713134765625, -63.65791320800781, -61.31869125366211, -58.979469299316406, -56.6402473449707, -54.301025390625, -51.9618034362793, -49.622581481933594, -47.28335952758789, -44.94413757324219, -42.604915618896484, -40.26569366455078, -37.92647171020508, -35.587249755859375, -33.24802780151367, -30.90880584716797, -28.569583892822266, -26.230358123779297, -23.891136169433594, -21.55191421508789, -19.212692260742188, -16.873470306396484, -14.534248352050781, -12.195026397705078, -9.855804443359375, -7.516582489013672, -5.177360534667969, -2.8381385803222656, -0.4989166259765625, 1.8403053283691406, 4.179527282714844, 6.518749237060547, 8.85797119140625, 11.197193145751953, 13.536415100097656, 15.87563705444336, 18.214859008789062, 20.554080963134766, 22.89330291748047, 25.232524871826172, 27.571746826171875, 29.910968780517578, 32.25019073486328, 34.589412689208984, 36.92863464355469, 39.26785659790039, 41.607078552246094, 43.9463005065918, 46.2855224609375, 48.6247444152832]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 10.0, 14.0, 14.0, 13.0, 17.0, 27.0, 28.0, 26.0, 32.0, 35.0, 41.0, 36.0, 45.0, 42.0, 49.0, 39.0, 46.0, 34.0, 29.0, 42.0, 39.0, 35.0, 38.0, 35.0, 37.0, 29.0, 25.0, 19.0, 18.0, 13.0, 16.0, 18.0, 8.0, 6.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.333791732788086, -19.734371185302734, -19.134950637817383, -18.53553009033203, -17.93610954284668, -17.336688995361328, -16.737268447875977, -16.137847900390625, -15.53842830657959, -14.939007759094238, -14.339587211608887, -13.740166664123535, -13.1407470703125, -12.541326522827148, -11.941905975341797, -11.342485427856445, -10.743064880371094, -10.143644332885742, -9.54422378540039, -8.944803237915039, -8.345382690429688, -7.745962619781494, -7.146542549133301, -6.547122001647949, -5.947701454162598, -5.348280906677246, -4.7488603591918945, -4.149440288543701, -3.5500197410583496, -2.950599193572998, -2.3511788845062256, -1.7517585754394531, -1.1523361206054688, -0.5529156923294067, 0.04650473594665527, 0.6459251642227173, 1.2453455924987793, 1.8447661399841309, 2.4441864490509033, 3.043606758117676, 3.6430273056030273, 4.242447853088379, 4.8418684005737305, 5.441288471221924, 6.040709018707275, 6.640129566192627, 7.23954963684082, 7.838970184326172, 8.438390731811523, 9.037811279296875, 9.637231826782227, 10.236652374267578, 10.83607292175293, 11.435493469238281, 12.034913063049316, 12.634333610534668, 13.23375415802002, 13.833174705505371, 14.432595252990723, 15.032015800476074, 15.63143539428711, 16.23085594177246, 16.830276489257812, 17.429697036743164, 18.029117584228516]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 3.0, 4.0, 7.0, 4.0, 13.0, 15.0, 7.0, 13.0, 23.0, 24.0, 27.0, 24.0, 32.0, 37.0, 46.0, 30.0, 27.0, 30.0, 42.0, 28.0, 50.0, 31.0, 50.0, 59.0, 36.0, 36.0, 41.0, 23.0, 34.0, 25.0, 25.0, 24.0, 26.0, 17.0, 21.0, 12.0, 11.0, 12.0, 13.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2374725341796875, -1.194671630859375, -1.1518707275390625, -1.10906982421875, -1.0662689208984375, -1.023468017578125, -0.9806671142578125, -0.9378662109375, -0.8950653076171875, -0.852264404296875, -0.8094635009765625, -0.76666259765625, -0.7238616943359375, -0.681060791015625, -0.6382598876953125, -0.595458984375, -0.5526580810546875, -0.509857177734375, -0.4670562744140625, -0.42425537109375, -0.3814544677734375, -0.338653564453125, -0.2958526611328125, -0.2530517578125, -0.2102508544921875, -0.167449951171875, -0.1246490478515625, -0.08184814453125, -0.0390472412109375, 0.003753662109375, 0.0465545654296875, 0.08935546875, 0.1321563720703125, 0.174957275390625, 0.2177581787109375, 0.26055908203125, 0.3033599853515625, 0.346160888671875, 0.3889617919921875, 0.4317626953125, 0.4745635986328125, 0.517364501953125, 0.5601654052734375, 0.60296630859375, 0.6457672119140625, 0.688568115234375, 0.7313690185546875, 0.774169921875, 0.8169708251953125, 0.859771728515625, 0.9025726318359375, 0.94537353515625, 0.9881744384765625, 1.030975341796875, 1.0737762451171875, 1.1165771484375, 1.1593780517578125, 1.202178955078125, 1.2449798583984375, 1.28778076171875, 1.3305816650390625, 1.373382568359375, 1.4161834716796875, 1.458984375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 5.0, 4.0, 7.0, 16.0, 23.0, 34.0, 35.0, 44.0, 76.0, 116.0, 159.0, 205.0, 313.0, 456.0, 657.0, 903.0, 1365.0, 2004.0, 2786.0, 4326.0, 6342.0, 9706.0, 15099.0, 24082.0, 38808.0, 62878.0, 102220.0, 160843.0, 201921.0, 154341.0, 96196.0, 59854.0, 36798.0, 22723.0, 14654.0, 9423.0, 6188.0, 4123.0, 2645.0, 1901.0, 1255.0, 939.0, 618.0, 463.0, 295.0, 210.0, 164.0, 99.0, 72.0, 47.0, 36.0, 35.0, 22.0, 14.0, 5.0, 6.0, 3.0, 7.0, 0.0, 1.0, 1.0], "bins": [-0.1319580078125, -0.1277618408203125, -0.123565673828125, -0.1193695068359375, -0.11517333984375, -0.1109771728515625, -0.106781005859375, -0.1025848388671875, -0.098388671875, -0.0941925048828125, -0.089996337890625, -0.0858001708984375, -0.08160400390625, -0.0774078369140625, -0.073211669921875, -0.0690155029296875, -0.0648193359375, -0.0606231689453125, -0.056427001953125, -0.0522308349609375, -0.04803466796875, -0.0438385009765625, -0.039642333984375, -0.0354461669921875, -0.03125, -0.0270538330078125, -0.022857666015625, -0.0186614990234375, -0.01446533203125, -0.0102691650390625, -0.006072998046875, -0.0018768310546875, 0.0023193359375, 0.0065155029296875, 0.010711669921875, 0.0149078369140625, 0.01910400390625, 0.0233001708984375, 0.027496337890625, 0.0316925048828125, 0.035888671875, 0.0400848388671875, 0.044281005859375, 0.0484771728515625, 0.05267333984375, 0.0568695068359375, 0.061065673828125, 0.0652618408203125, 0.0694580078125, 0.0736541748046875, 0.077850341796875, 0.0820465087890625, 0.08624267578125, 0.0904388427734375, 0.094635009765625, 0.0988311767578125, 0.10302734375, 0.1072235107421875, 0.111419677734375, 0.1156158447265625, 0.11981201171875, 0.1240081787109375, 0.128204345703125, 0.1324005126953125, 0.1365966796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 10.0, 4.0, 7.0, 18.0, 19.0, 14.0, 28.0, 19.0, 19.0, 27.0, 33.0, 35.0, 35.0, 34.0, 46.0, 41.0, 38.0, 38.0, 36.0, 1067.0, 34.0, 42.0, 37.0, 32.0, 39.0, 35.0, 31.0, 19.0, 27.0, 27.0, 21.0, 17.0, 15.0, 14.0, 9.0, 11.0, 11.0, 4.0, 8.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.853515625, -0.8255844116210938, -0.7976531982421875, -0.7697219848632812, -0.741790771484375, -0.7138595581054688, -0.6859283447265625, -0.6579971313476562, -0.63006591796875, -0.6021347045898438, -0.5742034912109375, -0.5462722778320312, -0.518341064453125, -0.49040985107421875, -0.4624786376953125, -0.43454742431640625, -0.4066162109375, -0.37868499755859375, -0.3507537841796875, -0.32282257080078125, -0.294891357421875, -0.26696014404296875, -0.2390289306640625, -0.21109771728515625, -0.18316650390625, -0.15523529052734375, -0.1273040771484375, -0.09937286376953125, -0.071441650390625, -0.04351043701171875, -0.0155792236328125, 0.01235198974609375, 0.040283203125, 0.06821441650390625, 0.0961456298828125, 0.12407684326171875, 0.152008056640625, 0.17993927001953125, 0.2078704833984375, 0.23580169677734375, 0.26373291015625, 0.29166412353515625, 0.3195953369140625, 0.34752655029296875, 0.375457763671875, 0.40338897705078125, 0.4313201904296875, 0.45925140380859375, 0.4871826171875, 0.5151138305664062, 0.5430450439453125, 0.5709762573242188, 0.598907470703125, 0.6268386840820312, 0.6547698974609375, 0.6827011108398438, 0.71063232421875, 0.7385635375976562, 0.7664947509765625, 0.7944259643554688, 0.822357177734375, 0.8502883911132812, 0.8782196044921875, 0.9061508178710938, 0.93408203125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 12.0, 7.0, 11.0, 18.0, 23.0, 57.0, 86.0, 115.0, 192.0, 275.0, 425.0, 592.0, 915.0, 1328.0, 1945.0, 2987.0, 4519.0, 6730.0, 10386.0, 15985.0, 24496.0, 37138.0, 55596.0, 83013.0, 117803.0, 384885.0, 967776.0, 122802.0, 85998.0, 58316.0, 38728.0, 25601.0, 16326.0, 11024.0, 7007.0, 4668.0, 3155.0, 2079.0, 1359.0, 893.0, 631.0, 431.0, 268.0, 190.0, 112.0, 74.0, 49.0, 40.0, 20.0, 15.0, 15.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0], "bins": [-0.08612060546875, -0.0834341049194336, -0.08074760437011719, -0.07806110382080078, -0.07537460327148438, -0.07268810272216797, -0.07000160217285156, -0.06731510162353516, -0.06462860107421875, -0.061942100524902344, -0.05925559997558594, -0.05656909942626953, -0.053882598876953125, -0.05119609832763672, -0.04850959777832031, -0.045823097229003906, -0.0431365966796875, -0.040450096130371094, -0.03776359558105469, -0.03507709503173828, -0.032390594482421875, -0.02970409393310547, -0.027017593383789062, -0.024331092834472656, -0.02164459228515625, -0.018958091735839844, -0.016271591186523438, -0.013585090637207031, -0.010898590087890625, -0.008212089538574219, -0.0055255889892578125, -0.0028390884399414062, -0.000152587890625, 0.0025339126586914062, 0.0052204132080078125, 0.007906913757324219, 0.010593414306640625, 0.013279914855957031, 0.015966415405273438, 0.018652915954589844, 0.02133941650390625, 0.024025917053222656, 0.026712417602539062, 0.02939891815185547, 0.032085418701171875, 0.03477191925048828, 0.03745841979980469, 0.040144920349121094, 0.0428314208984375, 0.045517921447753906, 0.04820442199707031, 0.05089092254638672, 0.053577423095703125, 0.05626392364501953, 0.05895042419433594, 0.061636924743652344, 0.06432342529296875, 0.06700992584228516, 0.06969642639160156, 0.07238292694091797, 0.07506942749023438, 0.07775592803955078, 0.08044242858886719, 0.0831289291381836, 0.0858154296875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 2.0, 2.0, 8.0, 4.0, 3.0, 10.0, 9.0, 6.0, 16.0, 9.0, 9.0, 14.0, 10.0, 24.0, 23.0, 30.0, 39.0, 46.0, 39.0, 71.0, 44.0, 78.0, 70.0, 75.0, 56.0, 43.0, 37.0, 30.0, 18.0, 16.0, 22.0, 19.0, 16.0, 9.0, 11.0, 12.0, 14.0, 5.0, 6.0, 5.0, 5.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0017910003662109375, -0.0017289519309997559, -0.0016669034957885742, -0.0016048550605773926, -0.001542806625366211, -0.0014807581901550293, -0.0014187097549438477, -0.001356661319732666, -0.0012946128845214844, -0.0012325644493103027, -0.001170516014099121, -0.0011084675788879395, -0.0010464191436767578, -0.0009843707084655762, -0.0009223222732543945, -0.0008602738380432129, -0.0007982254028320312, -0.0007361769676208496, -0.000674128532409668, -0.0006120800971984863, -0.0005500316619873047, -0.00048798322677612305, -0.0004259347915649414, -0.00036388635635375977, -0.0003018379211425781, -0.00023978948593139648, -0.00017774105072021484, -0.0001156926155090332, -5.364418029785156e-05, 8.404254913330078e-06, 7.045269012451172e-05, 0.00013250112533569336, 0.000194549560546875, 0.00025659799575805664, 0.0003186464309692383, 0.0003806948661804199, 0.00044274330139160156, 0.0005047917366027832, 0.0005668401718139648, 0.0006288886070251465, 0.0006909370422363281, 0.0007529854774475098, 0.0008150339126586914, 0.000877082347869873, 0.0009391307830810547, 0.0010011792182922363, 0.001063227653503418, 0.0011252760887145996, 0.0011873245239257812, 0.0012493729591369629, 0.0013114213943481445, 0.0013734698295593262, 0.0014355182647705078, 0.0014975666999816895, 0.001559615135192871, 0.0016216635704040527, 0.0016837120056152344, 0.001745760440826416, 0.0018078088760375977, 0.0018698573112487793, 0.001931905746459961, 0.0019939541816711426, 0.0020560026168823242, 0.002118051052093506, 0.0021800994873046875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 10.0, 4.0, 6.0, 15.0, 12.0, 16.0, 21.0, 13.0, 15.0, 23.0, 24.0, 35.0, 40.0, 39.0, 39.0, 58.0, 74.0, 84.0, 113.0, 154.0, 220.0, 269.0, 639.0, 8303.0, 1029566.0, 6862.0, 621.0, 305.0, 187.0, 140.0, 95.0, 93.0, 65.0, 59.0, 56.0, 37.0, 50.0, 42.0, 17.0, 16.0, 11.0, 21.0, 25.0, 14.0, 10.0, 7.0, 4.0, 12.0, 8.0, 3.0, 4.0, 1.0, 4.0, 1.0, 3.0], "bins": [-0.03857421875, -0.03742218017578125, -0.0362701416015625, -0.03511810302734375, -0.033966064453125, -0.03281402587890625, -0.0316619873046875, -0.03050994873046875, -0.02935791015625, -0.02820587158203125, -0.0270538330078125, -0.02590179443359375, -0.024749755859375, -0.02359771728515625, -0.0224456787109375, -0.02129364013671875, -0.0201416015625, -0.01898956298828125, -0.0178375244140625, -0.01668548583984375, -0.015533447265625, -0.01438140869140625, -0.0132293701171875, -0.01207733154296875, -0.01092529296875, -0.00977325439453125, -0.0086212158203125, -0.00746917724609375, -0.006317138671875, -0.00516510009765625, -0.0040130615234375, -0.00286102294921875, -0.001708984375, -0.00055694580078125, 0.0005950927734375, 0.00174713134765625, 0.002899169921875, 0.00405120849609375, 0.0052032470703125, 0.00635528564453125, 0.00750732421875, 0.00865936279296875, 0.0098114013671875, 0.01096343994140625, 0.012115478515625, 0.01326751708984375, 0.0144195556640625, 0.01557159423828125, 0.0167236328125, 0.01787567138671875, 0.0190277099609375, 0.02017974853515625, 0.021331787109375, 0.02248382568359375, 0.0236358642578125, 0.02478790283203125, 0.02593994140625, 0.02709197998046875, 0.0282440185546875, 0.02939605712890625, 0.030548095703125, 0.03170013427734375, 0.0328521728515625, 0.03400421142578125, 0.03515625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 975.0, 39.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035568419843912125, -0.03475503996014595, -0.033941660076379776, -0.0331282801926136, -0.03231490030884743, -0.03150152042508125, -0.03068814054131508, -0.029874760657548904, -0.02906138077378273, -0.028248000890016556, -0.02743462100625038, -0.026621241122484207, -0.025807861238718033, -0.02499448135495186, -0.024181101471185684, -0.02336772158741951, -0.022554343566298485, -0.02174096368253231, -0.020927583798766136, -0.020114203914999962, -0.019300824031233788, -0.018487444147467613, -0.017674066126346588, -0.016860686242580414, -0.01604730635881424, -0.015233926475048065, -0.014420546591281891, -0.013607166707515717, -0.012793786823749542, -0.011980406939983368, -0.011167027987539768, -0.010353648103773594, -0.009540269151329994, -0.00872688926756382, -0.007913509383797646, -0.0071001299656927586, -0.006286750081926584, -0.00547337019816041, -0.004659990780055523, -0.0038466108962893486, -0.0030332310125231743, -0.002219851128757, -0.0014064714778214693, -0.0005930918268859386, 0.00022028805688023567, 0.00103366794064641, 0.001847047358751297, 0.0026604272425174713, 0.0034738071262836456, 0.00428718701004982, 0.005100566893815994, 0.005913946311920881, 0.006727326195687056, 0.00754070607945323, 0.008354085497558117, 0.009167465381324291, 0.009980845265090466, 0.01079422514885664, 0.011607605032622814, 0.012420983985066414, 0.013234363868832588, 0.014047743752598763, 0.014861123636364937, 0.01567450352013111, 0.016487883403897285]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 10.0, 6.0, 19.0, 18.0, 25.0, 33.0, 39.0, 55.0, 47.0, 69.0, 66.0, 63.0, 73.0, 68.0, 70.0, 66.0, 40.0, 50.0, 46.0, 29.0, 37.0, 28.0, 16.0, 11.0, 9.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0030336976051330566, -0.002960260957479477, -0.002886824309825897, -0.0028133876621723175, -0.002739951014518738, -0.002666514366865158, -0.0025930777192115784, -0.0025196410715579987, -0.002446204423904419, -0.0023727677762508392, -0.0022993311285972595, -0.00222589448094368, -0.0021524578332901, -0.0020790211856365204, -0.0020055845379829407, -0.001932147890329361, -0.0018587112426757812, -0.0017852745950222015, -0.0017118379473686218, -0.0016384012997150421, -0.0015649646520614624, -0.0014915280044078827, -0.001418091356754303, -0.0013446547091007233, -0.0012712180614471436, -0.0011977814137935638, -0.0011243447661399841, -0.0010509081184864044, -0.0009774714708328247, -0.000904034823179245, -0.0008305981755256653, -0.0007571615278720856, -0.0006837248802185059, -0.0006102882325649261, -0.0005368515849113464, -0.0004634149372577667, -0.000389978289604187, -0.0003165416419506073, -0.0002431049942970276, -0.00016966834664344788, -9.623169898986816e-05, -2.2795051336288452e-05, 5.064159631729126e-05, 0.00012407824397087097, 0.00019751489162445068, 0.0002709515392780304, 0.0003443881869316101, 0.0004178248345851898, 0.0004912614822387695, 0.0005646981298923492, 0.000638134777545929, 0.0007115714251995087, 0.0007850080728530884, 0.0008584447205066681, 0.0009318813681602478, 0.0010053180158138275, 0.0010787546634674072, 0.001152191311120987, 0.0012256279587745667, 0.0012990646064281464, 0.001372501254081726, 0.0014459379017353058, 0.0015193745493888855, 0.0015928111970424652, 0.001666247844696045]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 3.0, 4.0, 7.0, 4.0, 13.0, 15.0, 7.0, 13.0, 23.0, 24.0, 27.0, 24.0, 32.0, 38.0, 45.0, 30.0, 27.0, 30.0, 42.0, 28.0, 50.0, 31.0, 50.0, 59.0, 36.0, 36.0, 41.0, 23.0, 34.0, 25.0, 25.0, 24.0, 25.0, 18.0, 21.0, 12.0, 11.0, 12.0, 13.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2374725341796875, -1.194671630859375, -1.1518707275390625, -1.10906982421875, -1.0662689208984375, -1.023468017578125, -0.9806671142578125, -0.9378662109375, -0.8950653076171875, -0.852264404296875, -0.8094635009765625, -0.76666259765625, -0.7238616943359375, -0.681060791015625, -0.6382598876953125, -0.595458984375, -0.5526580810546875, -0.509857177734375, -0.4670562744140625, -0.42425537109375, -0.3814544677734375, -0.338653564453125, -0.2958526611328125, -0.2530517578125, -0.2102508544921875, -0.167449951171875, -0.1246490478515625, -0.08184814453125, -0.0390472412109375, 0.003753662109375, 0.0465545654296875, 0.08935546875, 0.1321563720703125, 0.174957275390625, 0.2177581787109375, 0.26055908203125, 0.3033599853515625, 0.346160888671875, 0.3889617919921875, 0.4317626953125, 0.4745635986328125, 0.517364501953125, 0.5601654052734375, 0.60296630859375, 0.6457672119140625, 0.688568115234375, 0.7313690185546875, 0.774169921875, 0.8169708251953125, 0.859771728515625, 0.9025726318359375, 0.94537353515625, 0.9881744384765625, 1.030975341796875, 1.0737762451171875, 1.1165771484375, 1.1593780517578125, 1.202178955078125, 1.2449798583984375, 1.28778076171875, 1.3305816650390625, 1.373382568359375, 1.4161834716796875, 1.458984375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 10.0, 7.0, 12.0, 24.0, 27.0, 30.0, 50.0, 67.0, 88.0, 122.0, 178.0, 252.0, 394.0, 512.0, 732.0, 1014.0, 1403.0, 2021.0, 3081.0, 4473.0, 7115.0, 12091.0, 23005.0, 56048.0, 176401.0, 415922.0, 214602.0, 66111.0, 26219.0, 13281.0, 7815.0, 4876.0, 3190.0, 2130.0, 1538.0, 1099.0, 725.0, 567.0, 398.0, 250.0, 194.0, 132.0, 122.0, 86.0, 48.0, 38.0, 28.0, 15.0, 8.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.20806884765625, -3.0958251953125, -2.98358154296875, -2.871337890625, -2.75909423828125, -2.6468505859375, -2.53460693359375, -2.42236328125, -2.31011962890625, -2.1978759765625, -2.08563232421875, -1.973388671875, -1.86114501953125, -1.7489013671875, -1.63665771484375, -1.5244140625, -1.41217041015625, -1.2999267578125, -1.18768310546875, -1.075439453125, -0.96319580078125, -0.8509521484375, -0.73870849609375, -0.62646484375, -0.51422119140625, -0.4019775390625, -0.28973388671875, -0.177490234375, -0.06524658203125, 0.0469970703125, 0.15924072265625, 0.271484375, 0.38372802734375, 0.4959716796875, 0.60821533203125, 0.720458984375, 0.83270263671875, 0.9449462890625, 1.05718994140625, 1.16943359375, 1.28167724609375, 1.3939208984375, 1.50616455078125, 1.618408203125, 1.73065185546875, 1.8428955078125, 1.95513916015625, 2.0673828125, 2.17962646484375, 2.2918701171875, 2.40411376953125, 2.516357421875, 2.62860107421875, 2.7408447265625, 2.85308837890625, 2.96533203125, 3.07757568359375, 3.1898193359375, 3.30206298828125, 3.414306640625, 3.52655029296875, 3.6387939453125, 3.75103759765625, 3.86328125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 5.0, 10.0, 8.0, 6.0, 16.0, 16.0, 18.0, 28.0, 35.0, 34.0, 32.0, 39.0, 52.0, 60.0, 54.0, 90.0, 130.0, 188.0, 1297.0, 214.0, 137.0, 107.0, 68.0, 59.0, 51.0, 42.0, 28.0, 27.0, 29.0, 26.0, 23.0, 19.0, 10.0, 23.0, 10.0, 9.0, 2.0, 7.0, 5.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.6846923828125, -3.560791015625, -3.4368896484375, -3.31298828125, -3.1890869140625, -3.065185546875, -2.9412841796875, -2.8173828125, -2.6934814453125, -2.569580078125, -2.4456787109375, -2.32177734375, -2.1978759765625, -2.073974609375, -1.9500732421875, -1.826171875, -1.7022705078125, -1.578369140625, -1.4544677734375, -1.33056640625, -1.2066650390625, -1.082763671875, -0.9588623046875, -0.8349609375, -0.7110595703125, -0.587158203125, -0.4632568359375, -0.33935546875, -0.2154541015625, -0.091552734375, 0.0323486328125, 0.15625, 0.2801513671875, 0.404052734375, 0.5279541015625, 0.65185546875, 0.7757568359375, 0.899658203125, 1.0235595703125, 1.1474609375, 1.2713623046875, 1.395263671875, 1.5191650390625, 1.64306640625, 1.7669677734375, 1.890869140625, 2.0147705078125, 2.138671875, 2.2625732421875, 2.386474609375, 2.5103759765625, 2.63427734375, 2.7581787109375, 2.882080078125, 3.0059814453125, 3.1298828125, 3.2537841796875, 3.377685546875, 3.5015869140625, 3.62548828125, 3.7493896484375, 3.873291015625, 3.9971923828125, 4.12109375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 7.0, 6.0, 9.0, 8.0, 10.0, 19.0, 14.0, 19.0, 23.0, 25.0, 32.0, 27.0, 48.0, 69.0, 111.0, 269.0, 692.0, 2343.0, 55197.0, 3047795.0, 35702.0, 1959.0, 612.0, 242.0, 121.0, 67.0, 52.0, 40.0, 28.0, 24.0, 25.0, 20.0, 21.0, 10.0, 10.0, 9.0, 6.0, 11.0, 2.0, 5.0, 1.0, 0.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-17.53125, -17.036865234375, -16.54248046875, -16.048095703125, -15.5537109375, -15.059326171875, -14.56494140625, -14.070556640625, -13.576171875, -13.081787109375, -12.58740234375, -12.093017578125, -11.5986328125, -11.104248046875, -10.60986328125, -10.115478515625, -9.62109375, -9.126708984375, -8.63232421875, -8.137939453125, -7.6435546875, -7.149169921875, -6.65478515625, -6.160400390625, -5.666015625, -5.171630859375, -4.67724609375, -4.182861328125, -3.6884765625, -3.194091796875, -2.69970703125, -2.205322265625, -1.7109375, -1.216552734375, -0.72216796875, -0.227783203125, 0.2666015625, 0.760986328125, 1.25537109375, 1.749755859375, 2.244140625, 2.738525390625, 3.23291015625, 3.727294921875, 4.2216796875, 4.716064453125, 5.21044921875, 5.704833984375, 6.19921875, 6.693603515625, 7.18798828125, 7.682373046875, 8.1767578125, 8.671142578125, 9.16552734375, 9.659912109375, 10.154296875, 10.648681640625, 11.14306640625, 11.637451171875, 12.1318359375, 12.626220703125, 13.12060546875, 13.614990234375, 14.109375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 31.0, 564.0, 406.0, 9.0, 0.0, 1.0], "bins": [-97.55330657958984, -95.92345428466797, -94.29360961914062, -92.66375732421875, -91.03390502929688, -89.404052734375, -87.77420806884766, -86.14435577392578, -84.5145034790039, -82.88465118408203, -81.25480651855469, -79.62495422363281, -77.99510192871094, -76.36524963378906, -74.73540496826172, -73.10555267333984, -71.4757080078125, -69.84585571289062, -68.21601104736328, -66.5861587524414, -64.95630645751953, -63.32645797729492, -61.69660949707031, -60.06675720214844, -58.43690490722656, -56.80705642700195, -55.17720413208008, -53.54735565185547, -51.917503356933594, -50.287654876708984, -48.657806396484375, -47.0279541015625, -45.39810562133789, -43.76825714111328, -42.138404846191406, -40.5085563659668, -38.87870407104492, -37.24885559082031, -35.61900329589844, -33.98915481567383, -32.35930633544922, -30.729455947875977, -29.099605560302734, -27.469757080078125, -25.839906692504883, -24.21005630493164, -22.5802059173584, -20.950355529785156, -19.32050323486328, -17.69065284729004, -16.060802459716797, -14.430953025817871, -12.801103591918945, -11.171253204345703, -9.541402816772461, -7.911553382873535, -6.281703948974609, -4.651854038238525, -3.0220038890838623, -1.3921537399291992, 0.23769617080688477, 1.8675460815429688, 3.497396469116211, 5.127245903015137, 6.757096290588379]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 14.0, 9.0, 5.0, 8.0, 9.0, 12.0, 11.0, 12.0, 18.0, 12.0, 27.0, 35.0, 24.0, 28.0, 33.0, 44.0, 40.0, 37.0, 39.0, 32.0, 55.0, 41.0, 36.0, 41.0, 31.0, 40.0, 29.0, 29.0, 36.0, 26.0, 21.0, 32.0, 22.0, 25.0, 19.0, 9.0, 11.0, 9.0, 10.0, 3.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.687631607055664, -12.281689643859863, -11.875746726989746, -11.469804763793945, -11.063861846923828, -10.657919883728027, -10.251977920532227, -9.84603500366211, -9.440092086791992, -9.034150123596191, -8.628207206726074, -8.222265243530273, -7.816322326660156, -7.4103803634643555, -7.0044379234313965, -6.5984954833984375, -6.192553520202637, -5.786611080169678, -5.380668640136719, -4.974726676940918, -4.568783760070801, -4.162841796875, -3.756899356842041, -3.350956916809082, -2.945014476776123, -2.539072036743164, -2.133129596710205, -1.7271873950958252, -1.3212449550628662, -0.9153025150299072, -0.5093603134155273, -0.10341787338256836, 0.3025245666503906, 0.7084669470787048, 1.114409327507019, 1.5203516483306885, 1.9262940883636475, 2.3322365283966064, 2.7381787300109863, 3.1441211700439453, 3.5500636100769043, 3.9560060501098633, 4.361948490142822, 4.767890930175781, 5.173832893371582, 5.579775810241699, 5.9857177734375, 6.391660213470459, 6.797602653503418, 7.203545093536377, 7.609487533569336, 8.015429496765137, 8.421372413635254, 8.827314376831055, 9.233257293701172, 9.639199256896973, 10.045141220092773, 10.451083183288574, 10.857026100158691, 11.262968063354492, 11.66891098022461, 12.07485294342041, 12.480794906616211, 12.886737823486328, 13.292680740356445]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 6.0, 5.0, 8.0, 13.0, 10.0, 15.0, 9.0, 12.0, 22.0, 28.0, 23.0, 26.0, 30.0, 37.0, 36.0, 24.0, 33.0, 40.0, 23.0, 41.0, 30.0, 46.0, 42.0, 48.0, 47.0, 27.0, 36.0, 30.0, 29.0, 26.0, 21.0, 27.0, 24.0, 21.0, 19.0, 9.0, 13.0, 12.0, 13.0, 8.0, 10.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.281524658203125, -1.23883056640625, -1.196136474609375, -1.1534423828125, -1.110748291015625, -1.06805419921875, -1.025360107421875, -0.982666015625, -0.939971923828125, -0.89727783203125, -0.854583740234375, -0.8118896484375, -0.769195556640625, -0.72650146484375, -0.683807373046875, -0.64111328125, -0.598419189453125, -0.55572509765625, -0.513031005859375, -0.4703369140625, -0.427642822265625, -0.38494873046875, -0.342254638671875, -0.299560546875, -0.256866455078125, -0.21417236328125, -0.171478271484375, -0.1287841796875, -0.086090087890625, -0.04339599609375, -0.000701904296875, 0.0419921875, 0.084686279296875, 0.12738037109375, 0.170074462890625, 0.2127685546875, 0.255462646484375, 0.29815673828125, 0.340850830078125, 0.383544921875, 0.426239013671875, 0.46893310546875, 0.511627197265625, 0.5543212890625, 0.597015380859375, 0.63970947265625, 0.682403564453125, 0.72509765625, 0.767791748046875, 0.81048583984375, 0.853179931640625, 0.8958740234375, 0.938568115234375, 0.98126220703125, 1.023956298828125, 1.066650390625, 1.109344482421875, 1.15203857421875, 1.194732666015625, 1.2374267578125, 1.280120849609375, 1.32281494140625, 1.365509033203125, 1.408203125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 13.0, 8.0, 11.0, 20.0, 25.0, 38.0, 36.0, 63.0, 75.0, 111.0, 148.0, 219.0, 353.0, 518.0, 949.0, 2206.0, 6326.0, 24251.0, 130270.0, 1386823.0, 2361295.0, 230112.0, 36187.0, 8553.0, 2788.0, 1133.0, 590.0, 347.0, 218.0, 161.0, 123.0, 76.0, 67.0, 40.0, 23.0, 23.0, 24.0, 14.0, 8.0, 9.0, 10.0, 3.0, 8.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.2734375, -6.08966064453125, -5.9058837890625, -5.72210693359375, -5.538330078125, -5.35455322265625, -5.1707763671875, -4.98699951171875, -4.80322265625, -4.61944580078125, -4.4356689453125, -4.25189208984375, -4.068115234375, -3.88433837890625, -3.7005615234375, -3.51678466796875, -3.3330078125, -3.14923095703125, -2.9654541015625, -2.78167724609375, -2.597900390625, -2.41412353515625, -2.2303466796875, -2.04656982421875, -1.86279296875, -1.67901611328125, -1.4952392578125, -1.31146240234375, -1.127685546875, -0.94390869140625, -0.7601318359375, -0.57635498046875, -0.392578125, -0.20880126953125, -0.0250244140625, 0.15875244140625, 0.342529296875, 0.52630615234375, 0.7100830078125, 0.89385986328125, 1.07763671875, 1.26141357421875, 1.4451904296875, 1.62896728515625, 1.812744140625, 1.99652099609375, 2.1802978515625, 2.36407470703125, 2.5478515625, 2.73162841796875, 2.9154052734375, 3.09918212890625, 3.282958984375, 3.46673583984375, 3.6505126953125, 3.83428955078125, 4.01806640625, 4.20184326171875, 4.3856201171875, 4.56939697265625, 4.753173828125, 4.93695068359375, 5.1207275390625, 5.30450439453125, 5.48828125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 17.0, 26.0, 46.0, 73.0, 103.0, 208.0, 328.0, 599.0, 808.0, 717.0, 473.0, 259.0, 162.0, 94.0, 61.0, 40.0, 21.0, 16.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.6328125, -11.3543701171875, -11.075927734375, -10.7974853515625, -10.51904296875, -10.2406005859375, -9.962158203125, -9.6837158203125, -9.4052734375, -9.1268310546875, -8.848388671875, -8.5699462890625, -8.29150390625, -8.0130615234375, -7.734619140625, -7.4561767578125, -7.177734375, -6.8992919921875, -6.620849609375, -6.3424072265625, -6.06396484375, -5.7855224609375, -5.507080078125, -5.2286376953125, -4.9501953125, -4.6717529296875, -4.393310546875, -4.1148681640625, -3.83642578125, -3.5579833984375, -3.279541015625, -3.0010986328125, -2.72265625, -2.4442138671875, -2.165771484375, -1.8873291015625, -1.60888671875, -1.3304443359375, -1.052001953125, -0.7735595703125, -0.4951171875, -0.2166748046875, 0.061767578125, 0.3402099609375, 0.61865234375, 0.8970947265625, 1.175537109375, 1.4539794921875, 1.732421875, 2.0108642578125, 2.289306640625, 2.5677490234375, 2.84619140625, 3.1246337890625, 3.403076171875, 3.6815185546875, 3.9599609375, 4.2384033203125, 4.516845703125, 4.7952880859375, 5.07373046875, 5.3521728515625, 5.630615234375, 5.9090576171875, 6.1875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 7.0, 10.0, 21.0, 20.0, 19.0, 41.0, 52.0, 72.0, 148.0, 208.0, 397.0, 724.0, 1564.0, 5098.0, 43986.0, 1423298.0, 2628709.0, 79317.0, 6811.0, 1908.0, 755.0, 457.0, 224.0, 142.0, 91.0, 67.0, 45.0, 33.0, 18.0, 14.0, 9.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.8671875, -13.4212646484375, -12.975341796875, -12.5294189453125, -12.08349609375, -11.6375732421875, -11.191650390625, -10.7457275390625, -10.2998046875, -9.8538818359375, -9.407958984375, -8.9620361328125, -8.51611328125, -8.0701904296875, -7.624267578125, -7.1783447265625, -6.732421875, -6.2864990234375, -5.840576171875, -5.3946533203125, -4.94873046875, -4.5028076171875, -4.056884765625, -3.6109619140625, -3.1650390625, -2.7191162109375, -2.273193359375, -1.8272705078125, -1.38134765625, -0.9354248046875, -0.489501953125, -0.0435791015625, 0.40234375, 0.8482666015625, 1.294189453125, 1.7401123046875, 2.18603515625, 2.6319580078125, 3.077880859375, 3.5238037109375, 3.9697265625, 4.4156494140625, 4.861572265625, 5.3074951171875, 5.75341796875, 6.1993408203125, 6.645263671875, 7.0911865234375, 7.537109375, 7.9830322265625, 8.428955078125, 8.8748779296875, 9.32080078125, 9.7667236328125, 10.212646484375, 10.6585693359375, 11.1044921875, 11.5504150390625, 11.996337890625, 12.4422607421875, 12.88818359375, 13.3341064453125, 13.780029296875, 14.2259521484375, 14.671875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 12.0, 52.0, 146.0, 293.0, 260.0, 169.0, 66.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.969112396240234, -52.470314025878906, -50.971519470214844, -49.472721099853516, -47.97392654418945, -46.475128173828125, -44.97633361816406, -43.477535247802734, -41.978736877441406, -40.47993850708008, -38.981143951416016, -37.48234558105469, -35.983551025390625, -34.4847526550293, -32.98595428466797, -31.487159729003906, -29.98836326599121, -28.489566802978516, -26.99077033996582, -25.491973876953125, -23.993175506591797, -22.4943790435791, -20.995582580566406, -19.496784210205078, -17.997989654541016, -16.49919319152832, -15.000395774841309, -13.501599311828613, -12.002801895141602, -10.504005432128906, -9.005208969116211, -7.506411552429199, -6.0076141357421875, -4.508817195892334, -3.0100204944610596, -1.5112237930297852, -0.01242685317993164, 1.4863700866699219, 2.985166549682617, 4.483963966369629, 5.982760429382324, 7.481557369232178, 8.980354309082031, 10.479150772094727, 11.977947235107422, 13.476744651794434, 14.975541114807129, 16.47433853149414, 17.973134994506836, 19.47193145751953, 20.970727920532227, 22.469524383544922, 23.96832275390625, 25.467119216918945, 26.96591567993164, 28.46471405029297, 29.96350860595703, 31.462305068969727, 32.96110153198242, 34.45989990234375, 35.95869445800781, 37.45749282836914, 38.95629119873047, 40.45508575439453, 41.95388412475586]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 9.0, 13.0, 13.0, 12.0, 17.0, 25.0, 13.0, 19.0, 31.0, 21.0, 34.0, 24.0, 29.0, 30.0, 32.0, 41.0, 38.0, 51.0, 23.0, 45.0, 36.0, 46.0, 32.0, 46.0, 32.0, 29.0, 41.0, 29.0, 20.0, 24.0, 17.0, 20.0, 16.0, 16.0, 7.0, 12.0, 10.0, 6.0, 6.0, 8.0, 4.0, 1.0, 5.0, 6.0, 1.0, 2.0, 1.0], "bins": [-17.54867935180664, -17.057861328125, -16.56704330444336, -16.07622528076172, -15.585408210754395, -15.09459114074707, -14.60377311706543, -14.112955093383789, -13.622137069702148, -13.131319046020508, -12.640501976013184, -12.149683952331543, -11.658865928649902, -11.168048858642578, -10.677230834960938, -10.186412811279297, -9.695595741271973, -9.204777717590332, -8.713960647583008, -8.223142623901367, -7.732324600219727, -7.241507053375244, -6.750689506530762, -6.259871482849121, -5.769053936004639, -5.278236389160156, -4.787418365478516, -4.296600818634033, -3.8057830333709717, -3.31496524810791, -2.8241477012634277, -2.333329916000366, -1.8425121307373047, -1.3516943454742432, -0.8608766794204712, -0.3700590133666992, 0.1207587718963623, 0.6115765571594238, 1.1023941040039062, 1.5932118892669678, 2.0840296745300293, 2.574847459793091, 3.0656652450561523, 3.5564827919006348, 4.047300338745117, 4.538118362426758, 5.02893590927124, 5.519753456115723, 6.010571479797363, 6.501389026641846, 6.992207050323486, 7.483024597167969, 7.973842620849609, 8.46466064453125, 8.955477714538574, 9.446295738220215, 9.937112808227539, 10.42793083190918, 10.918747901916504, 11.409565925598145, 11.900383949279785, 12.39120101928711, 12.88201904296875, 13.37283706665039, 13.863655090332031]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 10.0, 7.0, 12.0, 10.0, 16.0, 21.0, 20.0, 24.0, 28.0, 24.0, 27.0, 43.0, 27.0, 36.0, 36.0, 31.0, 48.0, 34.0, 52.0, 44.0, 41.0, 37.0, 43.0, 35.0, 33.0, 30.0, 25.0, 18.0, 18.0, 24.0, 22.0, 23.0, 13.0, 17.0, 9.0, 8.0, 11.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.24969482421875, -1.2054443359375, -1.16119384765625, -1.116943359375, -1.07269287109375, -1.0284423828125, -0.98419189453125, -0.93994140625, -0.89569091796875, -0.8514404296875, -0.80718994140625, -0.762939453125, -0.71868896484375, -0.6744384765625, -0.63018798828125, -0.5859375, -0.54168701171875, -0.4974365234375, -0.45318603515625, -0.408935546875, -0.36468505859375, -0.3204345703125, -0.27618408203125, -0.23193359375, -0.18768310546875, -0.1434326171875, -0.09918212890625, -0.054931640625, -0.01068115234375, 0.0335693359375, 0.07781982421875, 0.1220703125, 0.16632080078125, 0.2105712890625, 0.25482177734375, 0.299072265625, 0.34332275390625, 0.3875732421875, 0.43182373046875, 0.47607421875, 0.52032470703125, 0.5645751953125, 0.60882568359375, 0.653076171875, 0.69732666015625, 0.7415771484375, 0.78582763671875, 0.830078125, 0.87432861328125, 0.9185791015625, 0.96282958984375, 1.007080078125, 1.05133056640625, 1.0955810546875, 1.13983154296875, 1.18408203125, 1.22833251953125, 1.2725830078125, 1.31683349609375, 1.361083984375, 1.40533447265625, 1.4495849609375, 1.49383544921875, 1.5380859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 1.0, 2.0, 7.0, 9.0, 13.0, 27.0, 27.0, 40.0, 47.0, 68.0, 143.0, 146.0, 207.0, 374.0, 504.0, 716.0, 1049.0, 1474.0, 2217.0, 3233.0, 4704.0, 6934.0, 10458.0, 15503.0, 24281.0, 37826.0, 60425.0, 95854.0, 143698.0, 188373.0, 156106.0, 105713.0, 66819.0, 42024.0, 26817.0, 17351.0, 11506.0, 7581.0, 5109.0, 3415.0, 2406.0, 1661.0, 1151.0, 790.0, 529.0, 345.0, 272.0, 196.0, 137.0, 78.0, 56.0, 48.0, 28.0, 26.0, 10.0, 12.0, 6.0, 6.0, 2.0, 4.0, 4.0], "bins": [-0.1363525390625, -0.132171630859375, -0.12799072265625, -0.123809814453125, -0.11962890625, -0.115447998046875, -0.11126708984375, -0.107086181640625, -0.1029052734375, -0.098724365234375, -0.09454345703125, -0.090362548828125, -0.086181640625, -0.082000732421875, -0.07781982421875, -0.073638916015625, -0.0694580078125, -0.065277099609375, -0.06109619140625, -0.056915283203125, -0.052734375, -0.048553466796875, -0.04437255859375, -0.040191650390625, -0.0360107421875, -0.031829833984375, -0.02764892578125, -0.023468017578125, -0.019287109375, -0.015106201171875, -0.01092529296875, -0.006744384765625, -0.0025634765625, 0.001617431640625, 0.00579833984375, 0.009979248046875, 0.01416015625, 0.018341064453125, 0.02252197265625, 0.026702880859375, 0.0308837890625, 0.035064697265625, 0.03924560546875, 0.043426513671875, 0.047607421875, 0.051788330078125, 0.05596923828125, 0.060150146484375, 0.0643310546875, 0.068511962890625, 0.07269287109375, 0.076873779296875, 0.0810546875, 0.085235595703125, 0.08941650390625, 0.093597412109375, 0.0977783203125, 0.101959228515625, 0.10614013671875, 0.110321044921875, 0.114501953125, 0.118682861328125, 0.12286376953125, 0.127044677734375, 0.1312255859375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 5.0, 8.0, 8.0, 8.0, 5.0, 14.0, 16.0, 8.0, 20.0, 20.0, 22.0, 21.0, 35.0, 35.0, 34.0, 49.0, 27.0, 32.0, 30.0, 36.0, 34.0, 1060.0, 36.0, 39.0, 44.0, 35.0, 20.0, 38.0, 34.0, 24.0, 25.0, 24.0, 24.0, 22.0, 23.0, 14.0, 15.0, 12.0, 9.0, 11.0, 14.0, 5.0, 7.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.87060546875, -0.8441162109375, -0.817626953125, -0.7911376953125, -0.7646484375, -0.7381591796875, -0.711669921875, -0.6851806640625, -0.65869140625, -0.6322021484375, -0.605712890625, -0.5792236328125, -0.552734375, -0.5262451171875, -0.499755859375, -0.4732666015625, -0.44677734375, -0.4202880859375, -0.393798828125, -0.3673095703125, -0.3408203125, -0.3143310546875, -0.287841796875, -0.2613525390625, -0.23486328125, -0.2083740234375, -0.181884765625, -0.1553955078125, -0.12890625, -0.1024169921875, -0.075927734375, -0.0494384765625, -0.02294921875, 0.0035400390625, 0.030029296875, 0.0565185546875, 0.0830078125, 0.1094970703125, 0.135986328125, 0.1624755859375, 0.18896484375, 0.2154541015625, 0.241943359375, 0.2684326171875, 0.294921875, 0.3214111328125, 0.347900390625, 0.3743896484375, 0.40087890625, 0.4273681640625, 0.453857421875, 0.4803466796875, 0.5068359375, 0.5333251953125, 0.559814453125, 0.5863037109375, 0.61279296875, 0.6392822265625, 0.665771484375, 0.6922607421875, 0.71875, 0.7452392578125, 0.771728515625, 0.7982177734375, 0.82470703125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 5.0, 14.0, 12.0, 16.0, 30.0, 45.0, 69.0, 109.0, 140.0, 238.0, 333.0, 491.0, 700.0, 1079.0, 1672.0, 2328.0, 3594.0, 5436.0, 8056.0, 12188.0, 18467.0, 27712.0, 41645.0, 62317.0, 91831.0, 127587.0, 1164733.0, 179094.0, 111715.0, 77961.0, 52939.0, 34688.0, 23624.0, 15489.0, 10287.0, 6712.0, 4539.0, 3035.0, 2013.0, 1343.0, 927.0, 614.0, 436.0, 298.0, 195.0, 138.0, 82.0, 59.0, 29.0, 20.0, 28.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08331298828125, -0.08060646057128906, -0.07789993286132812, -0.07519340515136719, -0.07248687744140625, -0.06978034973144531, -0.06707382202148438, -0.06436729431152344, -0.0616607666015625, -0.05895423889160156, -0.056247711181640625, -0.05354118347167969, -0.05083465576171875, -0.04812812805175781, -0.045421600341796875, -0.04271507263183594, -0.040008544921875, -0.03730201721191406, -0.034595489501953125, -0.03188896179199219, -0.02918243408203125, -0.026475906372070312, -0.023769378662109375, -0.021062850952148438, -0.0183563232421875, -0.015649795532226562, -0.012943267822265625, -0.010236740112304688, -0.00753021240234375, -0.0048236846923828125, -0.002117156982421875, 0.0005893707275390625, 0.0032958984375, 0.0060024261474609375, 0.008708953857421875, 0.011415481567382812, 0.01412200927734375, 0.016828536987304688, 0.019535064697265625, 0.022241592407226562, 0.0249481201171875, 0.027654647827148438, 0.030361175537109375, 0.03306770324707031, 0.03577423095703125, 0.03848075866699219, 0.041187286376953125, 0.04389381408691406, 0.046600341796875, 0.04930686950683594, 0.052013397216796875, 0.05471992492675781, 0.05742645263671875, 0.06013298034667969, 0.06283950805664062, 0.06554603576660156, 0.0682525634765625, 0.07095909118652344, 0.07366561889648438, 0.07637214660644531, 0.07907867431640625, 0.08178520202636719, 0.08449172973632812, 0.08719825744628906, 0.08990478515625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 3.0, 6.0, 2.0, 14.0, 10.0, 13.0, 17.0, 21.0, 19.0, 47.0, 53.0, 70.0, 55.0, 71.0, 100.0, 82.0, 82.0, 48.0, 61.0, 42.0, 40.0, 35.0, 20.0, 9.0, 14.0, 11.0, 13.0, 9.0, 8.0, 8.0, 9.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0033817291259765625, -0.0032904446125030518, -0.003199160099029541, -0.0031078755855560303, -0.0030165910720825195, -0.002925306558609009, -0.002834022045135498, -0.0027427375316619873, -0.0026514530181884766, -0.002560168504714966, -0.002468883991241455, -0.0023775994777679443, -0.0022863149642944336, -0.002195030450820923, -0.002103745937347412, -0.0020124614238739014, -0.0019211769104003906, -0.0018298923969268799, -0.0017386078834533691, -0.0016473233699798584, -0.0015560388565063477, -0.001464754343032837, -0.0013734698295593262, -0.0012821853160858154, -0.0011909008026123047, -0.001099616289138794, -0.0010083317756652832, -0.0009170472621917725, -0.0008257627487182617, -0.000734478235244751, -0.0006431937217712402, -0.0005519092082977295, -0.00046062469482421875, -0.000369340181350708, -0.00027805566787719727, -0.00018677115440368652, -9.548664093017578e-05, -4.202127456665039e-06, 8.70823860168457e-05, 0.00017836689949035645, 0.0002696514129638672, 0.00036093592643737793, 0.00045222043991088867, 0.0005435049533843994, 0.0006347894668579102, 0.0007260739803314209, 0.0008173584938049316, 0.0009086430072784424, 0.0009999275207519531, 0.0010912120342254639, 0.0011824965476989746, 0.0012737810611724854, 0.001365065574645996, 0.0014563500881195068, 0.0015476346015930176, 0.0016389191150665283, 0.001730203628540039, 0.0018214881420135498, 0.0019127726554870605, 0.0020040571689605713, 0.002095341682434082, 0.0021866261959075928, 0.0022779107093811035, 0.0023691952228546143, 0.002460479736328125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 8.0, 23.0, 18.0, 20.0, 28.0, 39.0, 54.0, 62.0, 98.0, 160.0, 217.0, 354.0, 639.0, 14074.0, 1025454.0, 5693.0, 548.0, 294.0, 220.0, 148.0, 85.0, 69.0, 43.0, 38.0, 24.0, 41.0, 19.0, 27.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05126953125, -0.049637794494628906, -0.04800605773925781, -0.04637432098388672, -0.044742584228515625, -0.04311084747314453, -0.04147911071777344, -0.039847373962402344, -0.03821563720703125, -0.036583900451660156, -0.03495216369628906, -0.03332042694091797, -0.031688690185546875, -0.03005695343017578, -0.028425216674804688, -0.026793479919433594, -0.0251617431640625, -0.023530006408691406, -0.021898269653320312, -0.02026653289794922, -0.018634796142578125, -0.01700305938720703, -0.015371322631835938, -0.013739585876464844, -0.01210784912109375, -0.010476112365722656, -0.008844375610351562, -0.007212638854980469, -0.005580902099609375, -0.003949165344238281, -0.0023174285888671875, -0.0006856918334960938, 0.000946044921875, 0.0025777816772460938, 0.0042095184326171875, 0.005841255187988281, 0.007472991943359375, 0.009104728698730469, 0.010736465454101562, 0.012368202209472656, 0.01399993896484375, 0.015631675720214844, 0.017263412475585938, 0.01889514923095703, 0.020526885986328125, 0.02215862274169922, 0.023790359497070312, 0.025422096252441406, 0.0270538330078125, 0.028685569763183594, 0.030317306518554688, 0.03194904327392578, 0.033580780029296875, 0.03521251678466797, 0.03684425354003906, 0.038475990295410156, 0.04010772705078125, 0.041739463806152344, 0.04337120056152344, 0.04500293731689453, 0.046634674072265625, 0.04826641082763672, 0.04989814758300781, 0.051529884338378906, 0.05316162109375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 748.0, 266.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05945118889212608, -0.05809766799211502, -0.05674414709210396, -0.055390626192092896, -0.05403710529208183, -0.05268358439207077, -0.051330067217350006, -0.049976546317338943, -0.04862302541732788, -0.04726950451731682, -0.045915983617305756, -0.04456246271729469, -0.04320894181728363, -0.041855424642562866, -0.040501900017261505, -0.03914838284254074, -0.03779485821723938, -0.03644133731722832, -0.035087816417217255, -0.03373429551720619, -0.03238077461719513, -0.031027255579829216, -0.029673734679818153, -0.02832021564245224, -0.026966694742441177, -0.025613173842430115, -0.024259652942419052, -0.02290613204240799, -0.021552613005042076, -0.020199092105031013, -0.01884557120501995, -0.017492052167654037, -0.016138533130288124, -0.014785012230277061, -0.013431492261588573, -0.01207797136157751, -0.010724451392889023, -0.00937093049287796, -0.008017409592866898, -0.00666388962417841, -0.005310368724167347, -0.003956848289817572, -0.0026033276226371527, -0.0012498069554567337, 0.00010371347889304161, 0.001457233913242817, 0.0028107548132538795, 0.0041642747819423676, 0.00551779568195343, 0.0068713161163032055, 0.00822483655065298, 0.009578357450664043, 0.010931877419352531, 0.012285398319363594, 0.013638919219374657, 0.014992439188063145, 0.016345959156751633, 0.017699480056762695, 0.019053000956773758, 0.02040652185678482, 0.021760040894150734, 0.023113561794161797, 0.02446708269417286, 0.025820601731538773, 0.027174124494194984]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 13.0, 22.0, 27.0, 47.0, 38.0, 77.0, 68.0, 77.0, 90.0, 99.0, 91.0, 65.0, 71.0, 50.0, 51.0, 37.0, 29.0, 22.0, 9.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004184544086456299, -0.004071698524057865, -0.0039588529616594315, -0.0038460073992609978, -0.003733161836862564, -0.0036203162744641304, -0.0035074707120656967, -0.003394625149667263, -0.0032817795872688293, -0.0031689340248703957, -0.003056088462471962, -0.0029432429000735283, -0.0028303973376750946, -0.002717551775276661, -0.0026047062128782272, -0.0024918606504797935, -0.00237901508808136, -0.002266169525682926, -0.0021533239632844925, -0.002040478400886059, -0.0019276328384876251, -0.0018147872760891914, -0.0017019417136907578, -0.001589096151292324, -0.0014762505888938904, -0.0013634050264954567, -0.001250559464097023, -0.0011377139016985893, -0.0010248683393001556, -0.000912022776901722, -0.0007991772145032883, -0.0006863316521048546, -0.0005734860897064209, -0.0004606405273079872, -0.00034779496490955353, -0.00023494940251111984, -0.00012210384011268616, -9.258277714252472e-06, 0.00010358728468418121, 0.0002164328470826149, 0.0003292784094810486, 0.00044212397187948227, 0.000554969534277916, 0.0006678150966763496, 0.0007806606590747833, 0.000893506221473217, 0.0010063517838716507, 0.0011191973462700844, 0.001232042908668518, 0.0013448884710669518, 0.0014577340334653854, 0.0015705795958638191, 0.0016834251582622528, 0.0017962707206606865, 0.0019091162830591202, 0.002021961845457554, 0.0021348074078559875, 0.0022476529702544212, 0.002360498532652855, 0.0024733440950512886, 0.0025861896574497223, 0.002699035219848156, 0.0028118807822465897, 0.0029247263446450233, 0.003037571907043457]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 10.0, 7.0, 12.0, 10.0, 16.0, 21.0, 20.0, 24.0, 28.0, 24.0, 27.0, 43.0, 27.0, 36.0, 36.0, 31.0, 48.0, 34.0, 52.0, 44.0, 41.0, 37.0, 43.0, 34.0, 34.0, 30.0, 25.0, 18.0, 18.0, 24.0, 22.0, 23.0, 13.0, 17.0, 9.0, 8.0, 11.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.24969482421875, -1.2054443359375, -1.16119384765625, -1.116943359375, -1.07269287109375, -1.0284423828125, -0.98419189453125, -0.93994140625, -0.89569091796875, -0.8514404296875, -0.80718994140625, -0.762939453125, -0.71868896484375, -0.6744384765625, -0.63018798828125, -0.5859375, -0.54168701171875, -0.4974365234375, -0.45318603515625, -0.408935546875, -0.36468505859375, -0.3204345703125, -0.27618408203125, -0.23193359375, -0.18768310546875, -0.1434326171875, -0.09918212890625, -0.054931640625, -0.01068115234375, 0.0335693359375, 0.07781982421875, 0.1220703125, 0.16632080078125, 0.2105712890625, 0.25482177734375, 0.299072265625, 0.34332275390625, 0.3875732421875, 0.43182373046875, 0.47607421875, 0.52032470703125, 0.5645751953125, 0.60882568359375, 0.653076171875, 0.69732666015625, 0.7415771484375, 0.78582763671875, 0.830078125, 0.87432861328125, 0.9185791015625, 0.96282958984375, 1.007080078125, 1.05133056640625, 1.0955810546875, 1.13983154296875, 1.18408203125, 1.22833251953125, 1.2725830078125, 1.31683349609375, 1.361083984375, 1.40533447265625, 1.4495849609375, 1.49383544921875, 1.5380859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 1.0, 5.0, 13.0, 14.0, 22.0, 24.0, 43.0, 62.0, 90.0, 149.0, 220.0, 320.0, 591.0, 983.0, 1945.0, 4007.0, 9508.0, 25588.0, 71569.0, 193299.0, 359060.0, 236210.0, 91118.0, 31986.0, 11819.0, 4791.0, 2220.0, 1161.0, 647.0, 386.0, 250.0, 166.0, 91.0, 63.0, 47.0, 32.0, 20.0, 18.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8876953125, -1.8260345458984375, -1.764373779296875, -1.7027130126953125, -1.64105224609375, -1.5793914794921875, -1.517730712890625, -1.4560699462890625, -1.3944091796875, -1.3327484130859375, -1.271087646484375, -1.2094268798828125, -1.14776611328125, -1.0861053466796875, -1.024444580078125, -0.9627838134765625, -0.901123046875, -0.8394622802734375, -0.777801513671875, -0.7161407470703125, -0.65447998046875, -0.5928192138671875, -0.531158447265625, -0.4694976806640625, -0.4078369140625, -0.3461761474609375, -0.284515380859375, -0.2228546142578125, -0.16119384765625, -0.0995330810546875, -0.037872314453125, 0.0237884521484375, 0.08544921875, 0.1471099853515625, 0.208770751953125, 0.2704315185546875, 0.33209228515625, 0.3937530517578125, 0.455413818359375, 0.5170745849609375, 0.5787353515625, 0.6403961181640625, 0.702056884765625, 0.7637176513671875, 0.82537841796875, 0.8870391845703125, 0.948699951171875, 1.0103607177734375, 1.072021484375, 1.1336822509765625, 1.195343017578125, 1.2570037841796875, 1.31866455078125, 1.3803253173828125, 1.441986083984375, 1.5036468505859375, 1.5653076171875, 1.6269683837890625, 1.688629150390625, 1.7502899169921875, 1.81195068359375, 1.8736114501953125, 1.935272216796875, 1.9969329833984375, 2.05859375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 11.0, 9.0, 18.0, 14.0, 20.0, 13.0, 35.0, 23.0, 26.0, 35.0, 51.0, 44.0, 42.0, 53.0, 80.0, 155.0, 360.0, 1396.0, 149.0, 96.0, 50.0, 53.0, 46.0, 40.0, 31.0, 29.0, 24.0, 22.0, 18.0, 14.0, 9.0, 14.0, 18.0, 7.0, 3.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.28515625, -5.12506103515625, -4.9649658203125, -4.80487060546875, -4.644775390625, -4.48468017578125, -4.3245849609375, -4.16448974609375, -4.00439453125, -3.84429931640625, -3.6842041015625, -3.52410888671875, -3.364013671875, -3.20391845703125, -3.0438232421875, -2.88372802734375, -2.7236328125, -2.56353759765625, -2.4034423828125, -2.24334716796875, -2.083251953125, -1.92315673828125, -1.7630615234375, -1.60296630859375, -1.44287109375, -1.28277587890625, -1.1226806640625, -0.96258544921875, -0.802490234375, -0.64239501953125, -0.4822998046875, -0.32220458984375, -0.162109375, -0.00201416015625, 0.1580810546875, 0.31817626953125, 0.478271484375, 0.63836669921875, 0.7984619140625, 0.95855712890625, 1.11865234375, 1.27874755859375, 1.4388427734375, 1.59893798828125, 1.759033203125, 1.91912841796875, 2.0792236328125, 2.23931884765625, 2.3994140625, 2.55950927734375, 2.7196044921875, 2.87969970703125, 3.039794921875, 3.19989013671875, 3.3599853515625, 3.52008056640625, 3.68017578125, 3.84027099609375, 4.0003662109375, 4.16046142578125, 4.320556640625, 4.48065185546875, 4.6407470703125, 4.80084228515625, 4.9609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 16.0, 7.0, 16.0, 13.0, 12.0, 13.0, 21.0, 20.0, 30.0, 46.0, 57.0, 67.0, 107.0, 230.0, 506.0, 1474.0, 15366.0, 2257505.0, 859310.0, 8627.0, 1216.0, 393.0, 187.0, 114.0, 63.0, 55.0, 33.0, 35.0, 27.0, 23.0, 20.0, 13.0, 22.0, 11.0, 8.0, 6.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0625, -9.7369384765625, -9.411376953125, -9.0858154296875, -8.76025390625, -8.4346923828125, -8.109130859375, -7.7835693359375, -7.4580078125, -7.1324462890625, -6.806884765625, -6.4813232421875, -6.15576171875, -5.8302001953125, -5.504638671875, -5.1790771484375, -4.853515625, -4.5279541015625, -4.202392578125, -3.8768310546875, -3.55126953125, -3.2257080078125, -2.900146484375, -2.5745849609375, -2.2490234375, -1.9234619140625, -1.597900390625, -1.2723388671875, -0.94677734375, -0.6212158203125, -0.295654296875, 0.0299072265625, 0.35546875, 0.6810302734375, 1.006591796875, 1.3321533203125, 1.65771484375, 1.9832763671875, 2.308837890625, 2.6343994140625, 2.9599609375, 3.2855224609375, 3.611083984375, 3.9366455078125, 4.26220703125, 4.5877685546875, 4.913330078125, 5.2388916015625, 5.564453125, 5.8900146484375, 6.215576171875, 6.5411376953125, 6.86669921875, 7.1922607421875, 7.517822265625, 7.8433837890625, 8.1689453125, 8.4945068359375, 8.820068359375, 9.1456298828125, 9.47119140625, 9.7967529296875, 10.122314453125, 10.4478759765625, 10.7734375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 9.0, 38.0, 242.0, 463.0, 225.0, 32.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.20339584350586, -45.353675842285156, -44.50395202636719, -43.654232025146484, -42.80451202392578, -41.95479202270508, -41.105072021484375, -40.255348205566406, -39.4056282043457, -38.555908203125, -37.70618438720703, -36.85646438598633, -36.006744384765625, -35.15702438354492, -34.30730438232422, -33.45758056640625, -32.60786056518555, -31.758140563964844, -30.908418655395508, -30.058696746826172, -29.20897674560547, -28.359256744384766, -27.50953483581543, -26.659812927246094, -25.81009292602539, -24.960372924804688, -24.11065101623535, -23.260929107666016, -22.411209106445312, -21.56148910522461, -20.711767196655273, -19.862045288085938, -19.012327194213867, -18.16260528564453, -17.312885284423828, -16.463165283203125, -15.613443374633789, -14.76372241973877, -13.91400146484375, -13.06428050994873, -12.214559555053711, -11.364838600158691, -10.515117645263672, -9.665396690368652, -8.815675735473633, -7.965954780578613, -7.116233825683594, -6.266512870788574, -5.416791915893555, -4.567070960998535, -3.7173500061035156, -2.867629051208496, -2.0179080963134766, -1.168187141418457, -0.3184661865234375, 0.531254768371582, 1.3809757232666016, 2.230696678161621, 3.0804176330566406, 3.93013858795166, 4.77985954284668, 5.629580497741699, 6.479301452636719, 7.329022407531738, 8.178743362426758]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 5.0, 14.0, 12.0, 13.0, 11.0, 15.0, 20.0, 27.0, 25.0, 23.0, 25.0, 26.0, 30.0, 26.0, 35.0, 39.0, 41.0, 45.0, 31.0, 39.0, 43.0, 38.0, 34.0, 34.0, 40.0, 23.0, 28.0, 23.0, 30.0, 34.0, 24.0, 19.0, 23.0, 16.0, 7.0, 10.0, 15.0, 8.0, 3.0, 6.0, 7.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 4.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.750160217285156, -13.298480987548828, -12.846802711486816, -12.395123481750488, -11.943445205688477, -11.491765975952148, -11.04008674621582, -10.588407516479492, -10.13672924041748, -9.685050010681152, -9.23337173461914, -8.781692504882812, -8.330013275146484, -7.878334999084473, -7.4266557693481445, -6.974977016448975, -6.523298263549805, -6.071619510650635, -5.619940757751465, -5.168261528015137, -4.716582775115967, -4.264904022216797, -3.813225030899048, -3.361546039581299, -2.909867286682129, -2.458188533782959, -2.00650954246521, -1.5548306703567505, -1.103151798248291, -0.6514730453491211, -0.19979405403137207, 0.25188493728637695, 0.7035636901855469, 1.1552425622940063, 1.6069214344024658, 2.058600425720215, 2.5102791786193848, 2.9619579315185547, 3.4136369228363037, 3.8653159141540527, 4.316994667053223, 4.768673419952393, 5.2203521728515625, 5.672031402587891, 6.1237101554870605, 6.5753889083862305, 7.027068138122559, 7.4787468910217285, 7.930425643920898, 8.382104873657227, 8.833783149719238, 9.285462379455566, 9.737140655517578, 10.188819885253906, 10.640499114990234, 11.092178344726562, 11.543856620788574, 11.995535850524902, 12.447214126586914, 12.898893356323242, 13.35057258605957, 13.802250862121582, 14.25393009185791, 14.705608367919922, 15.15728759765625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 10.0, 6.0, 3.0, 8.0, 11.0, 13.0, 18.0, 9.0, 31.0, 25.0, 19.0, 26.0, 24.0, 42.0, 24.0, 36.0, 37.0, 42.0, 36.0, 54.0, 31.0, 55.0, 30.0, 48.0, 37.0, 27.0, 39.0, 29.0, 29.0, 19.0, 24.0, 23.0, 20.0, 19.0, 20.0, 14.0, 11.0, 10.0, 8.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3076171875, -1.2619171142578125, -1.216217041015625, -1.1705169677734375, -1.12481689453125, -1.0791168212890625, -1.033416748046875, -0.9877166748046875, -0.9420166015625, -0.8963165283203125, -0.850616455078125, -0.8049163818359375, -0.75921630859375, -0.7135162353515625, -0.667816162109375, -0.6221160888671875, -0.576416015625, -0.5307159423828125, -0.485015869140625, -0.4393157958984375, -0.39361572265625, -0.3479156494140625, -0.302215576171875, -0.2565155029296875, -0.2108154296875, -0.1651153564453125, -0.119415283203125, -0.0737152099609375, -0.02801513671875, 0.0176849365234375, 0.063385009765625, 0.1090850830078125, 0.15478515625, 0.2004852294921875, 0.246185302734375, 0.2918853759765625, 0.33758544921875, 0.3832855224609375, 0.428985595703125, 0.4746856689453125, 0.5203857421875, 0.5660858154296875, 0.611785888671875, 0.6574859619140625, 0.70318603515625, 0.7488861083984375, 0.794586181640625, 0.8402862548828125, 0.885986328125, 0.9316864013671875, 0.977386474609375, 1.0230865478515625, 1.06878662109375, 1.1144866943359375, 1.160186767578125, 1.2058868408203125, 1.2515869140625, 1.2972869873046875, 1.342987060546875, 1.3886871337890625, 1.43438720703125, 1.4800872802734375, 1.525787353515625, 1.5714874267578125, 1.6171875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 5.0, 13.0, 8.0, 12.0, 32.0, 21.0, 26.0, 35.0, 45.0, 52.0, 91.0, 122.0, 197.0, 365.0, 783.0, 1912.0, 5794.0, 21884.0, 111629.0, 898405.0, 2619273.0, 447425.0, 65387.0, 14003.0, 3978.0, 1323.0, 538.0, 333.0, 175.0, 107.0, 60.0, 50.0, 34.0, 43.0, 26.0, 16.0, 14.0, 21.0, 9.0, 8.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.078125, -4.92584228515625, -4.7735595703125, -4.62127685546875, -4.468994140625, -4.31671142578125, -4.1644287109375, -4.01214599609375, -3.85986328125, -3.70758056640625, -3.5552978515625, -3.40301513671875, -3.250732421875, -3.09844970703125, -2.9461669921875, -2.79388427734375, -2.6416015625, -2.48931884765625, -2.3370361328125, -2.18475341796875, -2.032470703125, -1.88018798828125, -1.7279052734375, -1.57562255859375, -1.42333984375, -1.27105712890625, -1.1187744140625, -0.96649169921875, -0.814208984375, -0.66192626953125, -0.5096435546875, -0.35736083984375, -0.205078125, -0.05279541015625, 0.0994873046875, 0.25177001953125, 0.404052734375, 0.55633544921875, 0.7086181640625, 0.86090087890625, 1.01318359375, 1.16546630859375, 1.3177490234375, 1.47003173828125, 1.622314453125, 1.77459716796875, 1.9268798828125, 2.07916259765625, 2.2314453125, 2.38372802734375, 2.5360107421875, 2.68829345703125, 2.840576171875, 2.99285888671875, 3.1451416015625, 3.29742431640625, 3.44970703125, 3.60198974609375, 3.7542724609375, 3.90655517578125, 4.058837890625, 4.21112060546875, 4.3634033203125, 4.51568603515625, 4.66796875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 8.0, 14.0, 13.0, 19.0, 23.0, 29.0, 52.0, 67.0, 87.0, 103.0, 190.0, 251.0, 362.0, 432.0, 483.0, 569.0, 354.0, 310.0, 192.0, 131.0, 100.0, 88.0, 58.0, 35.0, 34.0, 17.0, 18.0, 7.0, 11.0, 12.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.44140625, -6.26611328125, -6.0908203125, -5.91552734375, -5.740234375, -5.56494140625, -5.3896484375, -5.21435546875, -5.0390625, -4.86376953125, -4.6884765625, -4.51318359375, -4.337890625, -4.16259765625, -3.9873046875, -3.81201171875, -3.63671875, -3.46142578125, -3.2861328125, -3.11083984375, -2.935546875, -2.76025390625, -2.5849609375, -2.40966796875, -2.234375, -2.05908203125, -1.8837890625, -1.70849609375, -1.533203125, -1.35791015625, -1.1826171875, -1.00732421875, -0.83203125, -0.65673828125, -0.4814453125, -0.30615234375, -0.130859375, 0.04443359375, 0.2197265625, 0.39501953125, 0.5703125, 0.74560546875, 0.9208984375, 1.09619140625, 1.271484375, 1.44677734375, 1.6220703125, 1.79736328125, 1.97265625, 2.14794921875, 2.3232421875, 2.49853515625, 2.673828125, 2.84912109375, 3.0244140625, 3.19970703125, 3.375, 3.55029296875, 3.7255859375, 3.90087890625, 4.076171875, 4.25146484375, 4.4267578125, 4.60205078125, 4.77734375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 12.0, 7.0, 13.0, 22.0, 23.0, 38.0, 68.0, 85.0, 155.0, 233.0, 403.0, 671.0, 1463.0, 3540.0, 12252.0, 60184.0, 388282.0, 2429711.0, 1107988.0, 151855.0, 26409.0, 6319.0, 2177.0, 944.0, 536.0, 323.0, 199.0, 112.0, 84.0, 52.0, 37.0, 26.0, 19.0, 8.0, 5.0, 10.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.369873046875, -6.12255859375, -5.875244140625, -5.6279296875, -5.380615234375, -5.13330078125, -4.885986328125, -4.638671875, -4.391357421875, -4.14404296875, -3.896728515625, -3.6494140625, -3.402099609375, -3.15478515625, -2.907470703125, -2.66015625, -2.412841796875, -2.16552734375, -1.918212890625, -1.6708984375, -1.423583984375, -1.17626953125, -0.928955078125, -0.681640625, -0.434326171875, -0.18701171875, 0.060302734375, 0.3076171875, 0.554931640625, 0.80224609375, 1.049560546875, 1.296875, 1.544189453125, 1.79150390625, 2.038818359375, 2.2861328125, 2.533447265625, 2.78076171875, 3.028076171875, 3.275390625, 3.522705078125, 3.77001953125, 4.017333984375, 4.2646484375, 4.511962890625, 4.75927734375, 5.006591796875, 5.25390625, 5.501220703125, 5.74853515625, 5.995849609375, 6.2431640625, 6.490478515625, 6.73779296875, 6.985107421875, 7.232421875, 7.479736328125, 7.72705078125, 7.974365234375, 8.2216796875, 8.468994140625, 8.71630859375, 8.963623046875, 9.2109375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 20.0, 36.0, 78.0, 156.0, 168.0, 209.0, 163.0, 100.0, 47.0, 18.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.31755828857422, -49.15058517456055, -47.983612060546875, -46.81663513183594, -45.649662017822266, -44.482688903808594, -43.315711975097656, -42.148738861083984, -40.98176574707031, -39.81479263305664, -38.64781951904297, -37.48084259033203, -36.31386947631836, -35.14689636230469, -33.97991943359375, -32.81294631958008, -31.645973205566406, -30.479000091552734, -29.31202507019043, -28.145050048828125, -26.978076934814453, -25.81110382080078, -24.644128799438477, -23.477153778076172, -22.3101806640625, -21.143207550048828, -19.976232528686523, -18.80925750732422, -17.642284393310547, -16.475311279296875, -15.30833625793457, -14.141362190246582, -12.97439193725586, -11.807417869567871, -10.640443801879883, -9.473469734191895, -8.306495666503906, -7.139521598815918, -5.97254753112793, -4.805573463439941, -3.638599395751953, -2.471625328063965, -1.3046512603759766, -0.13767719268798828, 1.029296875, 2.1962709426879883, 3.3632450103759766, 4.530219078063965, 5.697193145751953, 6.864167213439941, 8.03114128112793, 9.198115348815918, 10.365089416503906, 11.532063484191895, 12.699037551879883, 13.866011619567871, 15.03298568725586, 16.19995880126953, 17.366933822631836, 18.53390884399414, 19.700881958007812, 20.867855072021484, 22.03483009338379, 23.201805114746094, 24.368778228759766]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 7.0, 10.0, 22.0, 22.0, 19.0, 17.0, 19.0, 18.0, 27.0, 40.0, 42.0, 31.0, 44.0, 38.0, 39.0, 47.0, 42.0, 45.0, 44.0, 37.0, 42.0, 35.0, 36.0, 42.0, 32.0, 24.0, 25.0, 20.0, 16.0, 20.0, 9.0, 28.0, 11.0, 10.0, 9.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.64270782470703, -16.109790802001953, -15.576874732971191, -15.043957710266113, -14.511041641235352, -13.978124618530273, -13.445207595825195, -12.912291526794434, -12.379375457763672, -11.846458435058594, -11.313542366027832, -10.780625343322754, -10.247709274291992, -9.714792251586914, -9.181875228881836, -8.648959159851074, -8.116042137145996, -7.583125591278076, -7.050209045410156, -6.517292022705078, -5.984375953674316, -5.451458930969238, -4.918542385101318, -4.385625839233398, -3.8527092933654785, -3.3197927474975586, -2.7868762016296387, -2.2539594173431396, -1.7210428714752197, -1.1881263256072998, -0.6552095413208008, -0.12229299545288086, 0.41062355041503906, 0.9435401558876038, 1.4764567613601685, 2.009373426437378, 2.542289972305298, 3.0752065181732178, 3.608123302459717, 4.141039848327637, 4.673956394195557, 5.206872940063477, 5.7397894859313965, 6.272706031799316, 6.8056230545043945, 7.338539123535156, 7.871456146240234, 8.404373168945312, 8.937289237976074, 9.470206260681152, 10.003122329711914, 10.536039352416992, 11.068955421447754, 11.601872444152832, 12.134788513183594, 12.667705535888672, 13.20062255859375, 13.733539581298828, 14.26645565032959, 14.799372673034668, 15.33228874206543, 15.865205764770508, 16.398122787475586, 16.93103790283203, 17.46395492553711]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 5.0, 5.0, 5.0, 5.0, 7.0, 12.0, 14.0, 16.0, 24.0, 22.0, 14.0, 21.0, 26.0, 26.0, 24.0, 34.0, 28.0, 34.0, 31.0, 49.0, 39.0, 55.0, 44.0, 36.0, 36.0, 38.0, 24.0, 42.0, 34.0, 32.0, 28.0, 31.0, 28.0, 17.0, 14.0, 10.0, 12.0, 21.0, 11.0, 15.0, 4.0, 8.0, 6.0, 11.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.3777618408203125, -1.330718994140625, -1.2836761474609375, -1.23663330078125, -1.1895904541015625, -1.142547607421875, -1.0955047607421875, -1.0484619140625, -1.0014190673828125, -0.954376220703125, -0.9073333740234375, -0.86029052734375, -0.8132476806640625, -0.766204833984375, -0.7191619873046875, -0.672119140625, -0.6250762939453125, -0.578033447265625, -0.5309906005859375, -0.48394775390625, -0.4369049072265625, -0.389862060546875, -0.3428192138671875, -0.2957763671875, -0.2487335205078125, -0.201690673828125, -0.1546478271484375, -0.10760498046875, -0.0605621337890625, -0.013519287109375, 0.0335235595703125, 0.08056640625, 0.1276092529296875, 0.174652099609375, 0.2216949462890625, 0.26873779296875, 0.3157806396484375, 0.362823486328125, 0.4098663330078125, 0.4569091796875, 0.5039520263671875, 0.550994873046875, 0.5980377197265625, 0.64508056640625, 0.6921234130859375, 0.739166259765625, 0.7862091064453125, 0.833251953125, 0.8802947998046875, 0.927337646484375, 0.9743804931640625, 1.02142333984375, 1.0684661865234375, 1.115509033203125, 1.1625518798828125, 1.2095947265625, 1.2566375732421875, 1.303680419921875, 1.3507232666015625, 1.39776611328125, 1.4448089599609375, 1.491851806640625, 1.5388946533203125, 1.5859375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 8.0, 7.0, 13.0, 16.0, 42.0, 37.0, 61.0, 91.0, 123.0, 196.0, 280.0, 353.0, 560.0, 743.0, 991.0, 1435.0, 2051.0, 2979.0, 4150.0, 5890.0, 8596.0, 12222.0, 18308.0, 26642.0, 40241.0, 60836.0, 92807.0, 139895.0, 181206.0, 148258.0, 99341.0, 65721.0, 43090.0, 28613.0, 19327.0, 13192.0, 9143.0, 6346.0, 4265.0, 3126.0, 2112.0, 1509.0, 1084.0, 809.0, 548.0, 383.0, 261.0, 226.0, 138.0, 105.0, 56.0, 53.0, 27.0, 26.0, 10.0, 8.0, 5.0, 5.0, 1.0, 3.0], "bins": [-0.1434326171875, -0.13903045654296875, -0.1346282958984375, -0.13022613525390625, -0.125823974609375, -0.12142181396484375, -0.1170196533203125, -0.11261749267578125, -0.10821533203125, -0.10381317138671875, -0.0994110107421875, -0.09500885009765625, -0.090606689453125, -0.08620452880859375, -0.0818023681640625, -0.07740020751953125, -0.072998046875, -0.06859588623046875, -0.0641937255859375, -0.05979156494140625, -0.055389404296875, -0.05098724365234375, -0.0465850830078125, -0.04218292236328125, -0.03778076171875, -0.03337860107421875, -0.0289764404296875, -0.02457427978515625, -0.020172119140625, -0.01576995849609375, -0.0113677978515625, -0.00696563720703125, -0.0025634765625, 0.00183868408203125, 0.0062408447265625, 0.01064300537109375, 0.015045166015625, 0.01944732666015625, 0.0238494873046875, 0.02825164794921875, 0.03265380859375, 0.03705596923828125, 0.0414581298828125, 0.04586029052734375, 0.050262451171875, 0.05466461181640625, 0.0590667724609375, 0.06346893310546875, 0.06787109375, 0.07227325439453125, 0.0766754150390625, 0.08107757568359375, 0.085479736328125, 0.08988189697265625, 0.0942840576171875, 0.09868621826171875, 0.10308837890625, 0.10749053955078125, 0.1118927001953125, 0.11629486083984375, 0.120697021484375, 0.12509918212890625, 0.1295013427734375, 0.13390350341796875, 0.1383056640625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 4.0, 2.0, 5.0, 9.0, 2.0, 6.0, 9.0, 13.0, 8.0, 8.0, 8.0, 21.0, 21.0, 16.0, 20.0, 29.0, 19.0, 31.0, 44.0, 29.0, 36.0, 38.0, 29.0, 29.0, 43.0, 1060.0, 37.0, 32.0, 33.0, 38.0, 40.0, 35.0, 26.0, 35.0, 22.0, 27.0, 29.0, 24.0, 26.0, 21.0, 9.0, 10.0, 13.0, 8.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.93896484375, -0.9089736938476562, -0.8789825439453125, -0.8489913940429688, -0.819000244140625, -0.7890090942382812, -0.7590179443359375, -0.7290267944335938, -0.69903564453125, -0.6690444946289062, -0.6390533447265625, -0.6090621948242188, -0.579071044921875, -0.5490798950195312, -0.5190887451171875, -0.48909759521484375, -0.4591064453125, -0.42911529541015625, -0.3991241455078125, -0.36913299560546875, -0.339141845703125, -0.30915069580078125, -0.2791595458984375, -0.24916839599609375, -0.21917724609375, -0.18918609619140625, -0.1591949462890625, -0.12920379638671875, -0.099212646484375, -0.06922149658203125, -0.0392303466796875, -0.00923919677734375, 0.020751953125, 0.05074310302734375, 0.0807342529296875, 0.11072540283203125, 0.140716552734375, 0.17070770263671875, 0.2006988525390625, 0.23069000244140625, 0.26068115234375, 0.29067230224609375, 0.3206634521484375, 0.35065460205078125, 0.380645751953125, 0.41063690185546875, 0.4406280517578125, 0.47061920166015625, 0.5006103515625, 0.5306015014648438, 0.5605926513671875, 0.5905838012695312, 0.620574951171875, 0.6505661010742188, 0.6805572509765625, 0.7105484008789062, 0.74053955078125, 0.7705307006835938, 0.8005218505859375, 0.8305130004882812, 0.860504150390625, 0.8904953002929688, 0.9204864501953125, 0.9504776000976562, 0.98046875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 9.0, 13.0, 13.0, 14.0, 27.0, 32.0, 50.0, 82.0, 93.0, 171.0, 243.0, 342.0, 507.0, 716.0, 1052.0, 1567.0, 2227.0, 3355.0, 4675.0, 6818.0, 10218.0, 14783.0, 22013.0, 32023.0, 46690.0, 67936.0, 96290.0, 132028.0, 1181904.0, 142236.0, 101067.0, 71899.0, 49483.0, 33867.0, 23021.0, 15485.0, 10769.0, 7244.0, 5092.0, 3521.0, 2401.0, 1632.0, 1090.0, 754.0, 528.0, 353.0, 247.0, 166.0, 117.0, 68.0, 69.0, 47.0, 30.0, 16.0, 21.0, 10.0, 7.0, 3.0, 5.0, 0.0, 3.0], "bins": [-0.0882568359375, -0.08546161651611328, -0.08266639709472656, -0.07987117767333984, -0.07707595825195312, -0.0742807388305664, -0.07148551940917969, -0.06869029998779297, -0.06589508056640625, -0.06309986114501953, -0.06030464172363281, -0.057509422302246094, -0.054714202880859375, -0.051918983459472656, -0.04912376403808594, -0.04632854461669922, -0.0435333251953125, -0.04073810577392578, -0.03794288635253906, -0.035147666931152344, -0.032352447509765625, -0.029557228088378906, -0.026762008666992188, -0.02396678924560547, -0.02117156982421875, -0.01837635040283203, -0.015581130981445312, -0.012785911560058594, -0.009990692138671875, -0.007195472717285156, -0.0044002532958984375, -0.0016050338745117188, 0.001190185546875, 0.003985404968261719, 0.0067806243896484375, 0.009575843811035156, 0.012371063232421875, 0.015166282653808594, 0.017961502075195312, 0.02075672149658203, 0.02355194091796875, 0.02634716033935547, 0.029142379760742188, 0.031937599182128906, 0.034732818603515625, 0.037528038024902344, 0.04032325744628906, 0.04311847686767578, 0.0459136962890625, 0.04870891571044922, 0.05150413513183594, 0.054299354553222656, 0.057094573974609375, 0.059889793395996094, 0.06268501281738281, 0.06548023223876953, 0.06827545166015625, 0.07107067108154297, 0.07386589050292969, 0.0766611099243164, 0.07945632934570312, 0.08225154876708984, 0.08504676818847656, 0.08784198760986328, 0.09063720703125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 7.0, 6.0, 10.0, 15.0, 16.0, 12.0, 20.0, 28.0, 27.0, 32.0, 40.0, 45.0, 33.0, 43.0, 56.0, 31.0, 63.0, 57.0, 59.0, 55.0, 39.0, 43.0, 36.0, 35.0, 38.0, 28.0, 24.0, 18.0, 16.0, 20.0, 8.0, 9.0, 4.0, 4.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.002971649169921875, -0.0028788745403289795, -0.002786099910736084, -0.0026933252811431885, -0.002600550651550293, -0.0025077760219573975, -0.002415001392364502, -0.0023222267627716064, -0.002229452133178711, -0.0021366775035858154, -0.00204390287399292, -0.0019511282444000244, -0.001858353614807129, -0.0017655789852142334, -0.0016728043556213379, -0.0015800297260284424, -0.0014872550964355469, -0.0013944804668426514, -0.0013017058372497559, -0.0012089312076568604, -0.0011161565780639648, -0.0010233819484710693, -0.0009306073188781738, -0.0008378326892852783, -0.0007450580596923828, -0.0006522834300994873, -0.0005595088005065918, -0.0004667341709136963, -0.0003739595413208008, -0.0002811849117279053, -0.00018841028213500977, -9.563565254211426e-05, -2.86102294921875e-06, 8.991360664367676e-05, 0.00018268823623657227, 0.0002754628658294678, 0.0003682374954223633, 0.0004610121250152588, 0.0005537867546081543, 0.0006465613842010498, 0.0007393360137939453, 0.0008321106433868408, 0.0009248852729797363, 0.0010176599025726318, 0.0011104345321655273, 0.0012032091617584229, 0.0012959837913513184, 0.0013887584209442139, 0.0014815330505371094, 0.0015743076801300049, 0.0016670823097229004, 0.001759856939315796, 0.0018526315689086914, 0.001945406198501587, 0.0020381808280944824, 0.002130955457687378, 0.0022237300872802734, 0.002316504716873169, 0.0024092793464660645, 0.00250205397605896, 0.0025948286056518555, 0.002687603235244751, 0.0027803778648376465, 0.002873152494430542, 0.0029659271240234375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 4.0, 13.0, 12.0, 20.0, 30.0, 26.0, 34.0, 55.0, 67.0, 78.0, 103.0, 127.0, 156.0, 228.0, 343.0, 850.0, 16819.0, 1006927.0, 20412.0, 864.0, 373.0, 248.0, 189.0, 117.0, 97.0, 82.0, 69.0, 46.0, 39.0, 27.0, 25.0, 19.0, 13.0, 4.0, 10.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0496826171875, -0.04805469512939453, -0.04642677307128906, -0.044798851013183594, -0.043170928955078125, -0.041543006896972656, -0.03991508483886719, -0.03828716278076172, -0.03665924072265625, -0.03503131866455078, -0.03340339660644531, -0.031775474548339844, -0.030147552490234375, -0.028519630432128906, -0.026891708374023438, -0.02526378631591797, -0.0236358642578125, -0.02200794219970703, -0.020380020141601562, -0.018752098083496094, -0.017124176025390625, -0.015496253967285156, -0.013868331909179688, -0.012240409851074219, -0.01061248779296875, -0.008984565734863281, -0.0073566436767578125, -0.005728721618652344, -0.004100799560546875, -0.0024728775024414062, -0.0008449554443359375, 0.0007829666137695312, 0.002410888671875, 0.004038810729980469, 0.0056667327880859375, 0.007294654846191406, 0.008922576904296875, 0.010550498962402344, 0.012178421020507812, 0.013806343078613281, 0.01543426513671875, 0.01706218719482422, 0.018690109252929688, 0.020318031311035156, 0.021945953369140625, 0.023573875427246094, 0.025201797485351562, 0.02682971954345703, 0.0284576416015625, 0.03008556365966797, 0.03171348571777344, 0.033341407775878906, 0.034969329833984375, 0.036597251892089844, 0.03822517395019531, 0.03985309600830078, 0.04148101806640625, 0.04310894012451172, 0.04473686218261719, 0.046364784240722656, 0.047992706298828125, 0.049620628356933594, 0.05124855041503906, 0.05287647247314453, 0.05450439453125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 993.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04610783979296684, -0.044237278401851654, -0.04236671328544617, -0.04049615189433098, -0.03862559050321579, -0.0367550291121006, -0.03488446772098541, -0.033013902604579926, -0.031143341213464737, -0.02927277982234955, -0.02740221656858921, -0.025531653314828873, -0.023661091923713684, -0.021790530532598495, -0.019919967278838158, -0.01804940402507782, -0.01617884263396263, -0.014308280311524868, -0.012437717989087105, -0.010567155666649342, -0.008696593344211578, -0.006826031021773815, -0.004955468699336052, -0.0030849063768982887, -0.0012143440544605255, 0.0006562182679772377, 0.002526780590415001, 0.004397342912852764, 0.006267905235290527, 0.00813846755772829, 0.010009029880166054, 0.011879592202603817, 0.013750158250331879, 0.015620720572769642, 0.017491282895207405, 0.019361846148967743, 0.02123240754008293, 0.02310296893119812, 0.024973532184958458, 0.026844095438718796, 0.028714656829833984, 0.030585218220949173, 0.03245577961206436, 0.03432634472846985, 0.03619690611958504, 0.038067467510700226, 0.03993803262710571, 0.0418085940182209, 0.04367915540933609, 0.04554971680045128, 0.04742027819156647, 0.049290843307971954, 0.05116140469908714, 0.05303196609020233, 0.05490253120660782, 0.05677309259772301, 0.058643653988838196, 0.060514215379953384, 0.06238477677106857, 0.06425534188747406, 0.06612589955329895, 0.06799646466970444, 0.06986702978610992, 0.07173758745193481, 0.0736081525683403]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 7.0, 12.0, 23.0, 30.0, 27.0, 47.0, 38.0, 44.0, 59.0, 59.0, 58.0, 72.0, 87.0, 68.0, 62.0, 56.0, 63.0, 37.0, 37.0, 35.0, 21.0, 21.0, 16.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004634082317352295, -0.004500299692153931, -0.004366517066955566, -0.004232734441757202, -0.004098951816558838, -0.003965169191360474, -0.0038313865661621094, -0.003697603940963745, -0.003563821315765381, -0.0034300386905670166, -0.0032962560653686523, -0.003162473440170288, -0.003028690814971924, -0.0028949081897735596, -0.0027611255645751953, -0.002627342939376831, -0.002493560314178467, -0.0023597776889801025, -0.0022259950637817383, -0.002092212438583374, -0.0019584298133850098, -0.0018246471881866455, -0.0016908645629882812, -0.001557081937789917, -0.0014232993125915527, -0.0012895166873931885, -0.0011557340621948242, -0.00102195143699646, -0.0008881688117980957, -0.0007543861865997314, -0.0006206035614013672, -0.00048682093620300293, -0.00035303831100463867, -0.00021925568580627441, -8.547306060791016e-05, 4.83095645904541e-05, 0.00018209218978881836, 0.0003158748149871826, 0.0004496574401855469, 0.0005834400653839111, 0.0007172226905822754, 0.0008510053157806396, 0.000984787940979004, 0.0011185705661773682, 0.0012523531913757324, 0.0013861358165740967, 0.001519918441772461, 0.0016537010669708252, 0.0017874836921691895, 0.0019212663173675537, 0.002055048942565918, 0.0021888315677642822, 0.0023226141929626465, 0.0024563968181610107, 0.002590179443359375, 0.0027239620685577393, 0.0028577446937561035, 0.0029915273189544678, 0.003125309944152832, 0.0032590925693511963, 0.0033928751945495605, 0.003526657819747925, 0.003660440444946289, 0.0037942230701446533, 0.003928005695343018]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 5.0, 5.0, 5.0, 5.0, 7.0, 12.0, 14.0, 16.0, 24.0, 22.0, 14.0, 21.0, 26.0, 26.0, 24.0, 34.0, 28.0, 34.0, 31.0, 49.0, 39.0, 55.0, 44.0, 36.0, 36.0, 38.0, 24.0, 42.0, 34.0, 32.0, 28.0, 31.0, 28.0, 17.0, 14.0, 10.0, 12.0, 21.0, 11.0, 15.0, 4.0, 8.0, 6.0, 11.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.3777618408203125, -1.330718994140625, -1.2836761474609375, -1.23663330078125, -1.1895904541015625, -1.142547607421875, -1.0955047607421875, -1.0484619140625, -1.0014190673828125, -0.954376220703125, -0.9073333740234375, -0.86029052734375, -0.8132476806640625, -0.766204833984375, -0.7191619873046875, -0.672119140625, -0.6250762939453125, -0.578033447265625, -0.5309906005859375, -0.48394775390625, -0.4369049072265625, -0.389862060546875, -0.3428192138671875, -0.2957763671875, -0.2487335205078125, -0.201690673828125, -0.1546478271484375, -0.10760498046875, -0.0605621337890625, -0.013519287109375, 0.0335235595703125, 0.08056640625, 0.1276092529296875, 0.174652099609375, 0.2216949462890625, 0.26873779296875, 0.3157806396484375, 0.362823486328125, 0.4098663330078125, 0.4569091796875, 0.5039520263671875, 0.550994873046875, 0.5980377197265625, 0.64508056640625, 0.6921234130859375, 0.739166259765625, 0.7862091064453125, 0.833251953125, 0.8802947998046875, 0.927337646484375, 0.9743804931640625, 1.02142333984375, 1.0684661865234375, 1.115509033203125, 1.1625518798828125, 1.2095947265625, 1.2566375732421875, 1.303680419921875, 1.3507232666015625, 1.39776611328125, 1.4448089599609375, 1.491851806640625, 1.5388946533203125, 1.5859375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 9.0, 15.0, 24.0, 35.0, 41.0, 70.0, 99.0, 122.0, 184.0, 258.0, 364.0, 559.0, 839.0, 1330.0, 2037.0, 3436.0, 5957.0, 10727.0, 20590.0, 45167.0, 118016.0, 329459.0, 310801.0, 110705.0, 42935.0, 19582.0, 10178.0, 5697.0, 3376.0, 2018.0, 1316.0, 812.0, 543.0, 391.0, 254.0, 188.0, 122.0, 96.0, 48.0, 43.0, 27.0, 24.0, 14.0, 14.0, 9.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.9267578125, -1.8716583251953125, -1.816558837890625, -1.7614593505859375, -1.70635986328125, -1.6512603759765625, -1.596160888671875, -1.5410614013671875, -1.4859619140625, -1.4308624267578125, -1.375762939453125, -1.3206634521484375, -1.26556396484375, -1.2104644775390625, -1.155364990234375, -1.1002655029296875, -1.045166015625, -0.9900665283203125, -0.934967041015625, -0.8798675537109375, -0.82476806640625, -0.7696685791015625, -0.714569091796875, -0.6594696044921875, -0.6043701171875, -0.5492706298828125, -0.494171142578125, -0.4390716552734375, -0.38397216796875, -0.3288726806640625, -0.273773193359375, -0.2186737060546875, -0.16357421875, -0.1084747314453125, -0.053375244140625, 0.0017242431640625, 0.05682373046875, 0.1119232177734375, 0.167022705078125, 0.2221221923828125, 0.2772216796875, 0.3323211669921875, 0.387420654296875, 0.4425201416015625, 0.49761962890625, 0.5527191162109375, 0.607818603515625, 0.6629180908203125, 0.718017578125, 0.7731170654296875, 0.828216552734375, 0.8833160400390625, 0.93841552734375, 0.9935150146484375, 1.048614501953125, 1.1037139892578125, 1.1588134765625, 1.2139129638671875, 1.269012451171875, 1.3241119384765625, 1.37921142578125, 1.4343109130859375, 1.489410400390625, 1.5445098876953125, 1.599609375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 6.0, 3.0, 4.0, 7.0, 9.0, 13.0, 10.0, 13.0, 16.0, 26.0, 20.0, 38.0, 30.0, 34.0, 36.0, 49.0, 52.0, 67.0, 129.0, 324.0, 1511.0, 173.0, 68.0, 48.0, 58.0, 43.0, 52.0, 43.0, 21.0, 16.0, 23.0, 21.0, 14.0, 17.0, 13.0, 13.0, 8.0, 9.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.70703125, -5.52392578125, -5.3408203125, -5.15771484375, -4.974609375, -4.79150390625, -4.6083984375, -4.42529296875, -4.2421875, -4.05908203125, -3.8759765625, -3.69287109375, -3.509765625, -3.32666015625, -3.1435546875, -2.96044921875, -2.77734375, -2.59423828125, -2.4111328125, -2.22802734375, -2.044921875, -1.86181640625, -1.6787109375, -1.49560546875, -1.3125, -1.12939453125, -0.9462890625, -0.76318359375, -0.580078125, -0.39697265625, -0.2138671875, -0.03076171875, 0.15234375, 0.33544921875, 0.5185546875, 0.70166015625, 0.884765625, 1.06787109375, 1.2509765625, 1.43408203125, 1.6171875, 1.80029296875, 1.9833984375, 2.16650390625, 2.349609375, 2.53271484375, 2.7158203125, 2.89892578125, 3.08203125, 3.26513671875, 3.4482421875, 3.63134765625, 3.814453125, 3.99755859375, 4.1806640625, 4.36376953125, 4.546875, 4.72998046875, 4.9130859375, 5.09619140625, 5.279296875, 5.46240234375, 5.6455078125, 5.82861328125, 6.01171875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 10.0, 9.0, 13.0, 27.0, 25.0, 30.0, 33.0, 44.0, 56.0, 77.0, 132.0, 209.0, 412.0, 1115.0, 7168.0, 133711.0, 2918552.0, 77087.0, 5026.0, 983.0, 343.0, 214.0, 108.0, 71.0, 59.0, 44.0, 22.0, 19.0, 18.0, 15.0, 16.0, 11.0, 7.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.767333984375, -9.45654296875, -9.145751953125, -8.8349609375, -8.524169921875, -8.21337890625, -7.902587890625, -7.591796875, -7.281005859375, -6.97021484375, -6.659423828125, -6.3486328125, -6.037841796875, -5.72705078125, -5.416259765625, -5.10546875, -4.794677734375, -4.48388671875, -4.173095703125, -3.8623046875, -3.551513671875, -3.24072265625, -2.929931640625, -2.619140625, -2.308349609375, -1.99755859375, -1.686767578125, -1.3759765625, -1.065185546875, -0.75439453125, -0.443603515625, -0.1328125, 0.177978515625, 0.48876953125, 0.799560546875, 1.1103515625, 1.421142578125, 1.73193359375, 2.042724609375, 2.353515625, 2.664306640625, 2.97509765625, 3.285888671875, 3.5966796875, 3.907470703125, 4.21826171875, 4.529052734375, 4.83984375, 5.150634765625, 5.46142578125, 5.772216796875, 6.0830078125, 6.393798828125, 6.70458984375, 7.015380859375, 7.326171875, 7.636962890625, 7.94775390625, 8.258544921875, 8.5693359375, 8.880126953125, 9.19091796875, 9.501708984375, 9.8125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 36.0, 512.0, 446.0, 22.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.72103118896484, -82.98821258544922, -81.25540161132812, -79.5225830078125, -77.78976440429688, -76.05694580078125, -74.32413482666016, -72.59131622314453, -70.85850524902344, -69.12568664550781, -67.39287567138672, -65.6600570678711, -63.92723846435547, -62.19442367553711, -60.46160888671875, -58.728790283203125, -56.9959716796875, -55.26315689086914, -53.530338287353516, -51.797523498535156, -50.06470489501953, -48.33189010620117, -46.59907531738281, -44.86625671386719, -43.13344192504883, -41.40062713623047, -39.667808532714844, -37.934993743896484, -36.202178955078125, -34.4693603515625, -32.73654556274414, -31.00372886657715, -29.27090835571289, -27.5380916595459, -25.805274963378906, -24.072460174560547, -22.339643478393555, -20.606826782226562, -18.874011993408203, -17.14119529724121, -15.408378601074219, -13.675561904907227, -11.94274616241455, -10.209930419921875, -8.477113723754883, -6.744297027587891, -5.011481285095215, -3.278665542602539, -1.5458488464355469, 0.1869673728942871, 1.919783592224121, 3.652599811553955, 5.385416030883789, 7.118232727050781, 8.851048469543457, 10.583864212036133, 12.316680908203125, 14.049497604370117, 15.782313346862793, 17.51512908935547, 19.24794578552246, 20.980762481689453, 22.713577270507812, 24.446393966674805, 26.179210662841797]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 4.0, 4.0, 5.0, 8.0, 6.0, 5.0, 12.0, 12.0, 11.0, 12.0, 13.0, 24.0, 23.0, 22.0, 26.0, 38.0, 34.0, 44.0, 34.0, 26.0, 46.0, 37.0, 39.0, 40.0, 42.0, 32.0, 35.0, 33.0, 41.0, 25.0, 26.0, 24.0, 22.0, 29.0, 30.0, 15.0, 15.0, 22.0, 12.0, 13.0, 16.0, 9.0, 10.0, 3.0, 6.0, 8.0, 7.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-16.52822494506836, -16.022205352783203, -15.516183853149414, -15.010163307189941, -14.504142761230469, -13.998122215270996, -13.492101669311523, -12.98608112335205, -12.480060577392578, -11.974040031433105, -11.468019485473633, -10.96199893951416, -10.455978393554688, -9.949957847595215, -9.443937301635742, -8.93791675567627, -8.431896209716797, -7.925875663757324, -7.419855117797852, -6.913834571838379, -6.407814025878906, -5.901793479919434, -5.395772933959961, -4.889752388000488, -4.383731842041016, -3.877711296081543, -3.3716907501220703, -2.8656702041625977, -2.359649658203125, -1.8536291122436523, -1.3476085662841797, -0.841588020324707, -0.33556556701660156, 0.1704549789428711, 0.6764755249023438, 1.1824960708618164, 1.688516616821289, 2.1945371627807617, 2.7005577087402344, 3.206578254699707, 3.7125988006591797, 4.218619346618652, 4.724639892578125, 5.230660438537598, 5.73668098449707, 6.242701530456543, 6.748722076416016, 7.254742622375488, 7.760763168334961, 8.266783714294434, 8.772804260253906, 9.278824806213379, 9.784845352172852, 10.290865898132324, 10.796886444091797, 11.30290699005127, 11.808927536010742, 12.314948081970215, 12.820968627929688, 13.32698917388916, 13.833009719848633, 14.339030265808105, 14.845050811767578, 15.35107135772705, 15.857091903686523]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 12.0, 7.0, 18.0, 20.0, 16.0, 24.0, 18.0, 21.0, 25.0, 23.0, 34.0, 31.0, 28.0, 35.0, 34.0, 47.0, 51.0, 51.0, 42.0, 36.0, 32.0, 33.0, 26.0, 32.0, 39.0, 27.0, 27.0, 32.0, 24.0, 12.0, 18.0, 8.0, 20.0, 14.0, 12.0, 18.0, 5.0, 4.0, 8.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4541015625, -1.4054107666015625, -1.356719970703125, -1.3080291748046875, -1.25933837890625, -1.2106475830078125, -1.161956787109375, -1.1132659912109375, -1.0645751953125, -1.0158843994140625, -0.967193603515625, -0.9185028076171875, -0.86981201171875, -0.8211212158203125, -0.772430419921875, -0.7237396240234375, -0.675048828125, -0.6263580322265625, -0.577667236328125, -0.5289764404296875, -0.48028564453125, -0.4315948486328125, -0.382904052734375, -0.3342132568359375, -0.2855224609375, -0.2368316650390625, -0.188140869140625, -0.1394500732421875, -0.09075927734375, -0.0420684814453125, 0.006622314453125, 0.0553131103515625, 0.10400390625, 0.1526947021484375, 0.201385498046875, 0.2500762939453125, 0.29876708984375, 0.3474578857421875, 0.396148681640625, 0.4448394775390625, 0.4935302734375, 0.5422210693359375, 0.590911865234375, 0.6396026611328125, 0.68829345703125, 0.7369842529296875, 0.785675048828125, 0.8343658447265625, 0.883056640625, 0.9317474365234375, 0.980438232421875, 1.0291290283203125, 1.07781982421875, 1.1265106201171875, 1.175201416015625, 1.2238922119140625, 1.2725830078125, 1.3212738037109375, 1.369964599609375, 1.4186553955078125, 1.46734619140625, 1.5160369873046875, 1.564727783203125, 1.6134185791015625, 1.662109375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 1.0, 4.0, 5.0, 9.0, 9.0, 8.0, 9.0, 19.0, 24.0, 25.0, 23.0, 32.0, 35.0, 59.0, 70.0, 125.0, 249.0, 614.0, 1748.0, 7267.0, 45179.0, 456328.0, 2999825.0, 614261.0, 56342.0, 8637.0, 2004.0, 628.0, 248.0, 141.0, 87.0, 53.0, 53.0, 29.0, 23.0, 19.0, 13.0, 17.0, 15.0, 5.0, 6.0, 11.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.08203125, -5.8892822265625, -5.696533203125, -5.5037841796875, -5.31103515625, -5.1182861328125, -4.925537109375, -4.7327880859375, -4.5400390625, -4.3472900390625, -4.154541015625, -3.9617919921875, -3.76904296875, -3.5762939453125, -3.383544921875, -3.1907958984375, -2.998046875, -2.8052978515625, -2.612548828125, -2.4197998046875, -2.22705078125, -2.0343017578125, -1.841552734375, -1.6488037109375, -1.4560546875, -1.2633056640625, -1.070556640625, -0.8778076171875, -0.68505859375, -0.4923095703125, -0.299560546875, -0.1068115234375, 0.0859375, 0.2786865234375, 0.471435546875, 0.6641845703125, 0.85693359375, 1.0496826171875, 1.242431640625, 1.4351806640625, 1.6279296875, 1.8206787109375, 2.013427734375, 2.2061767578125, 2.39892578125, 2.5916748046875, 2.784423828125, 2.9771728515625, 3.169921875, 3.3626708984375, 3.555419921875, 3.7481689453125, 3.94091796875, 4.1336669921875, 4.326416015625, 4.5191650390625, 4.7119140625, 4.9046630859375, 5.097412109375, 5.2901611328125, 5.48291015625, 5.6756591796875, 5.868408203125, 6.0611572265625, 6.25390625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 10.0, 12.0, 6.0, 10.0, 13.0, 20.0, 31.0, 45.0, 51.0, 65.0, 76.0, 98.0, 131.0, 165.0, 222.0, 287.0, 366.0, 394.0, 434.0, 383.0, 271.0, 246.0, 195.0, 132.0, 105.0, 73.0, 41.0, 49.0, 33.0, 26.0, 16.0, 13.0, 12.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.19140625, -4.0518798828125, -3.912353515625, -3.7728271484375, -3.63330078125, -3.4937744140625, -3.354248046875, -3.2147216796875, -3.0751953125, -2.9356689453125, -2.796142578125, -2.6566162109375, -2.51708984375, -2.3775634765625, -2.238037109375, -2.0985107421875, -1.958984375, -1.8194580078125, -1.679931640625, -1.5404052734375, -1.40087890625, -1.2613525390625, -1.121826171875, -0.9822998046875, -0.8427734375, -0.7032470703125, -0.563720703125, -0.4241943359375, -0.28466796875, -0.1451416015625, -0.005615234375, 0.1339111328125, 0.2734375, 0.4129638671875, 0.552490234375, 0.6920166015625, 0.83154296875, 0.9710693359375, 1.110595703125, 1.2501220703125, 1.3896484375, 1.5291748046875, 1.668701171875, 1.8082275390625, 1.94775390625, 2.0872802734375, 2.226806640625, 2.3663330078125, 2.505859375, 2.6453857421875, 2.784912109375, 2.9244384765625, 3.06396484375, 3.2034912109375, 3.343017578125, 3.4825439453125, 3.6220703125, 3.7615966796875, 3.901123046875, 4.0406494140625, 4.18017578125, 4.3197021484375, 4.459228515625, 4.5987548828125, 4.73828125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 7.0, 6.0, 9.0, 18.0, 17.0, 32.0, 37.0, 57.0, 97.0, 145.0, 183.0, 395.0, 871.0, 2225.0, 8003.0, 43844.0, 374338.0, 2710307.0, 935685.0, 97555.0, 14470.0, 3484.0, 1160.0, 500.0, 279.0, 176.0, 117.0, 66.0, 45.0, 34.0, 29.0, 20.0, 16.0, 13.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.052978515625, -7.76220703125, -7.471435546875, -7.1806640625, -6.889892578125, -6.59912109375, -6.308349609375, -6.017578125, -5.726806640625, -5.43603515625, -5.145263671875, -4.8544921875, -4.563720703125, -4.27294921875, -3.982177734375, -3.69140625, -3.400634765625, -3.10986328125, -2.819091796875, -2.5283203125, -2.237548828125, -1.94677734375, -1.656005859375, -1.365234375, -1.074462890625, -0.78369140625, -0.492919921875, -0.2021484375, 0.088623046875, 0.37939453125, 0.670166015625, 0.9609375, 1.251708984375, 1.54248046875, 1.833251953125, 2.1240234375, 2.414794921875, 2.70556640625, 2.996337890625, 3.287109375, 3.577880859375, 3.86865234375, 4.159423828125, 4.4501953125, 4.740966796875, 5.03173828125, 5.322509765625, 5.61328125, 5.904052734375, 6.19482421875, 6.485595703125, 6.7763671875, 7.067138671875, 7.35791015625, 7.648681640625, 7.939453125, 8.230224609375, 8.52099609375, 8.811767578125, 9.1025390625, 9.393310546875, 9.68408203125, 9.974853515625, 10.265625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 14.0, 20.0, 24.0, 29.0, 49.0, 74.0, 104.0, 109.0, 112.0, 104.0, 109.0, 81.0, 52.0, 37.0, 31.0, 23.0, 18.0, 9.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.6882381439209, -18.952835083007812, -18.21743392944336, -17.482030868530273, -16.746627807617188, -16.011226654052734, -15.275823593139648, -14.540421485900879, -13.80501937866211, -13.06961727142334, -12.33421516418457, -11.598812103271484, -10.863409996032715, -10.128007888793945, -9.39260482788086, -8.65720272064209, -7.92180061340332, -7.186398506164551, -6.450995922088623, -5.715593338012695, -4.980191230773926, -4.244789123535156, -3.5093865394592285, -2.773983955383301, -2.0385818481445312, -1.3031795024871826, -0.567777156829834, 0.16762518882751465, 0.9030275344848633, 1.638429880142212, 2.3738322257995605, 3.1092348098754883, 3.844635009765625, 4.5800371170043945, 5.315439701080322, 6.05084228515625, 6.7862443923950195, 7.521646499633789, 8.257049560546875, 8.992451667785645, 9.727853775024414, 10.463255882263184, 11.198657989501953, 11.934061050415039, 12.669463157653809, 13.404865264892578, 14.140268325805664, 14.875670433044434, 15.611072540283203, 16.34647560119629, 17.081876754760742, 17.817279815673828, 18.55268096923828, 19.288084030151367, 20.023487091064453, 20.758888244628906, 21.494291305541992, 22.229694366455078, 22.96509552001953, 23.700498580932617, 24.435901641845703, 25.171302795410156, 25.906705856323242, 26.642108917236328, 27.37751007080078]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 4.0, 9.0, 6.0, 6.0, 4.0, 7.0, 13.0, 8.0, 10.0, 17.0, 18.0, 15.0, 15.0, 23.0, 25.0, 23.0, 29.0, 28.0, 31.0, 35.0, 33.0, 39.0, 28.0, 42.0, 31.0, 35.0, 40.0, 40.0, 32.0, 26.0, 42.0, 43.0, 26.0, 35.0, 19.0, 28.0, 21.0, 19.0, 13.0, 16.0, 7.0, 18.0, 9.0, 11.0, 7.0, 6.0, 3.0, 5.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.579944610595703, -13.124553680419922, -12.669161796569824, -12.213770866394043, -11.758379936218262, -11.302988052368164, -10.847597122192383, -10.392206192016602, -9.936814308166504, -9.481423377990723, -9.026031494140625, -8.570640563964844, -8.115249633789062, -7.659857749938965, -7.204466819763184, -6.749075412750244, -6.293684482574463, -5.838293075561523, -5.382902145385742, -4.927510738372803, -4.472119331359863, -4.016728401184082, -3.5613369941711426, -3.105945587158203, -2.6505544185638428, -2.1951632499694824, -1.739771842956543, -1.2843806743621826, -0.8289893865585327, -0.3735980987548828, 0.08179306983947754, 0.537184476852417, 0.9925756454467773, 1.4479669332504272, 1.9033582210540771, 2.3587493896484375, 2.814140796661377, 3.2695319652557373, 3.7249231338500977, 4.180314540863037, 4.635705947875977, 5.091097354888916, 5.546488285064697, 6.001879692077637, 6.457271099090576, 6.912662506103516, 7.368053436279297, 7.823444843292236, 8.27883529663086, 8.73422622680664, 9.189618110656738, 9.64500904083252, 10.1003999710083, 10.555791854858398, 11.01118278503418, 11.466573715209961, 11.921965599060059, 12.37735652923584, 12.832748413085938, 13.288139343261719, 13.7435302734375, 14.198922157287598, 14.654313087463379, 15.109704971313477, 15.565095901489258]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 11.0, 1.0, 10.0, 9.0, 7.0, 8.0, 11.0, 14.0, 16.0, 23.0, 18.0, 23.0, 22.0, 23.0, 33.0, 33.0, 34.0, 34.0, 50.0, 41.0, 27.0, 44.0, 45.0, 40.0, 25.0, 32.0, 28.0, 36.0, 37.0, 19.0, 26.0, 25.0, 23.0, 24.0, 18.0, 20.0, 14.0, 17.0, 7.0, 15.0, 9.0, 9.0, 5.0, 9.0, 7.0, 5.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.509765625, -1.463134765625, -1.41650390625, -1.369873046875, -1.3232421875, -1.276611328125, -1.22998046875, -1.183349609375, -1.13671875, -1.090087890625, -1.04345703125, -0.996826171875, -0.9501953125, -0.903564453125, -0.85693359375, -0.810302734375, -0.763671875, -0.717041015625, -0.67041015625, -0.623779296875, -0.5771484375, -0.530517578125, -0.48388671875, -0.437255859375, -0.390625, -0.343994140625, -0.29736328125, -0.250732421875, -0.2041015625, -0.157470703125, -0.11083984375, -0.064208984375, -0.017578125, 0.029052734375, 0.07568359375, 0.122314453125, 0.1689453125, 0.215576171875, 0.26220703125, 0.308837890625, 0.35546875, 0.402099609375, 0.44873046875, 0.495361328125, 0.5419921875, 0.588623046875, 0.63525390625, 0.681884765625, 0.728515625, 0.775146484375, 0.82177734375, 0.868408203125, 0.9150390625, 0.961669921875, 1.00830078125, 1.054931640625, 1.1015625, 1.148193359375, 1.19482421875, 1.241455078125, 1.2880859375, 1.334716796875, 1.38134765625, 1.427978515625, 1.474609375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 5.0, 4.0, 4.0, 9.0, 17.0, 13.0, 21.0, 37.0, 36.0, 58.0, 77.0, 106.0, 163.0, 246.0, 335.0, 486.0, 725.0, 1045.0, 1560.0, 2322.0, 3359.0, 5089.0, 7542.0, 11598.0, 17925.0, 28348.0, 44976.0, 73098.0, 117032.0, 171461.0, 186180.0, 136682.0, 88167.0, 53771.0, 33723.0, 21182.0, 13805.0, 9049.0, 5935.0, 3978.0, 2656.0, 1813.0, 1232.0, 783.0, 579.0, 409.0, 266.0, 200.0, 132.0, 80.0, 68.0, 59.0, 41.0, 25.0, 16.0, 15.0, 3.0, 5.0, 6.0, 4.0, 5.0, 2.0, 2.0], "bins": [-0.159912109375, -0.15478515625, -0.149658203125, -0.14453125, -0.139404296875, -0.13427734375, -0.129150390625, -0.1240234375, -0.118896484375, -0.11376953125, -0.108642578125, -0.103515625, -0.098388671875, -0.09326171875, -0.088134765625, -0.0830078125, -0.077880859375, -0.07275390625, -0.067626953125, -0.0625, -0.057373046875, -0.05224609375, -0.047119140625, -0.0419921875, -0.036865234375, -0.03173828125, -0.026611328125, -0.021484375, -0.016357421875, -0.01123046875, -0.006103515625, -0.0009765625, 0.004150390625, 0.00927734375, 0.014404296875, 0.01953125, 0.024658203125, 0.02978515625, 0.034912109375, 0.0400390625, 0.045166015625, 0.05029296875, 0.055419921875, 0.060546875, 0.065673828125, 0.07080078125, 0.075927734375, 0.0810546875, 0.086181640625, 0.09130859375, 0.096435546875, 0.1015625, 0.106689453125, 0.11181640625, 0.116943359375, 0.1220703125, 0.127197265625, 0.13232421875, 0.137451171875, 0.142578125, 0.147705078125, 0.15283203125, 0.157958984375, 0.1630859375, 0.168212890625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 11.0, 7.0, 7.0, 12.0, 17.0, 21.0, 20.0, 17.0, 22.0, 33.0, 36.0, 35.0, 29.0, 40.0, 46.0, 30.0, 32.0, 42.0, 40.0, 1062.0, 40.0, 39.0, 45.0, 33.0, 33.0, 33.0, 31.0, 30.0, 21.0, 17.0, 20.0, 16.0, 13.0, 16.0, 17.0, 12.0, 9.0, 8.0, 3.0, 1.0, 3.0, 7.0, 4.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.99560546875, -0.9640121459960938, -0.9324188232421875, -0.9008255004882812, -0.869232177734375, -0.8376388549804688, -0.8060455322265625, -0.7744522094726562, -0.74285888671875, -0.7112655639648438, -0.6796722412109375, -0.6480789184570312, -0.616485595703125, -0.5848922729492188, -0.5532989501953125, -0.5217056274414062, -0.4901123046875, -0.45851898193359375, -0.4269256591796875, -0.39533233642578125, -0.363739013671875, -0.33214569091796875, -0.3005523681640625, -0.26895904541015625, -0.23736572265625, -0.20577239990234375, -0.1741790771484375, -0.14258575439453125, -0.110992431640625, -0.07939910888671875, -0.0478057861328125, -0.01621246337890625, 0.015380859375, 0.04697418212890625, 0.0785675048828125, 0.11016082763671875, 0.141754150390625, 0.17334747314453125, 0.2049407958984375, 0.23653411865234375, 0.26812744140625, 0.29972076416015625, 0.3313140869140625, 0.36290740966796875, 0.394500732421875, 0.42609405517578125, 0.4576873779296875, 0.48928070068359375, 0.5208740234375, 0.5524673461914062, 0.5840606689453125, 0.6156539916992188, 0.647247314453125, 0.6788406372070312, 0.7104339599609375, 0.7420272827148438, 0.77362060546875, 0.8052139282226562, 0.8368072509765625, 0.8684005737304688, 0.899993896484375, 0.9315872192382812, 0.9631805419921875, 0.9947738647460938, 1.0263671875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 4.0, 14.0, 17.0, 24.0, 60.0, 76.0, 118.0, 172.0, 255.0, 395.0, 613.0, 932.0, 1466.0, 2232.0, 3379.0, 5308.0, 8297.0, 12762.0, 20416.0, 31888.0, 49070.0, 74900.0, 112699.0, 167548.0, 1206192.0, 135046.0, 92339.0, 60707.0, 39714.0, 25641.0, 16001.0, 10371.0, 6550.0, 4152.0, 2648.0, 1734.0, 1204.0, 762.0, 485.0, 300.0, 232.0, 150.0, 107.0, 49.0, 39.0, 26.0, 11.0, 5.0, 8.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.11090087890625, -0.10746192932128906, -0.10402297973632812, -0.10058403015136719, -0.09714508056640625, -0.09370613098144531, -0.09026718139648438, -0.08682823181152344, -0.0833892822265625, -0.07995033264160156, -0.07651138305664062, -0.07307243347167969, -0.06963348388671875, -0.06619453430175781, -0.06275558471679688, -0.05931663513183594, -0.055877685546875, -0.05243873596191406, -0.048999786376953125, -0.04556083679199219, -0.04212188720703125, -0.03868293762207031, -0.035243988037109375, -0.03180503845214844, -0.0283660888671875, -0.024927139282226562, -0.021488189697265625, -0.018049240112304688, -0.01461029052734375, -0.011171340942382812, -0.007732391357421875, -0.0042934417724609375, -0.0008544921875, 0.0025844573974609375, 0.006023406982421875, 0.009462356567382812, 0.01290130615234375, 0.016340255737304688, 0.019779205322265625, 0.023218154907226562, 0.0266571044921875, 0.030096054077148438, 0.033535003662109375, 0.03697395324707031, 0.04041290283203125, 0.04385185241699219, 0.047290802001953125, 0.05072975158691406, 0.054168701171875, 0.05760765075683594, 0.061046600341796875, 0.06448554992675781, 0.06792449951171875, 0.07136344909667969, 0.07480239868164062, 0.07824134826660156, 0.0816802978515625, 0.08511924743652344, 0.08855819702148438, 0.09199714660644531, 0.09543609619140625, 0.09887504577636719, 0.10231399536132812, 0.10575294494628906, 0.10919189453125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 0.0, 4.0, 5.0, 7.0, 11.0, 20.0, 37.0, 38.0, 61.0, 81.0, 107.0, 134.0, 132.0, 106.0, 75.0, 57.0, 35.0, 15.0, 14.0, 14.0, 9.0, 8.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003635406494140625, -0.003517657518386841, -0.0033999085426330566, -0.0032821595668792725, -0.0031644105911254883, -0.003046661615371704, -0.00292891263961792, -0.0028111636638641357, -0.0026934146881103516, -0.0025756657123565674, -0.002457916736602783, -0.002340167760848999, -0.002222418785095215, -0.0021046698093414307, -0.0019869208335876465, -0.0018691718578338623, -0.0017514228820800781, -0.001633673906326294, -0.0015159249305725098, -0.0013981759548187256, -0.0012804269790649414, -0.0011626780033111572, -0.001044929027557373, -0.0009271800518035889, -0.0008094310760498047, -0.0006916821002960205, -0.0005739331245422363, -0.00045618414878845215, -0.00033843517303466797, -0.0002206861972808838, -0.00010293722152709961, 1.481175422668457e-05, 0.00013256072998046875, 0.00025030970573425293, 0.0003680586814880371, 0.0004858076572418213, 0.0006035566329956055, 0.0007213056087493896, 0.0008390545845031738, 0.000956803560256958, 0.0010745525360107422, 0.0011923015117645264, 0.0013100504875183105, 0.0014277994632720947, 0.001545548439025879, 0.001663297414779663, 0.0017810463905334473, 0.0018987953662872314, 0.0020165443420410156, 0.0021342933177948, 0.002252042293548584, 0.002369791269302368, 0.0024875402450561523, 0.0026052892208099365, 0.0027230381965637207, 0.002840787172317505, 0.002958536148071289, 0.0030762851238250732, 0.0031940340995788574, 0.0033117830753326416, 0.0034295320510864258, 0.00354728102684021, 0.003665030002593994, 0.0037827789783477783, 0.0039005279541015625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 10.0, 12.0, 26.0, 18.0, 34.0, 22.0, 35.0, 74.0, 152.0, 298.0, 971.0, 198370.0, 846218.0, 1554.0, 318.0, 153.0, 98.0, 49.0, 43.0, 21.0, 17.0, 5.0, 9.0, 11.0, 2.0, 5.0, 3.0, 7.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07318115234375, -0.0709695816040039, -0.06875801086425781, -0.06654644012451172, -0.06433486938476562, -0.06212329864501953, -0.05991172790527344, -0.057700157165527344, -0.05548858642578125, -0.053277015686035156, -0.05106544494628906, -0.04885387420654297, -0.046642303466796875, -0.04443073272705078, -0.04221916198730469, -0.040007591247558594, -0.0377960205078125, -0.035584449768066406, -0.03337287902832031, -0.03116130828857422, -0.028949737548828125, -0.02673816680908203, -0.024526596069335938, -0.022315025329589844, -0.02010345458984375, -0.017891883850097656, -0.015680313110351562, -0.013468742370605469, -0.011257171630859375, -0.009045600891113281, -0.0068340301513671875, -0.004622459411621094, -0.002410888671875, -0.00019931793212890625, 0.0020122528076171875, 0.004223823547363281, 0.006435394287109375, 0.008646965026855469, 0.010858535766601562, 0.013070106506347656, 0.01528167724609375, 0.017493247985839844, 0.019704818725585938, 0.02191638946533203, 0.024127960205078125, 0.02633953094482422, 0.028551101684570312, 0.030762672424316406, 0.0329742431640625, 0.035185813903808594, 0.03739738464355469, 0.03960895538330078, 0.041820526123046875, 0.04403209686279297, 0.04624366760253906, 0.048455238342285156, 0.05066680908203125, 0.052878379821777344, 0.05508995056152344, 0.05730152130126953, 0.059513092041015625, 0.06172466278076172, 0.06393623352050781, 0.0661478042602539, 0.068359375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 11.0, 640.0, 358.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02134220488369465, -0.020367683842778206, -0.019393162801861763, -0.01841864176094532, -0.017444120720028877, -0.016469599679112434, -0.015495077706873417, -0.014520556665956974, -0.013546035625040531, -0.012571514584124088, -0.011596993543207645, -0.010622471570968628, -0.009647950530052185, -0.008673429489135742, -0.007698908448219299, -0.0067243874073028564, -0.005749866366386414, -0.004775345325469971, -0.003800824051722884, -0.0028263027779757977, -0.0018517817370593548, -0.0008772606961429119, 9.726081043481827e-05, 0.0010717818513512611, 0.002046302892267704, 0.003020823933184147, 0.00399534497410059, 0.00496986648067832, 0.005944387521594763, 0.006918908562511206, 0.007893430069088936, 0.008867951110005379, 0.00984247401356697, 0.010816995054483414, 0.011791516095399857, 0.0127660371363163, 0.013740558177232742, 0.014715079218149185, 0.015689600259065628, 0.01666412129998207, 0.017638642340898514, 0.018613163381814957, 0.0195876844227314, 0.020562205463647842, 0.021536726504564285, 0.022511247545480728, 0.02348576858639717, 0.024460289627313614, 0.025434812530875206, 0.02640933357179165, 0.027383854612708092, 0.028358375653624535, 0.029332896694540977, 0.03030741773545742, 0.03128194063901901, 0.032256461679935455, 0.0332309827208519, 0.03420550376176834, 0.035180024802684784, 0.03615454584360123, 0.03712906688451767, 0.03810358792543411, 0.039078108966350555, 0.040052630007267, 0.04102715104818344]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 13.0, 13.0, 16.0, 18.0, 22.0, 26.0, 45.0, 39.0, 44.0, 54.0, 61.0, 58.0, 50.0, 63.0, 60.0, 64.0, 43.0, 55.0, 47.0, 36.0, 42.0, 26.0, 23.0, 20.0, 11.0, 18.0, 10.0, 4.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025127530097961426, -0.0024291574954986572, -0.002345561981201172, -0.0022619664669036865, -0.002178370952606201, -0.002094775438308716, -0.0020111799240112305, -0.0019275844097137451, -0.0018439888954162598, -0.0017603933811187744, -0.001676797866821289, -0.0015932023525238037, -0.0015096068382263184, -0.001426011323928833, -0.0013424158096313477, -0.0012588202953338623, -0.001175224781036377, -0.0010916292667388916, -0.0010080337524414062, -0.0009244382381439209, -0.0008408427238464355, -0.0007572472095489502, -0.0006736516952514648, -0.0005900561809539795, -0.0005064606666564941, -0.0004228651523590088, -0.00033926963806152344, -0.0002556741237640381, -0.00017207860946655273, -8.848309516906738e-05, -4.887580871582031e-06, 7.870793342590332e-05, 0.00016230344772338867, 0.000245898962020874, 0.0003294944763183594, 0.0004130899906158447, 0.0004966855049133301, 0.0005802810192108154, 0.0006638765335083008, 0.0007474720478057861, 0.0008310675621032715, 0.0009146630764007568, 0.0009982585906982422, 0.0010818541049957275, 0.0011654496192932129, 0.0012490451335906982, 0.0013326406478881836, 0.001416236162185669, 0.0014998316764831543, 0.0015834271907806396, 0.001667022705078125, 0.0017506182193756104, 0.0018342137336730957, 0.001917809247970581, 0.0020014047622680664, 0.0020850002765655518, 0.002168595790863037, 0.0022521913051605225, 0.002335786819458008, 0.002419382333755493, 0.0025029778480529785, 0.002586573362350464, 0.0026701688766479492, 0.0027537643909454346, 0.00283735990524292]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 11.0, 1.0, 10.0, 9.0, 7.0, 8.0, 11.0, 14.0, 16.0, 23.0, 18.0, 23.0, 22.0, 23.0, 33.0, 33.0, 34.0, 34.0, 50.0, 41.0, 27.0, 44.0, 45.0, 40.0, 25.0, 32.0, 28.0, 36.0, 37.0, 19.0, 26.0, 25.0, 23.0, 24.0, 18.0, 20.0, 14.0, 17.0, 7.0, 15.0, 9.0, 9.0, 5.0, 9.0, 7.0, 5.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.509765625, -1.463134765625, -1.41650390625, -1.369873046875, -1.3232421875, -1.276611328125, -1.22998046875, -1.183349609375, -1.13671875, -1.090087890625, -1.04345703125, -0.996826171875, -0.9501953125, -0.903564453125, -0.85693359375, -0.810302734375, -0.763671875, -0.717041015625, -0.67041015625, -0.623779296875, -0.5771484375, -0.530517578125, -0.48388671875, -0.437255859375, -0.390625, -0.343994140625, -0.29736328125, -0.250732421875, -0.2041015625, -0.157470703125, -0.11083984375, -0.064208984375, -0.017578125, 0.029052734375, 0.07568359375, 0.122314453125, 0.1689453125, 0.215576171875, 0.26220703125, 0.308837890625, 0.35546875, 0.402099609375, 0.44873046875, 0.495361328125, 0.5419921875, 0.588623046875, 0.63525390625, 0.681884765625, 0.728515625, 0.775146484375, 0.82177734375, 0.868408203125, 0.9150390625, 0.961669921875, 1.00830078125, 1.054931640625, 1.1015625, 1.148193359375, 1.19482421875, 1.241455078125, 1.2880859375, 1.334716796875, 1.38134765625, 1.427978515625, 1.474609375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 6.0, 12.0, 8.0, 10.0, 12.0, 21.0, 34.0, 48.0, 50.0, 72.0, 100.0, 127.0, 226.0, 340.0, 607.0, 1019.0, 1950.0, 3767.0, 8012.0, 17865.0, 43735.0, 133217.0, 383114.0, 299616.0, 94176.0, 33214.0, 13806.0, 6462.0, 3018.0, 1587.0, 818.0, 539.0, 308.0, 182.0, 119.0, 86.0, 69.0, 53.0, 32.0, 34.0, 15.0, 14.0, 16.0, 10.0, 9.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8935546875, -1.8279266357421875, -1.762298583984375, -1.6966705322265625, -1.63104248046875, -1.5654144287109375, -1.499786376953125, -1.4341583251953125, -1.3685302734375, -1.3029022216796875, -1.237274169921875, -1.1716461181640625, -1.10601806640625, -1.0403900146484375, -0.974761962890625, -0.9091339111328125, -0.843505859375, -0.7778778076171875, -0.712249755859375, -0.6466217041015625, -0.58099365234375, -0.5153656005859375, -0.449737548828125, -0.3841094970703125, -0.3184814453125, -0.2528533935546875, -0.187225341796875, -0.1215972900390625, -0.05596923828125, 0.0096588134765625, 0.075286865234375, 0.1409149169921875, 0.20654296875, 0.2721710205078125, 0.337799072265625, 0.4034271240234375, 0.46905517578125, 0.5346832275390625, 0.600311279296875, 0.6659393310546875, 0.7315673828125, 0.7971954345703125, 0.862823486328125, 0.9284515380859375, 0.99407958984375, 1.0597076416015625, 1.125335693359375, 1.1909637451171875, 1.256591796875, 1.3222198486328125, 1.387847900390625, 1.4534759521484375, 1.51910400390625, 1.5847320556640625, 1.650360107421875, 1.7159881591796875, 1.7816162109375, 1.8472442626953125, 1.912872314453125, 1.9785003662109375, 2.04412841796875, 2.1097564697265625, 2.175384521484375, 2.2410125732421875, 2.306640625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 6.0, 11.0, 14.0, 13.0, 18.0, 24.0, 30.0, 23.0, 40.0, 43.0, 44.0, 49.0, 61.0, 99.0, 222.0, 1541.0, 219.0, 100.0, 65.0, 57.0, 60.0, 36.0, 38.0, 39.0, 24.0, 16.0, 20.0, 21.0, 13.0, 14.0, 13.0, 14.0, 5.0, 11.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.42578125, -6.2342529296875, -6.042724609375, -5.8511962890625, -5.65966796875, -5.4681396484375, -5.276611328125, -5.0850830078125, -4.8935546875, -4.7020263671875, -4.510498046875, -4.3189697265625, -4.12744140625, -3.9359130859375, -3.744384765625, -3.5528564453125, -3.361328125, -3.1697998046875, -2.978271484375, -2.7867431640625, -2.59521484375, -2.4036865234375, -2.212158203125, -2.0206298828125, -1.8291015625, -1.6375732421875, -1.446044921875, -1.2545166015625, -1.06298828125, -0.8714599609375, -0.679931640625, -0.4884033203125, -0.296875, -0.1053466796875, 0.086181640625, 0.2777099609375, 0.46923828125, 0.6607666015625, 0.852294921875, 1.0438232421875, 1.2353515625, 1.4268798828125, 1.618408203125, 1.8099365234375, 2.00146484375, 2.1929931640625, 2.384521484375, 2.5760498046875, 2.767578125, 2.9591064453125, 3.150634765625, 3.3421630859375, 3.53369140625, 3.7252197265625, 3.916748046875, 4.1082763671875, 4.2998046875, 4.4913330078125, 4.682861328125, 4.8743896484375, 5.06591796875, 5.2574462890625, 5.448974609375, 5.6405029296875, 5.83203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 10.0, 13.0, 16.0, 23.0, 23.0, 29.0, 28.0, 43.0, 62.0, 65.0, 90.0, 137.0, 238.0, 532.0, 1522.0, 8599.0, 126543.0, 2885167.0, 111647.0, 8127.0, 1449.0, 515.0, 244.0, 142.0, 101.0, 73.0, 45.0, 40.0, 24.0, 25.0, 19.0, 18.0, 14.0, 6.0, 7.0, 7.0, 7.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-8.796875, -8.5174560546875, -8.238037109375, -7.9586181640625, -7.67919921875, -7.3997802734375, -7.120361328125, -6.8409423828125, -6.5615234375, -6.2821044921875, -6.002685546875, -5.7232666015625, -5.44384765625, -5.1644287109375, -4.885009765625, -4.6055908203125, -4.326171875, -4.0467529296875, -3.767333984375, -3.4879150390625, -3.20849609375, -2.9290771484375, -2.649658203125, -2.3702392578125, -2.0908203125, -1.8114013671875, -1.531982421875, -1.2525634765625, -0.97314453125, -0.6937255859375, -0.414306640625, -0.1348876953125, 0.14453125, 0.4239501953125, 0.703369140625, 0.9827880859375, 1.26220703125, 1.5416259765625, 1.821044921875, 2.1004638671875, 2.3798828125, 2.6593017578125, 2.938720703125, 3.2181396484375, 3.49755859375, 3.7769775390625, 4.056396484375, 4.3358154296875, 4.615234375, 4.8946533203125, 5.174072265625, 5.4534912109375, 5.73291015625, 6.0123291015625, 6.291748046875, 6.5711669921875, 6.8505859375, 7.1300048828125, 7.409423828125, 7.6888427734375, 7.96826171875, 8.2476806640625, 8.527099609375, 8.8065185546875, 9.0859375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [6.0, 885.0, 125.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.826216220855713, -3.380767822265625, 1.064680576324463, 5.510129451751709, 9.955577850341797, 14.401025772094727, 18.84647560119629, 23.29192352294922, 27.73737144470215, 32.18281936645508, 36.62826919555664, 41.07371520996094, 45.5191650390625, 49.96461486816406, 54.410064697265625, 58.85551071166992, 63.30095672607422, 67.74640655517578, 72.19185638427734, 76.63729858398438, 81.08274841308594, 85.5281982421875, 89.97364807128906, 94.41909790039062, 98.86454772949219, 103.30999755859375, 107.75544738769531, 112.20089721679688, 116.6463394165039, 121.09178924560547, 125.53723907470703, 129.98268127441406, 134.4281463623047, 138.87359619140625, 143.3190460205078, 147.76449584960938, 152.20994567871094, 156.6553955078125, 161.100830078125, 165.54627990722656, 169.99172973632812, 174.4371795654297, 178.88262939453125, 183.3280792236328, 187.77352905273438, 192.21896362304688, 196.6644287109375, 201.10986328125, 205.55532836914062, 210.0007781982422, 214.44622802734375, 218.8916778564453, 223.33712768554688, 227.78256225585938, 232.22802734375, 236.6734619140625, 241.11891174316406, 245.56436157226562, 250.0098114013672, 254.45526123046875, 258.90069580078125, 263.3461608886719, 267.7915954589844, 272.237060546875, 276.6824951171875]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 1.0, 7.0, 13.0, 12.0, 12.0, 15.0, 15.0, 28.0, 23.0, 26.0, 18.0, 27.0, 25.0, 29.0, 32.0, 44.0, 32.0, 41.0, 36.0, 33.0, 29.0, 38.0, 43.0, 46.0, 41.0, 42.0, 34.0, 40.0, 21.0, 30.0, 24.0, 18.0, 15.0, 16.0, 16.0, 14.0, 13.0, 9.0, 6.0, 12.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.103717803955078, -18.5260066986084, -17.94829750061035, -17.370586395263672, -16.792877197265625, -16.215166091918945, -15.637455940246582, -15.059745788574219, -14.482034683227539, -13.904324531555176, -13.326614379882812, -12.748903274536133, -12.17119312286377, -11.593482971191406, -11.015772819519043, -10.43806266784668, -9.860352516174316, -9.282642364501953, -8.70493221282959, -8.127222061157227, -7.549510955810547, -6.971800804138184, -6.39409065246582, -5.816380023956299, -5.2386698722839355, -4.660959720611572, -4.083249092102051, -3.5055389404296875, -2.927828550338745, -2.3501181602478027, -1.7724080085754395, -1.194697380065918, -0.6169872283935547, -0.03927689790725708, 0.5384334325790405, 1.1161437034606934, 1.6938540935516357, 2.271564483642578, 2.8492746353149414, 3.426985263824463, 4.004695415496826, 4.5824055671691895, 5.160116195678711, 5.737826347351074, 6.3155364990234375, 6.893247127532959, 7.470957279205322, 8.048667907714844, 8.626378059387207, 9.20408821105957, 9.781798362731934, 10.359508514404297, 10.937219619750977, 11.51492977142334, 12.092639923095703, 12.670351028442383, 13.24806022644043, 13.825770378112793, 14.403480529785156, 14.981191635131836, 15.5589017868042, 16.136611938476562, 16.71432113647461, 17.29203224182129, 17.86974334716797]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 4.0, 11.0, 11.0, 9.0, 9.0, 10.0, 22.0, 18.0, 19.0, 20.0, 31.0, 38.0, 39.0, 35.0, 27.0, 39.0, 53.0, 37.0, 43.0, 53.0, 43.0, 29.0, 34.0, 37.0, 32.0, 32.0, 24.0, 28.0, 26.0, 29.0, 21.0, 18.0, 15.0, 14.0, 20.0, 10.0, 4.0, 7.0, 8.0, 12.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6748046875, -1.62152099609375, -1.5682373046875, -1.51495361328125, -1.461669921875, -1.40838623046875, -1.3551025390625, -1.30181884765625, -1.24853515625, -1.19525146484375, -1.1419677734375, -1.08868408203125, -1.035400390625, -0.98211669921875, -0.9288330078125, -0.87554931640625, -0.822265625, -0.76898193359375, -0.7156982421875, -0.66241455078125, -0.609130859375, -0.55584716796875, -0.5025634765625, -0.44927978515625, -0.39599609375, -0.34271240234375, -0.2894287109375, -0.23614501953125, -0.182861328125, -0.12957763671875, -0.0762939453125, -0.02301025390625, 0.0302734375, 0.08355712890625, 0.1368408203125, 0.19012451171875, 0.243408203125, 0.29669189453125, 0.3499755859375, 0.40325927734375, 0.45654296875, 0.50982666015625, 0.5631103515625, 0.61639404296875, 0.669677734375, 0.72296142578125, 0.7762451171875, 0.82952880859375, 0.8828125, 0.93609619140625, 0.9893798828125, 1.04266357421875, 1.095947265625, 1.14923095703125, 1.2025146484375, 1.25579833984375, 1.30908203125, 1.36236572265625, 1.4156494140625, 1.46893310546875, 1.522216796875, 1.57550048828125, 1.6287841796875, 1.68206787109375, 1.7353515625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 11.0, 9.0, 11.0, 22.0, 18.0, 35.0, 31.0, 49.0, 59.0, 96.0, 167.0, 240.0, 499.0, 1134.0, 2633.0, 7033.0, 19853.0, 63388.0, 247680.0, 1133952.0, 1944931.0, 585013.0, 130007.0, 37168.0, 12076.0, 4572.0, 1820.0, 802.0, 339.0, 186.0, 132.0, 76.0, 64.0, 35.0, 23.0, 23.0, 17.0, 11.0, 16.0, 16.0, 9.0, 5.0, 7.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.423828125, -3.314361572265625, -3.20489501953125, -3.095428466796875, -2.9859619140625, -2.876495361328125, -2.76702880859375, -2.657562255859375, -2.548095703125, -2.438629150390625, -2.32916259765625, -2.219696044921875, -2.1102294921875, -2.000762939453125, -1.89129638671875, -1.781829833984375, -1.67236328125, -1.562896728515625, -1.45343017578125, -1.343963623046875, -1.2344970703125, -1.125030517578125, -1.01556396484375, -0.906097412109375, -0.796630859375, -0.687164306640625, -0.57769775390625, -0.468231201171875, -0.3587646484375, -0.249298095703125, -0.13983154296875, -0.030364990234375, 0.0791015625, 0.188568115234375, 0.29803466796875, 0.407501220703125, 0.5169677734375, 0.626434326171875, 0.73590087890625, 0.845367431640625, 0.954833984375, 1.064300537109375, 1.17376708984375, 1.283233642578125, 1.3927001953125, 1.502166748046875, 1.61163330078125, 1.721099853515625, 1.83056640625, 1.940032958984375, 2.04949951171875, 2.158966064453125, 2.2684326171875, 2.377899169921875, 2.48736572265625, 2.596832275390625, 2.706298828125, 2.815765380859375, 2.92523193359375, 3.034698486328125, 3.1441650390625, 3.253631591796875, 3.36309814453125, 3.472564697265625, 3.58203125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 12.0, 18.0, 29.0, 38.0, 45.0, 65.0, 77.0, 141.0, 181.0, 253.0, 324.0, 416.0, 511.0, 470.0, 429.0, 256.0, 200.0, 162.0, 122.0, 79.0, 60.0, 40.0, 36.0, 24.0, 17.0, 11.0, 14.0, 9.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-6.65234375, -6.48492431640625, -6.3175048828125, -6.15008544921875, -5.982666015625, -5.81524658203125, -5.6478271484375, -5.48040771484375, -5.31298828125, -5.14556884765625, -4.9781494140625, -4.81072998046875, -4.643310546875, -4.47589111328125, -4.3084716796875, -4.14105224609375, -3.9736328125, -3.80621337890625, -3.6387939453125, -3.47137451171875, -3.303955078125, -3.13653564453125, -2.9691162109375, -2.80169677734375, -2.63427734375, -2.46685791015625, -2.2994384765625, -2.13201904296875, -1.964599609375, -1.79718017578125, -1.6297607421875, -1.46234130859375, -1.294921875, -1.12750244140625, -0.9600830078125, -0.79266357421875, -0.625244140625, -0.45782470703125, -0.2904052734375, -0.12298583984375, 0.04443359375, 0.21185302734375, 0.3792724609375, 0.54669189453125, 0.714111328125, 0.88153076171875, 1.0489501953125, 1.21636962890625, 1.3837890625, 1.55120849609375, 1.7186279296875, 1.88604736328125, 2.053466796875, 2.22088623046875, 2.3883056640625, 2.55572509765625, 2.72314453125, 2.89056396484375, 3.0579833984375, 3.22540283203125, 3.392822265625, 3.56024169921875, 3.7276611328125, 3.89508056640625, 4.0625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 10.0, 4.0, 8.0, 8.0, 7.0, 25.0, 23.0, 49.0, 64.0, 115.0, 207.0, 395.0, 839.0, 2137.0, 7411.0, 42477.0, 380073.0, 2781556.0, 872970.0, 88034.0, 12460.0, 3186.0, 1033.0, 535.0, 275.0, 146.0, 65.0, 58.0, 37.0, 21.0, 15.0, 12.0, 10.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.6624755859375, -7.364013671875, -7.0655517578125, -6.76708984375, -6.4686279296875, -6.170166015625, -5.8717041015625, -5.5732421875, -5.2747802734375, -4.976318359375, -4.6778564453125, -4.37939453125, -4.0809326171875, -3.782470703125, -3.4840087890625, -3.185546875, -2.8870849609375, -2.588623046875, -2.2901611328125, -1.99169921875, -1.6932373046875, -1.394775390625, -1.0963134765625, -0.7978515625, -0.4993896484375, -0.200927734375, 0.0975341796875, 0.39599609375, 0.6944580078125, 0.992919921875, 1.2913818359375, 1.58984375, 1.8883056640625, 2.186767578125, 2.4852294921875, 2.78369140625, 3.0821533203125, 3.380615234375, 3.6790771484375, 3.9775390625, 4.2760009765625, 4.574462890625, 4.8729248046875, 5.17138671875, 5.4698486328125, 5.768310546875, 6.0667724609375, 6.365234375, 6.6636962890625, 6.962158203125, 7.2606201171875, 7.55908203125, 7.8575439453125, 8.156005859375, 8.4544677734375, 8.7529296875, 9.0513916015625, 9.349853515625, 9.6483154296875, 9.94677734375, 10.2452392578125, 10.543701171875, 10.8421630859375, 11.140625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 15.0, 71.0, 164.0, 242.0, 253.0, 170.0, 58.0, 23.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.94883728027344, -73.07416534423828, -71.19949340820312, -69.3248291015625, -67.45015716552734, -65.57548522949219, -63.70081329345703, -61.82614517211914, -59.95147705078125, -58.076805114746094, -56.2021369934082, -54.32746505737305, -52.452796936035156, -50.578125, -48.703453063964844, -46.82878494262695, -44.9541130065918, -43.07944107055664, -41.20477294921875, -39.330101013183594, -37.4554328918457, -35.58076095581055, -33.706092834472656, -31.8314208984375, -29.956750869750977, -28.082080841064453, -26.20741081237793, -24.332740783691406, -22.45806884765625, -20.58340072631836, -18.708728790283203, -16.83405876159668, -14.959388732910156, -13.084718704223633, -11.21004867553711, -9.33537769317627, -7.460707664489746, -5.586037635803223, -3.711366653442383, -1.8366966247558594, 0.03797340393066406, 1.9126436710357666, 3.787313938140869, 5.661984443664551, 7.536654472351074, 9.411324501037598, 11.285995483398438, 13.160665512084961, 15.035335540771484, 16.910005569458008, 18.78467559814453, 20.659347534179688, 22.534015655517578, 24.408687591552734, 26.283357620239258, 28.15802764892578, 30.032697677612305, 31.907367706298828, 33.782039642333984, 35.656707763671875, 37.53137969970703, 39.40604782104492, 41.28071975708008, 43.15538787841797, 45.030059814453125]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 7.0, 6.0, 10.0, 11.0, 13.0, 12.0, 17.0, 21.0, 20.0, 22.0, 17.0, 24.0, 26.0, 23.0, 30.0, 32.0, 38.0, 34.0, 35.0, 43.0, 33.0, 39.0, 26.0, 38.0, 48.0, 39.0, 34.0, 34.0, 18.0, 29.0, 20.0, 25.0, 23.0, 20.0, 18.0, 17.0, 16.0, 11.0, 9.0, 7.0, 9.0, 6.0, 9.0, 5.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-15.537351608276367, -15.064696311950684, -14.592041015625, -14.119385719299316, -13.646730422973633, -13.17407512664795, -12.701419830322266, -12.228764533996582, -11.756109237670898, -11.283453941345215, -10.810798645019531, -10.338143348693848, -9.865488052368164, -9.39283275604248, -8.920177459716797, -8.447522163391113, -7.9748663902282715, -7.502211093902588, -7.029555797576904, -6.556900501251221, -6.084245204925537, -5.611589431762695, -5.138934135437012, -4.666278839111328, -4.1936235427856445, -3.720968246459961, -3.2483129501342773, -2.7756576538085938, -2.30300235748291, -1.8303468227386475, -1.3576915264129639, -0.8850362300872803, -0.4123811721801758, 0.0602741539478302, 0.5329294800758362, 1.0055848360061646, 1.4782401323318481, 1.9508955478668213, 2.423550844192505, 2.8962061405181885, 3.368861436843872, 3.8415167331695557, 4.314172267913818, 4.786827564239502, 5.2594828605651855, 5.732138156890869, 6.204793453216553, 6.677448749542236, 7.15010404586792, 7.6227593421936035, 8.095415115356445, 8.568070411682129, 9.040725708007812, 9.513381004333496, 9.98603630065918, 10.458691596984863, 10.931346893310547, 11.40400218963623, 11.876657485961914, 12.349312782287598, 12.821968078613281, 13.294623374938965, 13.767278671264648, 14.239933967590332, 14.712589263916016]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 4.0, 11.0, 11.0, 14.0, 11.0, 13.0, 34.0, 21.0, 30.0, 26.0, 41.0, 42.0, 43.0, 28.0, 43.0, 37.0, 38.0, 36.0, 51.0, 36.0, 39.0, 41.0, 35.0, 33.0, 45.0, 30.0, 17.0, 23.0, 33.0, 17.0, 13.0, 17.0, 18.0, 12.0, 11.0, 6.0, 9.0, 6.0, 2.0, 8.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.755859375, -1.6979217529296875, -1.639984130859375, -1.5820465087890625, -1.52410888671875, -1.4661712646484375, -1.408233642578125, -1.3502960205078125, -1.2923583984375, -1.2344207763671875, -1.176483154296875, -1.1185455322265625, -1.06060791015625, -1.0026702880859375, -0.944732666015625, -0.8867950439453125, -0.828857421875, -0.7709197998046875, -0.712982177734375, -0.6550445556640625, -0.59710693359375, -0.5391693115234375, -0.481231689453125, -0.4232940673828125, -0.3653564453125, -0.3074188232421875, -0.249481201171875, -0.1915435791015625, -0.13360595703125, -0.0756683349609375, -0.017730712890625, 0.0402069091796875, 0.09814453125, 0.1560821533203125, 0.214019775390625, 0.2719573974609375, 0.32989501953125, 0.3878326416015625, 0.445770263671875, 0.5037078857421875, 0.5616455078125, 0.6195831298828125, 0.677520751953125, 0.7354583740234375, 0.79339599609375, 0.8513336181640625, 0.909271240234375, 0.9672088623046875, 1.025146484375, 1.0830841064453125, 1.141021728515625, 1.1989593505859375, 1.25689697265625, 1.3148345947265625, 1.372772216796875, 1.4307098388671875, 1.4886474609375, 1.5465850830078125, 1.604522705078125, 1.6624603271484375, 1.72039794921875, 1.7783355712890625, 1.836273193359375, 1.8942108154296875, 1.9521484375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 8.0, 10.0, 16.0, 23.0, 35.0, 58.0, 86.0, 102.0, 164.0, 268.0, 366.0, 553.0, 882.0, 1249.0, 2089.0, 3179.0, 4917.0, 7525.0, 12432.0, 19607.0, 32348.0, 54282.0, 89995.0, 148683.0, 210646.0, 176947.0, 110856.0, 66407.0, 39858.0, 24087.0, 14707.0, 9323.0, 5882.0, 3774.0, 2435.0, 1603.0, 1022.0, 702.0, 449.0, 296.0, 235.0, 159.0, 108.0, 61.0, 43.0, 21.0, 17.0, 13.0, 5.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.2025146484375, -0.19612693786621094, -0.18973922729492188, -0.1833515167236328, -0.17696380615234375, -0.1705760955810547, -0.16418838500976562, -0.15780067443847656, -0.1514129638671875, -0.14502525329589844, -0.13863754272460938, -0.1322498321533203, -0.12586212158203125, -0.11947441101074219, -0.11308670043945312, -0.10669898986816406, -0.100311279296875, -0.09392356872558594, -0.08753585815429688, -0.08114814758300781, -0.07476043701171875, -0.06837272644042969, -0.061985015869140625, -0.05559730529785156, -0.0492095947265625, -0.04282188415527344, -0.036434173583984375, -0.030046463012695312, -0.02365875244140625, -0.017271041870117188, -0.010883331298828125, -0.0044956207275390625, 0.00189208984375, 0.008279800415039062, 0.014667510986328125, 0.021055221557617188, 0.02744293212890625, 0.03383064270019531, 0.040218353271484375, 0.04660606384277344, 0.0529937744140625, 0.05938148498535156, 0.06576919555664062, 0.07215690612792969, 0.07854461669921875, 0.08493232727050781, 0.09132003784179688, 0.09770774841308594, 0.104095458984375, 0.11048316955566406, 0.11687088012695312, 0.12325859069824219, 0.12964630126953125, 0.1360340118408203, 0.14242172241210938, 0.14880943298339844, 0.1551971435546875, 0.16158485412597656, 0.16797256469726562, 0.1743602752685547, 0.18074798583984375, 0.1871356964111328, 0.19352340698242188, 0.19991111755371094, 0.206298828125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 3.0, 8.0, 14.0, 16.0, 12.0, 11.0, 14.0, 13.0, 20.0, 27.0, 42.0, 30.0, 31.0, 33.0, 31.0, 42.0, 44.0, 53.0, 40.0, 1069.0, 47.0, 36.0, 40.0, 35.0, 38.0, 33.0, 38.0, 27.0, 31.0, 24.0, 15.0, 15.0, 13.0, 17.0, 10.0, 6.0, 12.0, 11.0, 2.0, 6.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.1416168212890625, -1.102569580078125, -1.0635223388671875, -1.02447509765625, -0.9854278564453125, -0.946380615234375, -0.9073333740234375, -0.8682861328125, -0.8292388916015625, -0.790191650390625, -0.7511444091796875, -0.71209716796875, -0.6730499267578125, -0.634002685546875, -0.5949554443359375, -0.555908203125, -0.5168609619140625, -0.477813720703125, -0.4387664794921875, -0.39971923828125, -0.3606719970703125, -0.321624755859375, -0.2825775146484375, -0.2435302734375, -0.2044830322265625, -0.165435791015625, -0.1263885498046875, -0.08734130859375, -0.0482940673828125, -0.009246826171875, 0.0298004150390625, 0.06884765625, 0.1078948974609375, 0.146942138671875, 0.1859893798828125, 0.22503662109375, 0.2640838623046875, 0.303131103515625, 0.3421783447265625, 0.3812255859375, 0.4202728271484375, 0.459320068359375, 0.4983673095703125, 0.53741455078125, 0.5764617919921875, 0.615509033203125, 0.6545562744140625, 0.693603515625, 0.7326507568359375, 0.771697998046875, 0.8107452392578125, 0.84979248046875, 0.8888397216796875, 0.927886962890625, 0.9669342041015625, 1.0059814453125, 1.0450286865234375, 1.084075927734375, 1.1231231689453125, 1.16217041015625, 1.2012176513671875, 1.240264892578125, 1.2793121337890625, 1.318359375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 11.0, 17.0, 28.0, 43.0, 57.0, 83.0, 119.0, 184.0, 272.0, 398.0, 607.0, 920.0, 1265.0, 1869.0, 2821.0, 4241.0, 6363.0, 9747.0, 15049.0, 22926.0, 35009.0, 52963.0, 79526.0, 116782.0, 254557.0, 1109481.0, 125632.0, 86726.0, 58078.0, 38105.0, 25320.0, 16298.0, 10636.0, 6959.0, 4691.0, 3010.0, 2050.0, 1349.0, 924.0, 617.0, 426.0, 312.0, 242.0, 136.0, 95.0, 63.0, 40.0, 24.0, 22.0, 10.0, 5.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.1190185546875, -0.11519241333007812, -0.11136627197265625, -0.10754013061523438, -0.1037139892578125, -0.09988784790039062, -0.09606170654296875, -0.09223556518554688, -0.088409423828125, -0.08458328247070312, -0.08075714111328125, -0.07693099975585938, -0.0731048583984375, -0.06927871704101562, -0.06545257568359375, -0.061626434326171875, -0.05780029296875, -0.053974151611328125, -0.05014801025390625, -0.046321868896484375, -0.0424957275390625, -0.038669586181640625, -0.03484344482421875, -0.031017303466796875, -0.027191162109375, -0.023365020751953125, -0.01953887939453125, -0.015712738037109375, -0.0118865966796875, -0.008060455322265625, -0.00423431396484375, -0.000408172607421875, 0.00341796875, 0.007244110107421875, 0.01107025146484375, 0.014896392822265625, 0.0187225341796875, 0.022548675537109375, 0.02637481689453125, 0.030200958251953125, 0.034027099609375, 0.037853240966796875, 0.04167938232421875, 0.045505523681640625, 0.0493316650390625, 0.053157806396484375, 0.05698394775390625, 0.060810089111328125, 0.06463623046875, 0.06846237182617188, 0.07228851318359375, 0.07611465454101562, 0.0799407958984375, 0.08376693725585938, 0.08759307861328125, 0.09141921997070312, 0.095245361328125, 0.09907150268554688, 0.10289764404296875, 0.10672378540039062, 0.1105499267578125, 0.11437606811523438, 0.11820220947265625, 0.12202835083007812, 0.1258544921875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 7.0, 9.0, 6.0, 7.0, 20.0, 14.0, 21.0, 30.0, 30.0, 64.0, 114.0, 184.0, 163.0, 109.0, 48.0, 36.0, 34.0, 25.0, 20.0, 12.0, 12.0, 8.0, 11.0, 3.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0039215087890625, -0.0037575960159301758, -0.0035936832427978516, -0.0034297704696655273, -0.003265857696533203, -0.003101944923400879, -0.0029380321502685547, -0.0027741193771362305, -0.0026102066040039062, -0.002446293830871582, -0.002282381057739258, -0.0021184682846069336, -0.0019545555114746094, -0.0017906427383422852, -0.001626729965209961, -0.0014628171920776367, -0.0012989044189453125, -0.0011349916458129883, -0.0009710788726806641, -0.0008071660995483398, -0.0006432533264160156, -0.0004793405532836914, -0.0003154277801513672, -0.00015151500701904297, 1.239776611328125e-05, 0.00017631053924560547, 0.0003402233123779297, 0.0005041360855102539, 0.0006680488586425781, 0.0008319616317749023, 0.0009958744049072266, 0.0011597871780395508, 0.001323699951171875, 0.0014876127243041992, 0.0016515254974365234, 0.0018154382705688477, 0.001979351043701172, 0.002143263816833496, 0.0023071765899658203, 0.0024710893630981445, 0.0026350021362304688, 0.002798914909362793, 0.002962827682495117, 0.0031267404556274414, 0.0032906532287597656, 0.00345456600189209, 0.003618478775024414, 0.0037823915481567383, 0.0039463043212890625, 0.004110217094421387, 0.004274129867553711, 0.004438042640686035, 0.004601955413818359, 0.004765868186950684, 0.004929780960083008, 0.005093693733215332, 0.005257606506347656, 0.0054215192794799805, 0.005585432052612305, 0.005749344825744629, 0.005913257598876953, 0.006077170372009277, 0.0062410831451416016, 0.006404995918273926, 0.00656890869140625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 7.0, 7.0, 14.0, 17.0, 30.0, 33.0, 53.0, 63.0, 107.0, 128.0, 375.0, 2933.0, 889838.0, 152725.0, 1542.0, 260.0, 133.0, 83.0, 50.0, 36.0, 38.0, 21.0, 15.0, 13.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.1016845703125, -0.0989999771118164, -0.09631538391113281, -0.09363079071044922, -0.09094619750976562, -0.08826160430908203, -0.08557701110839844, -0.08289241790771484, -0.08020782470703125, -0.07752323150634766, -0.07483863830566406, -0.07215404510498047, -0.06946945190429688, -0.06678485870361328, -0.06410026550292969, -0.061415672302246094, -0.0587310791015625, -0.056046485900878906, -0.05336189270019531, -0.05067729949951172, -0.047992706298828125, -0.04530811309814453, -0.04262351989746094, -0.039938926696777344, -0.03725433349609375, -0.034569740295410156, -0.03188514709472656, -0.02920055389404297, -0.026515960693359375, -0.02383136749267578, -0.021146774291992188, -0.018462181091308594, -0.015777587890625, -0.013092994689941406, -0.010408401489257812, -0.007723808288574219, -0.005039215087890625, -0.0023546218872070312, 0.0003299713134765625, 0.0030145645141601562, 0.00569915771484375, 0.008383750915527344, 0.011068344116210938, 0.013752937316894531, 0.016437530517578125, 0.01912212371826172, 0.021806716918945312, 0.024491310119628906, 0.0271759033203125, 0.029860496520996094, 0.03254508972167969, 0.03522968292236328, 0.037914276123046875, 0.04059886932373047, 0.04328346252441406, 0.045968055725097656, 0.04865264892578125, 0.051337242126464844, 0.05402183532714844, 0.05670642852783203, 0.059391021728515625, 0.06207561492919922, 0.06476020812988281, 0.0674448013305664, 0.07012939453125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 16.0, 107.0, 571.0, 253.0, 54.0, 18.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004443892743438482, -0.0038606177549809217, -0.003277342766523361, -0.0026940680108964443, -0.0021107930224388838, -0.0015275180339813232, -0.0009442432783544064, -0.00036096805706620216, 0.00022230669856071472, 0.0008055816288106143, 0.001388856559060514, 0.0019721314311027527, 0.0025554064195603132, 0.0031386814080178738, 0.0037219561636447906, 0.004305231384932995, 0.004888506140559912, 0.005471780896186829, 0.006055056117475033, 0.00663833087310195, 0.007221605628728867, 0.007804880850017071, 0.008388156071305275, 0.008971430361270905, 0.009554705582559109, 0.010137980803847313, 0.010721255093812943, 0.011304530315101147, 0.011887805536389351, 0.01247107982635498, 0.013054355047643185, 0.013637630268931389, 0.014220906421542168, 0.014804181642830372, 0.015387455932796001, 0.015970731154084206, 0.016554005444049835, 0.017137281596660614, 0.017720555886626244, 0.018303830176591873, 0.018887106329202652, 0.01947038061916828, 0.02005365677177906, 0.02063693106174469, 0.02122020535171032, 0.0218034815043211, 0.022386755794286728, 0.022970031946897507, 0.023553304374217987, 0.024136578664183617, 0.024719854816794395, 0.025303129106760025, 0.025886403396725655, 0.026469679549336433, 0.027052953839302063, 0.027636229991912842, 0.02821950428187847, 0.0288027785718441, 0.02938605472445488, 0.02996932901442051, 0.03055260330438614, 0.031135879456996918, 0.0317191556096077, 0.03230242803692818, 0.032885704189538956]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 3.0, 6.0, 8.0, 6.0, 12.0, 13.0, 13.0, 18.0, 20.0, 24.0, 25.0, 37.0, 50.0, 39.0, 32.0, 32.0, 40.0, 36.0, 41.0, 41.0, 32.0, 49.0, 35.0, 43.0, 32.0, 38.0, 32.0, 34.0, 25.0, 26.0, 20.0, 21.0, 20.0, 11.0, 9.0, 11.0, 9.0, 9.0, 3.0, 8.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0018526911735534668, -0.0017955005168914795, -0.0017383098602294922, -0.0016811192035675049, -0.0016239285469055176, -0.0015667378902435303, -0.001509547233581543, -0.0014523565769195557, -0.0013951659202575684, -0.001337975263595581, -0.0012807846069335938, -0.0012235939502716064, -0.0011664032936096191, -0.0011092126369476318, -0.0010520219802856445, -0.0009948313236236572, -0.0009376406669616699, -0.0008804500102996826, -0.0008232593536376953, -0.000766068696975708, -0.0007088780403137207, -0.0006516873836517334, -0.0005944967269897461, -0.0005373060703277588, -0.0004801154136657715, -0.0004229247570037842, -0.0003657341003417969, -0.00030854344367980957, -0.00025135278701782227, -0.00019416213035583496, -0.00013697147369384766, -7.978081703186035e-05, -2.2590160369873047e-05, 3.460049629211426e-05, 9.179115295410156e-05, 0.00014898180961608887, 0.00020617246627807617, 0.0002633631229400635, 0.0003205537796020508, 0.0003777444362640381, 0.0004349350929260254, 0.0004921257495880127, 0.00054931640625, 0.0006065070629119873, 0.0006636977195739746, 0.0007208883762359619, 0.0007780790328979492, 0.0008352696895599365, 0.0008924603462219238, 0.0009496510028839111, 0.0010068416595458984, 0.0010640323162078857, 0.001121222972869873, 0.0011784136295318604, 0.0012356042861938477, 0.001292794942855835, 0.0013499855995178223, 0.0014071762561798096, 0.0014643669128417969, 0.0015215575695037842, 0.0015787482261657715, 0.0016359388828277588, 0.001693129539489746, 0.0017503201961517334, 0.0018075108528137207]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 4.0, 11.0, 11.0, 14.0, 11.0, 13.0, 34.0, 21.0, 30.0, 27.0, 40.0, 42.0, 43.0, 28.0, 43.0, 37.0, 38.0, 36.0, 51.0, 36.0, 39.0, 41.0, 35.0, 33.0, 45.0, 30.0, 17.0, 23.0, 33.0, 17.0, 13.0, 17.0, 18.0, 12.0, 11.0, 6.0, 9.0, 6.0, 2.0, 8.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.755859375, -1.6979217529296875, -1.639984130859375, -1.5820465087890625, -1.52410888671875, -1.4661712646484375, -1.408233642578125, -1.3502960205078125, -1.2923583984375, -1.2344207763671875, -1.176483154296875, -1.1185455322265625, -1.06060791015625, -1.0026702880859375, -0.944732666015625, -0.8867950439453125, -0.828857421875, -0.7709197998046875, -0.712982177734375, -0.6550445556640625, -0.59710693359375, -0.5391693115234375, -0.481231689453125, -0.4232940673828125, -0.3653564453125, -0.3074188232421875, -0.249481201171875, -0.1915435791015625, -0.13360595703125, -0.0756683349609375, -0.017730712890625, 0.0402069091796875, 0.09814453125, 0.1560821533203125, 0.214019775390625, 0.2719573974609375, 0.32989501953125, 0.3878326416015625, 0.445770263671875, 0.5037078857421875, 0.5616455078125, 0.6195831298828125, 0.677520751953125, 0.7354583740234375, 0.79339599609375, 0.8513336181640625, 0.909271240234375, 0.9672088623046875, 1.025146484375, 1.0830841064453125, 1.141021728515625, 1.1989593505859375, 1.25689697265625, 1.3148345947265625, 1.372772216796875, 1.4307098388671875, 1.4886474609375, 1.5465850830078125, 1.604522705078125, 1.6624603271484375, 1.72039794921875, 1.7783355712890625, 1.836273193359375, 1.8942108154296875, 1.9521484375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 10.0, 10.0, 11.0, 24.0, 38.0, 41.0, 65.0, 112.0, 173.0, 313.0, 546.0, 896.0, 1563.0, 2795.0, 5105.0, 9623.0, 18285.0, 35355.0, 67475.0, 126055.0, 207198.0, 233113.0, 156432.0, 86900.0, 45411.0, 23828.0, 12432.0, 6618.0, 3505.0, 1958.0, 1120.0, 591.0, 339.0, 226.0, 136.0, 78.0, 56.0, 26.0, 20.0, 19.0, 18.0, 9.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.3154296875, -1.2718658447265625, -1.228302001953125, -1.1847381591796875, -1.14117431640625, -1.0976104736328125, -1.054046630859375, -1.0104827880859375, -0.9669189453125, -0.9233551025390625, -0.879791259765625, -0.8362274169921875, -0.79266357421875, -0.7490997314453125, -0.705535888671875, -0.6619720458984375, -0.618408203125, -0.5748443603515625, -0.531280517578125, -0.4877166748046875, -0.44415283203125, -0.4005889892578125, -0.357025146484375, -0.3134613037109375, -0.2698974609375, -0.2263336181640625, -0.182769775390625, -0.1392059326171875, -0.09564208984375, -0.0520782470703125, -0.008514404296875, 0.0350494384765625, 0.07861328125, 0.1221771240234375, 0.165740966796875, 0.2093048095703125, 0.25286865234375, 0.2964324951171875, 0.339996337890625, 0.3835601806640625, 0.4271240234375, 0.4706878662109375, 0.514251708984375, 0.5578155517578125, 0.60137939453125, 0.6449432373046875, 0.688507080078125, 0.7320709228515625, 0.775634765625, 0.8191986083984375, 0.862762451171875, 0.9063262939453125, 0.94989013671875, 0.9934539794921875, 1.037017822265625, 1.0805816650390625, 1.1241455078125, 1.1677093505859375, 1.211273193359375, 1.2548370361328125, 1.29840087890625, 1.3419647216796875, 1.385528564453125, 1.4290924072265625, 1.47265625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 6.0, 10.0, 8.0, 19.0, 16.0, 26.0, 27.0, 27.0, 30.0, 39.0, 49.0, 44.0, 50.0, 92.0, 128.0, 299.0, 1399.0, 223.0, 108.0, 74.0, 55.0, 37.0, 42.0, 24.0, 29.0, 21.0, 29.0, 26.0, 22.0, 7.0, 11.0, 20.0, 15.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.93359375, -6.71893310546875, -6.5042724609375, -6.28961181640625, -6.074951171875, -5.86029052734375, -5.6456298828125, -5.43096923828125, -5.21630859375, -5.00164794921875, -4.7869873046875, -4.57232666015625, -4.357666015625, -4.14300537109375, -3.9283447265625, -3.71368408203125, -3.4990234375, -3.28436279296875, -3.0697021484375, -2.85504150390625, -2.640380859375, -2.42572021484375, -2.2110595703125, -1.99639892578125, -1.78173828125, -1.56707763671875, -1.3524169921875, -1.13775634765625, -0.923095703125, -0.70843505859375, -0.4937744140625, -0.27911376953125, -0.064453125, 0.15020751953125, 0.3648681640625, 0.57952880859375, 0.794189453125, 1.00885009765625, 1.2235107421875, 1.43817138671875, 1.65283203125, 1.86749267578125, 2.0821533203125, 2.29681396484375, 2.511474609375, 2.72613525390625, 2.9407958984375, 3.15545654296875, 3.3701171875, 3.58477783203125, 3.7994384765625, 4.01409912109375, 4.228759765625, 4.44342041015625, 4.6580810546875, 4.87274169921875, 5.08740234375, 5.30206298828125, 5.5167236328125, 5.73138427734375, 5.946044921875, 6.16070556640625, 6.3753662109375, 6.59002685546875, 6.8046875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 4.0, 17.0, 18.0, 32.0, 36.0, 44.0, 95.0, 150.0, 261.0, 696.0, 4027.0, 588031.0, 2543439.0, 7167.0, 898.0, 338.0, 155.0, 87.0, 65.0, 54.0, 21.0, 21.0, 14.0, 9.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.567626953125, -19.01025390625, -18.452880859375, -17.8955078125, -17.338134765625, -16.78076171875, -16.223388671875, -15.666015625, -15.108642578125, -14.55126953125, -13.993896484375, -13.4365234375, -12.879150390625, -12.32177734375, -11.764404296875, -11.20703125, -10.649658203125, -10.09228515625, -9.534912109375, -8.9775390625, -8.420166015625, -7.86279296875, -7.305419921875, -6.748046875, -6.190673828125, -5.63330078125, -5.075927734375, -4.5185546875, -3.961181640625, -3.40380859375, -2.846435546875, -2.2890625, -1.731689453125, -1.17431640625, -0.616943359375, -0.0595703125, 0.497802734375, 1.05517578125, 1.612548828125, 2.169921875, 2.727294921875, 3.28466796875, 3.842041015625, 4.3994140625, 4.956787109375, 5.51416015625, 6.071533203125, 6.62890625, 7.186279296875, 7.74365234375, 8.301025390625, 8.8583984375, 9.415771484375, 9.97314453125, 10.530517578125, 11.087890625, 11.645263671875, 12.20263671875, 12.760009765625, 13.3173828125, 13.874755859375, 14.43212890625, 14.989501953125, 15.546875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 25.0, 99.0, 228.0, 332.0, 221.0, 84.0, 15.0, 4.0], "bins": [-56.3259162902832, -55.37737274169922, -54.42882537841797, -53.48027801513672, -52.531734466552734, -51.58319091796875, -50.6346435546875, -49.68609619140625, -48.737552642822266, -47.78900909423828, -46.84046173095703, -45.89191436767578, -44.9433708190918, -43.99482727050781, -43.04627990722656, -42.09773254394531, -41.14918899536133, -40.200645446777344, -39.252098083496094, -38.303550720214844, -37.35500717163086, -36.406463623046875, -35.457916259765625, -34.509368896484375, -33.56082534790039, -32.612281799316406, -31.663734436035156, -30.71518898010254, -29.766643524169922, -28.818098068237305, -27.869552612304688, -26.92100715637207, -25.972461700439453, -25.023916244506836, -24.07537078857422, -23.1268253326416, -22.178279876708984, -21.229734420776367, -20.28118896484375, -19.332643508911133, -18.384098052978516, -17.4355525970459, -16.48700714111328, -15.538461685180664, -14.589916229248047, -13.64137077331543, -12.692825317382812, -11.744279861450195, -10.795734405517578, -9.847188949584961, -8.898643493652344, -7.950098037719727, -7.001552581787109, -6.053007125854492, -5.104461669921875, -4.155916213989258, -3.2073707580566406, -2.2588253021240234, -1.3102798461914062, -0.36173439025878906, 0.5868110656738281, 1.5353565216064453, 2.4839019775390625, 3.4324474334716797, 4.380992889404297]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 6.0, 15.0, 13.0, 9.0, 9.0, 15.0, 21.0, 16.0, 19.0, 22.0, 27.0, 30.0, 37.0, 40.0, 35.0, 38.0, 43.0, 53.0, 37.0, 36.0, 32.0, 44.0, 33.0, 41.0, 30.0, 21.0, 30.0, 34.0, 34.0, 27.0, 16.0, 19.0, 17.0, 15.0, 13.0, 9.0, 14.0, 4.0, 5.0, 8.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-21.65929412841797, -21.034812927246094, -20.41033363342285, -19.785852432250977, -19.161373138427734, -18.53689193725586, -17.912410736083984, -17.28792953491211, -16.663450241088867, -16.038969039916992, -15.41448974609375, -14.790008544921875, -14.165528297424316, -13.541048049926758, -12.916566848754883, -12.292086601257324, -11.667606353759766, -11.043126106262207, -10.418645858764648, -9.794164657592773, -9.169684410095215, -8.545204162597656, -7.9207234382629395, -7.296242713928223, -6.671762466430664, -6.0472822189331055, -5.422801494598389, -4.798320770263672, -4.173840522766113, -3.5493600368499756, -2.924879550933838, -2.300398826599121, -1.6759204864501953, -1.0514400005340576, -0.4269595146179199, 0.19752097129821777, 0.8220014572143555, 1.4464819431304932, 2.070962429046631, 2.6954431533813477, 3.3199234008789062, 3.944403886795044, 4.568884372711182, 5.193365097045898, 5.817845344543457, 6.442325592041016, 7.066806316375732, 7.691287040710449, 8.315767288208008, 8.940247535705566, 9.564727783203125, 10.189208984375, 10.813689231872559, 11.438169479370117, 12.062650680541992, 12.68713092803955, 13.31161117553711, 13.936091423034668, 14.560571670532227, 15.185052871704102, 15.80953311920166, 16.43401336669922, 17.058494567871094, 17.68297576904297, 18.30745506286621]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 5.0, 7.0, 17.0, 18.0, 14.0, 26.0, 30.0, 23.0, 42.0, 33.0, 36.0, 53.0, 43.0, 29.0, 45.0, 40.0, 41.0, 34.0, 51.0, 46.0, 27.0, 47.0, 36.0, 38.0, 26.0, 21.0, 19.0, 24.0, 26.0, 16.0, 19.0, 9.0, 10.0, 4.0, 11.0, 7.0, 3.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.865234375, -1.800689697265625, -1.73614501953125, -1.671600341796875, -1.6070556640625, -1.542510986328125, -1.47796630859375, -1.413421630859375, -1.348876953125, -1.284332275390625, -1.21978759765625, -1.155242919921875, -1.0906982421875, -1.026153564453125, -0.96160888671875, -0.897064208984375, -0.83251953125, -0.767974853515625, -0.70343017578125, -0.638885498046875, -0.5743408203125, -0.509796142578125, -0.44525146484375, -0.380706787109375, -0.316162109375, -0.251617431640625, -0.18707275390625, -0.122528076171875, -0.0579833984375, 0.006561279296875, 0.07110595703125, 0.135650634765625, 0.2001953125, 0.264739990234375, 0.32928466796875, 0.393829345703125, 0.4583740234375, 0.522918701171875, 0.58746337890625, 0.652008056640625, 0.716552734375, 0.781097412109375, 0.84564208984375, 0.910186767578125, 0.9747314453125, 1.039276123046875, 1.10382080078125, 1.168365478515625, 1.23291015625, 1.297454833984375, 1.36199951171875, 1.426544189453125, 1.4910888671875, 1.555633544921875, 1.62017822265625, 1.684722900390625, 1.749267578125, 1.813812255859375, 1.87835693359375, 1.942901611328125, 2.0074462890625, 2.071990966796875, 2.13653564453125, 2.201080322265625, 2.265625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 5.0, 7.0, 12.0, 7.0, 16.0, 14.0, 20.0, 32.0, 43.0, 61.0, 100.0, 174.0, 271.0, 616.0, 1485.0, 4632.0, 15957.0, 66123.0, 337695.0, 1714791.0, 1660259.0, 308070.0, 61061.0, 15323.0, 4550.0, 1506.0, 609.0, 325.0, 185.0, 89.0, 50.0, 48.0, 30.0, 27.0, 18.0, 18.0, 11.0, 9.0, 8.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.20703125, -4.07122802734375, -3.9354248046875, -3.79962158203125, -3.663818359375, -3.52801513671875, -3.3922119140625, -3.25640869140625, -3.12060546875, -2.98480224609375, -2.8489990234375, -2.71319580078125, -2.577392578125, -2.44158935546875, -2.3057861328125, -2.16998291015625, -2.0341796875, -1.89837646484375, -1.7625732421875, -1.62677001953125, -1.490966796875, -1.35516357421875, -1.2193603515625, -1.08355712890625, -0.94775390625, -0.81195068359375, -0.6761474609375, -0.54034423828125, -0.404541015625, -0.26873779296875, -0.1329345703125, 0.00286865234375, 0.138671875, 0.27447509765625, 0.4102783203125, 0.54608154296875, 0.681884765625, 0.81768798828125, 0.9534912109375, 1.08929443359375, 1.22509765625, 1.36090087890625, 1.4967041015625, 1.63250732421875, 1.768310546875, 1.90411376953125, 2.0399169921875, 2.17572021484375, 2.3115234375, 2.44732666015625, 2.5831298828125, 2.71893310546875, 2.854736328125, 2.99053955078125, 3.1263427734375, 3.26214599609375, 3.39794921875, 3.53375244140625, 3.6695556640625, 3.80535888671875, 3.941162109375, 4.07696533203125, 4.2127685546875, 4.34857177734375, 4.484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 8.0, 24.0, 27.0, 59.0, 82.0, 111.0, 164.0, 286.0, 444.0, 616.0, 730.0, 556.0, 368.0, 220.0, 128.0, 96.0, 58.0, 34.0, 23.0, 9.0, 5.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1796875, -9.92034912109375, -9.6610107421875, -9.40167236328125, -9.142333984375, -8.88299560546875, -8.6236572265625, -8.36431884765625, -8.10498046875, -7.84564208984375, -7.5863037109375, -7.32696533203125, -7.067626953125, -6.80828857421875, -6.5489501953125, -6.28961181640625, -6.0302734375, -5.77093505859375, -5.5115966796875, -5.25225830078125, -4.992919921875, -4.73358154296875, -4.4742431640625, -4.21490478515625, -3.95556640625, -3.69622802734375, -3.4368896484375, -3.17755126953125, -2.918212890625, -2.65887451171875, -2.3995361328125, -2.14019775390625, -1.880859375, -1.62152099609375, -1.3621826171875, -1.10284423828125, -0.843505859375, -0.58416748046875, -0.3248291015625, -0.06549072265625, 0.19384765625, 0.45318603515625, 0.7125244140625, 0.97186279296875, 1.231201171875, 1.49053955078125, 1.7498779296875, 2.00921630859375, 2.2685546875, 2.52789306640625, 2.7872314453125, 3.04656982421875, 3.305908203125, 3.56524658203125, 3.8245849609375, 4.08392333984375, 4.34326171875, 4.60260009765625, 4.8619384765625, 5.12127685546875, 5.380615234375, 5.63995361328125, 5.8992919921875, 6.15863037109375, 6.41796875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 12.0, 18.0, 33.0, 33.0, 71.0, 120.0, 237.0, 427.0, 835.0, 1914.0, 6828.0, 48712.0, 653972.0, 3051337.0, 390375.0, 31113.0, 5022.0, 1581.0, 716.0, 391.0, 218.0, 120.0, 73.0, 35.0, 24.0, 19.0, 9.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.6607666015625, -8.305908203125, -7.9510498046875, -7.59619140625, -7.2413330078125, -6.886474609375, -6.5316162109375, -6.1767578125, -5.8218994140625, -5.467041015625, -5.1121826171875, -4.75732421875, -4.4024658203125, -4.047607421875, -3.6927490234375, -3.337890625, -2.9830322265625, -2.628173828125, -2.2733154296875, -1.91845703125, -1.5635986328125, -1.208740234375, -0.8538818359375, -0.4990234375, -0.1441650390625, 0.210693359375, 0.5655517578125, 0.92041015625, 1.2752685546875, 1.630126953125, 1.9849853515625, 2.33984375, 2.6947021484375, 3.049560546875, 3.4044189453125, 3.75927734375, 4.1141357421875, 4.468994140625, 4.8238525390625, 5.1787109375, 5.5335693359375, 5.888427734375, 6.2432861328125, 6.59814453125, 6.9530029296875, 7.307861328125, 7.6627197265625, 8.017578125, 8.3724365234375, 8.727294921875, 9.0821533203125, 9.43701171875, 9.7918701171875, 10.146728515625, 10.5015869140625, 10.8564453125, 11.2113037109375, 11.566162109375, 11.9210205078125, 12.27587890625, 12.6307373046875, 12.985595703125, 13.3404541015625, 13.6953125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 19.0, 66.0, 135.0, 253.0, 242.0, 161.0, 90.0, 29.0, 9.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.59773254394531, -42.5008659362793, -40.40399932861328, -38.30712890625, -36.210262298583984, -34.11339569091797, -32.01652526855469, -29.919658660888672, -27.822792053222656, -25.72592544555664, -23.629056930541992, -21.532188415527344, -19.435321807861328, -17.338455200195312, -15.241586685180664, -13.144719123840332, -11.0478515625, -8.950984001159668, -6.854116439819336, -4.757248878479004, -2.660381317138672, -0.5635137557983398, 1.5333538055419922, 3.630221366882324, 5.727088928222656, 7.823956489562988, 9.92082405090332, 12.017691612243652, 14.114559173583984, 16.21142578125, 18.30829429626465, 20.405162811279297, 22.502029418945312, 24.598896026611328, 26.695764541625977, 28.792633056640625, 30.88949966430664, 32.986366271972656, 35.08323669433594, 37.18010330200195, 39.27696990966797, 41.373836517333984, 43.470703125, 45.56757354736328, 47.6644401550293, 49.76130676269531, 51.858177185058594, 53.95504379272461, 56.051910400390625, 58.14877700805664, 60.245643615722656, 62.34251403808594, 64.43937683105469, 66.53624725341797, 68.63311767578125, 70.72998046875, 72.82685089111328, 74.92372131347656, 77.02058410644531, 79.1174545288086, 81.21432495117188, 83.31118774414062, 85.4080581665039, 87.50492095947266, 89.60179138183594]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 10.0, 7.0, 11.0, 11.0, 15.0, 12.0, 13.0, 12.0, 17.0, 24.0, 25.0, 32.0, 26.0, 33.0, 34.0, 43.0, 49.0, 46.0, 37.0, 46.0, 36.0, 36.0, 36.0, 36.0, 39.0, 40.0, 34.0, 29.0, 37.0, 26.0, 26.0, 24.0, 18.0, 16.0, 11.0, 9.0, 10.0, 9.0, 5.0, 9.0, 1.0, 0.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.118377685546875, -19.504465103149414, -18.890554428100586, -18.276641845703125, -17.662731170654297, -17.048818588256836, -16.434906005859375, -15.82099437713623, -15.207082748413086, -14.593171119689941, -13.979259490966797, -13.365346908569336, -12.751435279846191, -12.137523651123047, -11.523611068725586, -10.909699440002441, -10.295787811279297, -9.681876182556152, -9.067964553833008, -8.454051971435547, -7.840140342712402, -7.226228713989258, -6.612316608428955, -5.998404502868652, -5.384492874145508, -4.770581245422363, -4.1566691398620605, -3.542757272720337, -2.9288454055786133, -2.3149335384368896, -1.701021671295166, -1.0871095657348633, -0.47319793701171875, 0.14071393013000488, 0.7546257972717285, 1.3685376644134521, 1.9824495315551758, 2.5963613986968994, 3.210273265838623, 3.824185371398926, 4.43809700012207, 5.052008628845215, 5.665920734405518, 6.27983283996582, 6.893744468688965, 7.507656097412109, 8.12156867980957, 8.735480308532715, 9.34939193725586, 9.963303565979004, 10.577215194702148, 11.19112777709961, 11.805039405822754, 12.418951034545898, 13.03286361694336, 13.646775245666504, 14.260686874389648, 14.874598503112793, 15.488510131835938, 16.1024227142334, 16.71633529663086, 17.330245971679688, 17.94415855407715, 18.55807113647461, 19.171981811523438]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 3.0, 9.0, 5.0, 7.0, 8.0, 8.0, 18.0, 13.0, 22.0, 25.0, 28.0, 29.0, 25.0, 36.0, 28.0, 29.0, 37.0, 39.0, 27.0, 34.0, 46.0, 36.0, 36.0, 38.0, 37.0, 36.0, 36.0, 30.0, 27.0, 31.0, 35.0, 26.0, 24.0, 12.0, 19.0, 17.0, 16.0, 12.0, 12.0, 8.0, 8.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.6920318603515625, -1.633087158203125, -1.5741424560546875, -1.51519775390625, -1.4562530517578125, -1.397308349609375, -1.3383636474609375, -1.2794189453125, -1.2204742431640625, -1.161529541015625, -1.1025848388671875, -1.04364013671875, -0.9846954345703125, -0.925750732421875, -0.8668060302734375, -0.807861328125, -0.7489166259765625, -0.689971923828125, -0.6310272216796875, -0.57208251953125, -0.5131378173828125, -0.454193115234375, -0.3952484130859375, -0.3363037109375, -0.2773590087890625, -0.218414306640625, -0.1594696044921875, -0.10052490234375, -0.0415802001953125, 0.017364501953125, 0.0763092041015625, 0.13525390625, 0.1941986083984375, 0.253143310546875, 0.3120880126953125, 0.37103271484375, 0.4299774169921875, 0.488922119140625, 0.5478668212890625, 0.6068115234375, 0.6657562255859375, 0.724700927734375, 0.7836456298828125, 0.84259033203125, 0.9015350341796875, 0.960479736328125, 1.0194244384765625, 1.078369140625, 1.1373138427734375, 1.196258544921875, 1.2552032470703125, 1.31414794921875, 1.3730926513671875, 1.432037353515625, 1.4909820556640625, 1.5499267578125, 1.6088714599609375, 1.667816162109375, 1.7267608642578125, 1.78570556640625, 1.8446502685546875, 1.903594970703125, 1.9625396728515625, 2.021484375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 25.0, 26.0, 48.0, 72.0, 80.0, 146.0, 197.0, 341.0, 553.0, 828.0, 1247.0, 1908.0, 2873.0, 4402.0, 7093.0, 10736.0, 17465.0, 28265.0, 46717.0, 77269.0, 127927.0, 195102.0, 195737.0, 127887.0, 77386.0, 47114.0, 28679.0, 17401.0, 10984.0, 7062.0, 4461.0, 2968.0, 1954.0, 1243.0, 823.0, 533.0, 325.0, 235.0, 168.0, 95.0, 66.0, 29.0, 18.0, 22.0, 13.0, 3.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.2462158203125, -0.2387561798095703, -0.23129653930664062, -0.22383689880371094, -0.21637725830078125, -0.20891761779785156, -0.20145797729492188, -0.1939983367919922, -0.1865386962890625, -0.1790790557861328, -0.17161941528320312, -0.16415977478027344, -0.15670013427734375, -0.14924049377441406, -0.14178085327148438, -0.1343212127685547, -0.126861572265625, -0.11940193176269531, -0.11194229125976562, -0.10448265075683594, -0.09702301025390625, -0.08956336975097656, -0.08210372924804688, -0.07464408874511719, -0.0671844482421875, -0.05972480773925781, -0.052265167236328125, -0.04480552673339844, -0.03734588623046875, -0.029886245727539062, -0.022426605224609375, -0.014966964721679688, -0.00750732421875, -4.76837158203125e-05, 0.007411956787109375, 0.014871597290039062, 0.02233123779296875, 0.029790878295898438, 0.037250518798828125, 0.04471015930175781, 0.0521697998046875, 0.05962944030761719, 0.06708908081054688, 0.07454872131347656, 0.08200836181640625, 0.08946800231933594, 0.09692764282226562, 0.10438728332519531, 0.111846923828125, 0.11930656433105469, 0.12676620483398438, 0.13422584533691406, 0.14168548583984375, 0.14914512634277344, 0.15660476684570312, 0.1640644073486328, 0.1715240478515625, 0.1789836883544922, 0.18644332885742188, 0.19390296936035156, 0.20136260986328125, 0.20882225036621094, 0.21628189086914062, 0.2237415313720703, 0.231201171875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 9.0, 10.0, 7.0, 12.0, 8.0, 17.0, 13.0, 17.0, 18.0, 17.0, 31.0, 22.0, 31.0, 36.0, 51.0, 43.0, 34.0, 40.0, 47.0, 1070.0, 44.0, 35.0, 45.0, 35.0, 42.0, 30.0, 27.0, 25.0, 31.0, 24.0, 17.0, 20.0, 17.0, 10.0, 11.0, 12.0, 13.0, 11.0, 10.0, 9.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.3076171875, -1.2667236328125, -1.225830078125, -1.1849365234375, -1.14404296875, -1.1031494140625, -1.062255859375, -1.0213623046875, -0.98046875, -0.9395751953125, -0.898681640625, -0.8577880859375, -0.81689453125, -0.7760009765625, -0.735107421875, -0.6942138671875, -0.6533203125, -0.6124267578125, -0.571533203125, -0.5306396484375, -0.48974609375, -0.4488525390625, -0.407958984375, -0.3670654296875, -0.326171875, -0.2852783203125, -0.244384765625, -0.2034912109375, -0.16259765625, -0.1217041015625, -0.080810546875, -0.0399169921875, 0.0009765625, 0.0418701171875, 0.082763671875, 0.1236572265625, 0.16455078125, 0.2054443359375, 0.246337890625, 0.2872314453125, 0.328125, 0.3690185546875, 0.409912109375, 0.4508056640625, 0.49169921875, 0.5325927734375, 0.573486328125, 0.6143798828125, 0.6552734375, 0.6961669921875, 0.737060546875, 0.7779541015625, 0.81884765625, 0.8597412109375, 0.900634765625, 0.9415283203125, 0.982421875, 1.0233154296875, 1.064208984375, 1.1051025390625, 1.14599609375, 1.1868896484375, 1.227783203125, 1.2686767578125, 1.3095703125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 5.0, 10.0, 9.0, 17.0, 48.0, 40.0, 64.0, 78.0, 102.0, 132.0, 233.0, 305.0, 403.0, 538.0, 714.0, 1031.0, 1442.0, 1894.0, 2772.0, 3745.0, 5234.0, 7243.0, 10576.0, 14633.0, 20615.0, 28856.0, 40900.0, 57034.0, 78854.0, 107173.0, 332835.0, 977157.0, 111686.0, 83208.0, 59843.0, 42498.0, 30241.0, 21602.0, 15357.0, 10830.0, 7740.0, 5467.0, 3868.0, 2807.0, 1990.0, 1450.0, 1080.0, 763.0, 586.0, 387.0, 307.0, 205.0, 163.0, 104.0, 79.0, 60.0, 43.0, 27.0, 21.0, 24.0, 7.0, 8.0, 4.0], "bins": [-0.11614990234375, -0.11252880096435547, -0.10890769958496094, -0.1052865982055664, -0.10166549682617188, -0.09804439544677734, -0.09442329406738281, -0.09080219268798828, -0.08718109130859375, -0.08355998992919922, -0.07993888854980469, -0.07631778717041016, -0.07269668579101562, -0.0690755844116211, -0.06545448303222656, -0.06183338165283203, -0.0582122802734375, -0.05459117889404297, -0.05097007751464844, -0.047348976135253906, -0.043727874755859375, -0.040106773376464844, -0.03648567199707031, -0.03286457061767578, -0.02924346923828125, -0.02562236785888672, -0.022001266479492188, -0.018380165100097656, -0.014759063720703125, -0.011137962341308594, -0.0075168609619140625, -0.0038957595825195312, -0.000274658203125, 0.0033464431762695312, 0.0069675445556640625, 0.010588645935058594, 0.014209747314453125, 0.017830848693847656, 0.021451950073242188, 0.02507305145263672, 0.02869415283203125, 0.03231525421142578, 0.03593635559082031, 0.039557456970214844, 0.043178558349609375, 0.046799659729003906, 0.05042076110839844, 0.05404186248779297, 0.0576629638671875, 0.06128406524658203, 0.06490516662597656, 0.0685262680053711, 0.07214736938476562, 0.07576847076416016, 0.07938957214355469, 0.08301067352294922, 0.08663177490234375, 0.09025287628173828, 0.09387397766113281, 0.09749507904052734, 0.10111618041992188, 0.1047372817993164, 0.10835838317871094, 0.11197948455810547, 0.1156005859375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 7.0, 11.0, 13.0, 17.0, 26.0, 25.0, 33.0, 45.0, 63.0, 96.0, 110.0, 133.0, 106.0, 75.0, 56.0, 34.0, 28.0, 22.0, 16.0, 16.0, 9.0, 6.0, 5.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0060272216796875, -0.00585561990737915, -0.005684018135070801, -0.005512416362762451, -0.0053408145904541016, -0.005169212818145752, -0.004997611045837402, -0.004826009273529053, -0.004654407501220703, -0.0044828057289123535, -0.004311203956604004, -0.004139602184295654, -0.003968000411987305, -0.003796398639678955, -0.0036247968673706055, -0.003453195095062256, -0.0032815933227539062, -0.0031099915504455566, -0.002938389778137207, -0.0027667880058288574, -0.002595186233520508, -0.002423584461212158, -0.0022519826889038086, -0.002080380916595459, -0.0019087791442871094, -0.0017371773719787598, -0.0015655755996704102, -0.0013939738273620605, -0.001222372055053711, -0.0010507702827453613, -0.0008791685104370117, -0.0007075667381286621, -0.0005359649658203125, -0.0003643631935119629, -0.00019276142120361328, -2.1159648895263672e-05, 0.00015044212341308594, 0.00032204389572143555, 0.0004936456680297852, 0.0006652474403381348, 0.0008368492126464844, 0.001008450984954834, 0.0011800527572631836, 0.0013516545295715332, 0.0015232563018798828, 0.0016948580741882324, 0.001866459846496582, 0.0020380616188049316, 0.0022096633911132812, 0.002381265163421631, 0.0025528669357299805, 0.00272446870803833, 0.0028960704803466797, 0.0030676722526550293, 0.003239274024963379, 0.0034108757972717285, 0.003582477569580078, 0.0037540793418884277, 0.003925681114196777, 0.004097282886505127, 0.0042688846588134766, 0.004440486431121826, 0.004612088203430176, 0.004783689975738525, 0.004955291748046875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 9.0, 4.0, 7.0, 12.0, 19.0, 31.0, 32.0, 52.0, 76.0, 122.0, 182.0, 326.0, 737.0, 39118.0, 999760.0, 6832.0, 496.0, 279.0, 144.0, 95.0, 65.0, 38.0, 29.0, 21.0, 14.0, 14.0, 12.0, 3.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0849609375, -0.08196353912353516, -0.07896614074707031, -0.07596874237060547, -0.07297134399414062, -0.06997394561767578, -0.06697654724121094, -0.0639791488647461, -0.06098175048828125, -0.057984352111816406, -0.05498695373535156, -0.05198955535888672, -0.048992156982421875, -0.04599475860595703, -0.04299736022949219, -0.039999961853027344, -0.0370025634765625, -0.034005165100097656, -0.031007766723632812, -0.02801036834716797, -0.025012969970703125, -0.02201557159423828, -0.019018173217773438, -0.016020774841308594, -0.01302337646484375, -0.010025978088378906, -0.0070285797119140625, -0.004031181335449219, -0.001033782958984375, 0.0019636154174804688, 0.0049610137939453125, 0.007958412170410156, 0.010955810546875, 0.013953208923339844, 0.016950607299804688, 0.01994800567626953, 0.022945404052734375, 0.02594280242919922, 0.028940200805664062, 0.031937599182128906, 0.03493499755859375, 0.037932395935058594, 0.04092979431152344, 0.04392719268798828, 0.046924591064453125, 0.04992198944091797, 0.05291938781738281, 0.055916786193847656, 0.0589141845703125, 0.061911582946777344, 0.06490898132324219, 0.06790637969970703, 0.07090377807617188, 0.07390117645263672, 0.07689857482910156, 0.0798959732055664, 0.08289337158203125, 0.0858907699584961, 0.08888816833496094, 0.09188556671142578, 0.09488296508789062, 0.09788036346435547, 0.10087776184082031, 0.10387516021728516, 0.10687255859375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 62.0, 756.0, 171.0, 23.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03756740316748619, -0.03647802025079727, -0.03538864105939865, -0.03429925814270973, -0.03320987522602081, -0.03212049603462219, -0.031031113117933273, -0.029941730201244354, -0.028852349147200584, -0.027762968093156815, -0.026673585176467896, -0.025584204122424126, -0.024494823068380356, -0.023405440151691437, -0.022316059097647667, -0.021226678043603897, -0.020137295126914978, -0.019047914072871208, -0.01795853115618229, -0.01686915010213852, -0.0157797671854496, -0.01469038613140583, -0.01360100507736206, -0.012511623091995716, -0.011422241106629372, -0.010332859121263027, -0.009243477135896683, -0.008154096081852913, -0.0070647140964865685, -0.005975332111120224, -0.004885950591415167, -0.0037965690717101097, -0.0027071870863437653, -0.0016178053338080645, -0.0005284235812723637, 0.0005609581712633371, 0.001650339923799038, 0.0027397219091653824, 0.0038291034288704395, 0.004918484948575497, 0.006007866933941841, 0.007097248919308186, 0.00818663090467453, 0.0092760119587183, 0.010365393944084644, 0.011454775929450989, 0.012544156983494759, 0.013633538968861103, 0.014722920954227448, 0.015812302008271217, 0.016901684924960136, 0.017991065979003906, 0.019080448895692825, 0.020169829949736595, 0.021259211003780365, 0.022348593920469284, 0.023437974974513054, 0.024527356028556824, 0.025616738945245743, 0.026706119999289513, 0.027795501053333282, 0.0288848839700222, 0.02997426502406597, 0.03106364607810974, 0.03215302899479866]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 8.0, 13.0, 12.0, 19.0, 18.0, 28.0, 14.0, 30.0, 27.0, 30.0, 36.0, 50.0, 53.0, 49.0, 48.0, 44.0, 49.0, 56.0, 49.0, 53.0, 30.0, 47.0, 37.0, 30.0, 36.0, 20.0, 24.0, 21.0, 14.0, 11.0, 10.0, 9.0, 6.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034987926483154297, -0.0033738669008016586, -0.0032489411532878876, -0.0031240154057741165, -0.0029990896582603455, -0.0028741639107465744, -0.0027492381632328033, -0.0026243124157190323, -0.0024993866682052612, -0.00237446092069149, -0.002249535173177719, -0.002124609425663948, -0.001999683678150177, -0.001874757930636406, -0.0017498321831226349, -0.0016249064356088638, -0.0014999806880950928, -0.0013750549405813217, -0.0012501291930675507, -0.0011252034455537796, -0.0010002776980400085, -0.0008753519505262375, -0.0007504262030124664, -0.0006255004554986954, -0.0005005747079849243, -0.00037564896047115326, -0.0002507232129573822, -0.00012579746544361115, -8.717179298400879e-07, 0.00012405402958393097, 0.000248979777097702, 0.0003739055246114731, 0.0004988312721252441, 0.0006237570196390152, 0.0007486827671527863, 0.0008736085146665573, 0.0009985342621803284, 0.0011234600096940994, 0.0012483857572078705, 0.0013733115047216415, 0.0014982372522354126, 0.0016231629997491837, 0.0017480887472629547, 0.0018730144947767258, 0.001997940242290497, 0.002122865989804268, 0.002247791737318039, 0.00237271748483181, 0.002497643232345581, 0.002622568979859352, 0.002747494727373123, 0.0028724204748868942, 0.0029973462224006653, 0.0031222719699144363, 0.0032471977174282074, 0.0033721234649419785, 0.0034970492124557495, 0.0036219749599695206, 0.0037469007074832916, 0.0038718264549970627, 0.003996752202510834, 0.004121677950024605, 0.004246603697538376, 0.004371529445052147, 0.004496455192565918]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 3.0, 9.0, 5.0, 7.0, 8.0, 8.0, 18.0, 13.0, 22.0, 25.0, 28.0, 29.0, 25.0, 36.0, 28.0, 29.0, 37.0, 39.0, 27.0, 34.0, 46.0, 36.0, 36.0, 38.0, 37.0, 36.0, 36.0, 30.0, 27.0, 31.0, 35.0, 26.0, 24.0, 12.0, 19.0, 17.0, 16.0, 12.0, 12.0, 8.0, 8.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.6920318603515625, -1.633087158203125, -1.5741424560546875, -1.51519775390625, -1.4562530517578125, -1.397308349609375, -1.3383636474609375, -1.2794189453125, -1.2204742431640625, -1.161529541015625, -1.1025848388671875, -1.04364013671875, -0.9846954345703125, -0.925750732421875, -0.8668060302734375, -0.807861328125, -0.7489166259765625, -0.689971923828125, -0.6310272216796875, -0.57208251953125, -0.5131378173828125, -0.454193115234375, -0.3952484130859375, -0.3363037109375, -0.2773590087890625, -0.218414306640625, -0.1594696044921875, -0.10052490234375, -0.0415802001953125, 0.017364501953125, 0.0763092041015625, 0.13525390625, 0.1941986083984375, 0.253143310546875, 0.3120880126953125, 0.37103271484375, 0.4299774169921875, 0.488922119140625, 0.5478668212890625, 0.6068115234375, 0.6657562255859375, 0.724700927734375, 0.7836456298828125, 0.84259033203125, 0.9015350341796875, 0.960479736328125, 1.0194244384765625, 1.078369140625, 1.1373138427734375, 1.196258544921875, 1.2552032470703125, 1.31414794921875, 1.3730926513671875, 1.432037353515625, 1.4909820556640625, 1.5499267578125, 1.6088714599609375, 1.667816162109375, 1.7267608642578125, 1.78570556640625, 1.8446502685546875, 1.903594970703125, 1.9625396728515625, 2.021484375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 5.0, 3.0, 8.0, 9.0, 22.0, 32.0, 45.0, 56.0, 89.0, 94.0, 175.0, 220.0, 357.0, 559.0, 924.0, 1485.0, 2574.0, 4520.0, 8045.0, 15140.0, 30920.0, 69231.0, 171740.0, 394650.0, 197573.0, 77829.0, 34641.0, 16786.0, 8588.0, 4985.0, 2703.0, 1595.0, 1048.0, 632.0, 435.0, 269.0, 189.0, 109.0, 92.0, 55.0, 31.0, 39.0, 12.0, 8.0, 7.0, 7.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.843048095703125, -2.75836181640625, -2.673675537109375, -2.5889892578125, -2.504302978515625, -2.41961669921875, -2.334930419921875, -2.250244140625, -2.165557861328125, -2.08087158203125, -1.996185302734375, -1.9114990234375, -1.826812744140625, -1.74212646484375, -1.657440185546875, -1.57275390625, -1.488067626953125, -1.40338134765625, -1.318695068359375, -1.2340087890625, -1.149322509765625, -1.06463623046875, -0.979949951171875, -0.895263671875, -0.810577392578125, -0.72589111328125, -0.641204833984375, -0.5565185546875, -0.471832275390625, -0.38714599609375, -0.302459716796875, -0.2177734375, -0.133087158203125, -0.04840087890625, 0.036285400390625, 0.1209716796875, 0.205657958984375, 0.29034423828125, 0.375030517578125, 0.459716796875, 0.544403076171875, 0.62908935546875, 0.713775634765625, 0.7984619140625, 0.883148193359375, 0.96783447265625, 1.052520751953125, 1.13720703125, 1.221893310546875, 1.30657958984375, 1.391265869140625, 1.4759521484375, 1.560638427734375, 1.64532470703125, 1.730010986328125, 1.814697265625, 1.899383544921875, 1.98406982421875, 2.068756103515625, 2.1534423828125, 2.238128662109375, 2.32281494140625, 2.407501220703125, 2.4921875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 2.0, 2.0, 9.0, 12.0, 16.0, 15.0, 18.0, 25.0, 23.0, 39.0, 23.0, 26.0, 37.0, 42.0, 46.0, 45.0, 89.0, 146.0, 305.0, 1411.0, 209.0, 92.0, 58.0, 52.0, 49.0, 37.0, 28.0, 29.0, 27.0, 23.0, 15.0, 17.0, 9.0, 23.0, 9.0, 8.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.56640625, -7.33868408203125, -7.1109619140625, -6.88323974609375, -6.655517578125, -6.42779541015625, -6.2000732421875, -5.97235107421875, -5.74462890625, -5.51690673828125, -5.2891845703125, -5.06146240234375, -4.833740234375, -4.60601806640625, -4.3782958984375, -4.15057373046875, -3.9228515625, -3.69512939453125, -3.4674072265625, -3.23968505859375, -3.011962890625, -2.78424072265625, -2.5565185546875, -2.32879638671875, -2.10107421875, -1.87335205078125, -1.6456298828125, -1.41790771484375, -1.190185546875, -0.96246337890625, -0.7347412109375, -0.50701904296875, -0.279296875, -0.05157470703125, 0.1761474609375, 0.40386962890625, 0.631591796875, 0.85931396484375, 1.0870361328125, 1.31475830078125, 1.54248046875, 1.77020263671875, 1.9979248046875, 2.22564697265625, 2.453369140625, 2.68109130859375, 2.9088134765625, 3.13653564453125, 3.3642578125, 3.59197998046875, 3.8197021484375, 4.04742431640625, 4.275146484375, 4.50286865234375, 4.7305908203125, 4.95831298828125, 5.18603515625, 5.41375732421875, 5.6414794921875, 5.86920166015625, 6.096923828125, 6.32464599609375, 6.5523681640625, 6.78009033203125, 7.0078125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 2.0, 7.0, 9.0, 8.0, 15.0, 18.0, 22.0, 44.0, 54.0, 72.0, 109.0, 195.0, 297.0, 804.0, 4921.0, 173933.0, 2926097.0, 35534.0, 2224.0, 550.0, 259.0, 172.0, 90.0, 55.0, 47.0, 39.0, 20.0, 27.0, 14.0, 16.0, 9.0, 3.0, 12.0, 5.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.918212890625, -16.32080078125, -15.723388671875, -15.1259765625, -14.528564453125, -13.93115234375, -13.333740234375, -12.736328125, -12.138916015625, -11.54150390625, -10.944091796875, -10.3466796875, -9.749267578125, -9.15185546875, -8.554443359375, -7.95703125, -7.359619140625, -6.76220703125, -6.164794921875, -5.5673828125, -4.969970703125, -4.37255859375, -3.775146484375, -3.177734375, -2.580322265625, -1.98291015625, -1.385498046875, -0.7880859375, -0.190673828125, 0.40673828125, 1.004150390625, 1.6015625, 2.198974609375, 2.79638671875, 3.393798828125, 3.9912109375, 4.588623046875, 5.18603515625, 5.783447265625, 6.380859375, 6.978271484375, 7.57568359375, 8.173095703125, 8.7705078125, 9.367919921875, 9.96533203125, 10.562744140625, 11.16015625, 11.757568359375, 12.35498046875, 12.952392578125, 13.5498046875, 14.147216796875, 14.74462890625, 15.342041015625, 15.939453125, 16.536865234375, 17.13427734375, 17.731689453125, 18.3291015625, 18.926513671875, 19.52392578125, 20.121337890625, 20.71875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 247.0, 647.0, 107.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.783203125, -164.63406372070312, -161.48492431640625, -158.33578491210938, -155.18666076660156, -152.0375213623047, -148.8883819580078, -145.73924255371094, -142.59010314941406, -139.4409637451172, -136.2918243408203, -133.1427001953125, -129.99356079101562, -126.84442138671875, -123.69528198242188, -120.546142578125, -117.39701080322266, -114.24787139892578, -111.09873962402344, -107.94960021972656, -104.80046081542969, -101.65132141113281, -98.50218963623047, -95.3530502319336, -92.20391845703125, -89.05477905273438, -85.90564727783203, -82.75650787353516, -79.60736846923828, -76.45823669433594, -73.30909729003906, -70.15995788574219, -67.01081848144531, -63.8616828918457, -60.71254348754883, -57.56340789794922, -54.414268493652344, -51.265132904052734, -48.115997314453125, -44.96685791015625, -41.817718505859375, -38.668582916259766, -35.51944351196289, -32.37030792236328, -29.22117042541504, -26.072032928466797, -22.922897338867188, -19.773759841918945, -16.624622344970703, -13.475484848022461, -10.326348304748535, -7.177211761474609, -4.028074264526367, -0.878936767578125, 2.2701988220214844, 5.419336318969727, 8.568473815917969, 11.717611312866211, 14.866747856140137, 18.015884399414062, 21.165021896362305, 24.314159393310547, 27.463294982910156, 30.6124324798584, 33.76156997680664]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 7.0, 8.0, 6.0, 15.0, 13.0, 16.0, 12.0, 25.0, 22.0, 26.0, 29.0, 24.0, 34.0, 33.0, 41.0, 37.0, 40.0, 27.0, 55.0, 49.0, 47.0, 49.0, 34.0, 50.0, 43.0, 33.0, 31.0, 26.0, 27.0, 16.0, 21.0, 17.0, 16.0, 10.0, 9.0, 4.0, 16.0, 7.0, 7.0, 7.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.582107543945312, -20.904064178466797, -20.22602081298828, -19.547977447509766, -18.86993408203125, -18.191890716552734, -17.51384735107422, -16.835803985595703, -16.157760620117188, -15.479717254638672, -14.801673889160156, -14.12363052368164, -13.445587158203125, -12.76754379272461, -12.089499473571777, -11.411456108093262, -10.73341178894043, -10.055368423461914, -9.377325057983398, -8.699281692504883, -8.021238327026367, -7.343194484710693, -6.6651506423950195, -5.987107276916504, -5.309063911437988, -4.631020545959473, -3.952976942062378, -3.274933338165283, -2.5968899726867676, -1.918846607208252, -1.2408027648925781, -0.5627593994140625, 0.11528396606445312, 0.7933274507522583, 1.4713709354400635, 2.149414539337158, 2.827457904815674, 3.5055012702941895, 4.183545112609863, 4.861588478088379, 5.5396318435668945, 6.21767520904541, 6.895718574523926, 7.5737624168396, 8.251806259155273, 8.929849624633789, 9.607892990112305, 10.28593635559082, 10.963979721069336, 11.642023086547852, 12.320066452026367, 12.998109817504883, 13.676153182983398, 14.354196548461914, 15.032240867614746, 15.710284233093262, 16.388328552246094, 17.06637191772461, 17.744415283203125, 18.42245864868164, 19.100502014160156, 19.778545379638672, 20.456588745117188, 21.134632110595703, 21.81267547607422]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 5.0, 1.0, 10.0, 9.0, 8.0, 12.0, 24.0, 22.0, 26.0, 21.0, 19.0, 21.0, 38.0, 26.0, 40.0, 38.0, 37.0, 34.0, 40.0, 42.0, 45.0, 40.0, 36.0, 39.0, 34.0, 37.0, 32.0, 34.0, 24.0, 24.0, 25.0, 22.0, 19.0, 25.0, 16.0, 14.0, 8.0, 8.0, 11.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.853515625, -1.788909912109375, -1.72430419921875, -1.659698486328125, -1.5950927734375, -1.530487060546875, -1.46588134765625, -1.401275634765625, -1.336669921875, -1.272064208984375, -1.20745849609375, -1.142852783203125, -1.0782470703125, -1.013641357421875, -0.94903564453125, -0.884429931640625, -0.81982421875, -0.755218505859375, -0.69061279296875, -0.626007080078125, -0.5614013671875, -0.496795654296875, -0.43218994140625, -0.367584228515625, -0.302978515625, -0.238372802734375, -0.17376708984375, -0.109161376953125, -0.0445556640625, 0.020050048828125, 0.08465576171875, 0.149261474609375, 0.2138671875, 0.278472900390625, 0.34307861328125, 0.407684326171875, 0.4722900390625, 0.536895751953125, 0.60150146484375, 0.666107177734375, 0.730712890625, 0.795318603515625, 0.85992431640625, 0.924530029296875, 0.9891357421875, 1.053741455078125, 1.11834716796875, 1.182952880859375, 1.24755859375, 1.312164306640625, 1.37677001953125, 1.441375732421875, 1.5059814453125, 1.570587158203125, 1.63519287109375, 1.699798583984375, 1.764404296875, 1.829010009765625, 1.89361572265625, 1.958221435546875, 2.0228271484375, 2.087432861328125, 2.15203857421875, 2.216644287109375, 2.28125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 8.0, 11.0, 14.0, 28.0, 29.0, 42.0, 71.0, 97.0, 141.0, 224.0, 362.0, 658.0, 1260.0, 2434.0, 5220.0, 11840.0, 28439.0, 72953.0, 204736.0, 588378.0, 1303727.0, 1206256.0, 493497.0, 169017.0, 60951.0, 24044.0, 10178.0, 4545.0, 2203.0, 1200.0, 658.0, 362.0, 247.0, 137.0, 89.0, 66.0, 50.0, 23.0, 23.0, 17.0, 19.0, 3.0, 12.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0], "bins": [-3.076171875, -2.988067626953125, -2.89996337890625, -2.811859130859375, -2.7237548828125, -2.635650634765625, -2.54754638671875, -2.459442138671875, -2.371337890625, -2.283233642578125, -2.19512939453125, -2.107025146484375, -2.0189208984375, -1.930816650390625, -1.84271240234375, -1.754608154296875, -1.66650390625, -1.578399658203125, -1.49029541015625, -1.402191162109375, -1.3140869140625, -1.225982666015625, -1.13787841796875, -1.049774169921875, -0.961669921875, -0.873565673828125, -0.78546142578125, -0.697357177734375, -0.6092529296875, -0.521148681640625, -0.43304443359375, -0.344940185546875, -0.2568359375, -0.168731689453125, -0.08062744140625, 0.007476806640625, 0.0955810546875, 0.183685302734375, 0.27178955078125, 0.359893798828125, 0.447998046875, 0.536102294921875, 0.62420654296875, 0.712310791015625, 0.8004150390625, 0.888519287109375, 0.97662353515625, 1.064727783203125, 1.15283203125, 1.240936279296875, 1.32904052734375, 1.417144775390625, 1.5052490234375, 1.593353271484375, 1.68145751953125, 1.769561767578125, 1.857666015625, 1.945770263671875, 2.03387451171875, 2.121978759765625, 2.2100830078125, 2.298187255859375, 2.38629150390625, 2.474395751953125, 2.5625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 8.0, 8.0, 11.0, 19.0, 24.0, 30.0, 51.0, 77.0, 102.0, 135.0, 252.0, 322.0, 436.0, 549.0, 527.0, 477.0, 303.0, 221.0, 176.0, 112.0, 93.0, 38.0, 31.0, 28.0, 17.0, 9.0, 5.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.30792236328125, -8.0767822265625, -7.84564208984375, -7.614501953125, -7.38336181640625, -7.1522216796875, -6.92108154296875, -6.68994140625, -6.45880126953125, -6.2276611328125, -5.99652099609375, -5.765380859375, -5.53424072265625, -5.3031005859375, -5.07196044921875, -4.8408203125, -4.60968017578125, -4.3785400390625, -4.14739990234375, -3.916259765625, -3.68511962890625, -3.4539794921875, -3.22283935546875, -2.99169921875, -2.76055908203125, -2.5294189453125, -2.29827880859375, -2.067138671875, -1.83599853515625, -1.6048583984375, -1.37371826171875, -1.142578125, -0.91143798828125, -0.6802978515625, -0.44915771484375, -0.218017578125, 0.01312255859375, 0.2442626953125, 0.47540283203125, 0.70654296875, 0.93768310546875, 1.1688232421875, 1.39996337890625, 1.631103515625, 1.86224365234375, 2.0933837890625, 2.32452392578125, 2.5556640625, 2.78680419921875, 3.0179443359375, 3.24908447265625, 3.480224609375, 3.71136474609375, 3.9425048828125, 4.17364501953125, 4.40478515625, 4.63592529296875, 4.8670654296875, 5.09820556640625, 5.329345703125, 5.56048583984375, 5.7916259765625, 6.02276611328125, 6.25390625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 4.0, 12.0, 21.0, 19.0, 48.0, 50.0, 78.0, 136.0, 201.0, 373.0, 859.0, 2341.0, 10909.0, 82518.0, 839611.0, 2772324.0, 430522.0, 44655.0, 6477.0, 1669.0, 640.0, 313.0, 173.0, 115.0, 75.0, 34.0, 33.0, 22.0, 16.0, 12.0, 8.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.5234375, -8.2000732421875, -7.876708984375, -7.5533447265625, -7.22998046875, -6.9066162109375, -6.583251953125, -6.2598876953125, -5.9365234375, -5.6131591796875, -5.289794921875, -4.9664306640625, -4.64306640625, -4.3197021484375, -3.996337890625, -3.6729736328125, -3.349609375, -3.0262451171875, -2.702880859375, -2.3795166015625, -2.05615234375, -1.7327880859375, -1.409423828125, -1.0860595703125, -0.7626953125, -0.4393310546875, -0.115966796875, 0.2073974609375, 0.53076171875, 0.8541259765625, 1.177490234375, 1.5008544921875, 1.82421875, 2.1475830078125, 2.470947265625, 2.7943115234375, 3.11767578125, 3.4410400390625, 3.764404296875, 4.0877685546875, 4.4111328125, 4.7344970703125, 5.057861328125, 5.3812255859375, 5.70458984375, 6.0279541015625, 6.351318359375, 6.6746826171875, 6.998046875, 7.3214111328125, 7.644775390625, 7.9681396484375, 8.29150390625, 8.6148681640625, 8.938232421875, 9.2615966796875, 9.5849609375, 9.9083251953125, 10.231689453125, 10.5550537109375, 10.87841796875, 11.2017822265625, 11.525146484375, 11.8485107421875, 12.171875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 10.0, 26.0, 58.0, 139.0, 153.0, 198.0, 187.0, 131.0, 66.0, 25.0, 9.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.074621200561523, -23.458099365234375, -21.84157943725586, -20.22505760192871, -18.608535766601562, -16.992015838623047, -15.375494003295898, -13.758973121643066, -12.142452239990234, -10.525931358337402, -8.90941047668457, -7.292888641357422, -5.67636775970459, -4.059846878051758, -2.4433250427246094, -0.8268041610717773, 0.7897167205810547, 2.406237840652466, 4.022758960723877, 5.639280319213867, 7.255801200866699, 8.872322082519531, 10.48884391784668, 12.105364799499512, 13.721885681152344, 15.338406562805176, 16.954927444458008, 18.571449279785156, 20.187969207763672, 21.80449104309082, 23.42101287841797, 25.037532806396484, 26.654052734375, 28.27057456970215, 29.887094497680664, 31.503616333007812, 33.12013626098633, 34.736656188964844, 36.353179931640625, 37.96969985961914, 39.586219787597656, 41.20273971557617, 42.81926345825195, 44.43578338623047, 46.052303314208984, 47.6688232421875, 49.28534698486328, 50.9018669128418, 52.51839065551758, 54.134910583496094, 55.751434326171875, 57.36795425415039, 58.984474182128906, 60.60099792480469, 62.2175178527832, 63.83403778076172, 65.4505615234375, 67.06708526611328, 68.68360137939453, 70.30012512207031, 71.9166488647461, 73.53316497802734, 75.14968872070312, 76.7662124633789, 78.38272857666016]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 9.0, 11.0, 14.0, 11.0, 21.0, 13.0, 20.0, 16.0, 17.0, 14.0, 22.0, 27.0, 31.0, 37.0, 44.0, 43.0, 45.0, 37.0, 37.0, 41.0, 45.0, 44.0, 45.0, 39.0, 36.0, 34.0, 30.0, 29.0, 20.0, 19.0, 27.0, 20.0, 14.0, 18.0, 6.0, 10.0, 7.0, 10.0, 7.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-20.340396881103516, -19.748149871826172, -19.155900955200195, -18.56365394592285, -17.971406936645508, -17.37915802001953, -16.786911010742188, -16.194664001464844, -15.602415084838867, -15.010167121887207, -14.417920112609863, -13.825672149658203, -13.233424186706543, -12.641176223754883, -12.048929214477539, -11.456681251525879, -10.864434242248535, -10.272186279296875, -9.679939270019531, -9.087691307067871, -8.495443344116211, -7.903195858001709, -7.310948371887207, -6.718700408935547, -6.126452922821045, -5.534205436706543, -4.941957473754883, -4.349709987640381, -3.7574622631073, -3.1652145385742188, -2.572967052459717, -1.9807190895080566, -1.3884716033935547, -0.7962239384651184, -0.20397627353668213, 0.3882713317871094, 0.9805190563201904, 1.5727667808532715, 2.1650142669677734, 2.7572622299194336, 3.3495097160339355, 3.9417574405670166, 4.534005165100098, 5.1262526512146, 5.718500137329102, 6.310748100280762, 6.902995586395264, 7.495243549346924, 8.087491035461426, 8.679738998413086, 9.27198600769043, 9.86423397064209, 10.45648193359375, 11.048728942871094, 11.640976905822754, 12.233224868774414, 12.825471878051758, 13.417719841003418, 14.009966850280762, 14.602214813232422, 15.194462776184082, 15.786710739135742, 16.378957748413086, 16.971206665039062, 17.563453674316406]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 1.0, 9.0, 13.0, 9.0, 4.0, 12.0, 17.0, 17.0, 18.0, 25.0, 27.0, 23.0, 28.0, 28.0, 25.0, 26.0, 37.0, 36.0, 52.0, 37.0, 44.0, 41.0, 35.0, 43.0, 32.0, 39.0, 26.0, 27.0, 31.0, 33.0, 26.0, 19.0, 17.0, 27.0, 16.0, 21.0, 8.0, 16.0, 7.0, 7.0, 8.0, 6.0, 6.0, 4.0, 4.0, 1.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.025390625, -1.960723876953125, -1.89605712890625, -1.831390380859375, -1.7667236328125, -1.702056884765625, -1.63739013671875, -1.572723388671875, -1.508056640625, -1.443389892578125, -1.37872314453125, -1.314056396484375, -1.2493896484375, -1.184722900390625, -1.12005615234375, -1.055389404296875, -0.99072265625, -0.926055908203125, -0.86138916015625, -0.796722412109375, -0.7320556640625, -0.667388916015625, -0.60272216796875, -0.538055419921875, -0.473388671875, -0.408721923828125, -0.34405517578125, -0.279388427734375, -0.2147216796875, -0.150054931640625, -0.08538818359375, -0.020721435546875, 0.0439453125, 0.108612060546875, 0.17327880859375, 0.237945556640625, 0.3026123046875, 0.367279052734375, 0.43194580078125, 0.496612548828125, 0.561279296875, 0.625946044921875, 0.69061279296875, 0.755279541015625, 0.8199462890625, 0.884613037109375, 0.94927978515625, 1.013946533203125, 1.07861328125, 1.143280029296875, 1.20794677734375, 1.272613525390625, 1.3372802734375, 1.401947021484375, 1.46661376953125, 1.531280517578125, 1.595947265625, 1.660614013671875, 1.72528076171875, 1.789947509765625, 1.8546142578125, 1.919281005859375, 1.98394775390625, 2.048614501953125, 2.11328125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 8.0, 13.0, 11.0, 26.0, 42.0, 59.0, 80.0, 127.0, 206.0, 274.0, 421.0, 600.0, 787.0, 1224.0, 1778.0, 2673.0, 3691.0, 5720.0, 8443.0, 12780.0, 19459.0, 30433.0, 47517.0, 76065.0, 119999.0, 181455.0, 186968.0, 125237.0, 79555.0, 50062.0, 31669.0, 20576.0, 13514.0, 8809.0, 5863.0, 3875.0, 2695.0, 1780.0, 1269.0, 885.0, 614.0, 397.0, 298.0, 194.0, 136.0, 112.0, 68.0, 38.0, 22.0, 9.0, 10.0, 5.0, 5.0, 3.0, 4.0, 1.0], "bins": [-0.25341796875, -0.24597549438476562, -0.23853302001953125, -0.23109054565429688, -0.2236480712890625, -0.21620559692382812, -0.20876312255859375, -0.20132064819335938, -0.193878173828125, -0.18643569946289062, -0.17899322509765625, -0.17155075073242188, -0.1641082763671875, -0.15666580200195312, -0.14922332763671875, -0.14178085327148438, -0.13433837890625, -0.12689590454101562, -0.11945343017578125, -0.11201095581054688, -0.1045684814453125, -0.09712600708007812, -0.08968353271484375, -0.08224105834960938, -0.074798583984375, -0.06735610961914062, -0.05991363525390625, -0.052471160888671875, -0.0450286865234375, -0.037586212158203125, -0.03014373779296875, -0.022701263427734375, -0.0152587890625, -0.007816314697265625, -0.00037384033203125, 0.007068634033203125, 0.0145111083984375, 0.021953582763671875, 0.02939605712890625, 0.036838531494140625, 0.044281005859375, 0.051723480224609375, 0.05916595458984375, 0.06660842895507812, 0.0740509033203125, 0.08149337768554688, 0.08893585205078125, 0.09637832641601562, 0.10382080078125, 0.11126327514648438, 0.11870574951171875, 0.12614822387695312, 0.1335906982421875, 0.14103317260742188, 0.14847564697265625, 0.15591812133789062, 0.163360595703125, 0.17080307006835938, 0.17824554443359375, 0.18568801879882812, 0.1931304931640625, 0.20057296752929688, 0.20801544189453125, 0.21545791625976562, 0.222900390625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 12.0, 10.0, 13.0, 14.0, 19.0, 25.0, 19.0, 32.0, 26.0, 25.0, 30.0, 43.0, 42.0, 42.0, 43.0, 46.0, 44.0, 1052.0, 35.0, 42.0, 37.0, 42.0, 41.0, 40.0, 34.0, 28.0, 29.0, 15.0, 22.0, 18.0, 15.0, 14.0, 14.0, 10.0, 9.0, 3.0, 7.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.228515625, -1.1830291748046875, -1.137542724609375, -1.0920562744140625, -1.04656982421875, -1.0010833740234375, -0.955596923828125, -0.9101104736328125, -0.8646240234375, -0.8191375732421875, -0.773651123046875, -0.7281646728515625, -0.68267822265625, -0.6371917724609375, -0.591705322265625, -0.5462188720703125, -0.500732421875, -0.4552459716796875, -0.409759521484375, -0.3642730712890625, -0.31878662109375, -0.2733001708984375, -0.227813720703125, -0.1823272705078125, -0.1368408203125, -0.0913543701171875, -0.045867919921875, -0.0003814697265625, 0.04510498046875, 0.0905914306640625, 0.136077880859375, 0.1815643310546875, 0.22705078125, 0.2725372314453125, 0.318023681640625, 0.3635101318359375, 0.40899658203125, 0.4544830322265625, 0.499969482421875, 0.5454559326171875, 0.5909423828125, 0.6364288330078125, 0.681915283203125, 0.7274017333984375, 0.77288818359375, 0.8183746337890625, 0.863861083984375, 0.9093475341796875, 0.954833984375, 1.0003204345703125, 1.045806884765625, 1.0912933349609375, 1.13677978515625, 1.1822662353515625, 1.227752685546875, 1.2732391357421875, 1.3187255859375, 1.3642120361328125, 1.409698486328125, 1.4551849365234375, 1.50067138671875, 1.5461578369140625, 1.591644287109375, 1.6371307373046875, 1.6826171875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 14.0, 6.0, 13.0, 30.0, 40.0, 59.0, 56.0, 113.0, 119.0, 244.0, 325.0, 447.0, 653.0, 943.0, 1396.0, 2031.0, 3062.0, 4546.0, 6931.0, 10534.0, 16378.0, 24891.0, 37873.0, 58389.0, 89631.0, 133324.0, 1168709.0, 205998.0, 113353.0, 75243.0, 48781.0, 31953.0, 20843.0, 13520.0, 8792.0, 5814.0, 3831.0, 2686.0, 1738.0, 1235.0, 768.0, 545.0, 411.0, 277.0, 198.0, 115.0, 91.0, 67.0, 36.0, 31.0, 27.0, 7.0, 10.0, 9.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.156494140625, -0.15157127380371094, -0.14664840698242188, -0.1417255401611328, -0.13680267333984375, -0.1318798065185547, -0.12695693969726562, -0.12203407287597656, -0.1171112060546875, -0.11218833923339844, -0.10726547241210938, -0.10234260559082031, -0.09741973876953125, -0.09249687194824219, -0.08757400512695312, -0.08265113830566406, -0.077728271484375, -0.07280540466308594, -0.06788253784179688, -0.06295967102050781, -0.05803680419921875, -0.05311393737792969, -0.048191070556640625, -0.04326820373535156, -0.0383453369140625, -0.03342247009277344, -0.028499603271484375, -0.023576736450195312, -0.01865386962890625, -0.013731002807617188, -0.008808135986328125, -0.0038852691650390625, 0.00103759765625, 0.0059604644775390625, 0.010883331298828125, 0.015806198120117188, 0.02072906494140625, 0.025651931762695312, 0.030574798583984375, 0.03549766540527344, 0.0404205322265625, 0.04534339904785156, 0.050266265869140625, 0.05518913269042969, 0.06011199951171875, 0.06503486633300781, 0.06995773315429688, 0.07488059997558594, 0.079803466796875, 0.08472633361816406, 0.08964920043945312, 0.09457206726074219, 0.09949493408203125, 0.10441780090332031, 0.10934066772460938, 0.11426353454589844, 0.1191864013671875, 0.12410926818847656, 0.12903213500976562, 0.1339550018310547, 0.13887786865234375, 0.1438007354736328, 0.14872360229492188, 0.15364646911621094, 0.1585693359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 8.0, 12.0, 8.0, 18.0, 18.0, 14.0, 15.0, 26.0, 24.0, 18.0, 31.0, 48.0, 36.0, 50.0, 84.0, 103.0, 107.0, 73.0, 41.0, 33.0, 32.0, 29.0, 20.0, 23.0, 23.0, 15.0, 17.0, 7.0, 10.0, 5.0, 5.0, 7.0, 8.0, 6.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0044097900390625, -0.004250943660736084, -0.004092097282409668, -0.003933250904083252, -0.003774404525756836, -0.00361555814743042, -0.003456711769104004, -0.003297865390777588, -0.003139019012451172, -0.002980172634124756, -0.00282132625579834, -0.002662479877471924, -0.002503633499145508, -0.002344787120819092, -0.0021859407424926758, -0.0020270943641662598, -0.0018682479858398438, -0.0017094016075134277, -0.0015505552291870117, -0.0013917088508605957, -0.0012328624725341797, -0.0010740160942077637, -0.0009151697158813477, -0.0007563233375549316, -0.0005974769592285156, -0.0004386305809020996, -0.0002797842025756836, -0.00012093782424926758, 3.790855407714844e-05, 0.00019675493240356445, 0.00035560131072998047, 0.0005144476890563965, 0.0006732940673828125, 0.0008321404457092285, 0.0009909868240356445, 0.0011498332023620605, 0.0013086795806884766, 0.0014675259590148926, 0.0016263723373413086, 0.0017852187156677246, 0.0019440650939941406, 0.0021029114723205566, 0.0022617578506469727, 0.0024206042289733887, 0.0025794506072998047, 0.0027382969856262207, 0.0028971433639526367, 0.0030559897422790527, 0.0032148361206054688, 0.0033736824989318848, 0.0035325288772583008, 0.003691375255584717, 0.003850221633911133, 0.004009068012237549, 0.004167914390563965, 0.004326760768890381, 0.004485607147216797, 0.004644453525543213, 0.004803299903869629, 0.004962146282196045, 0.005120992660522461, 0.005279839038848877, 0.005438685417175293, 0.005597531795501709, 0.005756378173828125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 8.0, 5.0, 9.0, 8.0, 9.0, 16.0, 25.0, 34.0, 46.0, 58.0, 78.0, 118.0, 136.0, 191.0, 287.0, 455.0, 1917.0, 91047.0, 938670.0, 13356.0, 842.0, 358.0, 214.0, 153.0, 122.0, 98.0, 56.0, 51.0, 51.0, 28.0, 28.0, 28.0, 11.0, 9.0, 10.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0859375, -0.08335590362548828, -0.08077430725097656, -0.07819271087646484, -0.07561111450195312, -0.0730295181274414, -0.07044792175292969, -0.06786632537841797, -0.06528472900390625, -0.06270313262939453, -0.06012153625488281, -0.057539939880371094, -0.054958343505859375, -0.052376747131347656, -0.04979515075683594, -0.04721355438232422, -0.0446319580078125, -0.04205036163330078, -0.03946876525878906, -0.036887168884277344, -0.034305572509765625, -0.031723976135253906, -0.029142379760742188, -0.02656078338623047, -0.02397918701171875, -0.02139759063720703, -0.018815994262695312, -0.016234397888183594, -0.013652801513671875, -0.011071205139160156, -0.008489608764648438, -0.005908012390136719, -0.003326416015625, -0.0007448196411132812, 0.0018367767333984375, 0.004418373107910156, 0.006999969482421875, 0.009581565856933594, 0.012163162231445312, 0.014744758605957031, 0.01732635498046875, 0.01990795135498047, 0.022489547729492188, 0.025071144104003906, 0.027652740478515625, 0.030234336853027344, 0.03281593322753906, 0.03539752960205078, 0.0379791259765625, 0.04056072235107422, 0.04314231872558594, 0.045723915100097656, 0.048305511474609375, 0.050887107849121094, 0.05346870422363281, 0.05605030059814453, 0.05863189697265625, 0.06121349334716797, 0.06379508972167969, 0.0663766860961914, 0.06895828247070312, 0.07153987884521484, 0.07412147521972656, 0.07670307159423828, 0.07928466796875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 24.0, 662.0, 287.0, 36.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020383179187774658, -0.019163617864251137, -0.017944056540727615, -0.016724495217204094, -0.015504933893680573, -0.014285372570157051, -0.013065812177956104, -0.011846250854432583, -0.010626689530909061, -0.00940712820738554, -0.008187566883862019, -0.0069680060259997845, -0.005748444702476263, -0.004528883378952742, -0.0033093225210905075, -0.002089761197566986, -0.0008701998740434647, 0.00034936133306473494, 0.0015689225401729345, 0.0027884836308658123, 0.004008044954389334, 0.005227606277912855, 0.006447167135775089, 0.007666728459298611, 0.008886289782822132, 0.010105851106345654, 0.011325412429869175, 0.012544972822070122, 0.013764534145593643, 0.014984095469117165, 0.016203656792640686, 0.017423218116164207, 0.01864277943968773, 0.01986234076321125, 0.02108190208673477, 0.022301463410258293, 0.023521024733781815, 0.024740586057305336, 0.025960147380828857, 0.02717970684170723, 0.0283992700278759, 0.02961883135139942, 0.030838392674922943, 0.032057952135801315, 0.033277515321969986, 0.03449707478284836, 0.03571663796901703, 0.0369361974298954, 0.03815575689077377, 0.039375316351652145, 0.040594879537820816, 0.04181443899869919, 0.04303400218486786, 0.04425356164574623, 0.0454731248319149, 0.046692684292793274, 0.047912247478961945, 0.04913180693984032, 0.05035137012600899, 0.05157092958688736, 0.05279049277305603, 0.0540100522339344, 0.05522961542010307, 0.056449174880981445, 0.057668738067150116]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 6.0, 4.0, 10.0, 8.0, 16.0, 13.0, 25.0, 17.0, 25.0, 37.0, 34.0, 39.0, 39.0, 34.0, 43.0, 45.0, 49.0, 52.0, 56.0, 50.0, 41.0, 45.0, 39.0, 41.0, 44.0, 29.0, 32.0, 28.0, 22.0, 16.0, 18.0, 8.0, 10.0, 7.0, 4.0, 7.0, 4.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005774140357971191, -0.005610007792711258, -0.0054458752274513245, -0.005281742662191391, -0.0051176100969314575, -0.004953477531671524, -0.004789344966411591, -0.004625212401151657, -0.004461079835891724, -0.00429694727063179, -0.004132814705371857, -0.003968682140111923, -0.0038045495748519897, -0.0036404170095920563, -0.003476284444332123, -0.0033121518790721893, -0.003148019313812256, -0.0029838867485523224, -0.002819754183292389, -0.0026556216180324554, -0.002491489052772522, -0.0023273564875125885, -0.002163223922252655, -0.0019990913569927216, -0.001834958791732788, -0.0016708262264728546, -0.0015066936612129211, -0.0013425610959529877, -0.0011784285306930542, -0.0010142959654331207, -0.0008501634001731873, -0.0006860308349132538, -0.0005218982696533203, -0.00035776570439338684, -0.00019363313913345337, -2.9500573873519897e-05, 0.00013463199138641357, 0.00029876455664634705, 0.0004628971219062805, 0.000627029687166214, 0.0007911622524261475, 0.0009552948176860809, 0.0011194273829460144, 0.0012835599482059479, 0.0014476925134658813, 0.0016118250787258148, 0.0017759576439857483, 0.0019400902092456818, 0.0021042227745056152, 0.0022683553397655487, 0.002432487905025482, 0.0025966204702854156, 0.002760753035545349, 0.0029248856008052826, 0.003089018166065216, 0.0032531507313251495, 0.003417283296585083, 0.0035814158618450165, 0.00374554842710495, 0.003909680992364883, 0.004073813557624817, 0.00423794612288475, 0.004402078688144684, 0.004566211253404617, 0.004730343818664551]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 1.0, 9.0, 13.0, 9.0, 4.0, 12.0, 17.0, 17.0, 18.0, 25.0, 27.0, 23.0, 28.0, 28.0, 25.0, 26.0, 37.0, 36.0, 52.0, 37.0, 44.0, 41.0, 34.0, 44.0, 32.0, 39.0, 26.0, 27.0, 31.0, 33.0, 26.0, 19.0, 17.0, 27.0, 16.0, 21.0, 8.0, 16.0, 7.0, 7.0, 8.0, 6.0, 6.0, 4.0, 4.0, 1.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.025390625, -1.960723876953125, -1.89605712890625, -1.831390380859375, -1.7667236328125, -1.702056884765625, -1.63739013671875, -1.572723388671875, -1.508056640625, -1.443389892578125, -1.37872314453125, -1.314056396484375, -1.2493896484375, -1.184722900390625, -1.12005615234375, -1.055389404296875, -0.99072265625, -0.926055908203125, -0.86138916015625, -0.796722412109375, -0.7320556640625, -0.667388916015625, -0.60272216796875, -0.538055419921875, -0.473388671875, -0.408721923828125, -0.34405517578125, -0.279388427734375, -0.2147216796875, -0.150054931640625, -0.08538818359375, -0.020721435546875, 0.0439453125, 0.108612060546875, 0.17327880859375, 0.237945556640625, 0.3026123046875, 0.367279052734375, 0.43194580078125, 0.496612548828125, 0.561279296875, 0.625946044921875, 0.69061279296875, 0.755279541015625, 0.8199462890625, 0.884613037109375, 0.94927978515625, 1.013946533203125, 1.07861328125, 1.143280029296875, 1.20794677734375, 1.272613525390625, 1.3372802734375, 1.401947021484375, 1.46661376953125, 1.531280517578125, 1.595947265625, 1.660614013671875, 1.72528076171875, 1.789947509765625, 1.8546142578125, 1.919281005859375, 1.98394775390625, 2.048614501953125, 2.11328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 13.0, 11.0, 17.0, 24.0, 28.0, 55.0, 39.0, 100.0, 106.0, 139.0, 267.0, 337.0, 526.0, 836.0, 1148.0, 1843.0, 2712.0, 4386.0, 7064.0, 11898.0, 20890.0, 41017.0, 92905.0, 217514.0, 321987.0, 171622.0, 72752.0, 33163.0, 17601.0, 10160.0, 6164.0, 3878.0, 2446.0, 1601.0, 1063.0, 681.0, 477.0, 314.0, 237.0, 154.0, 114.0, 83.0, 48.0, 44.0, 28.0, 19.0, 13.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.1640625, -2.0927734375, -2.021484375, -1.9501953125, -1.87890625, -1.8076171875, -1.736328125, -1.6650390625, -1.59375, -1.5224609375, -1.451171875, -1.3798828125, -1.30859375, -1.2373046875, -1.166015625, -1.0947265625, -1.0234375, -0.9521484375, -0.880859375, -0.8095703125, -0.73828125, -0.6669921875, -0.595703125, -0.5244140625, -0.453125, -0.3818359375, -0.310546875, -0.2392578125, -0.16796875, -0.0966796875, -0.025390625, 0.0458984375, 0.1171875, 0.1884765625, 0.259765625, 0.3310546875, 0.40234375, 0.4736328125, 0.544921875, 0.6162109375, 0.6875, 0.7587890625, 0.830078125, 0.9013671875, 0.97265625, 1.0439453125, 1.115234375, 1.1865234375, 1.2578125, 1.3291015625, 1.400390625, 1.4716796875, 1.54296875, 1.6142578125, 1.685546875, 1.7568359375, 1.828125, 1.8994140625, 1.970703125, 2.0419921875, 2.11328125, 2.1845703125, 2.255859375, 2.3271484375, 2.3984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 5.0, 2.0, 7.0, 13.0, 12.0, 16.0, 17.0, 14.0, 25.0, 25.0, 26.0, 40.0, 43.0, 50.0, 67.0, 113.0, 135.0, 1392.0, 364.0, 165.0, 108.0, 64.0, 51.0, 53.0, 41.0, 34.0, 35.0, 19.0, 28.0, 16.0, 23.0, 8.0, 8.0, 6.0, 5.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3675537109375, -8.078857421875, -7.7901611328125, -7.50146484375, -7.2127685546875, -6.924072265625, -6.6353759765625, -6.3466796875, -6.0579833984375, -5.769287109375, -5.4805908203125, -5.19189453125, -4.9031982421875, -4.614501953125, -4.3258056640625, -4.037109375, -3.7484130859375, -3.459716796875, -3.1710205078125, -2.88232421875, -2.5936279296875, -2.304931640625, -2.0162353515625, -1.7275390625, -1.4388427734375, -1.150146484375, -0.8614501953125, -0.57275390625, -0.2840576171875, 0.004638671875, 0.2933349609375, 0.58203125, 0.8707275390625, 1.159423828125, 1.4481201171875, 1.73681640625, 2.0255126953125, 2.314208984375, 2.6029052734375, 2.8916015625, 3.1802978515625, 3.468994140625, 3.7576904296875, 4.04638671875, 4.3350830078125, 4.623779296875, 4.9124755859375, 5.201171875, 5.4898681640625, 5.778564453125, 6.0672607421875, 6.35595703125, 6.6446533203125, 6.933349609375, 7.2220458984375, 7.5107421875, 7.7994384765625, 8.088134765625, 8.3768310546875, 8.66552734375, 8.9542236328125, 9.242919921875, 9.5316162109375, 9.8203125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 7.0, 14.0, 18.0, 27.0, 41.0, 68.0, 91.0, 181.0, 331.0, 843.0, 10002.0, 3077145.0, 54640.0, 1393.0, 378.0, 213.0, 114.0, 56.0, 42.0, 27.0, 16.0, 12.0, 12.0, 9.0, 10.0, 2.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.25, -32.232177734375, -31.21435546875, -30.196533203125, -29.1787109375, -28.160888671875, -27.14306640625, -26.125244140625, -25.107421875, -24.089599609375, -23.07177734375, -22.053955078125, -21.0361328125, -20.018310546875, -19.00048828125, -17.982666015625, -16.96484375, -15.947021484375, -14.92919921875, -13.911376953125, -12.8935546875, -11.875732421875, -10.85791015625, -9.840087890625, -8.822265625, -7.804443359375, -6.78662109375, -5.768798828125, -4.7509765625, -3.733154296875, -2.71533203125, -1.697509765625, -0.6796875, 0.338134765625, 1.35595703125, 2.373779296875, 3.3916015625, 4.409423828125, 5.42724609375, 6.445068359375, 7.462890625, 8.480712890625, 9.49853515625, 10.516357421875, 11.5341796875, 12.552001953125, 13.56982421875, 14.587646484375, 15.60546875, 16.623291015625, 17.64111328125, 18.658935546875, 19.6767578125, 20.694580078125, 21.71240234375, 22.730224609375, 23.748046875, 24.765869140625, 25.78369140625, 26.801513671875, 27.8193359375, 28.837158203125, 29.85498046875, 30.872802734375, 31.890625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 335.0, 659.0, 20.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.099002838134766, -49.07429122924805, -45.049583435058594, -41.024871826171875, -37.000160217285156, -32.9754524230957, -28.950740814208984, -24.9260311126709, -20.901321411132812, -16.876611709594727, -12.851901054382324, -8.827190399169922, -4.802480697631836, -0.77777099609375, 3.2469406127929688, 7.271650314331055, 11.29636001586914, 15.321069717407227, 19.345779418945312, 23.37049102783203, 27.395200729370117, 31.419910430908203, 35.44462203979492, 39.469329833984375, 43.494041442871094, 47.51875305175781, 51.543460845947266, 55.568172454833984, 59.59288024902344, 63.617591857910156, 67.64230346679688, 71.6670150756836, 75.69171142578125, 79.71642303466797, 83.74113464355469, 87.76583862304688, 91.7905502319336, 95.81526184082031, 99.83997344970703, 103.86468505859375, 107.88938903808594, 111.91410064697266, 115.93881225585938, 119.96351623535156, 123.98822784423828, 128.012939453125, 132.03765869140625, 136.06236267089844, 140.08706665039062, 144.1117706298828, 148.13648986816406, 152.16119384765625, 156.1859130859375, 160.2106170654297, 164.23532104492188, 168.26004028320312, 172.28475952148438, 176.30946350097656, 180.3341827392578, 184.35888671875, 188.38360595703125, 192.40830993652344, 196.43301391601562, 200.45773315429688, 204.48243713378906]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 9.0, 13.0, 18.0, 14.0, 15.0, 29.0, 18.0, 27.0, 29.0, 37.0, 40.0, 53.0, 27.0, 38.0, 44.0, 51.0, 36.0, 40.0, 47.0, 37.0, 53.0, 40.0, 50.0, 33.0, 33.0, 18.0, 23.0, 24.0, 15.0, 19.0, 11.0, 7.0, 5.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.452285766601562, -18.810428619384766, -18.16857147216797, -17.526714324951172, -16.884857177734375, -16.24300193786621, -15.601144790649414, -14.959287643432617, -14.31743049621582, -13.675573348999023, -13.033716201782227, -12.391860008239746, -11.75000286102295, -11.108145713806152, -10.466289520263672, -9.824432373046875, -9.182575225830078, -8.540718078613281, -7.898861408233643, -7.257004737854004, -6.615147590637207, -5.97329044342041, -5.3314337730407715, -4.689577102661133, -4.047719955444336, -3.405863046646118, -2.7640061378479004, -2.1221492290496826, -1.4802923202514648, -0.8384354114532471, -0.1965785026550293, 0.4452781677246094, 1.0871353149414062, 1.728992223739624, 2.370849132537842, 3.0127060413360596, 3.6545629501342773, 4.296420097351074, 4.938276767730713, 5.580133438110352, 6.221990585327148, 6.863847732543945, 7.505704402923584, 8.147561073303223, 8.78941822052002, 9.431275367736816, 10.073131561279297, 10.714988708496094, 11.35684585571289, 11.998703002929688, 12.640560150146484, 13.282416343688965, 13.924273490905762, 14.566130638122559, 15.207986831665039, 15.849843978881836, 16.491701126098633, 17.13355827331543, 17.775415420532227, 18.417272567749023, 19.059127807617188, 19.700984954833984, 20.34284210205078, 20.984699249267578, 21.626556396484375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 3.0, 3.0, 0.0, 5.0, 5.0, 8.0, 11.0, 7.0, 12.0, 13.0, 9.0, 15.0, 19.0, 17.0, 17.0, 24.0, 27.0, 27.0, 32.0, 22.0, 42.0, 34.0, 32.0, 32.0, 39.0, 39.0, 34.0, 38.0, 46.0, 39.0, 32.0, 20.0, 31.0, 32.0, 30.0, 22.0, 20.0, 26.0, 11.0, 22.0, 14.0, 14.0, 9.0, 14.0, 15.0, 7.0, 9.0, 5.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.927734375, -1.86212158203125, -1.7965087890625, -1.73089599609375, -1.665283203125, -1.59967041015625, -1.5340576171875, -1.46844482421875, -1.40283203125, -1.33721923828125, -1.2716064453125, -1.20599365234375, -1.140380859375, -1.07476806640625, -1.0091552734375, -0.94354248046875, -0.8779296875, -0.81231689453125, -0.7467041015625, -0.68109130859375, -0.615478515625, -0.54986572265625, -0.4842529296875, -0.41864013671875, -0.35302734375, -0.28741455078125, -0.2218017578125, -0.15618896484375, -0.090576171875, -0.02496337890625, 0.0406494140625, 0.10626220703125, 0.171875, 0.23748779296875, 0.3031005859375, 0.36871337890625, 0.434326171875, 0.49993896484375, 0.5655517578125, 0.63116455078125, 0.69677734375, 0.76239013671875, 0.8280029296875, 0.89361572265625, 0.959228515625, 1.02484130859375, 1.0904541015625, 1.15606689453125, 1.2216796875, 1.28729248046875, 1.3529052734375, 1.41851806640625, 1.484130859375, 1.54974365234375, 1.6153564453125, 1.68096923828125, 1.74658203125, 1.81219482421875, 1.8778076171875, 1.94342041015625, 2.009033203125, 2.07464599609375, 2.1402587890625, 2.20587158203125, 2.271484375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 5.0, 9.0, 9.0, 8.0, 14.0, 22.0, 18.0, 26.0, 23.0, 40.0, 44.0, 37.0, 48.0, 44.0, 60.0, 95.0, 115.0, 197.0, 438.0, 1568.0, 10289.0, 126272.0, 2137958.0, 1807124.0, 98354.0, 8725.0, 1500.0, 455.0, 206.0, 107.0, 83.0, 51.0, 46.0, 48.0, 31.0, 40.0, 34.0, 24.0, 19.0, 19.0, 15.0, 15.0, 13.0, 11.0, 4.0, 6.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.7265625, -8.4534912109375, -8.180419921875, -7.9073486328125, -7.63427734375, -7.3612060546875, -7.088134765625, -6.8150634765625, -6.5419921875, -6.2689208984375, -5.995849609375, -5.7227783203125, -5.44970703125, -5.1766357421875, -4.903564453125, -4.6304931640625, -4.357421875, -4.0843505859375, -3.811279296875, -3.5382080078125, -3.26513671875, -2.9920654296875, -2.718994140625, -2.4459228515625, -2.1728515625, -1.8997802734375, -1.626708984375, -1.3536376953125, -1.08056640625, -0.8074951171875, -0.534423828125, -0.2613525390625, 0.01171875, 0.2847900390625, 0.557861328125, 0.8309326171875, 1.10400390625, 1.3770751953125, 1.650146484375, 1.9232177734375, 2.1962890625, 2.4693603515625, 2.742431640625, 3.0155029296875, 3.28857421875, 3.5616455078125, 3.834716796875, 4.1077880859375, 4.380859375, 4.6539306640625, 4.927001953125, 5.2000732421875, 5.47314453125, 5.7462158203125, 6.019287109375, 6.2923583984375, 6.5654296875, 6.8385009765625, 7.111572265625, 7.3846435546875, 7.65771484375, 7.9307861328125, 8.203857421875, 8.4769287109375, 8.75]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 6.0, 5.0, 8.0, 16.0, 14.0, 19.0, 31.0, 47.0, 75.0, 132.0, 213.0, 344.0, 461.0, 665.0, 630.0, 505.0, 311.0, 201.0, 151.0, 77.0, 55.0, 40.0, 24.0, 10.0, 18.0, 9.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9375, -11.65325927734375, -11.3690185546875, -11.08477783203125, -10.800537109375, -10.51629638671875, -10.2320556640625, -9.94781494140625, -9.66357421875, -9.37933349609375, -9.0950927734375, -8.81085205078125, -8.526611328125, -8.24237060546875, -7.9581298828125, -7.67388916015625, -7.3896484375, -7.10540771484375, -6.8211669921875, -6.53692626953125, -6.252685546875, -5.96844482421875, -5.6842041015625, -5.39996337890625, -5.11572265625, -4.83148193359375, -4.5472412109375, -4.26300048828125, -3.978759765625, -3.69451904296875, -3.4102783203125, -3.12603759765625, -2.841796875, -2.55755615234375, -2.2733154296875, -1.98907470703125, -1.704833984375, -1.42059326171875, -1.1363525390625, -0.85211181640625, -0.56787109375, -0.28363037109375, 0.0006103515625, 0.28485107421875, 0.569091796875, 0.85333251953125, 1.1375732421875, 1.42181396484375, 1.7060546875, 1.99029541015625, 2.2745361328125, 2.55877685546875, 2.843017578125, 3.12725830078125, 3.4114990234375, 3.69573974609375, 3.97998046875, 4.26422119140625, 4.5484619140625, 4.83270263671875, 5.116943359375, 5.40118408203125, 5.6854248046875, 5.96966552734375, 6.25390625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 11.0, 6.0, 17.0, 28.0, 46.0, 75.0, 121.0, 223.0, 427.0, 1187.0, 13949.0, 2252129.0, 1911957.0, 12090.0, 1156.0, 381.0, 207.0, 105.0, 65.0, 30.0, 23.0, 15.0, 10.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.214111328125, -14.41259765625, -13.611083984375, -12.8095703125, -12.008056640625, -11.20654296875, -10.405029296875, -9.603515625, -8.802001953125, -8.00048828125, -7.198974609375, -6.3974609375, -5.595947265625, -4.79443359375, -3.992919921875, -3.19140625, -2.389892578125, -1.58837890625, -0.786865234375, 0.0146484375, 0.816162109375, 1.61767578125, 2.419189453125, 3.220703125, 4.022216796875, 4.82373046875, 5.625244140625, 6.4267578125, 7.228271484375, 8.02978515625, 8.831298828125, 9.6328125, 10.434326171875, 11.23583984375, 12.037353515625, 12.8388671875, 13.640380859375, 14.44189453125, 15.243408203125, 16.044921875, 16.846435546875, 17.64794921875, 18.449462890625, 19.2509765625, 20.052490234375, 20.85400390625, 21.655517578125, 22.45703125, 23.258544921875, 24.06005859375, 24.861572265625, 25.6630859375, 26.464599609375, 27.26611328125, 28.067626953125, 28.869140625, 29.670654296875, 30.47216796875, 31.273681640625, 32.0751953125, 32.876708984375, 33.67822265625, 34.479736328125, 35.28125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 12.0, 13.0, 37.0, 29.0, 62.0, 79.0, 76.0, 111.0, 112.0, 117.0, 97.0, 88.0, 61.0, 38.0, 29.0, 21.0, 12.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.321203231811523, -12.275741577148438, -11.230279922485352, -10.184818267822266, -9.13935661315918, -8.093894958496094, -7.048433303833008, -6.002971649169922, -4.957509994506836, -3.91204833984375, -2.866586685180664, -1.8211250305175781, -0.7756633758544922, 0.26979827880859375, 1.3152599334716797, 2.3607215881347656, 3.4061832427978516, 4.4516448974609375, 5.497106552124023, 6.542568206787109, 7.588029861450195, 8.633491516113281, 9.678953170776367, 10.724414825439453, 11.769876480102539, 12.815338134765625, 13.860799789428711, 14.906261444091797, 15.951723098754883, 16.99718475341797, 18.042646408081055, 19.08810806274414, 20.133567810058594, 21.17902946472168, 22.224491119384766, 23.26995277404785, 24.315414428710938, 25.360876083374023, 26.40633773803711, 27.451799392700195, 28.49726104736328, 29.542722702026367, 30.588184356689453, 31.63364601135254, 32.679107666015625, 33.724571228027344, 34.7700309753418, 35.81549072265625, 36.86095428466797, 37.90641784667969, 38.95187759399414, 39.997337341308594, 41.04280090332031, 42.08826446533203, 43.133724212646484, 44.17918395996094, 45.224647521972656, 46.270111083984375, 47.31557083129883, 48.36103057861328, 49.406494140625, 50.45195770263672, 51.49741744995117, 52.542877197265625, 53.588340759277344]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 4.0, 7.0, 10.0, 20.0, 16.0, 21.0, 14.0, 24.0, 24.0, 23.0, 36.0, 27.0, 35.0, 33.0, 45.0, 40.0, 41.0, 46.0, 44.0, 37.0, 47.0, 38.0, 40.0, 44.0, 40.0, 16.0, 27.0, 24.0, 28.0, 28.0, 18.0, 12.0, 12.0, 20.0, 8.0, 12.0, 4.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.31110382080078, -20.648548126220703, -19.985992431640625, -19.32343864440918, -18.6608829498291, -17.998327255249023, -17.335773468017578, -16.6732177734375, -16.010662078857422, -15.348106384277344, -14.685551643371582, -14.02299690246582, -13.360441207885742, -12.697885513305664, -12.035330772399902, -11.37277603149414, -10.710220336914062, -10.047664642333984, -9.385109901428223, -8.722555160522461, -8.059999465942383, -7.397444248199463, -6.734889030456543, -6.072333812713623, -5.409778594970703, -4.747223377227783, -4.084668159484863, -3.4221129417419434, -2.7595577239990234, -2.0970025062561035, -1.4344472885131836, -0.7718920707702637, -0.10933685302734375, 0.5532183647155762, 1.215773582458496, 1.878328800201416, 2.540884017944336, 3.203439235687256, 3.865994453430176, 4.528549671173096, 5.191104888916016, 5.8536601066589355, 6.5162153244018555, 7.178770542144775, 7.841325759887695, 8.503881454467773, 9.166436195373535, 9.828990936279297, 10.491546630859375, 11.154102325439453, 11.816657066345215, 12.479211807250977, 13.141767501831055, 13.804323196411133, 14.466877937316895, 15.129432678222656, 15.791988372802734, 16.454544067382812, 17.11709976196289, 17.779653549194336, 18.442209243774414, 19.104764938354492, 19.767318725585938, 20.429874420166016, 21.092430114746094]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 6.0, 6.0, 10.0, 14.0, 12.0, 19.0, 15.0, 23.0, 21.0, 32.0, 29.0, 32.0, 33.0, 33.0, 30.0, 31.0, 47.0, 43.0, 38.0, 34.0, 43.0, 37.0, 41.0, 39.0, 29.0, 23.0, 27.0, 25.0, 24.0, 24.0, 21.0, 22.0, 15.0, 21.0, 12.0, 12.0, 13.0, 13.0, 9.0, 5.0, 4.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.197265625, -2.126922607421875, -2.05657958984375, -1.986236572265625, -1.9158935546875, -1.845550537109375, -1.77520751953125, -1.704864501953125, -1.634521484375, -1.564178466796875, -1.49383544921875, -1.423492431640625, -1.3531494140625, -1.282806396484375, -1.21246337890625, -1.142120361328125, -1.07177734375, -1.001434326171875, -0.93109130859375, -0.860748291015625, -0.7904052734375, -0.720062255859375, -0.64971923828125, -0.579376220703125, -0.509033203125, -0.438690185546875, -0.36834716796875, -0.298004150390625, -0.2276611328125, -0.157318115234375, -0.08697509765625, -0.016632080078125, 0.0537109375, 0.124053955078125, 0.19439697265625, 0.264739990234375, 0.3350830078125, 0.405426025390625, 0.47576904296875, 0.546112060546875, 0.616455078125, 0.686798095703125, 0.75714111328125, 0.827484130859375, 0.8978271484375, 0.968170166015625, 1.03851318359375, 1.108856201171875, 1.17919921875, 1.249542236328125, 1.31988525390625, 1.390228271484375, 1.4605712890625, 1.530914306640625, 1.60125732421875, 1.671600341796875, 1.741943359375, 1.812286376953125, 1.88262939453125, 1.952972412109375, 2.0233154296875, 2.093658447265625, 2.16400146484375, 2.234344482421875, 2.3046875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 8.0, 16.0, 24.0, 28.0, 54.0, 71.0, 110.0, 169.0, 248.0, 310.0, 506.0, 692.0, 1014.0, 1495.0, 2223.0, 3160.0, 4867.0, 7194.0, 11167.0, 16923.0, 27231.0, 44250.0, 73761.0, 120876.0, 183323.0, 193965.0, 136114.0, 83033.0, 49944.0, 30338.0, 18868.0, 12091.0, 8055.0, 5237.0, 3537.0, 2396.0, 1678.0, 1124.0, 750.0, 531.0, 388.0, 242.0, 182.0, 122.0, 83.0, 50.0, 31.0, 25.0, 13.0, 13.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.2822265625, -0.27370452880859375, -0.2651824951171875, -0.25666046142578125, -0.248138427734375, -0.23961639404296875, -0.2310943603515625, -0.22257232666015625, -0.21405029296875, -0.20552825927734375, -0.1970062255859375, -0.18848419189453125, -0.179962158203125, -0.17144012451171875, -0.1629180908203125, -0.15439605712890625, -0.1458740234375, -0.13735198974609375, -0.1288299560546875, -0.12030792236328125, -0.111785888671875, -0.10326385498046875, -0.0947418212890625, -0.08621978759765625, -0.07769775390625, -0.06917572021484375, -0.0606536865234375, -0.05213165283203125, -0.043609619140625, -0.03508758544921875, -0.0265655517578125, -0.01804351806640625, -0.009521484375, -0.00099945068359375, 0.0075225830078125, 0.01604461669921875, 0.024566650390625, 0.03308868408203125, 0.0416107177734375, 0.05013275146484375, 0.05865478515625, 0.06717681884765625, 0.0756988525390625, 0.08422088623046875, 0.092742919921875, 0.10126495361328125, 0.1097869873046875, 0.11830902099609375, 0.1268310546875, 0.13535308837890625, 0.1438751220703125, 0.15239715576171875, 0.160919189453125, 0.16944122314453125, 0.1779632568359375, 0.18648529052734375, 0.19500732421875, 0.20352935791015625, 0.2120513916015625, 0.22057342529296875, 0.229095458984375, 0.23761749267578125, 0.2461395263671875, 0.25466156005859375, 0.26318359375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 1.0, 4.0, 9.0, 12.0, 3.0, 10.0, 16.0, 11.0, 18.0, 24.0, 21.0, 29.0, 38.0, 27.0, 34.0, 32.0, 38.0, 37.0, 40.0, 48.0, 37.0, 1063.0, 33.0, 51.0, 44.0, 33.0, 36.0, 33.0, 35.0, 27.0, 26.0, 23.0, 25.0, 14.0, 11.0, 16.0, 14.0, 10.0, 9.0, 4.0, 6.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.318359375, -1.2699127197265625, -1.221466064453125, -1.1730194091796875, -1.12457275390625, -1.0761260986328125, -1.027679443359375, -0.9792327880859375, -0.9307861328125, -0.8823394775390625, -0.833892822265625, -0.7854461669921875, -0.73699951171875, -0.6885528564453125, -0.640106201171875, -0.5916595458984375, -0.543212890625, -0.4947662353515625, -0.446319580078125, -0.3978729248046875, -0.34942626953125, -0.3009796142578125, -0.252532958984375, -0.2040863037109375, -0.1556396484375, -0.1071929931640625, -0.058746337890625, -0.0102996826171875, 0.03814697265625, 0.0865936279296875, 0.135040283203125, 0.1834869384765625, 0.23193359375, 0.2803802490234375, 0.328826904296875, 0.3772735595703125, 0.42572021484375, 0.4741668701171875, 0.522613525390625, 0.5710601806640625, 0.6195068359375, 0.6679534912109375, 0.716400146484375, 0.7648468017578125, 0.81329345703125, 0.8617401123046875, 0.910186767578125, 0.9586334228515625, 1.007080078125, 1.0555267333984375, 1.103973388671875, 1.1524200439453125, 1.20086669921875, 1.2493133544921875, 1.297760009765625, 1.3462066650390625, 1.3946533203125, 1.4430999755859375, 1.491546630859375, 1.5399932861328125, 1.58843994140625, 1.6368865966796875, 1.685333251953125, 1.7337799072265625, 1.7822265625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 18.0, 15.0, 35.0, 58.0, 85.0, 138.0, 164.0, 254.0, 332.0, 504.0, 725.0, 1078.0, 1559.0, 2252.0, 3336.0, 4684.0, 6898.0, 10238.0, 14954.0, 22031.0, 32684.0, 47537.0, 69414.0, 98790.0, 137154.0, 1191221.0, 135467.0, 98529.0, 68417.0, 47248.0, 32562.0, 21946.0, 14912.0, 10047.0, 6903.0, 4642.0, 3160.0, 2187.0, 1570.0, 1068.0, 717.0, 475.0, 348.0, 210.0, 189.0, 128.0, 86.0, 54.0, 45.0, 28.0, 20.0, 9.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.1546630859375, -0.14990234375, -0.1451416015625, -0.140380859375, -0.1356201171875, -0.130859375, -0.1260986328125, -0.121337890625, -0.1165771484375, -0.11181640625, -0.1070556640625, -0.102294921875, -0.0975341796875, -0.0927734375, -0.0880126953125, -0.083251953125, -0.0784912109375, -0.07373046875, -0.0689697265625, -0.064208984375, -0.0594482421875, -0.0546875, -0.0499267578125, -0.045166015625, -0.0404052734375, -0.03564453125, -0.0308837890625, -0.026123046875, -0.0213623046875, -0.0166015625, -0.0118408203125, -0.007080078125, -0.0023193359375, 0.00244140625, 0.0072021484375, 0.011962890625, 0.0167236328125, 0.021484375, 0.0262451171875, 0.031005859375, 0.0357666015625, 0.04052734375, 0.0452880859375, 0.050048828125, 0.0548095703125, 0.0595703125, 0.0643310546875, 0.069091796875, 0.0738525390625, 0.07861328125, 0.0833740234375, 0.088134765625, 0.0928955078125, 0.09765625, 0.1024169921875, 0.107177734375, 0.1119384765625, 0.11669921875, 0.1214599609375, 0.126220703125, 0.1309814453125, 0.1357421875, 0.1405029296875, 0.145263671875, 0.1500244140625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 4.0, 14.0, 11.0, 13.0, 11.0, 16.0, 20.0, 23.0, 23.0, 23.0, 33.0, 50.0, 48.0, 68.0, 83.0, 80.0, 77.0, 61.0, 41.0, 43.0, 45.0, 31.0, 27.0, 26.0, 20.0, 20.0, 13.0, 16.0, 8.0, 5.0, 10.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0036468505859375, -0.0035148262977600098, -0.0033828020095825195, -0.0032507777214050293, -0.003118753433227539, -0.002986729145050049, -0.0028547048568725586, -0.0027226805686950684, -0.002590656280517578, -0.002458631992340088, -0.0023266077041625977, -0.0021945834159851074, -0.002062559127807617, -0.001930534839630127, -0.0017985105514526367, -0.0016664862632751465, -0.0015344619750976562, -0.001402437686920166, -0.0012704133987426758, -0.0011383891105651855, -0.0010063648223876953, -0.0008743405342102051, -0.0007423162460327148, -0.0006102919578552246, -0.0004782676696777344, -0.00034624338150024414, -0.0002142190933227539, -8.219480514526367e-05, 4.982948303222656e-05, 0.0001818537712097168, 0.00031387805938720703, 0.00044590234756469727, 0.0005779266357421875, 0.0007099509239196777, 0.000841975212097168, 0.0009739995002746582, 0.0011060237884521484, 0.0012380480766296387, 0.001370072364807129, 0.0015020966529846191, 0.0016341209411621094, 0.0017661452293395996, 0.0018981695175170898, 0.00203019380569458, 0.0021622180938720703, 0.0022942423820495605, 0.0024262666702270508, 0.002558290958404541, 0.0026903152465820312, 0.0028223395347595215, 0.0029543638229370117, 0.003086388111114502, 0.003218412399291992, 0.0033504366874694824, 0.0034824609756469727, 0.003614485263824463, 0.003746509552001953, 0.0038785338401794434, 0.004010558128356934, 0.004142582416534424, 0.004274606704711914, 0.004406630992889404, 0.0045386552810668945, 0.004670679569244385, 0.004802703857421875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 7.0, 8.0, 13.0, 16.0, 30.0, 27.0, 41.0, 58.0, 87.0, 98.0, 141.0, 186.0, 320.0, 742.0, 6044.0, 265180.0, 760900.0, 12483.0, 999.0, 345.0, 219.0, 157.0, 102.0, 69.0, 55.0, 46.0, 29.0, 32.0, 19.0, 20.0, 17.0, 8.0, 13.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0784912109375, -0.07631778717041016, -0.07414436340332031, -0.07197093963623047, -0.06979751586914062, -0.06762409210205078, -0.06545066833496094, -0.0632772445678711, -0.06110382080078125, -0.058930397033691406, -0.05675697326660156, -0.05458354949951172, -0.052410125732421875, -0.05023670196533203, -0.04806327819824219, -0.045889854431152344, -0.0437164306640625, -0.041543006896972656, -0.03936958312988281, -0.03719615936279297, -0.035022735595703125, -0.03284931182861328, -0.030675888061523438, -0.028502464294433594, -0.02632904052734375, -0.024155616760253906, -0.021982192993164062, -0.01980876922607422, -0.017635345458984375, -0.015461921691894531, -0.013288497924804688, -0.011115074157714844, -0.008941650390625, -0.006768226623535156, -0.0045948028564453125, -0.0024213790893554688, -0.000247955322265625, 0.0019254684448242188, 0.0040988922119140625, 0.006272315979003906, 0.00844573974609375, 0.010619163513183594, 0.012792587280273438, 0.014966011047363281, 0.017139434814453125, 0.01931285858154297, 0.021486282348632812, 0.023659706115722656, 0.0258331298828125, 0.028006553649902344, 0.030179977416992188, 0.03235340118408203, 0.034526824951171875, 0.03670024871826172, 0.03887367248535156, 0.041047096252441406, 0.04322052001953125, 0.045393943786621094, 0.04756736755371094, 0.04974079132080078, 0.051914215087890625, 0.05408763885498047, 0.05626106262207031, 0.058434486389160156, 0.06060791015625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 5.0, 88.0, 610.0, 253.0, 47.0, 13.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032626560423523188, -0.002360634272918105, -0.0014586125034838915, -0.0005565907340496778, 0.0003454310353845358, 0.0012474528048187494, 0.002149474574252963, 0.0030514963436871767, 0.003953518345952034, 0.004855540115386248, 0.005757561884820461, 0.006659583654254675, 0.0075616054236888885, 0.008463626727461815, 0.009365648962557316, 0.010267671197652817, 0.011169692501425743, 0.01207171380519867, 0.01297373604029417, 0.013875758275389671, 0.014777779579162598, 0.015679800882935524, 0.01658182218670845, 0.017483845353126526, 0.018385866656899452, 0.01928788796067238, 0.020189911127090454, 0.02109193243086338, 0.021993953734636307, 0.022895975038409233, 0.02379799634218216, 0.024700019508600235, 0.025602038949728012, 0.02650406025350094, 0.027406081557273865, 0.02830810472369194, 0.029210126027464867, 0.030112147331237793, 0.03101417049765587, 0.031916189938783646, 0.03281821310520172, 0.0337202362716198, 0.034622255712747574, 0.03552427887916565, 0.036426298320293427, 0.0373283214867115, 0.03823034465312958, 0.039132364094257355, 0.04003438726067543, 0.040936410427093506, 0.04183842986822128, 0.04274045303463936, 0.043642476201057434, 0.04454449564218521, 0.04544651880860329, 0.046348538249731064, 0.04725056141614914, 0.048152584582567215, 0.04905460402369499, 0.04995662719011307, 0.050858646631240845, 0.05176066979765892, 0.052662692964076996, 0.05356471240520477, 0.05446673557162285]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 11.0, 17.0, 24.0, 15.0, 32.0, 39.0, 54.0, 45.0, 45.0, 71.0, 65.0, 51.0, 68.0, 55.0, 50.0, 56.0, 42.0, 58.0, 34.0, 35.0, 29.0, 21.0, 26.0, 15.0, 10.0, 10.0, 6.0, 5.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.005779087543487549, -0.005636661313474178, -0.005494235083460808, -0.005351808853447437, -0.005209382623434067, -0.005066956393420696, -0.004924530163407326, -0.004782103933393955, -0.004639677703380585, -0.004497251473367214, -0.004354825243353844, -0.004212399013340473, -0.004069972783327103, -0.003927546553313732, -0.0037851203233003616, -0.003642694093286991, -0.0035002678632736206, -0.00335784163326025, -0.0032154154032468796, -0.003072989173233509, -0.0029305629432201385, -0.002788136713206768, -0.0026457104831933975, -0.002503284253180027, -0.0023608580231666565, -0.002218431793153286, -0.0020760055631399155, -0.001933579333126545, -0.0017911531031131744, -0.001648726873099804, -0.0015063006430864334, -0.001363874413073063, -0.0012214481830596924, -0.0010790219530463219, -0.0009365957230329514, -0.0007941694930195808, -0.0006517432630062103, -0.0005093170329928398, -0.0003668908029794693, -0.00022446457296609879, -8.203834295272827e-05, 6.038788706064224e-05, 0.00020281411707401276, 0.00034524034708738327, 0.0004876665771007538, 0.0006300928071141243, 0.0007725190371274948, 0.0009149452671408653, 0.0010573714971542358, 0.0011997977271676064, 0.0013422239571809769, 0.0014846501871943474, 0.001627076417207718, 0.0017695026472210884, 0.001911928877234459, 0.0020543551072478294, 0.0021967813372612, 0.0023392075672745705, 0.002481633797287941, 0.0026240600273013115, 0.002766486257314682, 0.0029089124873280525, 0.003051338717341423, 0.0031937649473547935, 0.003336191177368164]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 6.0, 6.0, 10.0, 14.0, 12.0, 20.0, 14.0, 23.0, 22.0, 31.0, 29.0, 32.0, 33.0, 33.0, 30.0, 31.0, 47.0, 43.0, 38.0, 34.0, 43.0, 37.0, 41.0, 38.0, 31.0, 22.0, 27.0, 24.0, 25.0, 24.0, 21.0, 22.0, 15.0, 21.0, 12.0, 12.0, 13.0, 13.0, 9.0, 5.0, 4.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.197265625, -2.126922607421875, -2.05657958984375, -1.986236572265625, -1.9158935546875, -1.845550537109375, -1.77520751953125, -1.704864501953125, -1.634521484375, -1.564178466796875, -1.49383544921875, -1.423492431640625, -1.3531494140625, -1.282806396484375, -1.21246337890625, -1.142120361328125, -1.07177734375, -1.001434326171875, -0.93109130859375, -0.860748291015625, -0.7904052734375, -0.720062255859375, -0.64971923828125, -0.579376220703125, -0.509033203125, -0.438690185546875, -0.36834716796875, -0.298004150390625, -0.2276611328125, -0.157318115234375, -0.08697509765625, -0.016632080078125, 0.0537109375, 0.124053955078125, 0.19439697265625, 0.264739990234375, 0.3350830078125, 0.405426025390625, 0.47576904296875, 0.546112060546875, 0.616455078125, 0.686798095703125, 0.75714111328125, 0.827484130859375, 0.8978271484375, 0.968170166015625, 1.03851318359375, 1.108856201171875, 1.17919921875, 1.249542236328125, 1.31988525390625, 1.390228271484375, 1.4605712890625, 1.530914306640625, 1.60125732421875, 1.671600341796875, 1.741943359375, 1.812286376953125, 1.88262939453125, 1.952972412109375, 2.0233154296875, 2.093658447265625, 2.16400146484375, 2.234344482421875, 2.3046875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 12.0, 21.0, 21.0, 18.0, 31.0, 56.0, 57.0, 122.0, 236.0, 453.0, 742.0, 1565.0, 2864.0, 5440.0, 10077.0, 18774.0, 34026.0, 67364.0, 161113.0, 337975.0, 224289.0, 89689.0, 42938.0, 23477.0, 12706.0, 6708.0, 3608.0, 1887.0, 1056.0, 533.0, 290.0, 165.0, 81.0, 55.0, 33.0, 20.0, 24.0, 11.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.01885986328125, -1.9459228515625, -1.87298583984375, -1.800048828125, -1.72711181640625, -1.6541748046875, -1.58123779296875, -1.50830078125, -1.43536376953125, -1.3624267578125, -1.28948974609375, -1.216552734375, -1.14361572265625, -1.0706787109375, -0.99774169921875, -0.9248046875, -0.85186767578125, -0.7789306640625, -0.70599365234375, -0.633056640625, -0.56011962890625, -0.4871826171875, -0.41424560546875, -0.34130859375, -0.26837158203125, -0.1954345703125, -0.12249755859375, -0.049560546875, 0.02337646484375, 0.0963134765625, 0.16925048828125, 0.2421875, 0.31512451171875, 0.3880615234375, 0.46099853515625, 0.533935546875, 0.60687255859375, 0.6798095703125, 0.75274658203125, 0.82568359375, 0.89862060546875, 0.9715576171875, 1.04449462890625, 1.117431640625, 1.19036865234375, 1.2633056640625, 1.33624267578125, 1.4091796875, 1.48211669921875, 1.5550537109375, 1.62799072265625, 1.700927734375, 1.77386474609375, 1.8468017578125, 1.91973876953125, 1.99267578125, 2.06561279296875, 2.1385498046875, 2.21148681640625, 2.284423828125, 2.35736083984375, 2.4302978515625, 2.50323486328125, 2.576171875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 8.0, 10.0, 5.0, 7.0, 11.0, 8.0, 17.0, 22.0, 19.0, 23.0, 25.0, 34.0, 23.0, 41.0, 57.0, 43.0, 51.0, 88.0, 175.0, 1495.0, 292.0, 132.0, 77.0, 65.0, 39.0, 47.0, 37.0, 36.0, 31.0, 21.0, 19.0, 18.0, 17.0, 19.0, 7.0, 9.0, 4.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.296875, -9.9920654296875, -9.687255859375, -9.3824462890625, -9.07763671875, -8.7728271484375, -8.468017578125, -8.1632080078125, -7.8583984375, -7.5535888671875, -7.248779296875, -6.9439697265625, -6.63916015625, -6.3343505859375, -6.029541015625, -5.7247314453125, -5.419921875, -5.1151123046875, -4.810302734375, -4.5054931640625, -4.20068359375, -3.8958740234375, -3.591064453125, -3.2862548828125, -2.9814453125, -2.6766357421875, -2.371826171875, -2.0670166015625, -1.76220703125, -1.4573974609375, -1.152587890625, -0.8477783203125, -0.54296875, -0.2381591796875, 0.066650390625, 0.3714599609375, 0.67626953125, 0.9810791015625, 1.285888671875, 1.5906982421875, 1.8955078125, 2.2003173828125, 2.505126953125, 2.8099365234375, 3.11474609375, 3.4195556640625, 3.724365234375, 4.0291748046875, 4.333984375, 4.6387939453125, 4.943603515625, 5.2484130859375, 5.55322265625, 5.8580322265625, 6.162841796875, 6.4676513671875, 6.7724609375, 7.0772705078125, 7.382080078125, 7.6868896484375, 7.99169921875, 8.2965087890625, 8.601318359375, 8.9061279296875, 9.2109375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 8.0, 3.0, 6.0, 11.0, 6.0, 19.0, 20.0, 29.0, 52.0, 77.0, 151.0, 234.0, 508.0, 3001.0, 2982710.0, 156628.0, 1291.0, 410.0, 188.0, 122.0, 78.0, 36.0, 34.0, 25.0, 19.0, 10.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.71875, -43.43505859375, -42.1513671875, -40.86767578125, -39.583984375, -38.30029296875, -37.0166015625, -35.73291015625, -34.44921875, -33.16552734375, -31.8818359375, -30.59814453125, -29.314453125, -28.03076171875, -26.7470703125, -25.46337890625, -24.1796875, -22.89599609375, -21.6123046875, -20.32861328125, -19.044921875, -17.76123046875, -16.4775390625, -15.19384765625, -13.91015625, -12.62646484375, -11.3427734375, -10.05908203125, -8.775390625, -7.49169921875, -6.2080078125, -4.92431640625, -3.640625, -2.35693359375, -1.0732421875, 0.21044921875, 1.494140625, 2.77783203125, 4.0615234375, 5.34521484375, 6.62890625, 7.91259765625, 9.1962890625, 10.47998046875, 11.763671875, 13.04736328125, 14.3310546875, 15.61474609375, 16.8984375, 18.18212890625, 19.4658203125, 20.74951171875, 22.033203125, 23.31689453125, 24.6005859375, 25.88427734375, 27.16796875, 28.45166015625, 29.7353515625, 31.01904296875, 32.302734375, 33.58642578125, 34.8701171875, 36.15380859375, 37.4375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 16.0, 95.0, 286.0, 352.0, 191.0, 57.0, 15.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.50761604309082, -21.030540466308594, -19.553464889526367, -18.07638931274414, -16.599313735961914, -15.122238159179688, -13.645163536071777, -12.16808795928955, -10.691012382507324, -9.213936805725098, -7.736861228942871, -6.259786128997803, -4.782710552215576, -3.3056349754333496, -1.8285598754882812, -0.3514842987060547, 1.1255912780761719, 2.6026668548583984, 4.079742431640625, 5.556817531585693, 7.03389310836792, 8.510969161987305, 9.988043785095215, 11.465119361877441, 12.942194938659668, 14.419270515441895, 15.896346092224121, 17.37342071533203, 18.850496292114258, 20.327571868896484, 21.80464744567871, 23.281723022460938, 24.758800506591797, 26.235876083374023, 27.71295166015625, 29.190027236938477, 30.667102813720703, 32.1441764831543, 33.621253967285156, 35.09832763671875, 36.57540512084961, 38.0524787902832, 39.52955627441406, 41.006629943847656, 42.483707427978516, 43.96078109741211, 45.43785858154297, 46.91493225097656, 48.392005920410156, 49.86907958984375, 51.34615707397461, 52.8232307434082, 54.30030822753906, 55.777381896972656, 57.254459381103516, 58.73153305053711, 60.20861053466797, 61.68568420410156, 63.16276168823242, 64.63983917236328, 66.11691284179688, 67.59398651123047, 69.07106018066406, 70.54814147949219, 72.02521514892578]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 7.0, 8.0, 11.0, 13.0, 23.0, 14.0, 23.0, 31.0, 30.0, 30.0, 24.0, 46.0, 41.0, 48.0, 51.0, 43.0, 44.0, 36.0, 29.0, 49.0, 46.0, 43.0, 51.0, 39.0, 41.0, 37.0, 29.0, 26.0, 19.0, 8.0, 11.0, 13.0, 10.0, 4.0, 9.0, 4.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.62518310546875, -30.683149337768555, -29.74111557006836, -28.799081802368164, -27.85704803466797, -26.91501235961914, -25.972978591918945, -25.03094482421875, -24.088911056518555, -23.14687728881836, -22.204843521118164, -21.26280975341797, -20.32077407836914, -19.378742218017578, -18.43670654296875, -17.494672775268555, -16.55263900756836, -15.610605239868164, -14.668571472167969, -13.726536750793457, -12.784502983093262, -11.842469215393066, -10.900434494018555, -9.95840072631836, -9.016366958618164, -8.074333190917969, -7.132298946380615, -6.190264701843262, -5.248230934143066, -4.306197166442871, -3.3641629219055176, -2.422128677368164, -1.480093002319336, -0.5380589962005615, 0.4039750099182129, 1.3460090160369873, 2.2880430221557617, 3.230076789855957, 4.1721110343933105, 5.114145278930664, 6.056179046630859, 6.998212814331055, 7.940247058868408, 8.882281303405762, 9.824315071105957, 10.766348838806152, 11.708383560180664, 12.65041732788086, 13.592451095581055, 14.53448486328125, 15.476518630981445, 16.41855239868164, 17.36058807373047, 18.30261993408203, 19.24465560913086, 20.186689376831055, 21.12872314453125, 22.070756912231445, 23.01279067993164, 23.954824447631836, 24.89685821533203, 25.83889389038086, 26.780927658081055, 27.72296142578125, 28.664995193481445]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 8.0, 9.0, 7.0, 6.0, 8.0, 9.0, 15.0, 18.0, 12.0, 24.0, 25.0, 32.0, 31.0, 30.0, 30.0, 37.0, 38.0, 32.0, 29.0, 35.0, 31.0, 46.0, 47.0, 37.0, 34.0, 38.0, 30.0, 27.0, 29.0, 29.0, 17.0, 32.0, 24.0, 25.0, 15.0, 16.0, 21.0, 10.0, 16.0, 9.0, 8.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.5078125, -2.430694580078125, -2.35357666015625, -2.276458740234375, -2.1993408203125, -2.122222900390625, -2.04510498046875, -1.967987060546875, -1.890869140625, -1.813751220703125, -1.73663330078125, -1.659515380859375, -1.5823974609375, -1.505279541015625, -1.42816162109375, -1.351043701171875, -1.27392578125, -1.196807861328125, -1.11968994140625, -1.042572021484375, -0.9654541015625, -0.888336181640625, -0.81121826171875, -0.734100341796875, -0.656982421875, -0.579864501953125, -0.50274658203125, -0.425628662109375, -0.3485107421875, -0.271392822265625, -0.19427490234375, -0.117156982421875, -0.0400390625, 0.037078857421875, 0.11419677734375, 0.191314697265625, 0.2684326171875, 0.345550537109375, 0.42266845703125, 0.499786376953125, 0.576904296875, 0.654022216796875, 0.73114013671875, 0.808258056640625, 0.8853759765625, 0.962493896484375, 1.03961181640625, 1.116729736328125, 1.19384765625, 1.270965576171875, 1.34808349609375, 1.425201416015625, 1.5023193359375, 1.579437255859375, 1.65655517578125, 1.733673095703125, 1.810791015625, 1.887908935546875, 1.96502685546875, 2.042144775390625, 2.1192626953125, 2.196380615234375, 2.27349853515625, 2.350616455078125, 2.427734375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 6.0, 8.0, 8.0, 11.0, 9.0, 15.0, 19.0, 23.0, 35.0, 30.0, 50.0, 87.0, 142.0, 237.0, 440.0, 1112.0, 3222.0, 10817.0, 44745.0, 215470.0, 1028154.0, 1925689.0, 763955.0, 154192.0, 32731.0, 8509.0, 2518.0, 925.0, 421.0, 210.0, 156.0, 89.0, 42.0, 39.0, 26.0, 28.0, 23.0, 20.0, 9.0, 9.0, 9.0, 4.0, 3.0, 10.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.1328125, -4.98358154296875, -4.8343505859375, -4.68511962890625, -4.535888671875, -4.38665771484375, -4.2374267578125, -4.08819580078125, -3.93896484375, -3.78973388671875, -3.6405029296875, -3.49127197265625, -3.342041015625, -3.19281005859375, -3.0435791015625, -2.89434814453125, -2.7451171875, -2.59588623046875, -2.4466552734375, -2.29742431640625, -2.148193359375, -1.99896240234375, -1.8497314453125, -1.70050048828125, -1.55126953125, -1.40203857421875, -1.2528076171875, -1.10357666015625, -0.954345703125, -0.80511474609375, -0.6558837890625, -0.50665283203125, -0.357421875, -0.20819091796875, -0.0589599609375, 0.09027099609375, 0.239501953125, 0.38873291015625, 0.5379638671875, 0.68719482421875, 0.83642578125, 0.98565673828125, 1.1348876953125, 1.28411865234375, 1.433349609375, 1.58258056640625, 1.7318115234375, 1.88104248046875, 2.0302734375, 2.17950439453125, 2.3287353515625, 2.47796630859375, 2.627197265625, 2.77642822265625, 2.9256591796875, 3.07489013671875, 3.22412109375, 3.37335205078125, 3.5225830078125, 3.67181396484375, 3.821044921875, 3.97027587890625, 4.1195068359375, 4.26873779296875, 4.41796875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 3.0, 6.0, 14.0, 19.0, 21.0, 28.0, 50.0, 76.0, 97.0, 151.0, 212.0, 278.0, 380.0, 495.0, 507.0, 448.0, 332.0, 288.0, 191.0, 159.0, 98.0, 69.0, 47.0, 29.0, 17.0, 20.0, 13.0, 11.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.90386962890625, -7.6671142578125, -7.43035888671875, -7.193603515625, -6.95684814453125, -6.7200927734375, -6.48333740234375, -6.24658203125, -6.00982666015625, -5.7730712890625, -5.53631591796875, -5.299560546875, -5.06280517578125, -4.8260498046875, -4.58929443359375, -4.3525390625, -4.11578369140625, -3.8790283203125, -3.64227294921875, -3.405517578125, -3.16876220703125, -2.9320068359375, -2.69525146484375, -2.45849609375, -2.22174072265625, -1.9849853515625, -1.74822998046875, -1.511474609375, -1.27471923828125, -1.0379638671875, -0.80120849609375, -0.564453125, -0.32769775390625, -0.0909423828125, 0.14581298828125, 0.382568359375, 0.61932373046875, 0.8560791015625, 1.09283447265625, 1.32958984375, 1.56634521484375, 1.8031005859375, 2.03985595703125, 2.276611328125, 2.51336669921875, 2.7501220703125, 2.98687744140625, 3.2236328125, 3.46038818359375, 3.6971435546875, 3.93389892578125, 4.170654296875, 4.40740966796875, 4.6441650390625, 4.88092041015625, 5.11767578125, 5.35443115234375, 5.5911865234375, 5.82794189453125, 6.064697265625, 6.30145263671875, 6.5382080078125, 6.77496337890625, 7.01171875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 6.0, 10.0, 9.0, 15.0, 23.0, 36.0, 40.0, 50.0, 80.0, 130.0, 158.0, 305.0, 568.0, 1427.0, 8737.0, 118822.0, 2065523.0, 1881897.0, 105896.0, 7906.0, 1331.0, 524.0, 283.0, 157.0, 95.0, 88.0, 50.0, 40.0, 25.0, 11.0, 12.0, 12.0, 7.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.953125, -11.5406494140625, -11.128173828125, -10.7156982421875, -10.30322265625, -9.8907470703125, -9.478271484375, -9.0657958984375, -8.6533203125, -8.2408447265625, -7.828369140625, -7.4158935546875, -7.00341796875, -6.5909423828125, -6.178466796875, -5.7659912109375, -5.353515625, -4.9410400390625, -4.528564453125, -4.1160888671875, -3.70361328125, -3.2911376953125, -2.878662109375, -2.4661865234375, -2.0537109375, -1.6412353515625, -1.228759765625, -0.8162841796875, -0.40380859375, 0.0086669921875, 0.421142578125, 0.8336181640625, 1.24609375, 1.6585693359375, 2.071044921875, 2.4835205078125, 2.89599609375, 3.3084716796875, 3.720947265625, 4.1334228515625, 4.5458984375, 4.9583740234375, 5.370849609375, 5.7833251953125, 6.19580078125, 6.6082763671875, 7.020751953125, 7.4332275390625, 7.845703125, 8.2581787109375, 8.670654296875, 9.0831298828125, 9.49560546875, 9.9080810546875, 10.320556640625, 10.7330322265625, 11.1455078125, 11.5579833984375, 11.970458984375, 12.3829345703125, 12.79541015625, 13.2078857421875, 13.620361328125, 14.0328369140625, 14.4453125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 13.0, 36.0, 73.0, 177.0, 204.0, 211.0, 153.0, 102.0, 22.0, 14.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.28544616699219, -80.37281799316406, -78.4601821899414, -76.54755401611328, -74.63492584228516, -72.7222900390625, -70.80966186523438, -68.89703369140625, -66.9843978881836, -65.07176971435547, -63.15913772583008, -61.24650573730469, -59.3338737487793, -57.421241760253906, -55.50861358642578, -53.59598159790039, -51.683353424072266, -49.770721435546875, -47.85809326171875, -45.94546127319336, -44.03282928466797, -42.120201110839844, -40.20756912231445, -38.29493713378906, -36.38230895996094, -34.46967697143555, -32.55704879760742, -30.64441680908203, -28.73178482055664, -26.819154739379883, -24.906524658203125, -22.993892669677734, -21.08126449584961, -19.16863441467285, -17.25600242614746, -15.343372344970703, -13.430741310119629, -11.518110275268555, -9.605480194091797, -7.692849159240723, -5.780218124389648, -3.8675873279571533, -1.9549565315246582, -0.04232597351074219, 1.870305061340332, 3.7829360961914062, 5.695566177368164, 7.608197212219238, 9.520828247070312, 11.433459281921387, 13.346090316772461, 15.258720397949219, 17.17135238647461, 19.083982467651367, 20.996612548828125, 22.909244537353516, 24.821874618530273, 26.73450469970703, 28.647136688232422, 30.55976676940918, 32.47239685058594, 34.38502883911133, 36.29766082763672, 38.210289001464844, 40.122920989990234]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 7.0, 12.0, 10.0, 10.0, 11.0, 17.0, 13.0, 23.0, 21.0, 30.0, 20.0, 38.0, 30.0, 34.0, 34.0, 31.0, 39.0, 43.0, 36.0, 52.0, 32.0, 44.0, 36.0, 33.0, 54.0, 34.0, 34.0, 31.0, 19.0, 13.0, 20.0, 17.0, 17.0, 20.0, 13.0, 8.0, 11.0, 9.0, 11.0, 5.0, 6.0, 2.0, 1.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.209890365600586, -18.562021255493164, -17.914152145385742, -17.26628303527832, -16.618412017822266, -15.97054386138916, -15.322673797607422, -14.6748046875, -14.026935577392578, -13.379066467285156, -12.731197357177734, -12.083327293395996, -11.435458183288574, -10.787589073181152, -10.139719009399414, -9.491849899291992, -8.84398078918457, -8.196111679077148, -7.548242092132568, -6.900372505187988, -6.252503395080566, -5.6046342849731445, -4.9567646980285645, -4.308895111083984, -3.6610260009765625, -3.0131566524505615, -2.3652873039245605, -1.7174179553985596, -1.0695486068725586, -0.4216792583465576, 0.22619009017944336, 0.8740596771240234, 1.5219306945800781, 2.169800043106079, 2.81766939163208, 3.465538740158081, 4.113408088684082, 4.761277198791504, 5.409146785736084, 6.057016372680664, 6.704885482788086, 7.352754592895508, 8.00062370300293, 8.648493766784668, 9.29636287689209, 9.944231986999512, 10.59210205078125, 11.239971160888672, 11.887840270996094, 12.535709381103516, 13.183578491210938, 13.831448554992676, 14.479317665100098, 15.12718677520752, 15.775056838989258, 16.42292594909668, 17.0707950592041, 17.718664169311523, 18.366533279418945, 19.014402389526367, 19.662273406982422, 20.310142517089844, 20.958011627197266, 21.605880737304688, 22.25374984741211]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 5.0, 7.0, 10.0, 8.0, 12.0, 11.0, 19.0, 13.0, 20.0, 30.0, 29.0, 21.0, 22.0, 44.0, 32.0, 33.0, 29.0, 41.0, 37.0, 45.0, 50.0, 33.0, 35.0, 40.0, 30.0, 41.0, 31.0, 28.0, 29.0, 31.0, 29.0, 29.0, 14.0, 15.0, 19.0, 17.0, 11.0, 11.0, 4.0, 6.0, 8.0, 9.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.671875, -2.592071533203125, -2.51226806640625, -2.432464599609375, -2.3526611328125, -2.272857666015625, -2.19305419921875, -2.113250732421875, -2.033447265625, -1.953643798828125, -1.87384033203125, -1.794036865234375, -1.7142333984375, -1.634429931640625, -1.55462646484375, -1.474822998046875, -1.39501953125, -1.315216064453125, -1.23541259765625, -1.155609130859375, -1.0758056640625, -0.996002197265625, -0.91619873046875, -0.836395263671875, -0.756591796875, -0.676788330078125, -0.59698486328125, -0.517181396484375, -0.4373779296875, -0.357574462890625, -0.27777099609375, -0.197967529296875, -0.1181640625, -0.038360595703125, 0.04144287109375, 0.121246337890625, 0.2010498046875, 0.280853271484375, 0.36065673828125, 0.440460205078125, 0.520263671875, 0.600067138671875, 0.67987060546875, 0.759674072265625, 0.8394775390625, 0.919281005859375, 0.99908447265625, 1.078887939453125, 1.15869140625, 1.238494873046875, 1.31829833984375, 1.398101806640625, 1.4779052734375, 1.557708740234375, 1.63751220703125, 1.717315673828125, 1.797119140625, 1.876922607421875, 1.95672607421875, 2.036529541015625, 2.1163330078125, 2.196136474609375, 2.27593994140625, 2.355743408203125, 2.435546875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 15.0, 16.0, 35.0, 35.0, 58.0, 88.0, 138.0, 209.0, 292.0, 480.0, 818.0, 1249.0, 1973.0, 3336.0, 5575.0, 9784.0, 17540.0, 31180.0, 58303.0, 108518.0, 189180.0, 244181.0, 167693.0, 93672.0, 50629.0, 27148.0, 15038.0, 8691.0, 4922.0, 2916.0, 1790.0, 1114.0, 696.0, 386.0, 291.0, 175.0, 132.0, 83.0, 60.0, 37.0, 24.0, 11.0, 14.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.380615234375, -0.3692131042480469, -0.35781097412109375, -0.3464088439941406, -0.3350067138671875, -0.3236045837402344, -0.31220245361328125, -0.3008003234863281, -0.289398193359375, -0.2779960632324219, -0.26659393310546875, -0.2551918029785156, -0.2437896728515625, -0.23238754272460938, -0.22098541259765625, -0.20958328247070312, -0.19818115234375, -0.18677902221679688, -0.17537689208984375, -0.16397476196289062, -0.1525726318359375, -0.14117050170898438, -0.12976837158203125, -0.11836624145507812, -0.106964111328125, -0.09556198120117188, -0.08415985107421875, -0.07275772094726562, -0.0613555908203125, -0.049953460693359375, -0.03855133056640625, -0.027149200439453125, -0.0157470703125, -0.004344940185546875, 0.00705718994140625, 0.018459320068359375, 0.0298614501953125, 0.041263580322265625, 0.05266571044921875, 0.06406784057617188, 0.075469970703125, 0.08687210083007812, 0.09827423095703125, 0.10967636108398438, 0.1210784912109375, 0.13248062133789062, 0.14388275146484375, 0.15528488159179688, 0.16668701171875, 0.17808914184570312, 0.18949127197265625, 0.20089340209960938, 0.2122955322265625, 0.22369766235351562, 0.23509979248046875, 0.24650192260742188, 0.257904052734375, 0.2693061828613281, 0.28070831298828125, 0.2921104431152344, 0.3035125732421875, 0.3149147033691406, 0.32631683349609375, 0.3377189636230469, 0.34912109375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 4.0, 5.0, 12.0, 9.0, 12.0, 12.0, 27.0, 18.0, 24.0, 23.0, 23.0, 27.0, 31.0, 42.0, 30.0, 48.0, 34.0, 32.0, 46.0, 1069.0, 32.0, 50.0, 36.0, 45.0, 32.0, 29.0, 38.0, 34.0, 23.0, 18.0, 23.0, 22.0, 22.0, 14.0, 8.0, 19.0, 13.0, 5.0, 7.0, 7.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.828125, -1.773681640625, -1.71923828125, -1.664794921875, -1.6103515625, -1.555908203125, -1.50146484375, -1.447021484375, -1.392578125, -1.338134765625, -1.28369140625, -1.229248046875, -1.1748046875, -1.120361328125, -1.06591796875, -1.011474609375, -0.95703125, -0.902587890625, -0.84814453125, -0.793701171875, -0.7392578125, -0.684814453125, -0.63037109375, -0.575927734375, -0.521484375, -0.467041015625, -0.41259765625, -0.358154296875, -0.3037109375, -0.249267578125, -0.19482421875, -0.140380859375, -0.0859375, -0.031494140625, 0.02294921875, 0.077392578125, 0.1318359375, 0.186279296875, 0.24072265625, 0.295166015625, 0.349609375, 0.404052734375, 0.45849609375, 0.512939453125, 0.5673828125, 0.621826171875, 0.67626953125, 0.730712890625, 0.78515625, 0.839599609375, 0.89404296875, 0.948486328125, 1.0029296875, 1.057373046875, 1.11181640625, 1.166259765625, 1.220703125, 1.275146484375, 1.32958984375, 1.384033203125, 1.4384765625, 1.492919921875, 1.54736328125, 1.601806640625, 1.65625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 4.0, 12.0, 16.0, 17.0, 13.0, 34.0, 56.0, 62.0, 90.0, 151.0, 223.0, 333.0, 492.0, 746.0, 987.0, 1568.0, 2357.0, 3608.0, 5365.0, 8073.0, 12544.0, 18564.0, 28871.0, 43530.0, 66464.0, 97503.0, 136442.0, 1195092.0, 152944.0, 106886.0, 72621.0, 48193.0, 31735.0, 20954.0, 13701.0, 9051.0, 5970.0, 3916.0, 2602.0, 1730.0, 1148.0, 791.0, 521.0, 355.0, 244.0, 183.0, 116.0, 80.0, 53.0, 42.0, 25.0, 26.0, 8.0, 7.0, 8.0, 4.0, 2.0, 1.0, 4.0, 1.0], "bins": [-0.1751708984375, -0.1696319580078125, -0.164093017578125, -0.1585540771484375, -0.15301513671875, -0.1474761962890625, -0.141937255859375, -0.1363983154296875, -0.130859375, -0.1253204345703125, -0.119781494140625, -0.1142425537109375, -0.10870361328125, -0.1031646728515625, -0.097625732421875, -0.0920867919921875, -0.0865478515625, -0.0810089111328125, -0.075469970703125, -0.0699310302734375, -0.06439208984375, -0.0588531494140625, -0.053314208984375, -0.0477752685546875, -0.042236328125, -0.0366973876953125, -0.031158447265625, -0.0256195068359375, -0.02008056640625, -0.0145416259765625, -0.009002685546875, -0.0034637451171875, 0.0020751953125, 0.0076141357421875, 0.013153076171875, 0.0186920166015625, 0.02423095703125, 0.0297698974609375, 0.035308837890625, 0.0408477783203125, 0.04638671875, 0.0519256591796875, 0.057464599609375, 0.0630035400390625, 0.06854248046875, 0.0740814208984375, 0.079620361328125, 0.0851593017578125, 0.0906982421875, 0.0962371826171875, 0.101776123046875, 0.1073150634765625, 0.11285400390625, 0.1183929443359375, 0.123931884765625, 0.1294708251953125, 0.135009765625, 0.1405487060546875, 0.146087646484375, 0.1516265869140625, 0.15716552734375, 0.1627044677734375, 0.168243408203125, 0.1737823486328125, 0.1793212890625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 7.0, 6.0, 3.0, 2.0, 5.0, 12.0, 11.0, 20.0, 17.0, 11.0, 21.0, 27.0, 20.0, 35.0, 49.0, 92.0, 104.0, 98.0, 92.0, 67.0, 54.0, 45.0, 29.0, 32.0, 29.0, 17.0, 15.0, 7.0, 16.0, 10.0, 7.0, 5.0, 7.0, 11.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00662994384765625, -0.006454288959503174, -0.006278634071350098, -0.0061029791831970215, -0.005927324295043945, -0.005751669406890869, -0.005576014518737793, -0.005400359630584717, -0.005224704742431641, -0.0050490498542785645, -0.004873394966125488, -0.004697740077972412, -0.004522085189819336, -0.00434643030166626, -0.004170775413513184, -0.003995120525360107, -0.0038194656372070312, -0.003643810749053955, -0.003468155860900879, -0.0032925009727478027, -0.0031168460845947266, -0.0029411911964416504, -0.0027655363082885742, -0.002589881420135498, -0.002414226531982422, -0.0022385716438293457, -0.0020629167556762695, -0.0018872618675231934, -0.0017116069793701172, -0.001535952091217041, -0.0013602972030639648, -0.0011846423149108887, -0.0010089874267578125, -0.0008333325386047363, -0.0006576776504516602, -0.000482022762298584, -0.0003063678741455078, -0.00013071298599243164, 4.494190216064453e-05, 0.0002205967903137207, 0.0003962516784667969, 0.000571906566619873, 0.0007475614547729492, 0.0009232163429260254, 0.0010988712310791016, 0.0012745261192321777, 0.001450181007385254, 0.00162583589553833, 0.0018014907836914062, 0.0019771456718444824, 0.0021528005599975586, 0.0023284554481506348, 0.002504110336303711, 0.002679765224456787, 0.0028554201126098633, 0.0030310750007629395, 0.0032067298889160156, 0.003382384777069092, 0.003558039665222168, 0.003733694553375244, 0.00390934944152832, 0.0040850043296813965, 0.004260659217834473, 0.004436314105987549, 0.004611968994140625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 7.0, 9.0, 11.0, 2.0, 13.0, 10.0, 17.0, 20.0, 40.0, 39.0, 59.0, 81.0, 153.0, 177.0, 396.0, 1138.0, 93082.0, 947383.0, 4511.0, 603.0, 256.0, 159.0, 107.0, 83.0, 36.0, 23.0, 39.0, 21.0, 22.0, 9.0, 6.0, 6.0, 3.0, 7.0, 8.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0853271484375, -0.08207416534423828, -0.07882118225097656, -0.07556819915771484, -0.07231521606445312, -0.0690622329711914, -0.06580924987792969, -0.06255626678466797, -0.05930328369140625, -0.05605030059814453, -0.05279731750488281, -0.049544334411621094, -0.046291351318359375, -0.043038368225097656, -0.03978538513183594, -0.03653240203857422, -0.0332794189453125, -0.03002643585205078, -0.026773452758789062, -0.023520469665527344, -0.020267486572265625, -0.017014503479003906, -0.013761520385742188, -0.010508537292480469, -0.00725555419921875, -0.004002571105957031, -0.0007495880126953125, 0.0025033950805664062, 0.005756378173828125, 0.009009361267089844, 0.012262344360351562, 0.015515327453613281, 0.018768310546875, 0.02202129364013672, 0.025274276733398438, 0.028527259826660156, 0.031780242919921875, 0.035033226013183594, 0.03828620910644531, 0.04153919219970703, 0.04479217529296875, 0.04804515838623047, 0.05129814147949219, 0.054551124572753906, 0.057804107666015625, 0.061057090759277344, 0.06431007385253906, 0.06756305694580078, 0.0708160400390625, 0.07406902313232422, 0.07732200622558594, 0.08057498931884766, 0.08382797241210938, 0.0870809555053711, 0.09033393859863281, 0.09358692169189453, 0.09683990478515625, 0.10009288787841797, 0.10334587097167969, 0.1065988540649414, 0.10985183715820312, 0.11310482025146484, 0.11635780334472656, 0.11961078643798828, 0.12286376953125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [35.0, 736.0, 215.0, 25.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021249116398394108, -0.0008498249808326364, 0.00042526167817413807, 0.0017003482207655907, 0.002975434996187687, 0.004250521771609783, 0.005525608081370592, 0.006800694856792688, 0.008075781166553497, 0.009350867941975594, 0.01062595471739769, 0.011901041492819786, 0.013176128268241882, 0.014451215043663979, 0.015726301819086075, 0.017001386731863022, 0.018276475369930267, 0.019551562145352364, 0.02082664892077446, 0.022101735696196556, 0.023376822471618652, 0.02465190924704075, 0.025926996022462845, 0.027202080935239792, 0.028477167710661888, 0.029752254486083984, 0.03102734126150608, 0.03230242803692818, 0.033577512949705124, 0.03485260158777237, 0.036127686500549316, 0.03740277513861656, 0.03867786005139351, 0.039952944964170456, 0.0412280336022377, 0.04250311851501465, 0.043778207153081894, 0.04505329206585884, 0.046328380703926086, 0.04760346561670303, 0.04887855425477028, 0.050153639167547226, 0.05142872780561447, 0.05270381271839142, 0.053978901356458664, 0.05525398626923561, 0.056529074907302856, 0.0578041598200798, 0.05907924473285675, 0.0603543296456337, 0.06162941828370094, 0.06290450692176819, 0.06417959183454514, 0.06545467674732208, 0.06672976166009903, 0.06800485402345657, 0.06927993893623352, 0.07055502384901047, 0.07183010876178741, 0.07310520112514496, 0.0743802860379219, 0.07565537095069885, 0.0769304558634758, 0.07820554822683334, 0.07948063313961029]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 6.0, 8.0, 12.0, 10.0, 23.0, 27.0, 39.0, 32.0, 35.0, 42.0, 66.0, 70.0, 64.0, 62.0, 72.0, 58.0, 75.0, 61.0, 52.0, 59.0, 33.0, 34.0, 22.0, 22.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007820487022399902, -0.007613399066030979, -0.007406311109662056, -0.007199223153293133, -0.00699213519692421, -0.006785047240555286, -0.006577959284186363, -0.00637087132781744, -0.006163783371448517, -0.005956695415079594, -0.0057496074587106705, -0.005542519502341747, -0.005335431545972824, -0.005128343589603901, -0.004921255633234978, -0.0047141676768660545, -0.004507079720497131, -0.004299991764128208, -0.004092903807759285, -0.003885815851390362, -0.0036787278950214386, -0.0034716399386525154, -0.0032645519822835922, -0.003057464025914669, -0.002850376069545746, -0.0026432881131768227, -0.0024362001568078995, -0.0022291122004389763, -0.002022024244070053, -0.00181493628770113, -0.0016078483313322067, -0.0014007603749632835, -0.0011936724185943604, -0.0009865844622254372, -0.000779496505856514, -0.0005724085494875908, -0.0003653205931186676, -0.00015823263674974442, 4.885531961917877e-05, 0.00025594327598810196, 0.00046303123235702515, 0.0006701191887259483, 0.0008772071450948715, 0.0010842951014637947, 0.001291383057832718, 0.001498471014201641, 0.0017055589705705643, 0.0019126469269394875, 0.0021197348833084106, 0.002326822839677334, 0.002533910796046257, 0.00274099875241518, 0.0029480867087841034, 0.0031551746651530266, 0.0033622626215219498, 0.003569350577890873, 0.003776438534259796, 0.003983526490628719, 0.0041906144469976425, 0.004397702403366566, 0.004604790359735489, 0.004811878316104412, 0.005018966272473335, 0.0052260542288422585, 0.005433142185211182]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 5.0, 7.0, 10.0, 8.0, 12.0, 11.0, 19.0, 13.0, 20.0, 30.0, 29.0, 21.0, 22.0, 44.0, 32.0, 33.0, 29.0, 41.0, 37.0, 45.0, 50.0, 32.0, 36.0, 40.0, 30.0, 41.0, 31.0, 28.0, 29.0, 31.0, 29.0, 29.0, 14.0, 15.0, 19.0, 17.0, 11.0, 11.0, 4.0, 6.0, 8.0, 9.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.671875, -2.592071533203125, -2.51226806640625, -2.432464599609375, -2.3526611328125, -2.272857666015625, -2.19305419921875, -2.113250732421875, -2.033447265625, -1.953643798828125, -1.87384033203125, -1.794036865234375, -1.7142333984375, -1.634429931640625, -1.55462646484375, -1.474822998046875, -1.39501953125, -1.315216064453125, -1.23541259765625, -1.155609130859375, -1.0758056640625, -0.996002197265625, -0.91619873046875, -0.836395263671875, -0.756591796875, -0.676788330078125, -0.59698486328125, -0.517181396484375, -0.4373779296875, -0.357574462890625, -0.27777099609375, -0.197967529296875, -0.1181640625, -0.038360595703125, 0.04144287109375, 0.121246337890625, 0.2010498046875, 0.280853271484375, 0.36065673828125, 0.440460205078125, 0.520263671875, 0.600067138671875, 0.67987060546875, 0.759674072265625, 0.8394775390625, 0.919281005859375, 0.99908447265625, 1.078887939453125, 1.15869140625, 1.238494873046875, 1.31829833984375, 1.398101806640625, 1.4779052734375, 1.557708740234375, 1.63751220703125, 1.717315673828125, 1.797119140625, 1.876922607421875, 1.95672607421875, 2.036529541015625, 2.1163330078125, 2.196136474609375, 2.27593994140625, 2.355743408203125, 2.435546875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 19.0, 25.0, 45.0, 77.0, 102.0, 186.0, 263.0, 486.0, 803.0, 1455.0, 2650.0, 5086.0, 9451.0, 18584.0, 36980.0, 75035.0, 155089.0, 270027.0, 233572.0, 119859.0, 58083.0, 29240.0, 14820.0, 7576.0, 4034.0, 2076.0, 1138.0, 678.0, 415.0, 226.0, 157.0, 115.0, 53.0, 45.0, 23.0, 22.0, 11.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.716796875, -2.636474609375, -2.55615234375, -2.475830078125, -2.3955078125, -2.315185546875, -2.23486328125, -2.154541015625, -2.07421875, -1.993896484375, -1.91357421875, -1.833251953125, -1.7529296875, -1.672607421875, -1.59228515625, -1.511962890625, -1.431640625, -1.351318359375, -1.27099609375, -1.190673828125, -1.1103515625, -1.030029296875, -0.94970703125, -0.869384765625, -0.7890625, -0.708740234375, -0.62841796875, -0.548095703125, -0.4677734375, -0.387451171875, -0.30712890625, -0.226806640625, -0.146484375, -0.066162109375, 0.01416015625, 0.094482421875, 0.1748046875, 0.255126953125, 0.33544921875, 0.415771484375, 0.49609375, 0.576416015625, 0.65673828125, 0.737060546875, 0.8173828125, 0.897705078125, 0.97802734375, 1.058349609375, 1.138671875, 1.218994140625, 1.29931640625, 1.379638671875, 1.4599609375, 1.540283203125, 1.62060546875, 1.700927734375, 1.78125, 1.861572265625, 1.94189453125, 2.022216796875, 2.1025390625, 2.182861328125, 2.26318359375, 2.343505859375, 2.423828125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 4.0, 7.0, 9.0, 7.0, 11.0, 10.0, 15.0, 18.0, 26.0, 24.0, 33.0, 30.0, 21.0, 40.0, 44.0, 62.0, 67.0, 117.0, 223.0, 1401.0, 294.0, 121.0, 82.0, 53.0, 52.0, 34.0, 31.0, 25.0, 36.0, 25.0, 28.0, 17.0, 16.0, 15.0, 15.0, 8.0, 8.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.890625, -10.5667724609375, -10.242919921875, -9.9190673828125, -9.59521484375, -9.2713623046875, -8.947509765625, -8.6236572265625, -8.2998046875, -7.9759521484375, -7.652099609375, -7.3282470703125, -7.00439453125, -6.6805419921875, -6.356689453125, -6.0328369140625, -5.708984375, -5.3851318359375, -5.061279296875, -4.7374267578125, -4.41357421875, -4.0897216796875, -3.765869140625, -3.4420166015625, -3.1181640625, -2.7943115234375, -2.470458984375, -2.1466064453125, -1.82275390625, -1.4989013671875, -1.175048828125, -0.8511962890625, -0.52734375, -0.2034912109375, 0.120361328125, 0.4442138671875, 0.76806640625, 1.0919189453125, 1.415771484375, 1.7396240234375, 2.0634765625, 2.3873291015625, 2.711181640625, 3.0350341796875, 3.35888671875, 3.6827392578125, 4.006591796875, 4.3304443359375, 4.654296875, 4.9781494140625, 5.302001953125, 5.6258544921875, 5.94970703125, 6.2735595703125, 6.597412109375, 6.9212646484375, 7.2451171875, 7.5689697265625, 7.892822265625, 8.2166748046875, 8.54052734375, 8.8643798828125, 9.188232421875, 9.5120849609375, 9.8359375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 3.0, 11.0, 19.0, 34.0, 35.0, 46.0, 55.0, 84.0, 99.0, 192.0, 269.0, 445.0, 1552.0, 27904.0, 3073162.0, 38738.0, 1668.0, 490.0, 272.0, 171.0, 108.0, 109.0, 62.0, 46.0, 34.0, 25.0, 16.0, 15.0, 8.0, 13.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.625, -26.65673828125, -25.6884765625, -24.72021484375, -23.751953125, -22.78369140625, -21.8154296875, -20.84716796875, -19.87890625, -18.91064453125, -17.9423828125, -16.97412109375, -16.005859375, -15.03759765625, -14.0693359375, -13.10107421875, -12.1328125, -11.16455078125, -10.1962890625, -9.22802734375, -8.259765625, -7.29150390625, -6.3232421875, -5.35498046875, -4.38671875, -3.41845703125, -2.4501953125, -1.48193359375, -0.513671875, 0.45458984375, 1.4228515625, 2.39111328125, 3.359375, 4.32763671875, 5.2958984375, 6.26416015625, 7.232421875, 8.20068359375, 9.1689453125, 10.13720703125, 11.10546875, 12.07373046875, 13.0419921875, 14.01025390625, 14.978515625, 15.94677734375, 16.9150390625, 17.88330078125, 18.8515625, 19.81982421875, 20.7880859375, 21.75634765625, 22.724609375, 23.69287109375, 24.6611328125, 25.62939453125, 26.59765625, 27.56591796875, 28.5341796875, 29.50244140625, 30.470703125, 31.43896484375, 32.4072265625, 33.37548828125, 34.34375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 22.0, 738.0, 258.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.9682502746582, -34.8353157043457, -29.702383041381836, -24.56945037841797, -19.43651580810547, -14.303581237792969, -9.170648574829102, -4.037715911865234, 1.0952186584472656, 6.228152275085449, 11.361085891723633, 16.4940185546875, 21.626953125, 26.7598876953125, 31.892820358276367, 37.025753021240234, 42.158687591552734, 47.291622161865234, 52.42455291748047, 57.55748748779297, 62.69042205810547, 67.82335662841797, 72.95629119873047, 78.08921813964844, 83.22215270996094, 88.35508728027344, 93.48802185058594, 98.62095642089844, 103.75389099121094, 108.88682556152344, 114.0197525024414, 119.1526870727539, 124.28561401367188, 129.41854858398438, 134.55148315429688, 139.68441772460938, 144.81735229492188, 149.95028686523438, 155.08322143554688, 160.21615600585938, 165.34909057617188, 170.48202514648438, 175.61495971679688, 180.74789428710938, 185.88082885742188, 191.01376342773438, 196.14669799804688, 201.27963256835938, 206.4125518798828, 211.5454864501953, 216.6784210205078, 221.8113555908203, 226.9442901611328, 232.0772247314453, 237.2101593017578, 242.34307861328125, 247.47601318359375, 252.60894775390625, 257.74188232421875, 262.87481689453125, 268.00775146484375, 273.14068603515625, 278.27362060546875, 283.40655517578125, 288.53948974609375]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 4.0, 1.0, 5.0, 7.0, 10.0, 6.0, 11.0, 16.0, 15.0, 5.0, 24.0, 16.0, 22.0, 31.0, 32.0, 28.0, 24.0, 27.0, 38.0, 39.0, 35.0, 35.0, 43.0, 35.0, 34.0, 34.0, 37.0, 40.0, 40.0, 38.0, 24.0, 27.0, 24.0, 23.0, 24.0, 21.0, 20.0, 15.0, 14.0, 14.0, 11.0, 9.0, 13.0, 6.0, 6.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.11534881591797, -21.422685623168945, -20.73002052307129, -20.037357330322266, -19.34469223022461, -18.652029037475586, -17.959365844726562, -17.266700744628906, -16.574037551879883, -15.881373405456543, -15.188709259033203, -14.49604606628418, -13.80338191986084, -13.1107177734375, -12.418054580688477, -11.725390434265137, -11.032726287841797, -10.340062141418457, -9.647397994995117, -8.954734802246094, -8.262070655822754, -7.569406509399414, -6.876742839813232, -6.184079170227051, -5.491415023803711, -4.798750877380371, -4.1060872077941895, -3.4134232997894287, -2.720759391784668, -2.0280954837799072, -1.3354315757751465, -0.6427679061889648, 0.049896240234375, 0.7425601482391357, 1.4352240562438965, 2.1278879642486572, 2.820551872253418, 3.5132157802581787, 4.2058796882629395, 4.898543357849121, 5.591207504272461, 6.283871650695801, 6.976535320281982, 7.669198989868164, 8.361863136291504, 9.054527282714844, 9.747190475463867, 10.439854621887207, 11.132518768310547, 11.825182914733887, 12.517847061157227, 13.21051025390625, 13.90317440032959, 14.59583854675293, 15.288501739501953, 15.981165885925293, 16.673830032348633, 17.366493225097656, 18.059158325195312, 18.751821517944336, 19.44448471069336, 20.137149810791016, 20.82981300354004, 21.522476196289062, 22.21514129638672]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 7.0, 4.0, 9.0, 4.0, 14.0, 13.0, 15.0, 15.0, 18.0, 16.0, 21.0, 20.0, 24.0, 35.0, 26.0, 29.0, 38.0, 43.0, 29.0, 34.0, 49.0, 36.0, 36.0, 40.0, 34.0, 38.0, 29.0, 31.0, 34.0, 20.0, 32.0, 28.0, 28.0, 19.0, 18.0, 12.0, 9.0, 12.0, 19.0, 11.0, 7.0, 10.0, 15.0, 4.0, 5.0, 6.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.632354736328125, -2.54986572265625, -2.467376708984375, -2.3848876953125, -2.302398681640625, -2.21990966796875, -2.137420654296875, -2.054931640625, -1.972442626953125, -1.88995361328125, -1.807464599609375, -1.7249755859375, -1.642486572265625, -1.55999755859375, -1.477508544921875, -1.39501953125, -1.312530517578125, -1.23004150390625, -1.147552490234375, -1.0650634765625, -0.982574462890625, -0.90008544921875, -0.817596435546875, -0.735107421875, -0.652618408203125, -0.57012939453125, -0.487640380859375, -0.4051513671875, -0.322662353515625, -0.24017333984375, -0.157684326171875, -0.0751953125, 0.007293701171875, 0.08978271484375, 0.172271728515625, 0.2547607421875, 0.337249755859375, 0.41973876953125, 0.502227783203125, 0.584716796875, 0.667205810546875, 0.74969482421875, 0.832183837890625, 0.9146728515625, 0.997161865234375, 1.07965087890625, 1.162139892578125, 1.24462890625, 1.327117919921875, 1.40960693359375, 1.492095947265625, 1.5745849609375, 1.657073974609375, 1.73956298828125, 1.822052001953125, 1.904541015625, 1.987030029296875, 2.06951904296875, 2.152008056640625, 2.2344970703125, 2.316986083984375, 2.39947509765625, 2.481964111328125, 2.564453125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 7.0, 3.0, 7.0, 7.0, 10.0, 8.0, 8.0, 16.0, 14.0, 19.0, 13.0, 23.0, 27.0, 35.0, 24.0, 51.0, 81.0, 154.0, 430.0, 1417.0, 9509.0, 132522.0, 1885645.0, 2002805.0, 148217.0, 10554.0, 1633.0, 447.0, 195.0, 93.0, 60.0, 48.0, 26.0, 21.0, 16.0, 25.0, 13.0, 17.0, 17.0, 18.0, 13.0, 12.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.2662353515625, -8.985595703125, -8.7049560546875, -8.42431640625, -8.1436767578125, -7.863037109375, -7.5823974609375, -7.3017578125, -7.0211181640625, -6.740478515625, -6.4598388671875, -6.17919921875, -5.8985595703125, -5.617919921875, -5.3372802734375, -5.056640625, -4.7760009765625, -4.495361328125, -4.2147216796875, -3.93408203125, -3.6534423828125, -3.372802734375, -3.0921630859375, -2.8115234375, -2.5308837890625, -2.250244140625, -1.9696044921875, -1.68896484375, -1.4083251953125, -1.127685546875, -0.8470458984375, -0.56640625, -0.2857666015625, -0.005126953125, 0.2755126953125, 0.55615234375, 0.8367919921875, 1.117431640625, 1.3980712890625, 1.6787109375, 1.9593505859375, 2.239990234375, 2.5206298828125, 2.80126953125, 3.0819091796875, 3.362548828125, 3.6431884765625, 3.923828125, 4.2044677734375, 4.485107421875, 4.7657470703125, 5.04638671875, 5.3270263671875, 5.607666015625, 5.8883056640625, 6.1689453125, 6.4495849609375, 6.730224609375, 7.0108642578125, 7.29150390625, 7.5721435546875, 7.852783203125, 8.1334228515625, 8.4140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 9.0, 13.0, 19.0, 23.0, 24.0, 37.0, 53.0, 50.0, 89.0, 106.0, 166.0, 193.0, 267.0, 330.0, 348.0, 394.0, 417.0, 307.0, 297.0, 210.0, 165.0, 142.0, 87.0, 89.0, 61.0, 40.0, 32.0, 24.0, 13.0, 20.0, 9.0, 8.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.06640625, -5.87451171875, -5.6826171875, -5.49072265625, -5.298828125, -5.10693359375, -4.9150390625, -4.72314453125, -4.53125, -4.33935546875, -4.1474609375, -3.95556640625, -3.763671875, -3.57177734375, -3.3798828125, -3.18798828125, -2.99609375, -2.80419921875, -2.6123046875, -2.42041015625, -2.228515625, -2.03662109375, -1.8447265625, -1.65283203125, -1.4609375, -1.26904296875, -1.0771484375, -0.88525390625, -0.693359375, -0.50146484375, -0.3095703125, -0.11767578125, 0.07421875, 0.26611328125, 0.4580078125, 0.64990234375, 0.841796875, 1.03369140625, 1.2255859375, 1.41748046875, 1.609375, 1.80126953125, 1.9931640625, 2.18505859375, 2.376953125, 2.56884765625, 2.7607421875, 2.95263671875, 3.14453125, 3.33642578125, 3.5283203125, 3.72021484375, 3.912109375, 4.10400390625, 4.2958984375, 4.48779296875, 4.6796875, 4.87158203125, 5.0634765625, 5.25537109375, 5.447265625, 5.63916015625, 5.8310546875, 6.02294921875, 6.21484375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 12.0, 10.0, 12.0, 21.0, 24.0, 39.0, 54.0, 86.0, 81.0, 149.0, 198.0, 306.0, 610.0, 2062.0, 18517.0, 413205.0, 3306067.0, 430402.0, 18781.0, 2107.0, 577.0, 296.0, 202.0, 116.0, 92.0, 65.0, 50.0, 31.0, 30.0, 19.0, 17.0, 11.0, 10.0, 7.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.4375, -13.979248046875, -13.52099609375, -13.062744140625, -12.6044921875, -12.146240234375, -11.68798828125, -11.229736328125, -10.771484375, -10.313232421875, -9.85498046875, -9.396728515625, -8.9384765625, -8.480224609375, -8.02197265625, -7.563720703125, -7.10546875, -6.647216796875, -6.18896484375, -5.730712890625, -5.2724609375, -4.814208984375, -4.35595703125, -3.897705078125, -3.439453125, -2.981201171875, -2.52294921875, -2.064697265625, -1.6064453125, -1.148193359375, -0.68994140625, -0.231689453125, 0.2265625, 0.684814453125, 1.14306640625, 1.601318359375, 2.0595703125, 2.517822265625, 2.97607421875, 3.434326171875, 3.892578125, 4.350830078125, 4.80908203125, 5.267333984375, 5.7255859375, 6.183837890625, 6.64208984375, 7.100341796875, 7.55859375, 8.016845703125, 8.47509765625, 8.933349609375, 9.3916015625, 9.849853515625, 10.30810546875, 10.766357421875, 11.224609375, 11.682861328125, 12.14111328125, 12.599365234375, 13.0576171875, 13.515869140625, 13.97412109375, 14.432373046875, 14.890625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 21.0, 66.0, 127.0, 275.0, 237.0, 174.0, 87.0, 16.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.227203369140625, -31.95541000366211, -29.683616638183594, -27.41182518005371, -25.140031814575195, -22.86823844909668, -20.596446990966797, -18.32465362548828, -16.052860260009766, -13.78106689453125, -11.50927448272705, -9.237482070922852, -6.965688705444336, -4.69389533996582, -2.422102928161621, -0.15031051635742188, 2.1214828491210938, 4.393275737762451, 6.665068626403809, 8.936861038208008, 11.208654403686523, 13.480447769165039, 15.752240180969238, 18.024032592773438, 20.295825958251953, 22.56761932373047, 24.839412689208984, 27.111204147338867, 29.382997512817383, 31.6547908782959, 33.92658233642578, 36.1983757019043, 38.47016143798828, 40.7419548034668, 43.01374816894531, 45.28554153442383, 47.557334899902344, 49.829124450683594, 52.10091781616211, 54.372711181640625, 56.64450454711914, 58.916297912597656, 61.18809127807617, 63.45988464355469, 65.73167419433594, 68.00347137451172, 70.27526092529297, 72.54705810546875, 74.81884765625, 77.09063720703125, 79.36243438720703, 81.63422393798828, 83.90602111816406, 86.17781066894531, 88.4496078491211, 90.72139739990234, 92.99319458007812, 95.26498413085938, 97.53678131103516, 99.8085708618164, 102.08036804199219, 104.35215759277344, 106.62395477294922, 108.89574432373047, 111.16753387451172]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 3.0, 1.0, 8.0, 9.0, 13.0, 18.0, 17.0, 13.0, 21.0, 25.0, 28.0, 25.0, 31.0, 27.0, 30.0, 44.0, 33.0, 42.0, 42.0, 42.0, 39.0, 33.0, 37.0, 33.0, 34.0, 46.0, 40.0, 25.0, 24.0, 35.0, 25.0, 22.0, 23.0, 20.0, 25.0, 21.0, 14.0, 9.0, 4.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.351171493530273, -21.68994903564453, -21.028724670410156, -20.36750030517578, -19.70627784729004, -19.045055389404297, -18.383831024169922, -17.722606658935547, -17.061384201049805, -16.400161743164062, -15.738937377929688, -15.077713966369629, -14.41649055480957, -13.755267143249512, -13.094043731689453, -12.432820320129395, -11.771596908569336, -11.110373497009277, -10.449150085449219, -9.78792667388916, -9.126703262329102, -8.465479850769043, -7.804256439208984, -7.143033027648926, -6.481809616088867, -5.820586204528809, -5.15936279296875, -4.498139381408691, -3.836915969848633, -3.175692558288574, -2.5144691467285156, -1.853245735168457, -1.1920242309570312, -0.5308008193969727, 0.13042259216308594, 0.7916460037231445, 1.4528694152832031, 2.1140928268432617, 2.7753162384033203, 3.436539649963379, 4.0977630615234375, 4.758986473083496, 5.420209884643555, 6.081433296203613, 6.742656707763672, 7.4038801193237305, 8.065103530883789, 8.726326942443848, 9.387550354003906, 10.048773765563965, 10.709997177124023, 11.371220588684082, 12.03244400024414, 12.6936674118042, 13.354890823364258, 14.016114234924316, 14.677337646484375, 15.338561058044434, 15.999784469604492, 16.661006927490234, 17.32223129272461, 17.983455657958984, 18.644678115844727, 19.30590057373047, 19.967124938964844]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 4.0, 6.0, 9.0, 8.0, 7.0, 9.0, 5.0, 17.0, 14.0, 15.0, 14.0, 19.0, 32.0, 13.0, 21.0, 27.0, 31.0, 34.0, 32.0, 47.0, 40.0, 38.0, 37.0, 35.0, 46.0, 47.0, 45.0, 30.0, 36.0, 32.0, 29.0, 29.0, 22.0, 20.0, 16.0, 13.0, 19.0, 14.0, 13.0, 10.0, 13.0, 10.0, 10.0, 12.0, 7.0, 2.0, 6.0, 0.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.666015625, -2.583404541015625, -2.50079345703125, -2.418182373046875, -2.3355712890625, -2.252960205078125, -2.17034912109375, -2.087738037109375, -2.005126953125, -1.922515869140625, -1.83990478515625, -1.757293701171875, -1.6746826171875, -1.592071533203125, -1.50946044921875, -1.426849365234375, -1.34423828125, -1.261627197265625, -1.17901611328125, -1.096405029296875, -1.0137939453125, -0.931182861328125, -0.84857177734375, -0.765960693359375, -0.683349609375, -0.600738525390625, -0.51812744140625, -0.435516357421875, -0.3529052734375, -0.270294189453125, -0.18768310546875, -0.105072021484375, -0.0224609375, 0.060150146484375, 0.14276123046875, 0.225372314453125, 0.3079833984375, 0.390594482421875, 0.47320556640625, 0.555816650390625, 0.638427734375, 0.721038818359375, 0.80364990234375, 0.886260986328125, 0.9688720703125, 1.051483154296875, 1.13409423828125, 1.216705322265625, 1.29931640625, 1.381927490234375, 1.46453857421875, 1.547149658203125, 1.6297607421875, 1.712371826171875, 1.79498291015625, 1.877593994140625, 1.960205078125, 2.042816162109375, 2.12542724609375, 2.208038330078125, 2.2906494140625, 2.373260498046875, 2.45587158203125, 2.538482666015625, 2.62109375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 14.0, 9.0, 20.0, 19.0, 26.0, 45.0, 64.0, 111.0, 140.0, 198.0, 320.0, 476.0, 718.0, 1097.0, 1826.0, 2826.0, 4750.0, 8121.0, 14401.0, 25679.0, 48199.0, 92402.0, 175744.0, 258334.0, 191587.0, 102303.0, 52681.0, 28212.0, 15625.0, 8897.0, 5187.0, 3108.0, 1913.0, 1190.0, 780.0, 485.0, 320.0, 253.0, 158.0, 104.0, 65.0, 44.0, 26.0, 22.0, 20.0, 7.0, 10.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.4169921875, -0.40378570556640625, -0.3905792236328125, -0.37737274169921875, -0.364166259765625, -0.35095977783203125, -0.3377532958984375, -0.32454681396484375, -0.31134033203125, -0.29813385009765625, -0.2849273681640625, -0.27172088623046875, -0.258514404296875, -0.24530792236328125, -0.2321014404296875, -0.21889495849609375, -0.2056884765625, -0.19248199462890625, -0.1792755126953125, -0.16606903076171875, -0.152862548828125, -0.13965606689453125, -0.1264495849609375, -0.11324310302734375, -0.10003662109375, -0.08683013916015625, -0.0736236572265625, -0.06041717529296875, -0.047210693359375, -0.03400421142578125, -0.0207977294921875, -0.00759124755859375, 0.005615234375, 0.01882171630859375, 0.0320281982421875, 0.04523468017578125, 0.058441162109375, 0.07164764404296875, 0.0848541259765625, 0.09806060791015625, 0.11126708984375, 0.12447357177734375, 0.1376800537109375, 0.15088653564453125, 0.164093017578125, 0.17729949951171875, 0.1905059814453125, 0.20371246337890625, 0.2169189453125, 0.23012542724609375, 0.2433319091796875, 0.25653839111328125, 0.269744873046875, 0.28295135498046875, 0.2961578369140625, 0.30936431884765625, 0.32257080078125, 0.33577728271484375, 0.3489837646484375, 0.36219024658203125, 0.375396728515625, 0.38860321044921875, 0.4018096923828125, 0.41501617431640625, 0.42822265625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 14.0, 7.0, 9.0, 7.0, 9.0, 16.0, 12.0, 10.0, 28.0, 22.0, 16.0, 23.0, 30.0, 21.0, 26.0, 39.0, 33.0, 38.0, 39.0, 32.0, 31.0, 1054.0, 36.0, 36.0, 37.0, 26.0, 24.0, 40.0, 34.0, 32.0, 28.0, 28.0, 24.0, 28.0, 20.0, 15.0, 13.0, 17.0, 9.0, 13.0, 11.0, 7.0, 4.0, 8.0, 3.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.547943115234375, -1.49432373046875, -1.440704345703125, -1.3870849609375, -1.333465576171875, -1.27984619140625, -1.226226806640625, -1.172607421875, -1.118988037109375, -1.06536865234375, -1.011749267578125, -0.9581298828125, -0.904510498046875, -0.85089111328125, -0.797271728515625, -0.74365234375, -0.690032958984375, -0.63641357421875, -0.582794189453125, -0.5291748046875, -0.475555419921875, -0.42193603515625, -0.368316650390625, -0.314697265625, -0.261077880859375, -0.20745849609375, -0.153839111328125, -0.1002197265625, -0.046600341796875, 0.00701904296875, 0.060638427734375, 0.1142578125, 0.167877197265625, 0.22149658203125, 0.275115966796875, 0.3287353515625, 0.382354736328125, 0.43597412109375, 0.489593505859375, 0.543212890625, 0.596832275390625, 0.65045166015625, 0.704071044921875, 0.7576904296875, 0.811309814453125, 0.86492919921875, 0.918548583984375, 0.97216796875, 1.025787353515625, 1.07940673828125, 1.133026123046875, 1.1866455078125, 1.240264892578125, 1.29388427734375, 1.347503662109375, 1.401123046875, 1.454742431640625, 1.50836181640625, 1.561981201171875, 1.6156005859375, 1.669219970703125, 1.72283935546875, 1.776458740234375, 1.830078125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 10.0, 16.0, 37.0, 48.0, 77.0, 116.0, 147.0, 222.0, 331.0, 463.0, 640.0, 910.0, 1237.0, 1864.0, 2701.0, 3963.0, 5808.0, 8469.0, 12163.0, 17714.0, 25996.0, 37456.0, 53869.0, 76833.0, 106223.0, 162769.0, 1162507.0, 119990.0, 89164.0, 63390.0, 44172.0, 30643.0, 20816.0, 14404.0, 9961.0, 6913.0, 4657.0, 3115.0, 2275.0, 1501.0, 1123.0, 759.0, 490.0, 365.0, 256.0, 181.0, 133.0, 85.0, 48.0, 40.0, 24.0, 14.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.1680908203125, -0.1628742218017578, -0.15765762329101562, -0.15244102478027344, -0.14722442626953125, -0.14200782775878906, -0.13679122924804688, -0.1315746307373047, -0.1263580322265625, -0.12114143371582031, -0.11592483520507812, -0.11070823669433594, -0.10549163818359375, -0.10027503967285156, -0.09505844116210938, -0.08984184265136719, -0.084625244140625, -0.07940864562988281, -0.07419204711914062, -0.06897544860839844, -0.06375885009765625, -0.05854225158691406, -0.053325653076171875, -0.04810905456542969, -0.0428924560546875, -0.03767585754394531, -0.032459259033203125, -0.027242660522460938, -0.02202606201171875, -0.016809463500976562, -0.011592864990234375, -0.0063762664794921875, -0.00115966796875, 0.0040569305419921875, 0.009273529052734375, 0.014490127563476562, 0.01970672607421875, 0.024923324584960938, 0.030139923095703125, 0.03535652160644531, 0.0405731201171875, 0.04578971862792969, 0.051006317138671875, 0.05622291564941406, 0.06143951416015625, 0.06665611267089844, 0.07187271118164062, 0.07708930969238281, 0.082305908203125, 0.08752250671386719, 0.09273910522460938, 0.09795570373535156, 0.10317230224609375, 0.10838890075683594, 0.11360549926757812, 0.11882209777832031, 0.1240386962890625, 0.1292552947998047, 0.13447189331054688, 0.13968849182128906, 0.14490509033203125, 0.15012168884277344, 0.15533828735351562, 0.1605548858642578, 0.165771484375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 16.0, 11.0, 6.0, 17.0, 28.0, 32.0, 35.0, 34.0, 43.0, 69.0, 84.0, 112.0, 109.0, 87.0, 63.0, 40.0, 30.0, 35.0, 21.0, 20.0, 17.0, 8.0, 3.0, 10.0, 10.0, 4.0, 8.0, 10.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004810333251953125, -0.004660069942474365, -0.0045098066329956055, -0.004359543323516846, -0.004209280014038086, -0.004059016704559326, -0.003908753395080566, -0.0037584900856018066, -0.003608226776123047, -0.003457963466644287, -0.0033077001571655273, -0.0031574368476867676, -0.003007173538208008, -0.002856910228729248, -0.0027066469192504883, -0.0025563836097717285, -0.0024061203002929688, -0.002255856990814209, -0.0021055936813354492, -0.0019553303718566895, -0.0018050670623779297, -0.00165480375289917, -0.0015045404434204102, -0.0013542771339416504, -0.0012040138244628906, -0.0010537505149841309, -0.0009034872055053711, -0.0007532238960266113, -0.0006029605865478516, -0.0004526972770690918, -0.00030243396759033203, -0.00015217065811157227, -1.9073486328125e-06, 0.00014835596084594727, 0.00029861927032470703, 0.0004488825798034668, 0.0005991458892822266, 0.0007494091987609863, 0.0008996725082397461, 0.0010499358177185059, 0.0012001991271972656, 0.0013504624366760254, 0.0015007257461547852, 0.001650989055633545, 0.0018012523651123047, 0.0019515156745910645, 0.0021017789840698242, 0.002252042293548584, 0.0024023056030273438, 0.0025525689125061035, 0.0027028322219848633, 0.002853095531463623, 0.003003358840942383, 0.0031536221504211426, 0.0033038854598999023, 0.003454148769378662, 0.003604412078857422, 0.0037546753883361816, 0.0039049386978149414, 0.004055202007293701, 0.004205465316772461, 0.004355728626251221, 0.0045059919357299805, 0.00465625524520874, 0.0048065185546875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 9.0, 9.0, 10.0, 9.0, 9.0, 16.0, 14.0, 33.0, 43.0, 55.0, 65.0, 114.0, 191.0, 392.0, 2268.0, 401548.0, 639928.0, 2806.0, 386.0, 205.0, 127.0, 84.0, 62.0, 42.0, 31.0, 18.0, 18.0, 17.0, 15.0, 3.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09478759765625, -0.0918283462524414, -0.08886909484863281, -0.08590984344482422, -0.08295059204101562, -0.07999134063720703, -0.07703208923339844, -0.07407283782958984, -0.07111358642578125, -0.06815433502197266, -0.06519508361816406, -0.06223583221435547, -0.059276580810546875, -0.05631732940673828, -0.05335807800292969, -0.050398826599121094, -0.0474395751953125, -0.044480323791503906, -0.04152107238769531, -0.03856182098388672, -0.035602569580078125, -0.03264331817626953, -0.029684066772460938, -0.026724815368652344, -0.02376556396484375, -0.020806312561035156, -0.017847061157226562, -0.014887809753417969, -0.011928558349609375, -0.008969306945800781, -0.0060100555419921875, -0.0030508041381835938, -9.1552734375e-05, 0.0028676986694335938, 0.0058269500732421875, 0.008786201477050781, 0.011745452880859375, 0.014704704284667969, 0.017663955688476562, 0.020623207092285156, 0.02358245849609375, 0.026541709899902344, 0.029500961303710938, 0.03246021270751953, 0.035419464111328125, 0.03837871551513672, 0.04133796691894531, 0.044297218322753906, 0.0472564697265625, 0.050215721130371094, 0.05317497253417969, 0.05613422393798828, 0.059093475341796875, 0.06205272674560547, 0.06501197814941406, 0.06797122955322266, 0.07093048095703125, 0.07388973236083984, 0.07684898376464844, 0.07980823516845703, 0.08276748657226562, 0.08572673797607422, 0.08868598937988281, 0.0916452407836914, 0.0946044921875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 12.0, 503.0, 454.0, 39.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036411816254258156, -0.002398015931248665, -0.0011548504699021578, 8.831499144434929e-05, 0.0013314806856215, 0.0025746463797986507, 0.003817811608314514, 0.005060977302491665, 0.006304142996668816, 0.007547308690845966, 0.008790474385023117, 0.010033639147877693, 0.011276805773377419, 0.012519970536231995, 0.013763136230409145, 0.015006301924586296, 0.016249466687440872, 0.01749263145029545, 0.018735798075795174, 0.01997896283864975, 0.021222129464149475, 0.02246529422700405, 0.023708458989858627, 0.024951625615358353, 0.026194792240858078, 0.027437957003712654, 0.02868112362921238, 0.029924288392066956, 0.03116745501756668, 0.032410621643066406, 0.03365378454327583, 0.03489695116877556, 0.036140117794275284, 0.03738328441977501, 0.038626447319984436, 0.03986961394548416, 0.04111278057098389, 0.04235594719648361, 0.04359911009669304, 0.044842276722192764, 0.04608544334769249, 0.047328609973192215, 0.04857177287340164, 0.04981493949890137, 0.05105810612440109, 0.05230127274990082, 0.053544435650110245, 0.05478760227560997, 0.0560307651758194, 0.05727393180131912, 0.05851709470152855, 0.059760261327028275, 0.061003427952528, 0.062246594578027725, 0.06348975747823715, 0.06473292410373688, 0.0659760907292366, 0.06721925735473633, 0.06846242398023605, 0.06970559060573578, 0.07094874978065491, 0.07219191640615463, 0.07343508303165436, 0.07467824965715408, 0.07592141628265381]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 12.0, 15.0, 18.0, 22.0, 33.0, 36.0, 38.0, 45.0, 61.0, 59.0, 73.0, 65.0, 89.0, 79.0, 64.0, 50.0, 53.0, 51.0, 40.0, 27.0, 28.0, 14.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0064484477043151855, -0.006268625147640705, -0.006088802590966225, -0.005908980034291744, -0.005729157477617264, -0.005549334920942783, -0.005369512364268303, -0.0051896898075938225, -0.005009867250919342, -0.004830044694244862, -0.004650222137570381, -0.004470399580895901, -0.00429057702422142, -0.00411075446754694, -0.003930931910872459, -0.003751109354197979, -0.0035712867975234985, -0.003391464240849018, -0.0032116416841745377, -0.0030318191275000572, -0.0028519965708255768, -0.0026721740141510963, -0.002492351457476616, -0.0023125289008021355, -0.002132706344127655, -0.0019528837874531746, -0.0017730612307786942, -0.0015932386741042137, -0.0014134161174297333, -0.0012335935607552528, -0.0010537710040807724, -0.000873948447406292, -0.0006941258907318115, -0.0005143033340573311, -0.00033448077738285065, -0.0001546582207083702, 2.516433596611023e-05, 0.00020498689264059067, 0.0003848094493150711, 0.0005646320059895515, 0.000744454562664032, 0.0009242771193385124, 0.0011040996760129929, 0.0012839222326874733, 0.0014637447893619537, 0.0016435673460364342, 0.0018233899027109146, 0.002003212459385395, 0.0021830350160598755, 0.002362857572734356, 0.0025426801294088364, 0.002722502686083317, 0.0029023252427577972, 0.0030821477994322777, 0.003261970356106758, 0.0034417929127812386, 0.003621615469455719, 0.0038014380261301994, 0.00398126058280468, 0.00416108313947916, 0.004340905696153641, 0.004520728252828121, 0.004700550809502602, 0.004880373366177082, 0.0050601959228515625]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 4.0, 6.0, 9.0, 8.0, 7.0, 9.0, 5.0, 17.0, 14.0, 15.0, 13.0, 20.0, 32.0, 13.0, 21.0, 27.0, 31.0, 34.0, 32.0, 47.0, 40.0, 38.0, 37.0, 35.0, 46.0, 47.0, 45.0, 30.0, 36.0, 32.0, 29.0, 29.0, 22.0, 20.0, 16.0, 12.0, 20.0, 14.0, 13.0, 10.0, 13.0, 10.0, 10.0, 12.0, 7.0, 2.0, 6.0, 0.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.666015625, -2.583404541015625, -2.50079345703125, -2.418182373046875, -2.3355712890625, -2.252960205078125, -2.17034912109375, -2.087738037109375, -2.005126953125, -1.922515869140625, -1.83990478515625, -1.757293701171875, -1.6746826171875, -1.592071533203125, -1.50946044921875, -1.426849365234375, -1.34423828125, -1.261627197265625, -1.17901611328125, -1.096405029296875, -1.0137939453125, -0.931182861328125, -0.84857177734375, -0.765960693359375, -0.683349609375, -0.600738525390625, -0.51812744140625, -0.435516357421875, -0.3529052734375, -0.270294189453125, -0.18768310546875, -0.105072021484375, -0.0224609375, 0.060150146484375, 0.14276123046875, 0.225372314453125, 0.3079833984375, 0.390594482421875, 0.47320556640625, 0.555816650390625, 0.638427734375, 0.721038818359375, 0.80364990234375, 0.886260986328125, 0.9688720703125, 1.051483154296875, 1.13409423828125, 1.216705322265625, 1.29931640625, 1.381927490234375, 1.46453857421875, 1.547149658203125, 1.6297607421875, 1.712371826171875, 1.79498291015625, 1.877593994140625, 1.960205078125, 2.042816162109375, 2.12542724609375, 2.208038330078125, 2.2906494140625, 2.373260498046875, 2.45587158203125, 2.538482666015625, 2.62109375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 12.0, 23.0, 32.0, 42.0, 78.0, 125.0, 284.0, 630.0, 1422.0, 3471.0, 8061.0, 19612.0, 46201.0, 109440.0, 267014.0, 339665.0, 145378.0, 61932.0, 26130.0, 10958.0, 4473.0, 1853.0, 872.0, 405.0, 185.0, 101.0, 54.0, 32.0, 20.0, 14.0, 9.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.39453125, -4.279388427734375, -4.16424560546875, -4.049102783203125, -3.9339599609375, -3.818817138671875, -3.70367431640625, -3.588531494140625, -3.473388671875, -3.358245849609375, -3.24310302734375, -3.127960205078125, -3.0128173828125, -2.897674560546875, -2.78253173828125, -2.667388916015625, -2.55224609375, -2.437103271484375, -2.32196044921875, -2.206817626953125, -2.0916748046875, -1.976531982421875, -1.86138916015625, -1.746246337890625, -1.631103515625, -1.515960693359375, -1.40081787109375, -1.285675048828125, -1.1705322265625, -1.055389404296875, -0.94024658203125, -0.825103759765625, -0.7099609375, -0.594818115234375, -0.47967529296875, -0.364532470703125, -0.2493896484375, -0.134246826171875, -0.01910400390625, 0.096038818359375, 0.211181640625, 0.326324462890625, 0.44146728515625, 0.556610107421875, 0.6717529296875, 0.786895751953125, 0.90203857421875, 1.017181396484375, 1.13232421875, 1.247467041015625, 1.36260986328125, 1.477752685546875, 1.5928955078125, 1.708038330078125, 1.82318115234375, 1.938323974609375, 2.053466796875, 2.168609619140625, 2.28375244140625, 2.398895263671875, 2.5140380859375, 2.629180908203125, 2.74432373046875, 2.859466552734375, 2.974609375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 10.0, 12.0, 6.0, 11.0, 13.0, 19.0, 22.0, 23.0, 33.0, 33.0, 29.0, 48.0, 68.0, 73.0, 110.0, 216.0, 1461.0, 252.0, 138.0, 95.0, 52.0, 56.0, 42.0, 32.0, 29.0, 33.0, 28.0, 18.0, 9.0, 12.0, 14.0, 12.0, 4.0, 7.0, 5.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.921875, -9.5855712890625, -9.249267578125, -8.9129638671875, -8.57666015625, -8.2403564453125, -7.904052734375, -7.5677490234375, -7.2314453125, -6.8951416015625, -6.558837890625, -6.2225341796875, -5.88623046875, -5.5499267578125, -5.213623046875, -4.8773193359375, -4.541015625, -4.2047119140625, -3.868408203125, -3.5321044921875, -3.19580078125, -2.8594970703125, -2.523193359375, -2.1868896484375, -1.8505859375, -1.5142822265625, -1.177978515625, -0.8416748046875, -0.50537109375, -0.1690673828125, 0.167236328125, 0.5035400390625, 0.83984375, 1.1761474609375, 1.512451171875, 1.8487548828125, 2.18505859375, 2.5213623046875, 2.857666015625, 3.1939697265625, 3.5302734375, 3.8665771484375, 4.202880859375, 4.5391845703125, 4.87548828125, 5.2117919921875, 5.548095703125, 5.8843994140625, 6.220703125, 6.5570068359375, 6.893310546875, 7.2296142578125, 7.56591796875, 7.9022216796875, 8.238525390625, 8.5748291015625, 8.9111328125, 9.2474365234375, 9.583740234375, 9.9200439453125, 10.25634765625, 10.5926513671875, 10.928955078125, 11.2652587890625, 11.6015625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 8.0, 5.0, 9.0, 12.0, 17.0, 25.0, 34.0, 41.0, 49.0, 66.0, 90.0, 111.0, 212.0, 266.0, 513.0, 1599.0, 68830.0, 3052449.0, 18954.0, 1147.0, 418.0, 232.0, 145.0, 104.0, 93.0, 63.0, 46.0, 39.0, 27.0, 27.0, 8.0, 18.0, 12.0, 5.0, 4.0, 6.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.109375, -22.161865234375, -21.21435546875, -20.266845703125, -19.3193359375, -18.371826171875, -17.42431640625, -16.476806640625, -15.529296875, -14.581787109375, -13.63427734375, -12.686767578125, -11.7392578125, -10.791748046875, -9.84423828125, -8.896728515625, -7.94921875, -7.001708984375, -6.05419921875, -5.106689453125, -4.1591796875, -3.211669921875, -2.26416015625, -1.316650390625, -0.369140625, 0.578369140625, 1.52587890625, 2.473388671875, 3.4208984375, 4.368408203125, 5.31591796875, 6.263427734375, 7.2109375, 8.158447265625, 9.10595703125, 10.053466796875, 11.0009765625, 11.948486328125, 12.89599609375, 13.843505859375, 14.791015625, 15.738525390625, 16.68603515625, 17.633544921875, 18.5810546875, 19.528564453125, 20.47607421875, 21.423583984375, 22.37109375, 23.318603515625, 24.26611328125, 25.213623046875, 26.1611328125, 27.108642578125, 28.05615234375, 29.003662109375, 29.951171875, 30.898681640625, 31.84619140625, 32.793701171875, 33.7412109375, 34.688720703125, 35.63623046875, 36.583740234375, 37.53125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 19.0, 99.0, 366.0, 396.0, 121.0, 11.0, 4.0], "bins": [-123.5738296508789, -121.51334381103516, -119.4528579711914, -117.39237213134766, -115.3318862915039, -113.27140045166016, -111.2109146118164, -109.15042877197266, -107.0899429321289, -105.02945709228516, -102.9689712524414, -100.90848541259766, -98.8479995727539, -96.78751373291016, -94.7270278930664, -92.66654205322266, -90.60604858398438, -88.54556274414062, -86.48507690429688, -84.42459106445312, -82.36410522460938, -80.30361938476562, -78.24313354492188, -76.18264770507812, -74.12216186523438, -72.06167602539062, -70.00119018554688, -67.94070434570312, -65.88021850585938, -63.819732666015625, -61.759246826171875, -59.698760986328125, -57.638267517089844, -55.577781677246094, -53.517295837402344, -51.456809997558594, -49.396324157714844, -47.335838317871094, -45.275352478027344, -43.214866638183594, -41.154380798339844, -39.093894958496094, -37.033409118652344, -34.972923278808594, -32.912437438964844, -30.851951599121094, -28.79146385192871, -26.73097801208496, -24.67049217224121, -22.61000633239746, -20.54952049255371, -18.489032745361328, -16.428546905517578, -14.368062019348145, -12.307575225830078, -10.247089385986328, -8.186603546142578, -6.126117706298828, -4.06563138961792, -2.0051450729370117, 0.05534076690673828, 2.1158266067504883, 4.176313400268555, 6.236799240112305, 8.297285079956055]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 4.0, 8.0, 13.0, 15.0, 20.0, 22.0, 16.0, 26.0, 33.0, 38.0, 30.0, 36.0, 30.0, 32.0, 41.0, 40.0, 45.0, 50.0, 39.0, 42.0, 37.0, 34.0, 41.0, 30.0, 32.0, 36.0, 30.0, 23.0, 21.0, 16.0, 15.0, 22.0, 17.0, 12.0, 10.0, 16.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.9287166595459, -27.018306732177734, -26.10789680480957, -25.197486877441406, -24.28707504272461, -23.376665115356445, -22.46625518798828, -21.555845260620117, -20.645435333251953, -19.73502540588379, -18.824615478515625, -17.914203643798828, -17.003793716430664, -16.0933837890625, -15.182973861694336, -14.272563934326172, -13.362153053283691, -12.451743125915527, -11.541332244873047, -10.630922317504883, -9.720512390136719, -8.810102462768555, -7.899691581726074, -6.98928165435791, -6.078871250152588, -5.168460845947266, -4.258050918579102, -3.3476405143737793, -2.437230348587036, -1.526820182800293, -0.6164097785949707, 0.29400014877319336, 1.2044105529785156, 2.114820718765259, 3.025230884552002, 3.935641288757324, 4.846051216125488, 5.7564616203308105, 6.666872024536133, 7.577281951904297, 8.487691879272461, 9.398101806640625, 10.308512687683105, 11.21892261505127, 12.129332542419434, 13.039743423461914, 13.950153350830078, 14.860563278198242, 15.770974159240723, 16.681385040283203, 17.591794967651367, 18.50220489501953, 19.412614822387695, 20.32302474975586, 21.233436584472656, 22.143844604492188, 23.054256439208984, 23.96466636657715, 24.875076293945312, 25.78548812866211, 26.695898056030273, 27.606307983398438, 28.5167179107666, 29.427127838134766, 30.33753776550293]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 2.0, 5.0, 9.0, 5.0, 13.0, 10.0, 13.0, 15.0, 18.0, 11.0, 17.0, 24.0, 24.0, 28.0, 27.0, 26.0, 33.0, 36.0, 37.0, 44.0, 37.0, 44.0, 53.0, 38.0, 51.0, 39.0, 32.0, 35.0, 33.0, 29.0, 25.0, 23.0, 23.0, 16.0, 15.0, 11.0, 17.0, 12.0, 9.0, 16.0, 11.0, 7.0, 8.0, 3.0, 6.0, 5.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.951171875, -2.853363037109375, -2.75555419921875, -2.657745361328125, -2.5599365234375, -2.462127685546875, -2.36431884765625, -2.266510009765625, -2.168701171875, -2.070892333984375, -1.97308349609375, -1.875274658203125, -1.7774658203125, -1.679656982421875, -1.58184814453125, -1.484039306640625, -1.38623046875, -1.288421630859375, -1.19061279296875, -1.092803955078125, -0.9949951171875, -0.897186279296875, -0.79937744140625, -0.701568603515625, -0.603759765625, -0.505950927734375, -0.40814208984375, -0.310333251953125, -0.2125244140625, -0.114715576171875, -0.01690673828125, 0.080902099609375, 0.1787109375, 0.276519775390625, 0.37432861328125, 0.472137451171875, 0.5699462890625, 0.667755126953125, 0.76556396484375, 0.863372802734375, 0.961181640625, 1.058990478515625, 1.15679931640625, 1.254608154296875, 1.3524169921875, 1.450225830078125, 1.54803466796875, 1.645843505859375, 1.74365234375, 1.841461181640625, 1.93927001953125, 2.037078857421875, 2.1348876953125, 2.232696533203125, 2.33050537109375, 2.428314208984375, 2.526123046875, 2.623931884765625, 2.72174072265625, 2.819549560546875, 2.9173583984375, 3.015167236328125, 3.11297607421875, 3.210784912109375, 3.30859375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 6.0, 5.0, 8.0, 11.0, 20.0, 15.0, 16.0, 15.0, 30.0, 31.0, 30.0, 48.0, 78.0, 126.0, 348.0, 938.0, 3916.0, 37362.0, 613608.0, 2816951.0, 673208.0, 41274.0, 4441.0, 959.0, 319.0, 136.0, 82.0, 53.0, 35.0, 37.0, 31.0, 22.0, 12.0, 16.0, 14.0, 14.0, 7.0, 15.0, 6.0, 9.0, 5.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.2760009765625, -8.981689453125, -8.6873779296875, -8.39306640625, -8.0987548828125, -7.804443359375, -7.5101318359375, -7.2158203125, -6.9215087890625, -6.627197265625, -6.3328857421875, -6.03857421875, -5.7442626953125, -5.449951171875, -5.1556396484375, -4.861328125, -4.5670166015625, -4.272705078125, -3.9783935546875, -3.68408203125, -3.3897705078125, -3.095458984375, -2.8011474609375, -2.5068359375, -2.2125244140625, -1.918212890625, -1.6239013671875, -1.32958984375, -1.0352783203125, -0.740966796875, -0.4466552734375, -0.15234375, 0.1419677734375, 0.436279296875, 0.7305908203125, 1.02490234375, 1.3192138671875, 1.613525390625, 1.9078369140625, 2.2021484375, 2.4964599609375, 2.790771484375, 3.0850830078125, 3.37939453125, 3.6737060546875, 3.968017578125, 4.2623291015625, 4.556640625, 4.8509521484375, 5.145263671875, 5.4395751953125, 5.73388671875, 6.0281982421875, 6.322509765625, 6.6168212890625, 6.9111328125, 7.2054443359375, 7.499755859375, 7.7940673828125, 8.08837890625, 8.3826904296875, 8.677001953125, 8.9713134765625, 9.265625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 4.0, 9.0, 14.0, 19.0, 17.0, 28.0, 38.0, 63.0, 84.0, 93.0, 128.0, 170.0, 233.0, 338.0, 362.0, 466.0, 437.0, 351.0, 304.0, 241.0, 177.0, 129.0, 103.0, 73.0, 42.0, 44.0, 25.0, 27.0, 14.0, 9.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40625, -7.18115234375, -6.9560546875, -6.73095703125, -6.505859375, -6.28076171875, -6.0556640625, -5.83056640625, -5.60546875, -5.38037109375, -5.1552734375, -4.93017578125, -4.705078125, -4.47998046875, -4.2548828125, -4.02978515625, -3.8046875, -3.57958984375, -3.3544921875, -3.12939453125, -2.904296875, -2.67919921875, -2.4541015625, -2.22900390625, -2.00390625, -1.77880859375, -1.5537109375, -1.32861328125, -1.103515625, -0.87841796875, -0.6533203125, -0.42822265625, -0.203125, 0.02197265625, 0.2470703125, 0.47216796875, 0.697265625, 0.92236328125, 1.1474609375, 1.37255859375, 1.59765625, 1.82275390625, 2.0478515625, 2.27294921875, 2.498046875, 2.72314453125, 2.9482421875, 3.17333984375, 3.3984375, 3.62353515625, 3.8486328125, 4.07373046875, 4.298828125, 4.52392578125, 4.7490234375, 4.97412109375, 5.19921875, 5.42431640625, 5.6494140625, 5.87451171875, 6.099609375, 6.32470703125, 6.5498046875, 6.77490234375, 7.0]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 2.0, 2.0, 4.0, 18.0, 12.0, 18.0, 33.0, 35.0, 46.0, 67.0, 115.0, 160.0, 200.0, 297.0, 560.0, 2308.0, 86070.0, 3709588.0, 387901.0, 4951.0, 730.0, 352.0, 231.0, 161.0, 120.0, 78.0, 64.0, 45.0, 27.0, 21.0, 15.0, 13.0, 9.0, 7.0, 5.0, 1.0, 8.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.546875, -21.811279296875, -21.07568359375, -20.340087890625, -19.6044921875, -18.868896484375, -18.13330078125, -17.397705078125, -16.662109375, -15.926513671875, -15.19091796875, -14.455322265625, -13.7197265625, -12.984130859375, -12.24853515625, -11.512939453125, -10.77734375, -10.041748046875, -9.30615234375, -8.570556640625, -7.8349609375, -7.099365234375, -6.36376953125, -5.628173828125, -4.892578125, -4.156982421875, -3.42138671875, -2.685791015625, -1.9501953125, -1.214599609375, -0.47900390625, 0.256591796875, 0.9921875, 1.727783203125, 2.46337890625, 3.198974609375, 3.9345703125, 4.670166015625, 5.40576171875, 6.141357421875, 6.876953125, 7.612548828125, 8.34814453125, 9.083740234375, 9.8193359375, 10.554931640625, 11.29052734375, 12.026123046875, 12.76171875, 13.497314453125, 14.23291015625, 14.968505859375, 15.7041015625, 16.439697265625, 17.17529296875, 17.910888671875, 18.646484375, 19.382080078125, 20.11767578125, 20.853271484375, 21.5888671875, 22.324462890625, 23.06005859375, 23.795654296875, 24.53125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 27.0, 68.0, 157.0, 208.0, 246.0, 180.0, 83.0, 22.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.91522216796875, -97.7030029296875, -95.49077606201172, -93.27855682373047, -91.06633758544922, -88.85411071777344, -86.64189147949219, -84.42967224121094, -82.21745300292969, -80.00523376464844, -77.79300689697266, -75.5807876586914, -73.36856842041016, -71.15634155273438, -68.94412231445312, -66.73190307617188, -64.5196762084961, -62.30745315551758, -60.09523391723633, -57.88301086425781, -55.67079162597656, -53.45856857299805, -51.24634552001953, -49.03412628173828, -46.821903228759766, -44.60968017578125, -42.3974609375, -40.185237884521484, -37.97301483154297, -35.76079559326172, -33.5485725402832, -31.33635139465332, -29.124134063720703, -26.91191291809082, -24.699691772460938, -22.487468719482422, -20.27524757385254, -18.063026428222656, -15.850804328918457, -13.638582229614258, -11.426361083984375, -9.214139938354492, -7.001917839050293, -4.789696216583252, -2.577474594116211, -0.3652534484863281, 1.846968650817871, 4.05919075012207, 6.271411895751953, 8.483633041381836, 10.695855140686035, 12.908077239990234, 15.120298385620117, 17.33251953125, 19.544742584228516, 21.7569637298584, 23.96918487548828, 26.181406021118164, 28.393627166748047, 30.605850219726562, 32.81806945800781, 35.03029251098633, 37.242515563964844, 39.454734802246094, 41.66695785522461]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 4.0, 4.0, 7.0, 3.0, 11.0, 9.0, 11.0, 16.0, 13.0, 15.0, 24.0, 17.0, 27.0, 20.0, 29.0, 33.0, 28.0, 35.0, 29.0, 44.0, 34.0, 40.0, 35.0, 35.0, 43.0, 35.0, 54.0, 50.0, 34.0, 42.0, 37.0, 24.0, 22.0, 23.0, 13.0, 13.0, 18.0, 9.0, 9.0, 13.0, 11.0, 7.0, 3.0, 6.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.811996459960938, -21.090408325195312, -20.368820190429688, -19.647233963012695, -18.92564582824707, -18.204057693481445, -17.482471466064453, -16.760883331298828, -16.039295196533203, -15.317707061767578, -14.59611988067627, -13.874532699584961, -13.152944564819336, -12.431356430053711, -11.709769248962402, -10.988182067871094, -10.266593933105469, -9.545005798339844, -8.823418617248535, -8.101831436157227, -7.380243301391602, -6.658655643463135, -5.937067985534668, -5.215480327606201, -4.493892669677734, -3.7723050117492676, -3.050717353820801, -2.329129695892334, -1.6075420379638672, -0.8859543800354004, -0.1643667221069336, 0.5572209358215332, 1.27880859375, 2.000396251678467, 2.7219839096069336, 3.4435715675354004, 4.165159225463867, 4.886746883392334, 5.608334541320801, 6.329922199249268, 7.051509857177734, 7.773097515106201, 8.494685173034668, 9.216272354125977, 9.937860488891602, 10.659448623657227, 11.381035804748535, 12.102622985839844, 12.824211120605469, 13.545799255371094, 14.267386436462402, 14.988973617553711, 15.710561752319336, 16.43214988708496, 17.153736114501953, 17.875324249267578, 18.596912384033203, 19.318500518798828, 20.040088653564453, 20.761674880981445, 21.48326301574707, 22.204851150512695, 22.926437377929688, 23.648025512695312, 24.369613647460938]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 4.0, 3.0, 7.0, 5.0, 6.0, 6.0, 18.0, 13.0, 17.0, 19.0, 20.0, 22.0, 12.0, 35.0, 25.0, 36.0, 42.0, 30.0, 42.0, 27.0, 38.0, 40.0, 34.0, 43.0, 43.0, 36.0, 40.0, 41.0, 27.0, 19.0, 28.0, 23.0, 30.0, 19.0, 19.0, 18.0, 14.0, 18.0, 7.0, 13.0, 12.0, 7.0, 7.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.828125, -2.738739013671875, -2.64935302734375, -2.559967041015625, -2.4705810546875, -2.381195068359375, -2.29180908203125, -2.202423095703125, -2.113037109375, -2.023651123046875, -1.93426513671875, -1.844879150390625, -1.7554931640625, -1.666107177734375, -1.57672119140625, -1.487335205078125, -1.39794921875, -1.308563232421875, -1.21917724609375, -1.129791259765625, -1.0404052734375, -0.951019287109375, -0.86163330078125, -0.772247314453125, -0.682861328125, -0.593475341796875, -0.50408935546875, -0.414703369140625, -0.3253173828125, -0.235931396484375, -0.14654541015625, -0.057159423828125, 0.0322265625, 0.121612548828125, 0.21099853515625, 0.300384521484375, 0.3897705078125, 0.479156494140625, 0.56854248046875, 0.657928466796875, 0.747314453125, 0.836700439453125, 0.92608642578125, 1.015472412109375, 1.1048583984375, 1.194244384765625, 1.28363037109375, 1.373016357421875, 1.46240234375, 1.551788330078125, 1.64117431640625, 1.730560302734375, 1.8199462890625, 1.909332275390625, 1.99871826171875, 2.088104248046875, 2.177490234375, 2.266876220703125, 2.35626220703125, 2.445648193359375, 2.5350341796875, 2.624420166015625, 2.71380615234375, 2.803192138671875, 2.892578125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 14.0, 17.0, 22.0, 47.0, 60.0, 97.0, 158.0, 252.0, 354.0, 670.0, 1124.0, 2018.0, 3316.0, 6113.0, 11242.0, 20255.0, 38135.0, 73567.0, 146718.0, 260372.0, 230079.0, 121397.0, 61891.0, 31870.0, 17100.0, 9341.0, 5254.0, 2881.0, 1653.0, 993.0, 557.0, 340.0, 210.0, 129.0, 91.0, 64.0, 38.0, 31.0, 19.0, 16.0, 8.0, 8.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.5060844421386719, -0.49068450927734375, -0.4752845764160156, -0.4598846435546875, -0.4444847106933594, -0.42908477783203125, -0.4136848449707031, -0.398284912109375, -0.3828849792480469, -0.36748504638671875, -0.3520851135253906, -0.3366851806640625, -0.3212852478027344, -0.30588531494140625, -0.2904853820800781, -0.27508544921875, -0.2596855163574219, -0.24428558349609375, -0.22888565063476562, -0.2134857177734375, -0.19808578491210938, -0.18268585205078125, -0.16728591918945312, -0.151885986328125, -0.13648605346679688, -0.12108612060546875, -0.10568618774414062, -0.0902862548828125, -0.07488632202148438, -0.05948638916015625, -0.044086456298828125, -0.0286865234375, -0.013286590576171875, 0.00211334228515625, 0.017513275146484375, 0.0329132080078125, 0.048313140869140625, 0.06371307373046875, 0.07911300659179688, 0.094512939453125, 0.10991287231445312, 0.12531280517578125, 0.14071273803710938, 0.1561126708984375, 0.17151260375976562, 0.18691253662109375, 0.20231246948242188, 0.21771240234375, 0.23311233520507812, 0.24851226806640625, 0.2639122009277344, 0.2793121337890625, 0.2947120666503906, 0.31011199951171875, 0.3255119323730469, 0.340911865234375, 0.3563117980957031, 0.37171173095703125, 0.3871116638183594, 0.4025115966796875, 0.4179115295410156, 0.43331146240234375, 0.4487113952636719, 0.464111328125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 2.0, 7.0, 9.0, 16.0, 7.0, 13.0, 13.0, 18.0, 21.0, 27.0, 27.0, 35.0, 43.0, 30.0, 17.0, 31.0, 40.0, 41.0, 35.0, 1075.0, 49.0, 46.0, 47.0, 43.0, 36.0, 29.0, 35.0, 26.0, 29.0, 25.0, 18.0, 13.0, 23.0, 20.0, 11.0, 11.0, 15.0, 12.0, 8.0, 7.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.232421875, -2.1665496826171875, -2.100677490234375, -2.0348052978515625, -1.96893310546875, -1.9030609130859375, -1.837188720703125, -1.7713165283203125, -1.7054443359375, -1.6395721435546875, -1.573699951171875, -1.5078277587890625, -1.44195556640625, -1.3760833740234375, -1.310211181640625, -1.2443389892578125, -1.178466796875, -1.1125946044921875, -1.046722412109375, -0.9808502197265625, -0.91497802734375, -0.8491058349609375, -0.783233642578125, -0.7173614501953125, -0.6514892578125, -0.5856170654296875, -0.519744873046875, -0.4538726806640625, -0.38800048828125, -0.3221282958984375, -0.256256103515625, -0.1903839111328125, -0.12451171875, -0.0586395263671875, 0.007232666015625, 0.0731048583984375, 0.13897705078125, 0.2048492431640625, 0.270721435546875, 0.3365936279296875, 0.4024658203125, 0.4683380126953125, 0.534210205078125, 0.6000823974609375, 0.66595458984375, 0.7318267822265625, 0.797698974609375, 0.8635711669921875, 0.929443359375, 0.9953155517578125, 1.061187744140625, 1.1270599365234375, 1.19293212890625, 1.2588043212890625, 1.324676513671875, 1.3905487060546875, 1.4564208984375, 1.5222930908203125, 1.588165283203125, 1.6540374755859375, 1.71990966796875, 1.7857818603515625, 1.851654052734375, 1.9175262451171875, 1.9833984375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 6.0, 9.0, 14.0, 21.0, 27.0, 30.0, 76.0, 92.0, 144.0, 189.0, 304.0, 457.0, 668.0, 979.0, 1519.0, 2191.0, 3372.0, 5039.0, 7644.0, 11424.0, 18002.0, 27520.0, 41680.0, 63408.0, 94791.0, 135625.0, 1205206.0, 155804.0, 108110.0, 72563.0, 47912.0, 31836.0, 20565.0, 13490.0, 8970.0, 5754.0, 3941.0, 2518.0, 1675.0, 1179.0, 769.0, 527.0, 337.0, 221.0, 180.0, 112.0, 72.0, 48.0, 34.0, 31.0, 22.0, 7.0, 8.0, 3.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.207275390625, -0.2005176544189453, -0.19375991821289062, -0.18700218200683594, -0.18024444580078125, -0.17348670959472656, -0.16672897338867188, -0.1599712371826172, -0.1532135009765625, -0.1464557647705078, -0.13969802856445312, -0.13294029235839844, -0.12618255615234375, -0.11942481994628906, -0.11266708374023438, -0.10590934753417969, -0.099151611328125, -0.09239387512207031, -0.08563613891601562, -0.07887840270996094, -0.07212066650390625, -0.06536293029785156, -0.058605194091796875, -0.05184745788574219, -0.0450897216796875, -0.03833198547363281, -0.031574249267578125, -0.024816513061523438, -0.01805877685546875, -0.011301040649414062, -0.004543304443359375, 0.0022144317626953125, 0.00897216796875, 0.015729904174804688, 0.022487640380859375, 0.029245376586914062, 0.03600311279296875, 0.04276084899902344, 0.049518585205078125, 0.05627632141113281, 0.0630340576171875, 0.06979179382324219, 0.07654953002929688, 0.08330726623535156, 0.09006500244140625, 0.09682273864746094, 0.10358047485351562, 0.11033821105957031, 0.117095947265625, 0.12385368347167969, 0.13061141967773438, 0.13736915588378906, 0.14412689208984375, 0.15088462829589844, 0.15764236450195312, 0.1644001007080078, 0.1711578369140625, 0.1779155731201172, 0.18467330932617188, 0.19143104553222656, 0.19818878173828125, 0.20494651794433594, 0.21170425415039062, 0.2184619903564453, 0.2252197265625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 7.0, 5.0, 9.0, 8.0, 13.0, 18.0, 18.0, 23.0, 25.0, 28.0, 53.0, 53.0, 72.0, 78.0, 101.0, 81.0, 91.0, 73.0, 60.0, 43.0, 29.0, 21.0, 10.0, 11.0, 13.0, 6.0, 7.0, 5.0, 11.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0049896240234375, -0.004822790622711182, -0.004655957221984863, -0.004489123821258545, -0.0043222904205322266, -0.004155457019805908, -0.00398862361907959, -0.0038217902183532715, -0.003654956817626953, -0.0034881234169006348, -0.0033212900161743164, -0.003154456615447998, -0.0029876232147216797, -0.0028207898139953613, -0.002653956413269043, -0.0024871230125427246, -0.0023202896118164062, -0.002153456211090088, -0.0019866228103637695, -0.0018197894096374512, -0.0016529560089111328, -0.0014861226081848145, -0.001319289207458496, -0.0011524558067321777, -0.0009856224060058594, -0.000818789005279541, -0.0006519556045532227, -0.0004851222038269043, -0.00031828880310058594, -0.00015145540237426758, 1.537799835205078e-05, 0.00018221139907836914, 0.0003490447998046875, 0.0005158782005310059, 0.0006827116012573242, 0.0008495450019836426, 0.001016378402709961, 0.0011832118034362793, 0.0013500452041625977, 0.001516878604888916, 0.0016837120056152344, 0.0018505454063415527, 0.002017378807067871, 0.0021842122077941895, 0.002351045608520508, 0.002517879009246826, 0.0026847124099731445, 0.002851545810699463, 0.0030183792114257812, 0.0031852126121520996, 0.003352046012878418, 0.0035188794136047363, 0.0036857128143310547, 0.003852546215057373, 0.004019379615783691, 0.00418621301651001, 0.004353046417236328, 0.0045198798179626465, 0.004686713218688965, 0.004853546619415283, 0.0050203800201416016, 0.00518721342086792, 0.005354046821594238, 0.005520880222320557, 0.005687713623046875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 5.0, 5.0, 6.0, 10.0, 11.0, 11.0, 12.0, 14.0, 28.0, 28.0, 35.0, 62.0, 90.0, 162.0, 316.0, 970.0, 58537.0, 980851.0, 6243.0, 478.0, 241.0, 119.0, 68.0, 60.0, 40.0, 33.0, 27.0, 29.0, 19.0, 8.0, 6.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1064453125, -0.1031484603881836, -0.09985160827636719, -0.09655475616455078, -0.09325790405273438, -0.08996105194091797, -0.08666419982910156, -0.08336734771728516, -0.08007049560546875, -0.07677364349365234, -0.07347679138183594, -0.07017993927001953, -0.06688308715820312, -0.06358623504638672, -0.06028938293457031, -0.056992530822753906, -0.0536956787109375, -0.050398826599121094, -0.04710197448730469, -0.04380512237548828, -0.040508270263671875, -0.03721141815185547, -0.03391456604003906, -0.030617713928222656, -0.02732086181640625, -0.024024009704589844, -0.020727157592773438, -0.01743030548095703, -0.014133453369140625, -0.010836601257324219, -0.0075397491455078125, -0.004242897033691406, -0.000946044921875, 0.0023508071899414062, 0.0056476593017578125, 0.008944511413574219, 0.012241363525390625, 0.015538215637207031, 0.018835067749023438, 0.022131919860839844, 0.02542877197265625, 0.028725624084472656, 0.03202247619628906, 0.03531932830810547, 0.038616180419921875, 0.04191303253173828, 0.04520988464355469, 0.048506736755371094, 0.0518035888671875, 0.055100440979003906, 0.05839729309082031, 0.06169414520263672, 0.06499099731445312, 0.06828784942626953, 0.07158470153808594, 0.07488155364990234, 0.07817840576171875, 0.08147525787353516, 0.08477210998535156, 0.08806896209716797, 0.09136581420898438, 0.09466266632080078, 0.09795951843261719, 0.1012563705444336, 0.10455322265625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 11.0, 91.0, 518.0, 292.0, 72.0, 22.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00397814204916358, -0.003284793347120285, -0.0025914444122463465, -0.001898095477372408, -0.001204746775329113, -0.0005113980732858181, 0.00018195109441876411, 0.000875299796462059, 0.001568648498505354, 0.002261997200548649, 0.0029553461354225874, 0.003648695070296526, 0.004342043772339821, 0.005035392474383116, 0.005728741642087698, 0.006422090344130993, 0.007115439046174288, 0.007808787748217583, 0.008502136915922165, 0.009195486083626747, 0.009888834320008755, 0.010582182556390762, 0.011275531724095345, 0.011968880891799927, 0.012662230059504509, 0.013355579227209091, 0.014048927463591099, 0.014742276631295681, 0.015435624867677689, 0.01612897403538227, 0.016822323203086853, 0.017515672370791435, 0.018209021538496017, 0.0189023707062006, 0.019595719873905182, 0.020289067178964615, 0.020982416346669197, 0.02167576551437378, 0.02236911468207836, 0.023062463849782944, 0.023755811154842377, 0.02444916032254696, 0.02514250949025154, 0.025835856795310974, 0.026529205963015556, 0.02722255513072014, 0.02791590429842472, 0.028609253466129303, 0.029302602633833885, 0.029995951801538467, 0.03068930096924305, 0.03138265013694763, 0.032075997442007065, 0.0327693447470665, 0.03346269577741623, 0.03415604308247566, 0.034849394112825394, 0.03554274141788483, 0.03623609244823456, 0.03692943975329399, 0.03762279078364372, 0.038316138088703156, 0.03900948911905289, 0.03970283642411232, 0.04039618372917175]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 7.0, 10.0, 7.0, 13.0, 15.0, 6.0, 16.0, 22.0, 31.0, 29.0, 28.0, 29.0, 40.0, 39.0, 41.0, 43.0, 34.0, 39.0, 41.0, 46.0, 45.0, 38.0, 43.0, 29.0, 30.0, 31.0, 30.0, 27.0, 32.0, 21.0, 21.0, 27.0, 14.0, 16.0, 12.0, 6.0, 5.0, 5.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0029751062393188477, -0.0028793727979063988, -0.00278363935649395, -0.002687905915081501, -0.002592172473669052, -0.0024964390322566032, -0.0024007055908441544, -0.0023049721494317055, -0.0022092387080192566, -0.0021135052666068077, -0.002017771825194359, -0.00192203838378191, -0.001826304942369461, -0.0017305715009570122, -0.0016348380595445633, -0.0015391046181321144, -0.0014433711767196655, -0.0013476377353072166, -0.0012519042938947678, -0.0011561708524823189, -0.00106043741106987, -0.0009647039696574211, -0.0008689705282449722, -0.0007732370868325233, -0.0006775036454200745, -0.0005817702040076256, -0.0004860367625951767, -0.0003903033211827278, -0.00029456987977027893, -0.00019883643835783005, -0.00010310299694538116, -7.3695555329322815e-06, 8.83638858795166e-05, 0.00018409732729196548, 0.00027983076870441437, 0.00037556421011686325, 0.00047129765152931213, 0.000567031092941761, 0.0006627645343542099, 0.0007584979757666588, 0.0008542314171791077, 0.0009499648585915565, 0.0010456983000040054, 0.0011414317414164543, 0.0012371651828289032, 0.001332898624241352, 0.001428632065653801, 0.0015243655070662498, 0.0016200989484786987, 0.0017158323898911476, 0.0018115658313035965, 0.0019072992727160454, 0.0020030327141284943, 0.002098766155540943, 0.002194499596953392, 0.002290233038365841, 0.00238596647977829, 0.0024816999211907387, 0.0025774333626031876, 0.0026731668040156364, 0.0027689002454280853, 0.002864633686840534, 0.002960367128252983, 0.003056100569665432, 0.003151834011077881]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 4.0, 3.0, 7.0, 5.0, 6.0, 6.0, 18.0, 13.0, 17.0, 19.0, 20.0, 22.0, 12.0, 35.0, 25.0, 36.0, 42.0, 30.0, 42.0, 26.0, 39.0, 40.0, 34.0, 43.0, 43.0, 36.0, 40.0, 41.0, 27.0, 19.0, 28.0, 23.0, 30.0, 19.0, 19.0, 18.0, 14.0, 18.0, 7.0, 13.0, 12.0, 7.0, 7.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.828125, -2.738739013671875, -2.64935302734375, -2.559967041015625, -2.4705810546875, -2.381195068359375, -2.29180908203125, -2.202423095703125, -2.113037109375, -2.023651123046875, -1.93426513671875, -1.844879150390625, -1.7554931640625, -1.666107177734375, -1.57672119140625, -1.487335205078125, -1.39794921875, -1.308563232421875, -1.21917724609375, -1.129791259765625, -1.0404052734375, -0.951019287109375, -0.86163330078125, -0.772247314453125, -0.682861328125, -0.593475341796875, -0.50408935546875, -0.414703369140625, -0.3253173828125, -0.235931396484375, -0.14654541015625, -0.057159423828125, 0.0322265625, 0.121612548828125, 0.21099853515625, 0.300384521484375, 0.3897705078125, 0.479156494140625, 0.56854248046875, 0.657928466796875, 0.747314453125, 0.836700439453125, 0.92608642578125, 1.015472412109375, 1.1048583984375, 1.194244384765625, 1.28363037109375, 1.373016357421875, 1.46240234375, 1.551788330078125, 1.64117431640625, 1.730560302734375, 1.8199462890625, 1.909332275390625, 1.99871826171875, 2.088104248046875, 2.177490234375, 2.266876220703125, 2.35626220703125, 2.445648193359375, 2.5350341796875, 2.624420166015625, 2.71380615234375, 2.803192138671875, 2.892578125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 11.0, 14.0, 35.0, 31.0, 70.0, 92.0, 125.0, 209.0, 324.0, 532.0, 932.0, 1651.0, 3091.0, 6069.0, 12466.0, 26340.0, 56989.0, 122302.0, 272640.0, 295791.0, 131848.0, 61239.0, 28303.0, 13407.0, 6439.0, 3312.0, 1759.0, 969.0, 610.0, 375.0, 200.0, 127.0, 65.0, 67.0, 41.0, 19.0, 16.0, 14.0, 11.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.18359375, -3.0810546875, -2.978515625, -2.8759765625, -2.7734375, -2.6708984375, -2.568359375, -2.4658203125, -2.36328125, -2.2607421875, -2.158203125, -2.0556640625, -1.953125, -1.8505859375, -1.748046875, -1.6455078125, -1.54296875, -1.4404296875, -1.337890625, -1.2353515625, -1.1328125, -1.0302734375, -0.927734375, -0.8251953125, -0.72265625, -0.6201171875, -0.517578125, -0.4150390625, -0.3125, -0.2099609375, -0.107421875, -0.0048828125, 0.09765625, 0.2001953125, 0.302734375, 0.4052734375, 0.5078125, 0.6103515625, 0.712890625, 0.8154296875, 0.91796875, 1.0205078125, 1.123046875, 1.2255859375, 1.328125, 1.4306640625, 1.533203125, 1.6357421875, 1.73828125, 1.8408203125, 1.943359375, 2.0458984375, 2.1484375, 2.2509765625, 2.353515625, 2.4560546875, 2.55859375, 2.6611328125, 2.763671875, 2.8662109375, 2.96875, 3.0712890625, 3.173828125, 3.2763671875, 3.37890625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 6.0, 3.0, 9.0, 8.0, 6.0, 9.0, 16.0, 25.0, 19.0, 20.0, 34.0, 33.0, 40.0, 40.0, 48.0, 69.0, 98.0, 131.0, 252.0, 1402.0, 188.0, 105.0, 78.0, 60.0, 41.0, 39.0, 35.0, 35.0, 28.0, 29.0, 18.0, 19.0, 23.0, 18.0, 9.0, 10.0, 7.0, 4.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-11.1015625, -10.7864990234375, -10.471435546875, -10.1563720703125, -9.84130859375, -9.5262451171875, -9.211181640625, -8.8961181640625, -8.5810546875, -8.2659912109375, -7.950927734375, -7.6358642578125, -7.32080078125, -7.0057373046875, -6.690673828125, -6.3756103515625, -6.060546875, -5.7454833984375, -5.430419921875, -5.1153564453125, -4.80029296875, -4.4852294921875, -4.170166015625, -3.8551025390625, -3.5400390625, -3.2249755859375, -2.909912109375, -2.5948486328125, -2.27978515625, -1.9647216796875, -1.649658203125, -1.3345947265625, -1.01953125, -0.7044677734375, -0.389404296875, -0.0743408203125, 0.24072265625, 0.5557861328125, 0.870849609375, 1.1859130859375, 1.5009765625, 1.8160400390625, 2.131103515625, 2.4461669921875, 2.76123046875, 3.0762939453125, 3.391357421875, 3.7064208984375, 4.021484375, 4.3365478515625, 4.651611328125, 4.9666748046875, 5.28173828125, 5.5968017578125, 5.911865234375, 6.2269287109375, 6.5419921875, 6.8570556640625, 7.172119140625, 7.4871826171875, 7.80224609375, 8.1173095703125, 8.432373046875, 8.7474365234375, 9.0625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 15.0, 8.0, 28.0, 44.0, 35.0, 67.0, 86.0, 185.0, 280.0, 565.0, 2137.0, 3003638.0, 136496.0, 986.0, 433.0, 247.0, 151.0, 82.0, 48.0, 43.0, 22.0, 25.0, 16.0, 19.0, 8.0, 2.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.59375, -53.90087890625, -52.2080078125, -50.51513671875, -48.822265625, -47.12939453125, -45.4365234375, -43.74365234375, -42.05078125, -40.35791015625, -38.6650390625, -36.97216796875, -35.279296875, -33.58642578125, -31.8935546875, -30.20068359375, -28.5078125, -26.81494140625, -25.1220703125, -23.42919921875, -21.736328125, -20.04345703125, -18.3505859375, -16.65771484375, -14.96484375, -13.27197265625, -11.5791015625, -9.88623046875, -8.193359375, -6.50048828125, -4.8076171875, -3.11474609375, -1.421875, 0.27099609375, 1.9638671875, 3.65673828125, 5.349609375, 7.04248046875, 8.7353515625, 10.42822265625, 12.12109375, 13.81396484375, 15.5068359375, 17.19970703125, 18.892578125, 20.58544921875, 22.2783203125, 23.97119140625, 25.6640625, 27.35693359375, 29.0498046875, 30.74267578125, 32.435546875, 34.12841796875, 35.8212890625, 37.51416015625, 39.20703125, 40.89990234375, 42.5927734375, 44.28564453125, 45.978515625, 47.67138671875, 49.3642578125, 51.05712890625, 52.75]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 50.0, 672.0, 286.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-232.76841735839844, -228.51593017578125, -224.263427734375, -220.0109405517578, -215.75845336914062, -211.50595092773438, -207.2534637451172, -203.00096130371094, -198.74847412109375, -194.49598693847656, -190.2434844970703, -185.99099731445312, -181.73849487304688, -177.4860076904297, -173.2335205078125, -168.98101806640625, -164.72853088378906, -160.47604370117188, -156.22354125976562, -151.97105407714844, -147.71856689453125, -143.466064453125, -139.2135772705078, -134.96107482910156, -130.70858764648438, -126.45609283447266, -122.20359802246094, -117.95111083984375, -113.69861602783203, -109.44612121582031, -105.19363403320312, -100.9411392211914, -96.68863677978516, -92.43614196777344, -88.18365478515625, -83.93115997314453, -79.67866516113281, -75.4261703491211, -71.17367553710938, -66.92118835449219, -62.66869354248047, -58.41619873046875, -54.1637077331543, -49.911216735839844, -45.658721923828125, -41.406227111816406, -37.15373611450195, -32.9012451171875, -28.64875030517578, -24.396257400512695, -20.14376449584961, -15.891271591186523, -11.638778686523438, -7.386285781860352, -3.1337928771972656, 1.1187000274658203, 5.371192932128906, 9.623685836791992, 13.876178741455078, 18.128671646118164, 22.38116455078125, 26.633657455444336, 30.886150360107422, 35.138641357421875, 39.391136169433594]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 5.0, 5.0, 4.0, 11.0, 19.0, 18.0, 18.0, 27.0, 32.0, 30.0, 36.0, 25.0, 49.0, 31.0, 32.0, 47.0, 45.0, 44.0, 39.0, 49.0, 50.0, 52.0, 43.0, 32.0, 41.0, 29.0, 31.0, 27.0, 36.0, 22.0, 22.0, 10.0, 13.0, 5.0, 6.0, 7.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-32.968597412109375, -32.02206039428711, -31.075519561767578, -30.128982543945312, -29.182443618774414, -28.235904693603516, -27.289365768432617, -26.34282684326172, -25.39628791809082, -24.449748992919922, -23.503210067749023, -22.556671142578125, -21.61013412475586, -20.66359519958496, -19.717056274414062, -18.770517349243164, -17.823978424072266, -16.877439498901367, -15.930901527404785, -14.984362602233887, -14.037823677062988, -13.091285705566406, -12.144746780395508, -11.19820785522461, -10.251670837402344, -9.305131912231445, -8.358593940734863, -7.412055015563965, -6.465516090393066, -5.518977642059326, -4.572439193725586, -3.6259002685546875, -2.679361343383789, -1.7328226566314697, -0.7862840890884399, 0.16025447845458984, 1.1067931652069092, 2.0533318519592285, 2.9998703002929688, 3.946409225463867, 4.892947673797607, 5.839486122131348, 6.786025047302246, 7.732563495635986, 8.679101943969727, 9.625640869140625, 10.572179794311523, 11.518718719482422, 12.465256690979004, 13.411795616149902, 14.358333587646484, 15.304872512817383, 16.25141143798828, 17.19795036315918, 18.144489288330078, 19.091026306152344, 20.037565231323242, 20.98410415649414, 21.93064308166504, 22.877182006835938, 23.823719024658203, 24.7702579498291, 25.716796875, 26.6633358001709, 27.609874725341797]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 4.0, 4.0, 4.0, 6.0, 5.0, 11.0, 10.0, 11.0, 12.0, 26.0, 20.0, 19.0, 24.0, 24.0, 26.0, 33.0, 26.0, 38.0, 31.0, 30.0, 42.0, 42.0, 39.0, 41.0, 45.0, 40.0, 32.0, 21.0, 31.0, 25.0, 30.0, 31.0, 31.0, 16.0, 29.0, 24.0, 11.0, 12.0, 18.0, 11.0, 13.0, 7.0, 10.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0], "bins": [-3.2421875, -3.141876220703125, -3.04156494140625, -2.941253662109375, -2.8409423828125, -2.740631103515625, -2.64031982421875, -2.540008544921875, -2.439697265625, -2.339385986328125, -2.23907470703125, -2.138763427734375, -2.0384521484375, -1.938140869140625, -1.83782958984375, -1.737518310546875, -1.63720703125, -1.536895751953125, -1.43658447265625, -1.336273193359375, -1.2359619140625, -1.135650634765625, -1.03533935546875, -0.935028076171875, -0.834716796875, -0.734405517578125, -0.63409423828125, -0.533782958984375, -0.4334716796875, -0.333160400390625, -0.23284912109375, -0.132537841796875, -0.0322265625, 0.068084716796875, 0.16839599609375, 0.268707275390625, 0.3690185546875, 0.469329833984375, 0.56964111328125, 0.669952392578125, 0.770263671875, 0.870574951171875, 0.97088623046875, 1.071197509765625, 1.1715087890625, 1.271820068359375, 1.37213134765625, 1.472442626953125, 1.57275390625, 1.673065185546875, 1.77337646484375, 1.873687744140625, 1.9739990234375, 2.074310302734375, 2.17462158203125, 2.274932861328125, 2.375244140625, 2.475555419921875, 2.57586669921875, 2.676177978515625, 2.7764892578125, 2.876800537109375, 2.97711181640625, 3.077423095703125, 3.177734375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 5.0, 8.0, 10.0, 25.0, 14.0, 17.0, 32.0, 32.0, 54.0, 66.0, 101.0, 130.0, 197.0, 392.0, 842.0, 2725.0, 11736.0, 77068.0, 556125.0, 1990638.0, 1290624.0, 223525.0, 31299.0, 5573.0, 1505.0, 583.0, 267.0, 181.0, 121.0, 102.0, 55.0, 48.0, 36.0, 35.0, 25.0, 19.0, 14.0, 6.0, 4.0, 4.0, 7.0, 2.0, 3.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.6328125, -6.42401123046875, -6.2152099609375, -6.00640869140625, -5.797607421875, -5.58880615234375, -5.3800048828125, -5.17120361328125, -4.96240234375, -4.75360107421875, -4.5447998046875, -4.33599853515625, -4.127197265625, -3.91839599609375, -3.7095947265625, -3.50079345703125, -3.2919921875, -3.08319091796875, -2.8743896484375, -2.66558837890625, -2.456787109375, -2.24798583984375, -2.0391845703125, -1.83038330078125, -1.62158203125, -1.41278076171875, -1.2039794921875, -0.99517822265625, -0.786376953125, -0.57757568359375, -0.3687744140625, -0.15997314453125, 0.048828125, 0.25762939453125, 0.4664306640625, 0.67523193359375, 0.884033203125, 1.09283447265625, 1.3016357421875, 1.51043701171875, 1.71923828125, 1.92803955078125, 2.1368408203125, 2.34564208984375, 2.554443359375, 2.76324462890625, 2.9720458984375, 3.18084716796875, 3.3896484375, 3.59844970703125, 3.8072509765625, 4.01605224609375, 4.224853515625, 4.43365478515625, 4.6424560546875, 4.85125732421875, 5.06005859375, 5.26885986328125, 5.4776611328125, 5.68646240234375, 5.895263671875, 6.10406494140625, 6.3128662109375, 6.52166748046875, 6.73046875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 16.0, 14.0, 14.0, 22.0, 19.0, 26.0, 35.0, 41.0, 65.0, 80.0, 102.0, 140.0, 175.0, 193.0, 245.0, 344.0, 381.0, 390.0, 321.0, 326.0, 268.0, 194.0, 161.0, 100.0, 103.0, 59.0, 52.0, 32.0, 40.0, 21.0, 24.0, 17.0, 10.0, 9.0, 7.0, 12.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.2578125, -7.063232421875, -6.86865234375, -6.674072265625, -6.4794921875, -6.284912109375, -6.09033203125, -5.895751953125, -5.701171875, -5.506591796875, -5.31201171875, -5.117431640625, -4.9228515625, -4.728271484375, -4.53369140625, -4.339111328125, -4.14453125, -3.949951171875, -3.75537109375, -3.560791015625, -3.3662109375, -3.171630859375, -2.97705078125, -2.782470703125, -2.587890625, -2.393310546875, -2.19873046875, -2.004150390625, -1.8095703125, -1.614990234375, -1.42041015625, -1.225830078125, -1.03125, -0.836669921875, -0.64208984375, -0.447509765625, -0.2529296875, -0.058349609375, 0.13623046875, 0.330810546875, 0.525390625, 0.719970703125, 0.91455078125, 1.109130859375, 1.3037109375, 1.498291015625, 1.69287109375, 1.887451171875, 2.08203125, 2.276611328125, 2.47119140625, 2.665771484375, 2.8603515625, 3.054931640625, 3.24951171875, 3.444091796875, 3.638671875, 3.833251953125, 4.02783203125, 4.222412109375, 4.4169921875, 4.611572265625, 4.80615234375, 5.000732421875, 5.1953125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 12.0, 7.0, 7.0, 17.0, 19.0, 30.0, 29.0, 50.0, 55.0, 64.0, 120.0, 151.0, 206.0, 306.0, 481.0, 1526.0, 53961.0, 3138324.0, 984773.0, 11956.0, 806.0, 394.0, 269.0, 174.0, 135.0, 107.0, 67.0, 59.0, 48.0, 32.0, 20.0, 17.0, 20.0, 12.0, 10.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.644775390625, -16.96142578125, -16.278076171875, -15.5947265625, -14.911376953125, -14.22802734375, -13.544677734375, -12.861328125, -12.177978515625, -11.49462890625, -10.811279296875, -10.1279296875, -9.444580078125, -8.76123046875, -8.077880859375, -7.39453125, -6.711181640625, -6.02783203125, -5.344482421875, -4.6611328125, -3.977783203125, -3.29443359375, -2.611083984375, -1.927734375, -1.244384765625, -0.56103515625, 0.122314453125, 0.8056640625, 1.489013671875, 2.17236328125, 2.855712890625, 3.5390625, 4.222412109375, 4.90576171875, 5.589111328125, 6.2724609375, 6.955810546875, 7.63916015625, 8.322509765625, 9.005859375, 9.689208984375, 10.37255859375, 11.055908203125, 11.7392578125, 12.422607421875, 13.10595703125, 13.789306640625, 14.47265625, 15.156005859375, 15.83935546875, 16.522705078125, 17.2060546875, 17.889404296875, 18.57275390625, 19.256103515625, 19.939453125, 20.622802734375, 21.30615234375, 21.989501953125, 22.6728515625, 23.356201171875, 24.03955078125, 24.722900390625, 25.40625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 39.0, 119.0, 212.0, 289.0, 212.0, 100.0, 30.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.07173156738281, -91.62750244140625, -89.18327331542969, -86.73904418945312, -84.29481506347656, -81.8505859375, -79.40635681152344, -76.96212768554688, -74.51789855957031, -72.07366943359375, -69.62944030761719, -67.18521118164062, -64.74098205566406, -62.2967529296875, -59.85251998901367, -57.40829086303711, -54.96405792236328, -52.51982879638672, -50.075599670410156, -47.631370544433594, -45.18714141845703, -42.74291229248047, -40.29867935180664, -37.85445022583008, -35.410221099853516, -32.96599197387695, -30.52176284790039, -28.077531814575195, -25.633302688598633, -23.18907356262207, -20.744842529296875, -18.300613403320312, -15.856391906738281, -13.412162780761719, -10.96793270111084, -8.523702621459961, -6.079473495483398, -3.635244369506836, -1.191014289855957, 1.2532157897949219, 3.6974449157714844, 6.141674518585205, 8.585904121398926, 11.030134201049805, 13.474363327026367, 15.91859245300293, 18.362823486328125, 20.807052612304688, 23.25128173828125, 25.695510864257812, 28.139739990234375, 30.58397102355957, 33.0281982421875, 35.47242736816406, 37.91666030883789, 40.36088943481445, 42.805118560791016, 45.24934768676758, 47.69357681274414, 50.1378059387207, 52.58203887939453, 55.026268005371094, 57.470497131347656, 59.91472625732422, 62.35895538330078]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 10.0, 3.0, 10.0, 17.0, 17.0, 23.0, 19.0, 24.0, 34.0, 25.0, 28.0, 34.0, 44.0, 30.0, 33.0, 39.0, 53.0, 50.0, 39.0, 48.0, 42.0, 35.0, 35.0, 40.0, 34.0, 24.0, 20.0, 25.0, 22.0, 31.0, 16.0, 21.0, 10.0, 18.0, 7.0, 7.0, 9.0, 8.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-29.03809356689453, -28.252334594726562, -27.466577529907227, -26.680818557739258, -25.895061492919922, -25.109302520751953, -24.323543548583984, -23.537784576416016, -22.75202751159668, -21.96626853942871, -21.180511474609375, -20.394752502441406, -19.608993530273438, -18.8232364654541, -18.037477493286133, -17.251720428466797, -16.465961456298828, -15.680203437805176, -14.894445419311523, -14.108686447143555, -13.322928428649902, -12.53717041015625, -11.751411437988281, -10.965653419494629, -10.179895401000977, -9.394137382507324, -8.608379364013672, -7.822620391845703, -7.036862373352051, -6.251104354858398, -5.465345859527588, -4.679587364196777, -3.893829345703125, -3.1080710887908936, -2.322312831878662, -1.5365545749664307, -0.7507963180541992, 0.03496193885803223, 0.8207201957702637, 1.6064786911010742, 2.3922367095947266, 3.177994966506958, 3.9637532234191895, 4.74951171875, 5.535269737243652, 6.321027755737305, 7.106786251068115, 7.892544746398926, 8.678302764892578, 9.46406078338623, 10.249818801879883, 11.035577774047852, 11.821335792541504, 12.607093811035156, 13.392852783203125, 14.178610801696777, 14.96436882019043, 15.750126838684082, 16.535884857177734, 17.321643829345703, 18.107402801513672, 18.893159866333008, 19.678918838500977, 20.464675903320312, 21.25043487548828]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 2.0, 6.0, 15.0, 11.0, 9.0, 14.0, 11.0, 15.0, 24.0, 26.0, 26.0, 25.0, 35.0, 29.0, 33.0, 44.0, 42.0, 40.0, 39.0, 40.0, 33.0, 40.0, 36.0, 48.0, 29.0, 35.0, 28.0, 42.0, 29.0, 34.0, 23.0, 14.0, 19.0, 15.0, 18.0, 3.0, 17.0, 7.0, 6.0, 5.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.48828125, -3.385406494140625, -3.28253173828125, -3.179656982421875, -3.0767822265625, -2.973907470703125, -2.87103271484375, -2.768157958984375, -2.665283203125, -2.562408447265625, -2.45953369140625, -2.356658935546875, -2.2537841796875, -2.150909423828125, -2.04803466796875, -1.945159912109375, -1.84228515625, -1.739410400390625, -1.63653564453125, -1.533660888671875, -1.4307861328125, -1.327911376953125, -1.22503662109375, -1.122161865234375, -1.019287109375, -0.916412353515625, -0.81353759765625, -0.710662841796875, -0.6077880859375, -0.504913330078125, -0.40203857421875, -0.299163818359375, -0.1962890625, -0.093414306640625, 0.00946044921875, 0.112335205078125, 0.2152099609375, 0.318084716796875, 0.42095947265625, 0.523834228515625, 0.626708984375, 0.729583740234375, 0.83245849609375, 0.935333251953125, 1.0382080078125, 1.141082763671875, 1.24395751953125, 1.346832275390625, 1.44970703125, 1.552581787109375, 1.65545654296875, 1.758331298828125, 1.8612060546875, 1.964080810546875, 2.06695556640625, 2.169830322265625, 2.272705078125, 2.375579833984375, 2.47845458984375, 2.581329345703125, 2.6842041015625, 2.787078857421875, 2.88995361328125, 2.992828369140625, 3.095703125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 7.0, 3.0, 6.0, 2.0, 8.0, 14.0, 17.0, 23.0, 33.0, 51.0, 93.0, 139.0, 269.0, 453.0, 841.0, 1499.0, 2659.0, 4740.0, 9036.0, 17293.0, 35290.0, 76704.0, 170277.0, 304023.0, 225535.0, 103873.0, 47692.0, 22689.0, 11602.0, 6152.0, 3266.0, 1853.0, 1040.0, 585.0, 339.0, 156.0, 114.0, 57.0, 33.0, 30.0, 12.0, 13.0, 9.0, 5.0, 4.0, 5.0, 2.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5732421875, -0.5545654296875, -0.535888671875, -0.5172119140625, -0.49853515625, -0.4798583984375, -0.461181640625, -0.4425048828125, -0.423828125, -0.4051513671875, -0.386474609375, -0.3677978515625, -0.34912109375, -0.3304443359375, -0.311767578125, -0.2930908203125, -0.2744140625, -0.2557373046875, -0.237060546875, -0.2183837890625, -0.19970703125, -0.1810302734375, -0.162353515625, -0.1436767578125, -0.125, -0.1063232421875, -0.087646484375, -0.0689697265625, -0.05029296875, -0.0316162109375, -0.012939453125, 0.0057373046875, 0.0244140625, 0.0430908203125, 0.061767578125, 0.0804443359375, 0.09912109375, 0.1177978515625, 0.136474609375, 0.1551513671875, 0.173828125, 0.1925048828125, 0.211181640625, 0.2298583984375, 0.24853515625, 0.2672119140625, 0.285888671875, 0.3045654296875, 0.3232421875, 0.3419189453125, 0.360595703125, 0.3792724609375, 0.39794921875, 0.4166259765625, 0.435302734375, 0.4539794921875, 0.47265625, 0.4913330078125, 0.510009765625, 0.5286865234375, 0.54736328125, 0.5660400390625, 0.584716796875, 0.6033935546875, 0.6220703125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 2.0, 9.0, 9.0, 6.0, 13.0, 14.0, 12.0, 14.0, 18.0, 19.0, 20.0, 32.0, 28.0, 40.0, 38.0, 30.0, 47.0, 43.0, 42.0, 38.0, 1078.0, 46.0, 33.0, 46.0, 37.0, 38.0, 23.0, 38.0, 28.0, 20.0, 29.0, 24.0, 22.0, 14.0, 18.0, 6.0, 11.0, 5.0, 10.0, 6.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.455078125, -2.381866455078125, -2.30865478515625, -2.235443115234375, -2.1622314453125, -2.089019775390625, -2.01580810546875, -1.942596435546875, -1.869384765625, -1.796173095703125, -1.72296142578125, -1.649749755859375, -1.5765380859375, -1.503326416015625, -1.43011474609375, -1.356903076171875, -1.28369140625, -1.210479736328125, -1.13726806640625, -1.064056396484375, -0.9908447265625, -0.917633056640625, -0.84442138671875, -0.771209716796875, -0.697998046875, -0.624786376953125, -0.55157470703125, -0.478363037109375, -0.4051513671875, -0.331939697265625, -0.25872802734375, -0.185516357421875, -0.1123046875, -0.039093017578125, 0.03411865234375, 0.107330322265625, 0.1805419921875, 0.253753662109375, 0.32696533203125, 0.400177001953125, 0.473388671875, 0.546600341796875, 0.61981201171875, 0.693023681640625, 0.7662353515625, 0.839447021484375, 0.91265869140625, 0.985870361328125, 1.05908203125, 1.132293701171875, 1.20550537109375, 1.278717041015625, 1.3519287109375, 1.425140380859375, 1.49835205078125, 1.571563720703125, 1.644775390625, 1.717987060546875, 1.79119873046875, 1.864410400390625, 1.9376220703125, 2.010833740234375, 2.08404541015625, 2.157257080078125, 2.23046875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 13.0, 24.0, 29.0, 53.0, 77.0, 99.0, 151.0, 207.0, 338.0, 565.0, 872.0, 1329.0, 1963.0, 2963.0, 4579.0, 7015.0, 10805.0, 16451.0, 25667.0, 39487.0, 60665.0, 93531.0, 135746.0, 1205362.0, 166106.0, 112137.0, 74527.0, 47885.0, 30734.0, 20298.0, 13060.0, 8462.0, 5531.0, 3642.0, 2294.0, 1510.0, 1010.0, 690.0, 410.0, 274.0, 188.0, 123.0, 84.0, 55.0, 33.0, 29.0, 20.0, 12.0, 6.0, 1.0, 8.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.2359619140625, -0.22852516174316406, -0.22108840942382812, -0.2136516571044922, -0.20621490478515625, -0.1987781524658203, -0.19134140014648438, -0.18390464782714844, -0.1764678955078125, -0.16903114318847656, -0.16159439086914062, -0.1541576385498047, -0.14672088623046875, -0.1392841339111328, -0.13184738159179688, -0.12441062927246094, -0.116973876953125, -0.10953712463378906, -0.10210037231445312, -0.09466361999511719, -0.08722686767578125, -0.07979011535644531, -0.07235336303710938, -0.06491661071777344, -0.0574798583984375, -0.05004310607910156, -0.042606353759765625, -0.03516960144042969, -0.02773284912109375, -0.020296096801757812, -0.012859344482421875, -0.0054225921630859375, 0.00201416015625, 0.009450912475585938, 0.016887664794921875, 0.024324417114257812, 0.03176116943359375, 0.03919792175292969, 0.046634674072265625, 0.05407142639160156, 0.0615081787109375, 0.06894493103027344, 0.07638168334960938, 0.08381843566894531, 0.09125518798828125, 0.09869194030761719, 0.10612869262695312, 0.11356544494628906, 0.121002197265625, 0.12843894958496094, 0.13587570190429688, 0.1433124542236328, 0.15074920654296875, 0.1581859588623047, 0.16562271118164062, 0.17305946350097656, 0.1804962158203125, 0.18793296813964844, 0.19536972045898438, 0.2028064727783203, 0.21024322509765625, 0.2176799774169922, 0.22511672973632812, 0.23255348205566406, 0.239990234375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 1.0, 4.0, 7.0, 4.0, 5.0, 10.0, 16.0, 15.0, 20.0, 19.0, 41.0, 48.0, 73.0, 106.0, 107.0, 123.0, 99.0, 55.0, 42.0, 39.0, 30.0, 20.0, 23.0, 14.0, 15.0, 7.0, 3.0, 10.0, 2.0, 10.0, 5.0, 6.0, 5.0, 2.0, 1.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00750732421875, -0.007273674011230469, -0.0070400238037109375, -0.006806373596191406, -0.006572723388671875, -0.006339073181152344, -0.0061054229736328125, -0.005871772766113281, -0.00563812255859375, -0.005404472351074219, -0.0051708221435546875, -0.004937171936035156, -0.004703521728515625, -0.004469871520996094, -0.0042362213134765625, -0.004002571105957031, -0.0037689208984375, -0.0035352706909179688, -0.0033016204833984375, -0.0030679702758789062, -0.002834320068359375, -0.0026006698608398438, -0.0023670196533203125, -0.0021333694458007812, -0.00189971923828125, -0.0016660690307617188, -0.0014324188232421875, -0.0011987686157226562, -0.000965118408203125, -0.0007314682006835938, -0.0004978179931640625, -0.00026416778564453125, -3.0517578125e-05, 0.00020313262939453125, 0.0004367828369140625, 0.0006704330444335938, 0.000904083251953125, 0.0011377334594726562, 0.0013713836669921875, 0.0016050338745117188, 0.00183868408203125, 0.0020723342895507812, 0.0023059844970703125, 0.0025396347045898438, 0.002773284912109375, 0.0030069351196289062, 0.0032405853271484375, 0.0034742355346679688, 0.0037078857421875, 0.003941535949707031, 0.0041751861572265625, 0.004408836364746094, 0.004642486572265625, 0.004876136779785156, 0.0051097869873046875, 0.005343437194824219, 0.00557708740234375, 0.005810737609863281, 0.0060443878173828125, 0.006278038024902344, 0.006511688232421875, 0.006745338439941406, 0.0069789886474609375, 0.007212638854980469, 0.0074462890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 8.0, 4.0, 7.0, 15.0, 9.0, 11.0, 9.0, 26.0, 31.0, 33.0, 42.0, 66.0, 96.0, 140.0, 324.0, 1235.0, 884121.0, 160801.0, 834.0, 304.0, 133.0, 91.0, 56.0, 38.0, 19.0, 31.0, 14.0, 8.0, 10.0, 6.0, 6.0, 1.0, 5.0, 4.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1441650390625, -0.13934326171875, -0.134521484375, -0.12969970703125, -0.1248779296875, -0.12005615234375, -0.115234375, -0.11041259765625, -0.1055908203125, -0.10076904296875, -0.095947265625, -0.09112548828125, -0.0863037109375, -0.08148193359375, -0.07666015625, -0.07183837890625, -0.0670166015625, -0.06219482421875, -0.057373046875, -0.05255126953125, -0.0477294921875, -0.04290771484375, -0.0380859375, -0.03326416015625, -0.0284423828125, -0.02362060546875, -0.018798828125, -0.01397705078125, -0.0091552734375, -0.00433349609375, 0.00048828125, 0.00531005859375, 0.0101318359375, 0.01495361328125, 0.019775390625, 0.02459716796875, 0.0294189453125, 0.03424072265625, 0.0390625, 0.04388427734375, 0.0487060546875, 0.05352783203125, 0.058349609375, 0.06317138671875, 0.0679931640625, 0.07281494140625, 0.07763671875, 0.08245849609375, 0.0872802734375, 0.09210205078125, 0.096923828125, 0.10174560546875, 0.1065673828125, 0.11138916015625, 0.1162109375, 0.12103271484375, 0.1258544921875, 0.13067626953125, 0.135498046875, 0.14031982421875, 0.1451416015625, 0.14996337890625, 0.15478515625, 0.15960693359375, 0.1644287109375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 20.0, 164.0, 557.0, 199.0, 49.0, 23.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011133488267660141, -0.010367042385041714, -0.009600597433745861, -0.008834151551127434, -0.008067706599831581, -0.007301260717213154, -0.006534815300256014, -0.005768369883298874, -0.005001924466341734, -0.004235479049384594, -0.003469033632427454, -0.0027025879826396704, -0.0019361425656825304, -0.0011696971487253904, -0.0004032514989376068, 0.00036319391801953316, 0.0011296393349766731, 0.001896084751933813, 0.002662530168890953, 0.0034289758186787367, 0.004195421002805233, 0.00496186688542366, 0.0057283123023808, 0.00649475771933794, 0.00726120313629508, 0.00802764855325222, 0.008794094435870647, 0.0095605393871665, 0.010326985269784927, 0.01109343022108078, 0.011859876103699207, 0.012626321986317635, 0.013392766937613487, 0.014159212820231915, 0.014925657771527767, 0.015692103654146194, 0.016458548605442047, 0.0172249935567379, 0.0179914403706789, 0.018757885321974754, 0.019524330273270607, 0.02029077522456646, 0.02105722203850746, 0.021823666989803314, 0.022590111941099167, 0.02335655689239502, 0.02412300370633602, 0.024889448657631874, 0.025655895471572876, 0.02642234042286873, 0.02718878723680973, 0.027955232188105583, 0.028721677139401436, 0.02948812209069729, 0.03025456890463829, 0.031021013855934143, 0.031787458807229996, 0.03255390375852585, 0.0333203487098217, 0.034086793661117554, 0.034853242337703705, 0.03561968728899956, 0.03638613224029541, 0.03715257719159126, 0.037919022142887115]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 2.0, 3.0, 6.0, 9.0, 7.0, 11.0, 10.0, 16.0, 16.0, 26.0, 19.0, 18.0, 28.0, 29.0, 28.0, 41.0, 35.0, 47.0, 44.0, 35.0, 43.0, 44.0, 33.0, 42.0, 50.0, 39.0, 31.0, 37.0, 41.0, 33.0, 28.0, 27.0, 23.0, 23.0, 15.0, 14.0, 9.0, 9.0, 13.0, 5.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004331350326538086, -0.0042100828140974045, -0.004088815301656723, -0.0039675477892160416, -0.00384628027677536, -0.0037250127643346786, -0.003603745251893997, -0.0034824777394533157, -0.0033612102270126343, -0.003239942714571953, -0.0031186752021312714, -0.00299740768969059, -0.0028761401772499084, -0.002754872664809227, -0.0026336051523685455, -0.002512337639927864, -0.0023910701274871826, -0.002269802615046501, -0.0021485351026058197, -0.0020272675901651382, -0.0019060000777244568, -0.0017847325652837753, -0.0016634650528430939, -0.0015421975404024124, -0.001420930027961731, -0.0012996625155210495, -0.001178395003080368, -0.0010571274906396866, -0.0009358599781990051, -0.0008145924657583237, -0.0006933249533176422, -0.0005720574408769608, -0.0004507899284362793, -0.00032952241599559784, -0.00020825490355491638, -8.698739111423492e-05, 3.428012132644653e-05, 0.000155547633767128, 0.00027681514620780945, 0.0003980826586484909, 0.0005193501710891724, 0.0006406176835298538, 0.0007618851959705353, 0.0008831527084112167, 0.0010044202208518982, 0.0011256877332925797, 0.001246955245733261, 0.0013682227581739426, 0.001489490270614624, 0.0016107577830553055, 0.001732025295495987, 0.0018532928079366684, 0.00197456032037735, 0.0020958278328180313, 0.0022170953452587128, 0.0023383628576993942, 0.0024596303701400757, 0.002580897882580757, 0.0027021653950214386, 0.00282343290746212, 0.0029447004199028015, 0.003065967932343483, 0.0031872354447841644, 0.003308502957224846, 0.0034297704696655273]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 2.0, 6.0, 15.0, 11.0, 9.0, 14.0, 11.0, 15.0, 24.0, 26.0, 26.0, 25.0, 35.0, 29.0, 33.0, 44.0, 42.0, 40.0, 39.0, 40.0, 33.0, 40.0, 36.0, 48.0, 29.0, 35.0, 28.0, 42.0, 29.0, 34.0, 23.0, 14.0, 18.0, 16.0, 18.0, 3.0, 17.0, 7.0, 6.0, 5.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.48828125, -3.385406494140625, -3.28253173828125, -3.179656982421875, -3.0767822265625, -2.973907470703125, -2.87103271484375, -2.768157958984375, -2.665283203125, -2.562408447265625, -2.45953369140625, -2.356658935546875, -2.2537841796875, -2.150909423828125, -2.04803466796875, -1.945159912109375, -1.84228515625, -1.739410400390625, -1.63653564453125, -1.533660888671875, -1.4307861328125, -1.327911376953125, -1.22503662109375, -1.122161865234375, -1.019287109375, -0.916412353515625, -0.81353759765625, -0.710662841796875, -0.6077880859375, -0.504913330078125, -0.40203857421875, -0.299163818359375, -0.1962890625, -0.093414306640625, 0.00946044921875, 0.112335205078125, 0.2152099609375, 0.318084716796875, 0.42095947265625, 0.523834228515625, 0.626708984375, 0.729583740234375, 0.83245849609375, 0.935333251953125, 1.0382080078125, 1.141082763671875, 1.24395751953125, 1.346832275390625, 1.44970703125, 1.552581787109375, 1.65545654296875, 1.758331298828125, 1.8612060546875, 1.964080810546875, 2.06695556640625, 2.169830322265625, 2.272705078125, 2.375579833984375, 2.47845458984375, 2.581329345703125, 2.6842041015625, 2.787078857421875, 2.88995361328125, 2.992828369140625, 3.095703125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 13.0, 12.0, 12.0, 14.0, 36.0, 49.0, 57.0, 81.0, 121.0, 187.0, 322.0, 506.0, 982.0, 1980.0, 4152.0, 9199.0, 21798.0, 52024.0, 125233.0, 309893.0, 307080.0, 124130.0, 51649.0, 21123.0, 9220.0, 4120.0, 2076.0, 1033.0, 535.0, 320.0, 177.0, 122.0, 70.0, 61.0, 44.0, 30.0, 18.0, 17.0, 9.0, 19.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.205841064453125, -3.09527587890625, -2.984710693359375, -2.8741455078125, -2.763580322265625, -2.65301513671875, -2.542449951171875, -2.431884765625, -2.321319580078125, -2.21075439453125, -2.100189208984375, -1.9896240234375, -1.879058837890625, -1.76849365234375, -1.657928466796875, -1.54736328125, -1.436798095703125, -1.32623291015625, -1.215667724609375, -1.1051025390625, -0.994537353515625, -0.88397216796875, -0.773406982421875, -0.662841796875, -0.552276611328125, -0.44171142578125, -0.331146240234375, -0.2205810546875, -0.110015869140625, 0.00054931640625, 0.111114501953125, 0.2216796875, 0.332244873046875, 0.44281005859375, 0.553375244140625, 0.6639404296875, 0.774505615234375, 0.88507080078125, 0.995635986328125, 1.106201171875, 1.216766357421875, 1.32733154296875, 1.437896728515625, 1.5484619140625, 1.659027099609375, 1.76959228515625, 1.880157470703125, 1.99072265625, 2.101287841796875, 2.21185302734375, 2.322418212890625, 2.4329833984375, 2.543548583984375, 2.65411376953125, 2.764678955078125, 2.875244140625, 2.985809326171875, 3.09637451171875, 3.206939697265625, 3.3175048828125, 3.428070068359375, 3.53863525390625, 3.649200439453125, 3.759765625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 3.0, 7.0, 5.0, 9.0, 10.0, 12.0, 16.0, 19.0, 29.0, 18.0, 23.0, 35.0, 36.0, 44.0, 53.0, 62.0, 73.0, 141.0, 347.0, 1391.0, 205.0, 86.0, 66.0, 36.0, 53.0, 38.0, 36.0, 32.0, 29.0, 24.0, 20.0, 19.0, 10.0, 14.0, 11.0, 8.0, 8.0, 6.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.535400390625, -11.12548828125, -10.715576171875, -10.3056640625, -9.895751953125, -9.48583984375, -9.075927734375, -8.666015625, -8.256103515625, -7.84619140625, -7.436279296875, -7.0263671875, -6.616455078125, -6.20654296875, -5.796630859375, -5.38671875, -4.976806640625, -4.56689453125, -4.156982421875, -3.7470703125, -3.337158203125, -2.92724609375, -2.517333984375, -2.107421875, -1.697509765625, -1.28759765625, -0.877685546875, -0.4677734375, -0.057861328125, 0.35205078125, 0.761962890625, 1.171875, 1.581787109375, 1.99169921875, 2.401611328125, 2.8115234375, 3.221435546875, 3.63134765625, 4.041259765625, 4.451171875, 4.861083984375, 5.27099609375, 5.680908203125, 6.0908203125, 6.500732421875, 6.91064453125, 7.320556640625, 7.73046875, 8.140380859375, 8.55029296875, 8.960205078125, 9.3701171875, 9.780029296875, 10.18994140625, 10.599853515625, 11.009765625, 11.419677734375, 11.82958984375, 12.239501953125, 12.6494140625, 13.059326171875, 13.46923828125, 13.879150390625, 14.2890625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 4.0, 14.0, 19.0, 21.0, 44.0, 69.0, 121.0, 197.0, 416.0, 1411.0, 47633.0, 3091575.0, 2987.0, 589.0, 230.0, 131.0, 91.0, 49.0, 27.0, 26.0, 14.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.23046875, -60.0234375, -57.81640625, -55.609375, -53.40234375, -51.1953125, -48.98828125, -46.78125, -44.57421875, -42.3671875, -40.16015625, -37.953125, -35.74609375, -33.5390625, -31.33203125, -29.125, -26.91796875, -24.7109375, -22.50390625, -20.296875, -18.08984375, -15.8828125, -13.67578125, -11.46875, -9.26171875, -7.0546875, -4.84765625, -2.640625, -0.43359375, 1.7734375, 3.98046875, 6.1875, 8.39453125, 10.6015625, 12.80859375, 15.015625, 17.22265625, 19.4296875, 21.63671875, 23.84375, 26.05078125, 28.2578125, 30.46484375, 32.671875, 34.87890625, 37.0859375, 39.29296875, 41.5, 43.70703125, 45.9140625, 48.12109375, 50.328125, 52.53515625, 54.7421875, 56.94921875, 59.15625, 61.36328125, 63.5703125, 65.77734375, 67.984375, 70.19140625, 72.3984375, 74.60546875, 76.8125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 97.0, 794.0, 120.0], "bins": [-266.9373474121094, -262.6640319824219, -258.3907165527344, -254.11740112304688, -249.84408569335938, -245.57077026367188, -241.29745483398438, -237.02415466308594, -232.75083923339844, -228.47752380371094, -224.20420837402344, -219.93089294433594, -215.65757751464844, -211.38427734375, -207.1109619140625, -202.837646484375, -198.5643310546875, -194.291015625, -190.0177001953125, -185.744384765625, -181.4710693359375, -177.19775390625, -172.9244384765625, -168.65113830566406, -164.3778076171875, -160.1044921875, -155.8311767578125, -151.557861328125, -147.2845458984375, -143.01123046875, -138.7379150390625, -134.46461486816406, -130.19131469726562, -125.91799926757812, -121.64468383789062, -117.37136840820312, -113.09806060791016, -108.82474517822266, -104.55142974853516, -100.27811431884766, -96.00479888916016, -91.73148345947266, -87.45816802978516, -83.18486022949219, -78.91154479980469, -74.63822937011719, -70.36491394042969, -66.09159851074219, -61.81828689575195, -57.54497146606445, -53.27165985107422, -48.99834442138672, -44.72502899169922, -40.451717376708984, -36.178401947021484, -31.905088424682617, -27.631776809692383, -23.358463287353516, -19.085147857666016, -14.811834335327148, -10.538520812988281, -6.265207290649414, -1.991891860961914, 2.281421661376953, 6.5547356605529785]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 6.0, 12.0, 10.0, 16.0, 14.0, 21.0, 21.0, 23.0, 30.0, 19.0, 30.0, 29.0, 34.0, 30.0, 29.0, 30.0, 33.0, 43.0, 38.0, 29.0, 51.0, 25.0, 53.0, 33.0, 43.0, 25.0, 29.0, 27.0, 28.0, 24.0, 16.0, 14.0, 30.0, 16.0, 12.0, 13.0, 14.0, 14.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-27.907957077026367, -27.000696182250977, -26.093433380126953, -25.186172485351562, -24.27890968322754, -23.37164878845215, -22.464385986328125, -21.557125091552734, -20.649864196777344, -19.742603302001953, -18.83534049987793, -17.92807960510254, -17.020816802978516, -16.113555908203125, -15.206294059753418, -14.299032211303711, -13.391769409179688, -12.48450756072998, -11.577245712280273, -10.669984817504883, -9.76272201538086, -8.855461120605469, -7.948199272155762, -7.040937423706055, -6.133675575256348, -5.226413726806641, -4.319151878356934, -3.4118905067443848, -2.5046286582946777, -1.5973668098449707, -0.6901054382324219, 0.21715641021728516, 1.1244182586669922, 2.031680107116699, 2.938941717147827, 3.846203327178955, 4.753465175628662, 5.660727024078369, 6.567988395690918, 7.475250244140625, 8.382512092590332, 9.289773941040039, 10.197035789489746, 11.104297637939453, 12.011558532714844, 12.918821334838867, 13.826082229614258, 14.733344078063965, 15.640605926513672, 16.547866821289062, 17.455129623413086, 18.362390518188477, 19.2696533203125, 20.17691421508789, 21.08417510986328, 21.991437911987305, 22.898700714111328, 23.80596160888672, 24.713224411010742, 25.620485305786133, 26.527748107910156, 27.435009002685547, 28.342269897460938, 29.24953269958496, 30.15679359436035]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 7.0, 3.0, 9.0, 9.0, 22.0, 7.0, 9.0, 14.0, 21.0, 15.0, 15.0, 27.0, 27.0, 36.0, 28.0, 38.0, 32.0, 40.0, 30.0, 49.0, 31.0, 37.0, 37.0, 39.0, 40.0, 37.0, 28.0, 26.0, 37.0, 31.0, 25.0, 31.0, 24.0, 22.0, 12.0, 22.0, 10.0, 13.0, 10.0, 8.0, 7.0, 6.0, 6.0, 5.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.35546875, -3.248748779296875, -3.14202880859375, -3.035308837890625, -2.9285888671875, -2.821868896484375, -2.71514892578125, -2.608428955078125, -2.501708984375, -2.394989013671875, -2.28826904296875, -2.181549072265625, -2.0748291015625, -1.968109130859375, -1.86138916015625, -1.754669189453125, -1.64794921875, -1.541229248046875, -1.43450927734375, -1.327789306640625, -1.2210693359375, -1.114349365234375, -1.00762939453125, -0.900909423828125, -0.794189453125, -0.687469482421875, -0.58074951171875, -0.474029541015625, -0.3673095703125, -0.260589599609375, -0.15386962890625, -0.047149658203125, 0.0595703125, 0.166290283203125, 0.27301025390625, 0.379730224609375, 0.4864501953125, 0.593170166015625, 0.69989013671875, 0.806610107421875, 0.913330078125, 1.020050048828125, 1.12677001953125, 1.233489990234375, 1.3402099609375, 1.446929931640625, 1.55364990234375, 1.660369873046875, 1.76708984375, 1.873809814453125, 1.98052978515625, 2.087249755859375, 2.1939697265625, 2.300689697265625, 2.40740966796875, 2.514129638671875, 2.620849609375, 2.727569580078125, 2.83428955078125, 2.941009521484375, 3.0477294921875, 3.154449462890625, 3.26116943359375, 3.367889404296875, 3.474609375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 6.0, 5.0, 9.0, 5.0, 8.0, 10.0, 12.0, 19.0, 19.0, 23.0, 30.0, 47.0, 41.0, 58.0, 63.0, 87.0, 109.0, 238.0, 402.0, 1140.0, 3927.0, 19149.0, 131364.0, 887368.0, 2145588.0, 852187.0, 127244.0, 18909.0, 3831.0, 1131.0, 428.0, 224.0, 164.0, 91.0, 75.0, 49.0, 50.0, 30.0, 30.0, 23.0, 25.0, 10.0, 9.0, 17.0, 8.0, 1.0, 13.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-7.44140625, -7.22564697265625, -7.0098876953125, -6.79412841796875, -6.578369140625, -6.36260986328125, -6.1468505859375, -5.93109130859375, -5.71533203125, -5.49957275390625, -5.2838134765625, -5.06805419921875, -4.852294921875, -4.63653564453125, -4.4207763671875, -4.20501708984375, -3.9892578125, -3.77349853515625, -3.5577392578125, -3.34197998046875, -3.126220703125, -2.91046142578125, -2.6947021484375, -2.47894287109375, -2.26318359375, -2.04742431640625, -1.8316650390625, -1.61590576171875, -1.400146484375, -1.18438720703125, -0.9686279296875, -0.75286865234375, -0.537109375, -0.32135009765625, -0.1055908203125, 0.11016845703125, 0.325927734375, 0.54168701171875, 0.7574462890625, 0.97320556640625, 1.18896484375, 1.40472412109375, 1.6204833984375, 1.83624267578125, 2.052001953125, 2.26776123046875, 2.4835205078125, 2.69927978515625, 2.9150390625, 3.13079833984375, 3.3465576171875, 3.56231689453125, 3.778076171875, 3.99383544921875, 4.2095947265625, 4.42535400390625, 4.64111328125, 4.85687255859375, 5.0726318359375, 5.28839111328125, 5.504150390625, 5.71990966796875, 5.9356689453125, 6.15142822265625, 6.3671875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 3.0, 7.0, 7.0, 17.0, 15.0, 26.0, 32.0, 51.0, 48.0, 69.0, 95.0, 104.0, 143.0, 207.0, 282.0, 355.0, 398.0, 430.0, 423.0, 342.0, 266.0, 187.0, 151.0, 108.0, 88.0, 63.0, 38.0, 33.0, 26.0, 12.0, 17.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-9.1015625, -8.87042236328125, -8.6392822265625, -8.40814208984375, -8.177001953125, -7.94586181640625, -7.7147216796875, -7.48358154296875, -7.25244140625, -7.02130126953125, -6.7901611328125, -6.55902099609375, -6.327880859375, -6.09674072265625, -5.8656005859375, -5.63446044921875, -5.4033203125, -5.17218017578125, -4.9410400390625, -4.70989990234375, -4.478759765625, -4.24761962890625, -4.0164794921875, -3.78533935546875, -3.55419921875, -3.32305908203125, -3.0919189453125, -2.86077880859375, -2.629638671875, -2.39849853515625, -2.1673583984375, -1.93621826171875, -1.705078125, -1.47393798828125, -1.2427978515625, -1.01165771484375, -0.780517578125, -0.54937744140625, -0.3182373046875, -0.08709716796875, 0.14404296875, 0.37518310546875, 0.6063232421875, 0.83746337890625, 1.068603515625, 1.29974365234375, 1.5308837890625, 1.76202392578125, 1.9931640625, 2.22430419921875, 2.4554443359375, 2.68658447265625, 2.917724609375, 3.14886474609375, 3.3800048828125, 3.61114501953125, 3.84228515625, 4.07342529296875, 4.3045654296875, 4.53570556640625, 4.766845703125, 4.99798583984375, 5.2291259765625, 5.46026611328125, 5.69140625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 11.0, 17.0, 18.0, 28.0, 32.0, 50.0, 72.0, 116.0, 163.0, 198.0, 322.0, 552.0, 4958.0, 2214441.0, 1967222.0, 4431.0, 559.0, 316.0, 201.0, 134.0, 114.0, 83.0, 54.0, 49.0, 31.0, 27.0, 21.0, 15.0, 11.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.52685546875, -23.4599609375, -22.39306640625, -21.326171875, -20.25927734375, -19.1923828125, -18.12548828125, -17.05859375, -15.99169921875, -14.9248046875, -13.85791015625, -12.791015625, -11.72412109375, -10.6572265625, -9.59033203125, -8.5234375, -7.45654296875, -6.3896484375, -5.32275390625, -4.255859375, -3.18896484375, -2.1220703125, -1.05517578125, 0.01171875, 1.07861328125, 2.1455078125, 3.21240234375, 4.279296875, 5.34619140625, 6.4130859375, 7.47998046875, 8.546875, 9.61376953125, 10.6806640625, 11.74755859375, 12.814453125, 13.88134765625, 14.9482421875, 16.01513671875, 17.08203125, 18.14892578125, 19.2158203125, 20.28271484375, 21.349609375, 22.41650390625, 23.4833984375, 24.55029296875, 25.6171875, 26.68408203125, 27.7509765625, 28.81787109375, 29.884765625, 30.95166015625, 32.0185546875, 33.08544921875, 34.15234375, 35.21923828125, 36.2861328125, 37.35302734375, 38.419921875, 39.48681640625, 40.5537109375, 41.62060546875, 42.6875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 24.0, 174.0, 440.0, 323.0, 53.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-210.8077392578125, -206.39984130859375, -201.99192810058594, -197.58401489257812, -193.17611694335938, -188.76821899414062, -184.3603057861328, -179.952392578125, -175.54449462890625, -171.1365966796875, -166.7286834716797, -162.32077026367188, -157.91287231445312, -153.50497436523438, -149.09706115722656, -144.68914794921875, -140.28125, -135.87335205078125, -131.46543884277344, -127.05753326416016, -122.64962768554688, -118.2417221069336, -113.83381652832031, -109.42591094970703, -105.01800537109375, -100.61009979248047, -96.20219421386719, -91.7942886352539, -87.38638305664062, -82.97847747802734, -78.57057189941406, -74.16266632080078, -69.75475311279297, -65.34684753417969, -60.938941955566406, -56.531036376953125, -52.123130798339844, -47.71522521972656, -43.30731964111328, -38.8994140625, -34.49150848388672, -30.083602905273438, -25.675697326660156, -21.267791748046875, -16.859886169433594, -12.451980590820312, -8.044075012207031, -3.63616943359375, 0.7717361450195312, 5.1796417236328125, 9.587547302246094, 13.995452880859375, 18.403358459472656, 22.811264038085938, 27.21916961669922, 31.6270751953125, 36.03498077392578, 40.44288635253906, 44.850791931152344, 49.258697509765625, 53.666603088378906, 58.07450866699219, 62.48241424560547, 66.89031982421875, 71.29822540283203]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 8.0, 5.0, 5.0, 11.0, 10.0, 9.0, 16.0, 10.0, 20.0, 19.0, 17.0, 22.0, 21.0, 32.0, 34.0, 30.0, 39.0, 33.0, 35.0, 44.0, 38.0, 42.0, 38.0, 34.0, 38.0, 26.0, 48.0, 39.0, 34.0, 31.0, 30.0, 23.0, 27.0, 23.0, 21.0, 6.0, 16.0, 9.0, 13.0, 8.0, 8.0, 7.0, 5.0, 8.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-22.873281478881836, -22.197052001953125, -21.520822525024414, -20.844593048095703, -20.168363571166992, -19.49213409423828, -18.815906524658203, -18.13967514038086, -17.46344757080078, -16.78721809387207, -16.11098861694336, -15.434759140014648, -14.758529663085938, -14.082300186157227, -13.406071662902832, -12.729842185974121, -12.053611755371094, -11.377382278442383, -10.701152801513672, -10.024923324584961, -9.34869384765625, -8.672464370727539, -7.9962358474731445, -7.320006370544434, -6.643776893615723, -5.967547416687012, -5.291317939758301, -4.615088939666748, -3.938859462738037, -3.262629985809326, -2.5864009857177734, -1.9101715087890625, -1.2339439392089844, -0.557714581489563, 0.1185147762298584, 0.7947440147399902, 1.4709734916687012, 2.147202968597412, 2.823431968688965, 3.499661445617676, 4.175890922546387, 4.852120399475098, 5.528349876403809, 6.204578876495361, 6.880808353424072, 7.557037830352783, 8.233266830444336, 8.909496307373047, 9.585725784301758, 10.261955261230469, 10.93818473815918, 11.61441421508789, 12.290643692016602, 12.966873168945312, 13.643101692199707, 14.319331169128418, 14.995560646057129, 15.67179012298584, 16.348018646240234, 17.024248123168945, 17.700477600097656, 18.376707077026367, 19.052936553955078, 19.72916603088379, 20.4053955078125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 4.0, 8.0, 8.0, 3.0, 8.0, 9.0, 22.0, 20.0, 18.0, 23.0, 32.0, 22.0, 23.0, 22.0, 36.0, 28.0, 30.0, 38.0, 42.0, 42.0, 41.0, 31.0, 32.0, 30.0, 45.0, 34.0, 47.0, 23.0, 26.0, 23.0, 30.0, 24.0, 26.0, 17.0, 15.0, 19.0, 19.0, 13.0, 10.0, 10.0, 5.0, 5.0, 4.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.236328125, -3.13580322265625, -3.0352783203125, -2.93475341796875, -2.834228515625, -2.73370361328125, -2.6331787109375, -2.53265380859375, -2.43212890625, -2.33160400390625, -2.2310791015625, -2.13055419921875, -2.030029296875, -1.92950439453125, -1.8289794921875, -1.72845458984375, -1.6279296875, -1.52740478515625, -1.4268798828125, -1.32635498046875, -1.225830078125, -1.12530517578125, -1.0247802734375, -0.92425537109375, -0.82373046875, -0.72320556640625, -0.6226806640625, -0.52215576171875, -0.421630859375, -0.32110595703125, -0.2205810546875, -0.12005615234375, -0.01953125, 0.08099365234375, 0.1815185546875, 0.28204345703125, 0.382568359375, 0.48309326171875, 0.5836181640625, 0.68414306640625, 0.78466796875, 0.88519287109375, 0.9857177734375, 1.08624267578125, 1.186767578125, 1.28729248046875, 1.3878173828125, 1.48834228515625, 1.5888671875, 1.68939208984375, 1.7899169921875, 1.89044189453125, 1.990966796875, 2.09149169921875, 2.1920166015625, 2.29254150390625, 2.39306640625, 2.49359130859375, 2.5941162109375, 2.69464111328125, 2.795166015625, 2.89569091796875, 2.9962158203125, 3.09674072265625, 3.197265625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 14.0, 28.0, 23.0, 44.0, 58.0, 91.0, 190.0, 332.0, 570.0, 1113.0, 2076.0, 3885.0, 7462.0, 14883.0, 30672.0, 66063.0, 144194.0, 279195.0, 257144.0, 127780.0, 58250.0, 26768.0, 13261.0, 6741.0, 3609.0, 1863.0, 994.0, 495.0, 282.0, 158.0, 105.0, 68.0, 39.0, 24.0, 18.0, 9.0, 12.0, 10.0, 9.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472900390625, -0.4546546936035156, -0.43640899658203125, -0.4181632995605469, -0.3999176025390625, -0.3816719055175781, -0.36342620849609375, -0.3451805114746094, -0.326934814453125, -0.3086891174316406, -0.29044342041015625, -0.2721977233886719, -0.2539520263671875, -0.23570632934570312, -0.21746063232421875, -0.19921493530273438, -0.18096923828125, -0.16272354125976562, -0.14447784423828125, -0.12623214721679688, -0.1079864501953125, -0.08974075317382812, -0.07149505615234375, -0.053249359130859375, -0.035003662109375, -0.016757965087890625, 0.00148773193359375, 0.019733428955078125, 0.0379791259765625, 0.056224822998046875, 0.07447052001953125, 0.09271621704101562, 0.1109619140625, 0.12920761108398438, 0.14745330810546875, 0.16569900512695312, 0.1839447021484375, 0.20219039916992188, 0.22043609619140625, 0.23868179321289062, 0.256927490234375, 0.2751731872558594, 0.29341888427734375, 0.3116645812988281, 0.3299102783203125, 0.3481559753417969, 0.36640167236328125, 0.3846473693847656, 0.40289306640625, 0.4211387634277344, 0.43938446044921875, 0.4576301574707031, 0.4758758544921875, 0.4941215515136719, 0.5123672485351562, 0.5306129455566406, 0.548858642578125, 0.5671043395996094, 0.5853500366210938, 0.6035957336425781, 0.6218414306640625, 0.6400871276855469, 0.6583328247070312, 0.6765785217285156, 0.69482421875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 5.0, 1.0, 8.0, 5.0, 9.0, 7.0, 12.0, 5.0, 12.0, 12.0, 18.0, 23.0, 23.0, 24.0, 28.0, 39.0, 28.0, 20.0, 36.0, 44.0, 49.0, 41.0, 1063.0, 44.0, 33.0, 43.0, 31.0, 41.0, 33.0, 40.0, 42.0, 29.0, 20.0, 17.0, 19.0, 20.0, 13.0, 19.0, 15.0, 14.0, 13.0, 10.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.435546875, -2.363494873046875, -2.29144287109375, -2.219390869140625, -2.1473388671875, -2.075286865234375, -2.00323486328125, -1.931182861328125, -1.859130859375, -1.787078857421875, -1.71502685546875, -1.642974853515625, -1.5709228515625, -1.498870849609375, -1.42681884765625, -1.354766845703125, -1.28271484375, -1.210662841796875, -1.13861083984375, -1.066558837890625, -0.9945068359375, -0.922454833984375, -0.85040283203125, -0.778350830078125, -0.706298828125, -0.634246826171875, -0.56219482421875, -0.490142822265625, -0.4180908203125, -0.346038818359375, -0.27398681640625, -0.201934814453125, -0.1298828125, -0.057830810546875, 0.01422119140625, 0.086273193359375, 0.1583251953125, 0.230377197265625, 0.30242919921875, 0.374481201171875, 0.446533203125, 0.518585205078125, 0.59063720703125, 0.662689208984375, 0.7347412109375, 0.806793212890625, 0.87884521484375, 0.950897216796875, 1.02294921875, 1.095001220703125, 1.16705322265625, 1.239105224609375, 1.3111572265625, 1.383209228515625, 1.45526123046875, 1.527313232421875, 1.599365234375, 1.671417236328125, 1.74346923828125, 1.815521240234375, 1.8875732421875, 1.959625244140625, 2.03167724609375, 2.103729248046875, 2.17578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 4.0, 17.0, 18.0, 24.0, 56.0, 85.0, 119.0, 206.0, 259.0, 379.0, 584.0, 885.0, 1325.0, 2023.0, 3030.0, 4497.0, 6728.0, 10199.0, 15365.0, 23077.0, 34241.0, 51077.0, 74033.0, 105919.0, 143195.0, 1195516.0, 129256.0, 95233.0, 65333.0, 44028.0, 30114.0, 20037.0, 13574.0, 9019.0, 6004.0, 3867.0, 2518.0, 1788.0, 1156.0, 765.0, 551.0, 382.0, 213.0, 140.0, 104.0, 56.0, 55.0, 36.0, 18.0, 17.0, 8.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.22119140625, -0.21435165405273438, -0.20751190185546875, -0.20067214965820312, -0.1938323974609375, -0.18699264526367188, -0.18015289306640625, -0.17331314086914062, -0.166473388671875, -0.15963363647460938, -0.15279388427734375, -0.14595413208007812, -0.1391143798828125, -0.13227462768554688, -0.12543487548828125, -0.11859512329101562, -0.11175537109375, -0.10491561889648438, -0.09807586669921875, -0.09123611450195312, -0.0843963623046875, -0.07755661010742188, -0.07071685791015625, -0.06387710571289062, -0.057037353515625, -0.050197601318359375, -0.04335784912109375, -0.036518096923828125, -0.0296783447265625, -0.022838592529296875, -0.01599884033203125, -0.009159088134765625, -0.0023193359375, 0.004520416259765625, 0.01136016845703125, 0.018199920654296875, 0.0250396728515625, 0.031879425048828125, 0.03871917724609375, 0.045558929443359375, 0.052398681640625, 0.059238433837890625, 0.06607818603515625, 0.07291793823242188, 0.0797576904296875, 0.08659744262695312, 0.09343719482421875, 0.10027694702148438, 0.10711669921875, 0.11395645141601562, 0.12079620361328125, 0.12763595581054688, 0.1344757080078125, 0.14131546020507812, 0.14815521240234375, 0.15499496459960938, 0.161834716796875, 0.16867446899414062, 0.17551422119140625, 0.18235397338867188, 0.1891937255859375, 0.19603347778320312, 0.20287322998046875, 0.20971298217773438, 0.216552734375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 3.0, 4.0, 8.0, 7.0, 6.0, 10.0, 10.0, 12.0, 13.0, 15.0, 29.0, 19.0, 28.0, 27.0, 35.0, 42.0, 39.0, 45.0, 41.0, 53.0, 53.0, 58.0, 50.0, 33.0, 51.0, 40.0, 37.0, 34.0, 19.0, 24.0, 35.0, 19.0, 20.0, 11.0, 16.0, 10.0, 8.0, 5.0, 10.0, 8.0, 7.0, 3.0, 8.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003582000732421875, -0.0034675002098083496, -0.0033529996871948242, -0.003238499164581299, -0.0031239986419677734, -0.003009498119354248, -0.0028949975967407227, -0.0027804970741271973, -0.002665996551513672, -0.0025514960289001465, -0.002436995506286621, -0.0023224949836730957, -0.0022079944610595703, -0.002093493938446045, -0.0019789934158325195, -0.0018644928932189941, -0.0017499923706054688, -0.0016354918479919434, -0.001520991325378418, -0.0014064908027648926, -0.0012919902801513672, -0.0011774897575378418, -0.0010629892349243164, -0.000948488712310791, -0.0008339881896972656, -0.0007194876670837402, -0.0006049871444702148, -0.0004904866218566895, -0.00037598609924316406, -0.00026148557662963867, -0.00014698505401611328, -3.248453140258789e-05, 8.20159912109375e-05, 0.0001965165138244629, 0.0003110170364379883, 0.00042551755905151367, 0.0005400180816650391, 0.0006545186042785645, 0.0007690191268920898, 0.0008835196495056152, 0.0009980201721191406, 0.001112520694732666, 0.0012270212173461914, 0.0013415217399597168, 0.0014560222625732422, 0.0015705227851867676, 0.001685023307800293, 0.0017995238304138184, 0.0019140243530273438, 0.002028524875640869, 0.0021430253982543945, 0.00225752592086792, 0.0023720264434814453, 0.0024865269660949707, 0.002601027488708496, 0.0027155280113220215, 0.002830028533935547, 0.0029445290565490723, 0.0030590295791625977, 0.003173530101776123, 0.0032880306243896484, 0.003402531147003174, 0.0035170316696166992, 0.0036315321922302246, 0.00374603271484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 3.0, 5.0, 8.0, 10.0, 6.0, 13.0, 10.0, 19.0, 21.0, 26.0, 27.0, 45.0, 49.0, 52.0, 68.0, 103.0, 147.0, 283.0, 558.0, 4660.0, 803739.0, 235223.0, 2182.0, 470.0, 216.0, 135.0, 114.0, 71.0, 52.0, 59.0, 30.0, 31.0, 21.0, 18.0, 13.0, 14.0, 16.0, 7.0, 7.0, 11.0, 2.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07916259765625, -0.07675552368164062, -0.07434844970703125, -0.07194137573242188, -0.0695343017578125, -0.06712722778320312, -0.06472015380859375, -0.062313079833984375, -0.059906005859375, -0.057498931884765625, -0.05509185791015625, -0.052684783935546875, -0.0502777099609375, -0.047870635986328125, -0.04546356201171875, -0.043056488037109375, -0.0406494140625, -0.038242340087890625, -0.03583526611328125, -0.033428192138671875, -0.0310211181640625, -0.028614044189453125, -0.02620697021484375, -0.023799896240234375, -0.021392822265625, -0.018985748291015625, -0.01657867431640625, -0.014171600341796875, -0.0117645263671875, -0.009357452392578125, -0.00695037841796875, -0.004543304443359375, -0.00213623046875, 0.000270843505859375, 0.00267791748046875, 0.005084991455078125, 0.0074920654296875, 0.009899139404296875, 0.01230621337890625, 0.014713287353515625, 0.017120361328125, 0.019527435302734375, 0.02193450927734375, 0.024341583251953125, 0.0267486572265625, 0.029155731201171875, 0.03156280517578125, 0.033969879150390625, 0.036376953125, 0.038784027099609375, 0.04119110107421875, 0.043598175048828125, 0.0460052490234375, 0.048412322998046875, 0.05081939697265625, 0.053226470947265625, 0.055633544921875, 0.058040618896484375, 0.06044769287109375, 0.06285476684570312, 0.0652618408203125, 0.06766891479492188, 0.07007598876953125, 0.07248306274414062, 0.07489013671875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 20.0, 46.0, 76.0, 195.0, 232.0, 208.0, 101.0, 59.0, 39.0, 11.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003941108472645283, -0.003715698141604662, -0.0034902875777333975, -0.0032648772466927767, -0.003039466915652156, -0.0028140563517808914, -0.0025886460207402706, -0.00236323568969965, -0.002137825358659029, -0.0019124149112030864, -0.0016870045801624656, -0.001461594132706523, -0.0012361838016659021, -0.0010107733542099595, -0.0007853629067540169, -0.0005599525757133961, -0.0003345420118421316, -0.00010913160804193467, 0.00011627879575826228, 0.00034168921411037445, 0.0005670996033586562, 0.0007925099926069379, 0.0010179204400628805, 0.0012433307711035013, 0.001468741218559444, 0.0016941516660153866, 0.0019195619970560074, 0.002144972328096628, 0.0023703828919678926, 0.0025957932230085135, 0.002821203786879778, 0.0030466141179203987, 0.0032720244489610195, 0.0034974347800016403, 0.0037228453438729048, 0.003948255442082882, 0.00417366623878479, 0.004399076569825411, 0.004624486900866032, 0.0048498972319066525, 0.005075307562947273, 0.005300717893987894, 0.005526128225028515, 0.005751539021730423, 0.005976949352771044, 0.006202359683811665, 0.006427770014852285, 0.006653180345892906, 0.006878591142594814, 0.007104001473635435, 0.007329411804676056, 0.007554822601377964, 0.007780232932418585, 0.008005643263459206, 0.008231053128838539, 0.008456463925540447, 0.00868187379091978, 0.008907284587621689, 0.009132694453001022, 0.00935810524970293, 0.009583515115082264, 0.009808925911784172, 0.010034335777163506, 0.010259746573865414, 0.010485157370567322]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 3.0, 4.0, 3.0, 7.0, 6.0, 14.0, 9.0, 8.0, 13.0, 19.0, 25.0, 18.0, 34.0, 24.0, 27.0, 24.0, 36.0, 43.0, 26.0, 31.0, 24.0, 33.0, 34.0, 33.0, 54.0, 30.0, 34.0, 39.0, 33.0, 34.0, 20.0, 24.0, 23.0, 20.0, 24.0, 27.0, 25.0, 14.0, 14.0, 12.0, 17.0, 6.0, 7.0, 9.0, 7.0, 7.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0019467473030090332, -0.001883956603705883, -0.0018211659044027328, -0.0017583752050995827, -0.0016955845057964325, -0.0016327938064932823, -0.0015700031071901321, -0.001507212407886982, -0.0014444217085838318, -0.0013816310092806816, -0.0013188403099775314, -0.0012560496106743813, -0.001193258911371231, -0.001130468212068081, -0.0010676775127649307, -0.0010048868134617805, -0.0009420961141586304, -0.0008793054148554802, -0.00081651471555233, -0.0007537240162491798, -0.0006909333169460297, -0.0006281426176428795, -0.0005653519183397293, -0.0005025612190365791, -0.00043977051973342896, -0.0003769798204302788, -0.0003141891211271286, -0.0002513984218239784, -0.00018860772252082825, -0.00012581702321767807, -6.302632391452789e-05, -2.3562461137771606e-07, 6.255507469177246e-05, 0.00012534577399492264, 0.00018813647329807281, 0.000250927172601223, 0.00031371787190437317, 0.00037650857120752335, 0.0004392992705106735, 0.0005020899698138237, 0.0005648806691169739, 0.000627671368420124, 0.0006904620677232742, 0.0007532527670264244, 0.0008160434663295746, 0.0008788341656327248, 0.0009416248649358749, 0.0010044155642390251, 0.0010672062635421753, 0.0011299969628453255, 0.0011927876621484756, 0.0012555783614516258, 0.001318369060754776, 0.0013811597600579262, 0.0014439504593610764, 0.0015067411586642265, 0.0015695318579673767, 0.0016323225572705269, 0.001695113256573677, 0.0017579039558768272, 0.0018206946551799774, 0.0018834853544831276, 0.0019462760537862778, 0.002009066753089428, 0.002071857452392578]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 4.0, 8.0, 8.0, 3.0, 8.0, 9.0, 22.0, 20.0, 19.0, 22.0, 32.0, 22.0, 23.0, 22.0, 36.0, 28.0, 30.0, 39.0, 41.0, 42.0, 41.0, 31.0, 32.0, 30.0, 45.0, 34.0, 47.0, 23.0, 26.0, 23.0, 30.0, 24.0, 26.0, 17.0, 14.0, 20.0, 19.0, 13.0, 10.0, 10.0, 5.0, 5.0, 4.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.236328125, -3.13580322265625, -3.0352783203125, -2.93475341796875, -2.834228515625, -2.73370361328125, -2.6331787109375, -2.53265380859375, -2.43212890625, -2.33160400390625, -2.2310791015625, -2.13055419921875, -2.030029296875, -1.92950439453125, -1.8289794921875, -1.72845458984375, -1.6279296875, -1.52740478515625, -1.4268798828125, -1.32635498046875, -1.225830078125, -1.12530517578125, -1.0247802734375, -0.92425537109375, -0.82373046875, -0.72320556640625, -0.6226806640625, -0.52215576171875, -0.421630859375, -0.32110595703125, -0.2205810546875, -0.12005615234375, -0.01953125, 0.08099365234375, 0.1815185546875, 0.28204345703125, 0.382568359375, 0.48309326171875, 0.5836181640625, 0.68414306640625, 0.78466796875, 0.88519287109375, 0.9857177734375, 1.08624267578125, 1.186767578125, 1.28729248046875, 1.3878173828125, 1.48834228515625, 1.5888671875, 1.68939208984375, 1.7899169921875, 1.89044189453125, 1.990966796875, 2.09149169921875, 2.1920166015625, 2.29254150390625, 2.39306640625, 2.49359130859375, 2.5941162109375, 2.69464111328125, 2.795166015625, 2.89569091796875, 2.9962158203125, 3.09674072265625, 3.197265625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 9.0, 7.0, 12.0, 8.0, 11.0, 15.0, 31.0, 37.0, 59.0, 87.0, 146.0, 292.0, 562.0, 998.0, 1943.0, 3601.0, 7005.0, 13254.0, 26384.0, 59046.0, 154251.0, 365473.0, 244748.0, 93463.0, 38427.0, 18393.0, 9377.0, 5170.0, 2681.0, 1376.0, 683.0, 422.0, 210.0, 117.0, 52.0, 65.0, 32.0, 23.0, 17.0, 10.0, 12.0, 9.0, 9.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.51171875, -3.401092529296875, -3.29046630859375, -3.179840087890625, -3.0692138671875, -2.958587646484375, -2.84796142578125, -2.737335205078125, -2.626708984375, -2.516082763671875, -2.40545654296875, -2.294830322265625, -2.1842041015625, -2.073577880859375, -1.96295166015625, -1.852325439453125, -1.74169921875, -1.631072998046875, -1.52044677734375, -1.409820556640625, -1.2991943359375, -1.188568115234375, -1.07794189453125, -0.967315673828125, -0.856689453125, -0.746063232421875, -0.63543701171875, -0.524810791015625, -0.4141845703125, -0.303558349609375, -0.19293212890625, -0.082305908203125, 0.0283203125, 0.138946533203125, 0.24957275390625, 0.360198974609375, 0.4708251953125, 0.581451416015625, 0.69207763671875, 0.802703857421875, 0.913330078125, 1.023956298828125, 1.13458251953125, 1.245208740234375, 1.3558349609375, 1.466461181640625, 1.57708740234375, 1.687713623046875, 1.79833984375, 1.908966064453125, 2.01959228515625, 2.130218505859375, 2.2408447265625, 2.351470947265625, 2.46209716796875, 2.572723388671875, 2.683349609375, 2.793975830078125, 2.90460205078125, 3.015228271484375, 3.1258544921875, 3.236480712890625, 3.34710693359375, 3.457733154296875, 3.568359375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 3.0, 7.0, 5.0, 3.0, 5.0, 10.0, 13.0, 16.0, 15.0, 21.0, 29.0, 19.0, 28.0, 34.0, 28.0, 44.0, 55.0, 74.0, 92.0, 206.0, 1572.0, 265.0, 98.0, 76.0, 46.0, 56.0, 28.0, 27.0, 30.0, 24.0, 23.0, 21.0, 18.0, 20.0, 5.0, 14.0, 2.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-16.359375, -15.912109375, -15.46484375, -15.017578125, -14.5703125, -14.123046875, -13.67578125, -13.228515625, -12.78125, -12.333984375, -11.88671875, -11.439453125, -10.9921875, -10.544921875, -10.09765625, -9.650390625, -9.203125, -8.755859375, -8.30859375, -7.861328125, -7.4140625, -6.966796875, -6.51953125, -6.072265625, -5.625, -5.177734375, -4.73046875, -4.283203125, -3.8359375, -3.388671875, -2.94140625, -2.494140625, -2.046875, -1.599609375, -1.15234375, -0.705078125, -0.2578125, 0.189453125, 0.63671875, 1.083984375, 1.53125, 1.978515625, 2.42578125, 2.873046875, 3.3203125, 3.767578125, 4.21484375, 4.662109375, 5.109375, 5.556640625, 6.00390625, 6.451171875, 6.8984375, 7.345703125, 7.79296875, 8.240234375, 8.6875, 9.134765625, 9.58203125, 10.029296875, 10.4765625, 10.923828125, 11.37109375, 11.818359375, 12.265625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 4.0, 9.0, 4.0, 10.0, 11.0, 17.0, 19.0, 22.0, 25.0, 42.0, 50.0, 75.0, 106.0, 158.0, 202.0, 361.0, 806.0, 8823.0, 3036978.0, 94970.0, 1615.0, 447.0, 256.0, 163.0, 133.0, 93.0, 83.0, 48.0, 40.0, 28.0, 27.0, 12.0, 14.0, 9.0, 12.0, 7.0, 2.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.0, -37.80810546875, -36.6162109375, -35.42431640625, -34.232421875, -33.04052734375, -31.8486328125, -30.65673828125, -29.46484375, -28.27294921875, -27.0810546875, -25.88916015625, -24.697265625, -23.50537109375, -22.3134765625, -21.12158203125, -19.9296875, -18.73779296875, -17.5458984375, -16.35400390625, -15.162109375, -13.97021484375, -12.7783203125, -11.58642578125, -10.39453125, -9.20263671875, -8.0107421875, -6.81884765625, -5.626953125, -4.43505859375, -3.2431640625, -2.05126953125, -0.859375, 0.33251953125, 1.5244140625, 2.71630859375, 3.908203125, 5.10009765625, 6.2919921875, 7.48388671875, 8.67578125, 9.86767578125, 11.0595703125, 12.25146484375, 13.443359375, 14.63525390625, 15.8271484375, 17.01904296875, 18.2109375, 19.40283203125, 20.5947265625, 21.78662109375, 22.978515625, 24.17041015625, 25.3623046875, 26.55419921875, 27.74609375, 28.93798828125, 30.1298828125, 31.32177734375, 32.513671875, 33.70556640625, 34.8974609375, 36.08935546875, 37.28125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 380.0, 631.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.77734375, -289.5188293457031, -284.26031494140625, -279.0018005371094, -273.7432556152344, -268.4847412109375, -263.2262268066406, -257.96771240234375, -252.70919799804688, -247.45068359375, -242.19215393066406, -236.9336395263672, -231.6751251220703, -226.41659545898438, -221.1580810546875, -215.89956665039062, -210.6410369873047, -205.3825225830078, -200.12399291992188, -194.865478515625, -189.60696411132812, -184.34844970703125, -179.0899200439453, -173.83140563964844, -168.5728759765625, -163.31436157226562, -158.0558319091797, -152.7973175048828, -147.53880310058594, -142.2802734375, -137.02175903320312, -131.76324462890625, -126.50473022460938, -121.24620819091797, -115.9876937866211, -110.72917175292969, -105.47065734863281, -100.2121353149414, -94.95361328125, -89.69509887695312, -84.43658447265625, -79.17806243896484, -73.91954803466797, -68.66102600097656, -63.40250778198242, -58.14398956298828, -52.885467529296875, -47.626949310302734, -42.36842727661133, -37.10990905761719, -31.851388931274414, -26.59286880493164, -21.3343505859375, -16.07583236694336, -10.817312240600586, -5.5587921142578125, -0.3002738952636719, 4.958245277404785, 10.216764450073242, 15.4752836227417, 20.733802795410156, 25.992321014404297, 31.25084114074707, 36.509361267089844, 41.767879486083984]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 7.0, 6.0, 8.0, 14.0, 23.0, 22.0, 19.0, 19.0, 22.0, 28.0, 24.0, 27.0, 29.0, 29.0, 36.0, 40.0, 29.0, 52.0, 28.0, 35.0, 47.0, 34.0, 44.0, 33.0, 25.0, 37.0, 32.0, 24.0, 23.0, 33.0, 28.0, 17.0, 14.0, 11.0, 18.0, 10.0, 16.0, 7.0, 5.0, 9.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-29.192794799804688, -28.256088256835938, -27.319379806518555, -26.382673263549805, -25.445964813232422, -24.509258270263672, -23.572551727294922, -22.63584327697754, -21.69913673400879, -20.76243019104004, -19.825721740722656, -18.889015197753906, -17.952306747436523, -17.015600204467773, -16.07889175415039, -15.14218521118164, -14.205477714538574, -13.268770217895508, -12.332062721252441, -11.395355224609375, -10.458648681640625, -9.521941184997559, -8.585233688354492, -7.648526668548584, -6.711819171905518, -5.775111675262451, -4.838404655456543, -3.9016971588134766, -2.9649899005889893, -2.028282642364502, -1.0915751457214355, -0.15486812591552734, 0.7818393707275391, 1.7185466289520264, 2.6552538871765137, 3.59196138381958, 4.528668403625488, 5.465375900268555, 6.402083396911621, 7.338790416717529, 8.275497436523438, 9.212204933166504, 10.14891242980957, 11.08561897277832, 12.022326469421387, 12.959033966064453, 13.89574146270752, 14.832448959350586, 15.769156455993652, 16.70586395263672, 17.64257049560547, 18.57927894592285, 19.5159854888916, 20.452693939208984, 21.389400482177734, 22.326107025146484, 23.262815475463867, 24.199522018432617, 25.13623046875, 26.07293701171875, 27.009645462036133, 27.946352005004883, 28.883060455322266, 29.819766998291016, 30.756473541259766]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 8.0, 7.0, 10.0, 8.0, 8.0, 16.0, 18.0, 17.0, 31.0, 33.0, 29.0, 24.0, 22.0, 36.0, 41.0, 44.0, 33.0, 50.0, 35.0, 45.0, 38.0, 49.0, 41.0, 44.0, 38.0, 25.0, 37.0, 18.0, 25.0, 24.0, 26.0, 19.0, 16.0, 18.0, 14.0, 7.0, 9.0, 6.0, 8.0, 8.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.947998046875, -3.82177734375, -3.695556640625, -3.5693359375, -3.443115234375, -3.31689453125, -3.190673828125, -3.064453125, -2.938232421875, -2.81201171875, -2.685791015625, -2.5595703125, -2.433349609375, -2.30712890625, -2.180908203125, -2.0546875, -1.928466796875, -1.80224609375, -1.676025390625, -1.5498046875, -1.423583984375, -1.29736328125, -1.171142578125, -1.044921875, -0.918701171875, -0.79248046875, -0.666259765625, -0.5400390625, -0.413818359375, -0.28759765625, -0.161376953125, -0.03515625, 0.091064453125, 0.21728515625, 0.343505859375, 0.4697265625, 0.595947265625, 0.72216796875, 0.848388671875, 0.974609375, 1.100830078125, 1.22705078125, 1.353271484375, 1.4794921875, 1.605712890625, 1.73193359375, 1.858154296875, 1.984375, 2.110595703125, 2.23681640625, 2.363037109375, 2.4892578125, 2.615478515625, 2.74169921875, 2.867919921875, 2.994140625, 3.120361328125, 3.24658203125, 3.372802734375, 3.4990234375, 3.625244140625, 3.75146484375, 3.877685546875, 4.00390625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 1.0, 8.0, 9.0, 7.0, 5.0, 9.0, 12.0, 14.0, 24.0, 40.0, 40.0, 39.0, 55.0, 86.0, 120.0, 218.0, 419.0, 1334.0, 7496.0, 81855.0, 1146537.0, 2561271.0, 364366.0, 25475.0, 3126.0, 779.0, 300.0, 167.0, 116.0, 80.0, 67.0, 52.0, 38.0, 26.0, 23.0, 14.0, 9.0, 10.0, 11.0, 5.0, 5.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-11.3125, -11.0006103515625, -10.688720703125, -10.3768310546875, -10.06494140625, -9.7530517578125, -9.441162109375, -9.1292724609375, -8.8173828125, -8.5054931640625, -8.193603515625, -7.8817138671875, -7.56982421875, -7.2579345703125, -6.946044921875, -6.6341552734375, -6.322265625, -6.0103759765625, -5.698486328125, -5.3865966796875, -5.07470703125, -4.7628173828125, -4.450927734375, -4.1390380859375, -3.8271484375, -3.5152587890625, -3.203369140625, -2.8914794921875, -2.57958984375, -2.2677001953125, -1.955810546875, -1.6439208984375, -1.33203125, -1.0201416015625, -0.708251953125, -0.3963623046875, -0.08447265625, 0.2274169921875, 0.539306640625, 0.8511962890625, 1.1630859375, 1.4749755859375, 1.786865234375, 2.0987548828125, 2.41064453125, 2.7225341796875, 3.034423828125, 3.3463134765625, 3.658203125, 3.9700927734375, 4.281982421875, 4.5938720703125, 4.90576171875, 5.2176513671875, 5.529541015625, 5.8414306640625, 6.1533203125, 6.4652099609375, 6.777099609375, 7.0889892578125, 7.40087890625, 7.7127685546875, 8.024658203125, 8.3365478515625, 8.6484375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 15.0, 12.0, 15.0, 25.0, 33.0, 38.0, 52.0, 77.0, 84.0, 110.0, 151.0, 207.0, 246.0, 255.0, 401.0, 399.0, 409.0, 334.0, 265.0, 209.0, 182.0, 131.0, 105.0, 80.0, 48.0, 19.0, 33.0, 33.0, 23.0, 15.0, 15.0, 8.0, 8.0, 6.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.43994140625, -6.2236328125, -6.00732421875, -5.791015625, -5.57470703125, -5.3583984375, -5.14208984375, -4.92578125, -4.70947265625, -4.4931640625, -4.27685546875, -4.060546875, -3.84423828125, -3.6279296875, -3.41162109375, -3.1953125, -2.97900390625, -2.7626953125, -2.54638671875, -2.330078125, -2.11376953125, -1.8974609375, -1.68115234375, -1.46484375, -1.24853515625, -1.0322265625, -0.81591796875, -0.599609375, -0.38330078125, -0.1669921875, 0.04931640625, 0.265625, 0.48193359375, 0.6982421875, 0.91455078125, 1.130859375, 1.34716796875, 1.5634765625, 1.77978515625, 1.99609375, 2.21240234375, 2.4287109375, 2.64501953125, 2.861328125, 3.07763671875, 3.2939453125, 3.51025390625, 3.7265625, 3.94287109375, 4.1591796875, 4.37548828125, 4.591796875, 4.80810546875, 5.0244140625, 5.24072265625, 5.45703125, 5.67333984375, 5.8896484375, 6.10595703125, 6.322265625, 6.53857421875, 6.7548828125, 6.97119140625, 7.1875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 6.0, 6.0, 6.0, 14.0, 9.0, 21.0, 37.0, 34.0, 25.0, 35.0, 61.0, 102.0, 144.0, 173.0, 236.0, 364.0, 856.0, 17857.0, 3280994.0, 886691.0, 4826.0, 574.0, 328.0, 217.0, 185.0, 104.0, 91.0, 67.0, 49.0, 42.0, 37.0, 17.0, 14.0, 14.0, 11.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.03125, -31.0849609375, -30.138671875, -29.1923828125, -28.24609375, -27.2998046875, -26.353515625, -25.4072265625, -24.4609375, -23.5146484375, -22.568359375, -21.6220703125, -20.67578125, -19.7294921875, -18.783203125, -17.8369140625, -16.890625, -15.9443359375, -14.998046875, -14.0517578125, -13.10546875, -12.1591796875, -11.212890625, -10.2666015625, -9.3203125, -8.3740234375, -7.427734375, -6.4814453125, -5.53515625, -4.5888671875, -3.642578125, -2.6962890625, -1.75, -0.8037109375, 0.142578125, 1.0888671875, 2.03515625, 2.9814453125, 3.927734375, 4.8740234375, 5.8203125, 6.7666015625, 7.712890625, 8.6591796875, 9.60546875, 10.5517578125, 11.498046875, 12.4443359375, 13.390625, 14.3369140625, 15.283203125, 16.2294921875, 17.17578125, 18.1220703125, 19.068359375, 20.0146484375, 20.9609375, 21.9072265625, 22.853515625, 23.7998046875, 24.74609375, 25.6923828125, 26.638671875, 27.5849609375, 28.53125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 21.0, 47.0, 87.0, 143.0, 200.0, 177.0, 147.0, 105.0, 46.0, 25.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.91415786743164, -52.18389129638672, -50.4536247253418, -48.723358154296875, -46.99308776855469, -45.262821197509766, -43.532554626464844, -41.80228805541992, -40.072021484375, -38.34175491333008, -36.611488342285156, -34.88121795654297, -33.15095138549805, -31.420684814453125, -29.690418243408203, -27.96015167236328, -26.229883193969727, -24.499616622924805, -22.76934814453125, -21.039081573486328, -19.308815002441406, -17.578548431396484, -15.84827995300293, -14.118013381958008, -12.38774585723877, -10.657478332519531, -8.92721176147461, -7.196944236755371, -5.466677188873291, -3.736410140991211, -2.0061426162719727, -0.2758760452270508, 1.4543914794921875, 3.1846585273742676, 4.914925575256348, 6.645193099975586, 8.375459671020508, 10.105727195739746, 11.835994720458984, 13.566261291503906, 15.296528816223145, 17.026796340942383, 18.757062911987305, 20.48733139038086, 22.21759796142578, 23.947864532470703, 25.678131103515625, 27.408397674560547, 29.1386661529541, 30.868932723999023, 32.59920120239258, 34.3294677734375, 36.05973434448242, 37.790000915527344, 39.52027130126953, 41.25053405761719, 42.980804443359375, 44.7110710144043, 46.44133758544922, 48.171607971191406, 49.90187454223633, 51.63214111328125, 53.36240768432617, 55.092674255371094, 56.822940826416016]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 2.0, 1.0, 7.0, 3.0, 10.0, 10.0, 12.0, 13.0, 14.0, 16.0, 19.0, 27.0, 25.0, 22.0, 27.0, 25.0, 30.0, 43.0, 40.0, 33.0, 40.0, 38.0, 50.0, 41.0, 29.0, 45.0, 30.0, 37.0, 42.0, 26.0, 25.0, 23.0, 25.0, 24.0, 22.0, 16.0, 14.0, 18.0, 12.0, 14.0, 6.0, 14.0, 10.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-24.63397216796875, -23.928255081176758, -23.222537994384766, -22.51681900024414, -21.81110191345215, -21.105384826660156, -20.39966583251953, -19.69394874572754, -18.988231658935547, -18.282514572143555, -17.576797485351562, -16.871078491210938, -16.165361404418945, -15.459644317626953, -14.753926277160645, -14.048208236694336, -13.342491149902344, -12.636774063110352, -11.931056022644043, -11.225337982177734, -10.519620895385742, -9.81390380859375, -9.108185768127441, -8.402467727661133, -7.696750640869141, -6.99103307723999, -6.28531551361084, -5.5795979499816895, -4.873880386352539, -4.168162822723389, -3.4624452590942383, -2.756727695465088, -2.0510101318359375, -1.345292568206787, -0.6395750045776367, 0.06614255905151367, 0.7718601226806641, 1.4775776863098145, 2.183295249938965, 2.8890128135681152, 3.5947303771972656, 4.300447940826416, 5.006165504455566, 5.711883068084717, 6.417600631713867, 7.123318195343018, 7.829035758972168, 8.534753799438477, 9.240470886230469, 9.946187973022461, 10.65190601348877, 11.357624053955078, 12.06334114074707, 12.769058227539062, 13.474776268005371, 14.18049430847168, 14.886211395263672, 15.591928482055664, 16.297645568847656, 17.00336456298828, 17.709081649780273, 18.414798736572266, 19.12051773071289, 19.826234817504883, 20.531951904296875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 13.0, 3.0, 6.0, 5.0, 6.0, 12.0, 16.0, 17.0, 16.0, 20.0, 30.0, 27.0, 24.0, 34.0, 35.0, 32.0, 31.0, 35.0, 45.0, 46.0, 44.0, 50.0, 38.0, 47.0, 30.0, 34.0, 49.0, 25.0, 26.0, 29.0, 15.0, 23.0, 12.0, 20.0, 23.0, 15.0, 17.0, 13.0, 15.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-4.19921875, -4.08270263671875, -3.9661865234375, -3.84967041015625, -3.733154296875, -3.61663818359375, -3.5001220703125, -3.38360595703125, -3.26708984375, -3.15057373046875, -3.0340576171875, -2.91754150390625, -2.801025390625, -2.68450927734375, -2.5679931640625, -2.45147705078125, -2.3349609375, -2.21844482421875, -2.1019287109375, -1.98541259765625, -1.868896484375, -1.75238037109375, -1.6358642578125, -1.51934814453125, -1.40283203125, -1.28631591796875, -1.1697998046875, -1.05328369140625, -0.936767578125, -0.82025146484375, -0.7037353515625, -0.58721923828125, -0.470703125, -0.35418701171875, -0.2376708984375, -0.12115478515625, -0.004638671875, 0.11187744140625, 0.2283935546875, 0.34490966796875, 0.46142578125, 0.57794189453125, 0.6944580078125, 0.81097412109375, 0.927490234375, 1.04400634765625, 1.1605224609375, 1.27703857421875, 1.3935546875, 1.51007080078125, 1.6265869140625, 1.74310302734375, 1.859619140625, 1.97613525390625, 2.0926513671875, 2.20916748046875, 2.32568359375, 2.44219970703125, 2.5587158203125, 2.67523193359375, 2.791748046875, 2.90826416015625, 3.0247802734375, 3.14129638671875, 3.2578125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 16.0, 18.0, 21.0, 53.0, 60.0, 105.0, 185.0, 281.0, 469.0, 927.0, 1618.0, 3056.0, 5380.0, 10297.0, 19490.0, 39358.0, 78845.0, 157149.0, 260675.0, 224806.0, 122159.0, 60671.0, 29628.0, 15381.0, 8041.0, 4499.0, 2365.0, 1325.0, 699.0, 370.0, 202.0, 136.0, 115.0, 57.0, 34.0, 19.0, 18.0, 12.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.483642578125, -0.4674186706542969, -0.45119476318359375, -0.4349708557128906, -0.4187469482421875, -0.4025230407714844, -0.38629913330078125, -0.3700752258300781, -0.353851318359375, -0.3376274108886719, -0.32140350341796875, -0.3051795959472656, -0.2889556884765625, -0.2727317810058594, -0.25650787353515625, -0.24028396606445312, -0.22406005859375, -0.20783615112304688, -0.19161224365234375, -0.17538833618164062, -0.1591644287109375, -0.14294052124023438, -0.12671661376953125, -0.11049270629882812, -0.094268798828125, -0.07804489135742188, -0.06182098388671875, -0.045597076416015625, -0.0293731689453125, -0.013149261474609375, 0.00307464599609375, 0.019298553466796875, 0.0355224609375, 0.051746368408203125, 0.06797027587890625, 0.08419418334960938, 0.1004180908203125, 0.11664199829101562, 0.13286590576171875, 0.14908981323242188, 0.165313720703125, 0.18153762817382812, 0.19776153564453125, 0.21398544311523438, 0.2302093505859375, 0.24643325805664062, 0.26265716552734375, 0.2788810729980469, 0.29510498046875, 0.3113288879394531, 0.32755279541015625, 0.3437767028808594, 0.3600006103515625, 0.3762245178222656, 0.39244842529296875, 0.4086723327636719, 0.424896240234375, 0.4411201477050781, 0.45734405517578125, 0.4735679626464844, 0.4897918701171875, 0.5060157775878906, 0.5222396850585938, 0.5384635925292969, 0.5546875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 5.0, 7.0, 14.0, 9.0, 21.0, 12.0, 14.0, 23.0, 15.0, 21.0, 18.0, 33.0, 29.0, 29.0, 33.0, 36.0, 36.0, 32.0, 30.0, 30.0, 1059.0, 31.0, 40.0, 36.0, 31.0, 35.0, 37.0, 30.0, 20.0, 34.0, 33.0, 31.0, 20.0, 20.0, 23.0, 12.0, 16.0, 8.0, 12.0, 16.0, 12.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.404296875, -2.335479736328125, -2.26666259765625, -2.197845458984375, -2.1290283203125, -2.060211181640625, -1.99139404296875, -1.922576904296875, -1.853759765625, -1.784942626953125, -1.71612548828125, -1.647308349609375, -1.5784912109375, -1.509674072265625, -1.44085693359375, -1.372039794921875, -1.30322265625, -1.234405517578125, -1.16558837890625, -1.096771240234375, -1.0279541015625, -0.959136962890625, -0.89031982421875, -0.821502685546875, -0.752685546875, -0.683868408203125, -0.61505126953125, -0.546234130859375, -0.4774169921875, -0.408599853515625, -0.33978271484375, -0.270965576171875, -0.2021484375, -0.133331298828125, -0.06451416015625, 0.004302978515625, 0.0731201171875, 0.141937255859375, 0.21075439453125, 0.279571533203125, 0.348388671875, 0.417205810546875, 0.48602294921875, 0.554840087890625, 0.6236572265625, 0.692474365234375, 0.76129150390625, 0.830108642578125, 0.89892578125, 0.967742919921875, 1.03656005859375, 1.105377197265625, 1.1741943359375, 1.243011474609375, 1.31182861328125, 1.380645751953125, 1.449462890625, 1.518280029296875, 1.58709716796875, 1.655914306640625, 1.7247314453125, 1.793548583984375, 1.86236572265625, 1.931182861328125, 2.0]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 17.0, 13.0, 21.0, 36.0, 58.0, 98.0, 105.0, 182.0, 228.0, 389.0, 513.0, 778.0, 1178.0, 1677.0, 2479.0, 3617.0, 5372.0, 8080.0, 12075.0, 18267.0, 27388.0, 40528.0, 59089.0, 85548.0, 116205.0, 823326.0, 509865.0, 115439.0, 84246.0, 58739.0, 39791.0, 27013.0, 18151.0, 11852.0, 7983.0, 5370.0, 3704.0, 2493.0, 1621.0, 1098.0, 760.0, 524.0, 378.0, 270.0, 195.0, 112.0, 77.0, 77.0, 41.0, 28.0, 19.0, 5.0, 7.0, 3.0, 4.0, 2.0, 2.0], "bins": [-0.227783203125, -0.22087669372558594, -0.21397018432617188, -0.2070636749267578, -0.20015716552734375, -0.1932506561279297, -0.18634414672851562, -0.17943763732910156, -0.1725311279296875, -0.16562461853027344, -0.15871810913085938, -0.1518115997314453, -0.14490509033203125, -0.1379985809326172, -0.13109207153320312, -0.12418556213378906, -0.117279052734375, -0.11037254333496094, -0.10346603393554688, -0.09655952453613281, -0.08965301513671875, -0.08274650573730469, -0.07583999633789062, -0.06893348693847656, -0.0620269775390625, -0.05512046813964844, -0.048213958740234375, -0.04130744934082031, -0.03440093994140625, -0.027494430541992188, -0.020587921142578125, -0.013681411743164062, -0.00677490234375, 0.0001316070556640625, 0.007038116455078125, 0.013944625854492188, 0.02085113525390625, 0.027757644653320312, 0.034664154052734375, 0.04157066345214844, 0.0484771728515625, 0.05538368225097656, 0.062290191650390625, 0.06919670104980469, 0.07610321044921875, 0.08300971984863281, 0.08991622924804688, 0.09682273864746094, 0.103729248046875, 0.11063575744628906, 0.11754226684570312, 0.12444877624511719, 0.13135528564453125, 0.1382617950439453, 0.14516830444335938, 0.15207481384277344, 0.1589813232421875, 0.16588783264160156, 0.17279434204101562, 0.1797008514404297, 0.18660736083984375, 0.1935138702392578, 0.20042037963867188, 0.20732688903808594, 0.2142333984375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 5.0, 0.0, 4.0, 1.0, 6.0, 4.0, 5.0, 9.0, 14.0, 20.0, 21.0, 24.0, 39.0, 41.0, 61.0, 69.0, 89.0, 106.0, 72.0, 80.0, 58.0, 58.0, 43.0, 42.0, 30.0, 15.0, 28.0, 12.0, 6.0, 4.0, 7.0, 4.0, 8.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.00628662109375, -0.006097197532653809, -0.005907773971557617, -0.005718350410461426, -0.005528926849365234, -0.005339503288269043, -0.0051500797271728516, -0.00496065616607666, -0.004771232604980469, -0.004581809043884277, -0.004392385482788086, -0.0042029619216918945, -0.004013538360595703, -0.0038241147994995117, -0.0036346912384033203, -0.003445267677307129, -0.0032558441162109375, -0.003066420555114746, -0.0028769969940185547, -0.0026875734329223633, -0.002498149871826172, -0.0023087263107299805, -0.002119302749633789, -0.0019298791885375977, -0.0017404556274414062, -0.0015510320663452148, -0.0013616085052490234, -0.001172184944152832, -0.0009827613830566406, -0.0007933378219604492, -0.0006039142608642578, -0.0004144906997680664, -0.000225067138671875, -3.5643577575683594e-05, 0.0001537799835205078, 0.0003432035446166992, 0.0005326271057128906, 0.000722050666809082, 0.0009114742279052734, 0.0011008977890014648, 0.0012903213500976562, 0.0014797449111938477, 0.001669168472290039, 0.0018585920333862305, 0.002048015594482422, 0.0022374391555786133, 0.0024268627166748047, 0.002616286277770996, 0.0028057098388671875, 0.002995133399963379, 0.0031845569610595703, 0.0033739805221557617, 0.003563404083251953, 0.0037528276443481445, 0.003942251205444336, 0.004131674766540527, 0.004321098327636719, 0.00451052188873291, 0.0046999454498291016, 0.004889369010925293, 0.005078792572021484, 0.005268216133117676, 0.005457639694213867, 0.005647063255310059, 0.00583648681640625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 9.0, 7.0, 10.0, 6.0, 12.0, 14.0, 29.0, 44.0, 40.0, 85.0, 127.0, 153.0, 313.0, 725.0, 73341.0, 971016.0, 1513.0, 425.0, 218.0, 137.0, 82.0, 57.0, 42.0, 32.0, 25.0, 20.0, 10.0, 7.0, 7.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11846923828125, -0.1146707534790039, -0.11087226867675781, -0.10707378387451172, -0.10327529907226562, -0.09947681427001953, -0.09567832946777344, -0.09187984466552734, -0.08808135986328125, -0.08428287506103516, -0.08048439025878906, -0.07668590545654297, -0.07288742065429688, -0.06908893585205078, -0.06529045104980469, -0.061491966247558594, -0.0576934814453125, -0.053894996643066406, -0.05009651184082031, -0.04629802703857422, -0.042499542236328125, -0.03870105743408203, -0.03490257263183594, -0.031104087829589844, -0.02730560302734375, -0.023507118225097656, -0.019708633422851562, -0.01591014862060547, -0.012111663818359375, -0.008313179016113281, -0.0045146942138671875, -0.0007162094116210938, 0.003082275390625, 0.006880760192871094, 0.010679244995117188, 0.014477729797363281, 0.018276214599609375, 0.02207469940185547, 0.025873184204101562, 0.029671669006347656, 0.03347015380859375, 0.037268638610839844, 0.04106712341308594, 0.04486560821533203, 0.048664093017578125, 0.05246257781982422, 0.05626106262207031, 0.060059547424316406, 0.0638580322265625, 0.0676565170288086, 0.07145500183105469, 0.07525348663330078, 0.07905197143554688, 0.08285045623779297, 0.08664894104003906, 0.09044742584228516, 0.09424591064453125, 0.09804439544677734, 0.10184288024902344, 0.10564136505126953, 0.10943984985351562, 0.11323833465576172, 0.11703681945800781, 0.1208353042602539, 0.1246337890625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [40.0, 830.0, 139.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017441656673327088, -0.0006225272081792355, 0.0004991112509742379, 0.0016207498265430331, 0.0027423882856965065, 0.003864026628434658, 0.004985665436834097, 0.0061073037795722485, 0.0072289421223104, 0.008350580930709839, 0.00947221927344799, 0.010593857616186142, 0.011715495958924294, 0.012837134301662445, 0.013958772644400597, 0.015080410987138748, 0.0162020493298769, 0.01732368767261505, 0.018445326015353203, 0.019566964358091354, 0.020688602700829506, 0.021810241043567657, 0.022931881248950958, 0.02405351772904396, 0.02517515793442726, 0.026296796277165413, 0.027418434619903564, 0.028540072962641716, 0.029661711305379868, 0.03078334964811802, 0.03190498799085617, 0.03302662819623947, 0.034148264676332474, 0.035269904881715775, 0.03639154136180878, 0.03751318156719208, 0.03863481804728508, 0.03975645825266838, 0.04087809473276138, 0.041999734938144684, 0.043121371418237686, 0.04424301162362099, 0.04536464810371399, 0.04648628830909729, 0.04760792478919029, 0.04872956499457359, 0.049851201474666595, 0.050972841680049896, 0.0520944818854332, 0.0532161220908165, 0.0543377585709095, 0.0554593987762928, 0.0565810352563858, 0.057702675461769104, 0.058824311941862106, 0.05994595214724541, 0.06106758862733841, 0.06218922883272171, 0.06331086903810501, 0.06443250179290771, 0.06555414199829102, 0.06667578220367432, 0.06779742240905762, 0.06891905516386032, 0.07004069536924362]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 5.0, 9.0, 13.0, 19.0, 15.0, 27.0, 40.0, 34.0, 45.0, 45.0, 43.0, 60.0, 59.0, 69.0, 75.0, 71.0, 59.0, 51.0, 45.0, 29.0, 38.0, 27.0, 25.0, 26.0, 17.0, 6.0, 18.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004349350929260254, -0.004208815284073353, -0.004068279638886452, -0.003927743993699551, -0.0037872083485126495, -0.0036466727033257484, -0.0035061370581388474, -0.0033656014129519463, -0.003225065767765045, -0.003084530122578144, -0.002943994477391243, -0.002803458832204342, -0.002662923187017441, -0.0025223875418305397, -0.0023818518966436386, -0.0022413162514567375, -0.0021007806062698364, -0.0019602449610829353, -0.0018197093158960342, -0.0016791736707091331, -0.001538638025522232, -0.001398102380335331, -0.0012575667351484299, -0.0011170310899615288, -0.0009764954447746277, -0.0008359597995877266, -0.0006954241544008255, -0.0005548885092139244, -0.0004143528640270233, -0.0002738172188401222, -0.00013328157365322113, 7.254071533679962e-06, 0.00014778971672058105, 0.00028832536190748215, 0.00042886100709438324, 0.0005693966522812843, 0.0007099322974681854, 0.0008504679426550865, 0.0009910035878419876, 0.0011315392330288887, 0.0012720748782157898, 0.0014126105234026909, 0.001553146168589592, 0.001693681813776493, 0.0018342174589633942, 0.0019747531041502953, 0.0021152887493371964, 0.0022558243945240974, 0.0023963600397109985, 0.0025368956848978996, 0.0026774313300848007, 0.002817966975271702, 0.002958502620458603, 0.003099038265645504, 0.003239573910832405, 0.003380109556019306, 0.0035206452012062073, 0.0036611808463931084, 0.0038017164915800095, 0.0039422521367669106, 0.004082787781953812, 0.004223323427140713, 0.004363859072327614, 0.004504394717514515, 0.004644930362701416]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 13.0, 3.0, 6.0, 5.0, 6.0, 12.0, 16.0, 17.0, 16.0, 20.0, 30.0, 27.0, 24.0, 34.0, 35.0, 32.0, 31.0, 35.0, 45.0, 47.0, 43.0, 50.0, 38.0, 47.0, 30.0, 34.0, 49.0, 25.0, 26.0, 29.0, 15.0, 23.0, 12.0, 20.0, 23.0, 15.0, 17.0, 13.0, 15.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-4.19921875, -4.08270263671875, -3.9661865234375, -3.84967041015625, -3.733154296875, -3.61663818359375, -3.5001220703125, -3.38360595703125, -3.26708984375, -3.15057373046875, -3.0340576171875, -2.91754150390625, -2.801025390625, -2.68450927734375, -2.5679931640625, -2.45147705078125, -2.3349609375, -2.21844482421875, -2.1019287109375, -1.98541259765625, -1.868896484375, -1.75238037109375, -1.6358642578125, -1.51934814453125, -1.40283203125, -1.28631591796875, -1.1697998046875, -1.05328369140625, -0.936767578125, -0.82025146484375, -0.7037353515625, -0.58721923828125, -0.470703125, -0.35418701171875, -0.2376708984375, -0.12115478515625, -0.004638671875, 0.11187744140625, 0.2283935546875, 0.34490966796875, 0.46142578125, 0.57794189453125, 0.6944580078125, 0.81097412109375, 0.927490234375, 1.04400634765625, 1.1605224609375, 1.27703857421875, 1.3935546875, 1.51007080078125, 1.6265869140625, 1.74310302734375, 1.859619140625, 1.97613525390625, 2.0926513671875, 2.20916748046875, 2.32568359375, 2.44219970703125, 2.5587158203125, 2.67523193359375, 2.791748046875, 2.90826416015625, 3.0247802734375, 3.14129638671875, 3.2578125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 10.0, 13.0, 18.0, 15.0, 17.0, 19.0, 42.0, 53.0, 71.0, 92.0, 144.0, 215.0, 374.0, 710.0, 1536.0, 3245.0, 7278.0, 16452.0, 36881.0, 86182.0, 210144.0, 378496.0, 176682.0, 72445.0, 31497.0, 14025.0, 6158.0, 2894.0, 1230.0, 587.0, 309.0, 180.0, 131.0, 98.0, 61.0, 58.0, 50.0, 33.0, 30.0, 16.0, 14.0, 13.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-4.33984375, -4.217254638671875, -4.09466552734375, -3.972076416015625, -3.8494873046875, -3.726898193359375, -3.60430908203125, -3.481719970703125, -3.359130859375, -3.236541748046875, -3.11395263671875, -2.991363525390625, -2.8687744140625, -2.746185302734375, -2.62359619140625, -2.501007080078125, -2.37841796875, -2.255828857421875, -2.13323974609375, -2.010650634765625, -1.8880615234375, -1.765472412109375, -1.64288330078125, -1.520294189453125, -1.397705078125, -1.275115966796875, -1.15252685546875, -1.029937744140625, -0.9073486328125, -0.784759521484375, -0.66217041015625, -0.539581298828125, -0.4169921875, -0.294403076171875, -0.17181396484375, -0.049224853515625, 0.0733642578125, 0.195953369140625, 0.31854248046875, 0.441131591796875, 0.563720703125, 0.686309814453125, 0.80889892578125, 0.931488037109375, 1.0540771484375, 1.176666259765625, 1.29925537109375, 1.421844482421875, 1.54443359375, 1.667022705078125, 1.78961181640625, 1.912200927734375, 2.0347900390625, 2.157379150390625, 2.27996826171875, 2.402557373046875, 2.525146484375, 2.647735595703125, 2.77032470703125, 2.892913818359375, 3.0155029296875, 3.138092041015625, 3.26068115234375, 3.383270263671875, 3.505859375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 6.0, 8.0, 12.0, 10.0, 15.0, 17.0, 28.0, 25.0, 35.0, 30.0, 40.0, 58.0, 58.0, 96.0, 140.0, 1502.0, 408.0, 124.0, 69.0, 54.0, 49.0, 47.0, 49.0, 24.0, 24.0, 21.0, 29.0, 17.0, 18.0, 10.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0234375, -11.5596923828125, -11.095947265625, -10.6322021484375, -10.16845703125, -9.7047119140625, -9.240966796875, -8.7772216796875, -8.3134765625, -7.8497314453125, -7.385986328125, -6.9222412109375, -6.45849609375, -5.9947509765625, -5.531005859375, -5.0672607421875, -4.603515625, -4.1397705078125, -3.676025390625, -3.2122802734375, -2.74853515625, -2.2847900390625, -1.821044921875, -1.3572998046875, -0.8935546875, -0.4298095703125, 0.033935546875, 0.4976806640625, 0.96142578125, 1.4251708984375, 1.888916015625, 2.3526611328125, 2.81640625, 3.2801513671875, 3.743896484375, 4.2076416015625, 4.67138671875, 5.1351318359375, 5.598876953125, 6.0626220703125, 6.5263671875, 6.9901123046875, 7.453857421875, 7.9176025390625, 8.38134765625, 8.8450927734375, 9.308837890625, 9.7725830078125, 10.236328125, 10.7000732421875, 11.163818359375, 11.6275634765625, 12.09130859375, 12.5550537109375, 13.018798828125, 13.4825439453125, 13.9462890625, 14.4100341796875, 14.873779296875, 15.3375244140625, 15.80126953125, 16.2650146484375, 16.728759765625, 17.1925048828125, 17.65625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 4.0, 6.0, 5.0, 12.0, 29.0, 39.0, 36.0, 68.0, 91.0, 114.0, 196.0, 448.0, 1010.0, 7384.0, 3115869.0, 18046.0, 1226.0, 450.0, 235.0, 137.0, 94.0, 47.0, 46.0, 24.0, 28.0, 13.0, 10.0, 6.0, 3.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.90625, -49.34375, -47.78125, -46.21875, -44.65625, -43.09375, -41.53125, -39.96875, -38.40625, -36.84375, -35.28125, -33.71875, -32.15625, -30.59375, -29.03125, -27.46875, -25.90625, -24.34375, -22.78125, -21.21875, -19.65625, -18.09375, -16.53125, -14.96875, -13.40625, -11.84375, -10.28125, -8.71875, -7.15625, -5.59375, -4.03125, -2.46875, -0.90625, 0.65625, 2.21875, 3.78125, 5.34375, 6.90625, 8.46875, 10.03125, 11.59375, 13.15625, 14.71875, 16.28125, 17.84375, 19.40625, 20.96875, 22.53125, 24.09375, 25.65625, 27.21875, 28.78125, 30.34375, 31.90625, 33.46875, 35.03125, 36.59375, 38.15625, 39.71875, 41.28125, 42.84375, 44.40625, 45.96875, 47.53125, 49.09375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 81.0, 499.0, 380.0, 53.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0781831741333, -9.587721824645996, -7.09726095199585, -4.606800079345703, -2.1163387298583984, 0.37412261962890625, 2.8645830154418945, 5.355044364929199, 7.845505714416504, 10.335967063903809, 12.826427459716797, 15.316888809204102, 17.807350158691406, 20.29781150817871, 22.788272857666016, 25.278732299804688, 27.769195556640625, 30.25965690612793, 32.750118255615234, 35.240577697753906, 37.731040954589844, 40.221500396728516, 42.71195983886719, 45.202423095703125, 47.6928825378418, 50.18334197998047, 52.673805236816406, 55.16426467895508, 57.654727935791016, 60.14518737792969, 62.635650634765625, 65.12611389160156, 67.61656951904297, 70.1070327758789, 72.59748840332031, 75.08795166015625, 77.57841491699219, 80.06887817382812, 82.55933380126953, 85.04979705810547, 87.5402603149414, 90.03072357177734, 92.52117919921875, 95.01164245605469, 97.50210571289062, 99.99256896972656, 102.48302459716797, 104.9734878540039, 107.46394348144531, 109.95440673828125, 112.44486236572266, 114.9353256225586, 117.42578887939453, 119.91625213623047, 122.40670776367188, 124.89717102050781, 127.38763427734375, 129.8780975341797, 132.36856079101562, 134.85902404785156, 137.34947204589844, 139.83993530273438, 142.3303985595703, 144.82086181640625, 147.3113250732422]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 8.0, 4.0, 13.0, 10.0, 8.0, 12.0, 15.0, 20.0, 12.0, 22.0, 34.0, 30.0, 32.0, 31.0, 29.0, 27.0, 44.0, 40.0, 41.0, 29.0, 39.0, 47.0, 35.0, 43.0, 48.0, 33.0, 42.0, 41.0, 33.0, 38.0, 25.0, 17.0, 25.0, 15.0, 12.0, 5.0, 4.0, 18.0, 9.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.48008918762207, -29.532920837402344, -28.585750579833984, -27.638582229614258, -26.69141387939453, -25.744243621826172, -24.797075271606445, -23.84990692138672, -22.90273666381836, -21.955568313598633, -21.008398056030273, -20.061229705810547, -19.11406135559082, -18.166893005371094, -17.219722747802734, -16.272554397583008, -15.325386047363281, -14.378216743469238, -13.431048393249512, -12.483879089355469, -11.536710739135742, -10.5895414352417, -9.642372131347656, -8.69520378112793, -7.748034477233887, -6.800865650177002, -5.853696823120117, -4.906527519226074, -3.9593586921691895, -3.0121898651123047, -2.0650205612182617, -1.117851734161377, -0.170684814453125, 0.7764841318130493, 1.7236530780792236, 2.6708221435546875, 3.6179909706115723, 4.565159797668457, 5.5123291015625, 6.459497928619385, 7.4066667556762695, 8.353836059570312, 9.301004409790039, 10.248173713684082, 11.195343017578125, 12.142511367797852, 13.089680671691895, 14.036849975585938, 14.984018325805664, 15.931187629699707, 16.87835693359375, 17.825525283813477, 18.772693634033203, 19.719863891601562, 20.66703224182129, 21.614200592041016, 22.561370849609375, 23.5085391998291, 24.45570945739746, 25.402877807617188, 26.350046157836914, 27.29721450805664, 28.244384765625, 29.191553115844727, 30.138721466064453]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 10.0, 7.0, 8.0, 8.0, 15.0, 17.0, 16.0, 14.0, 24.0, 24.0, 30.0, 39.0, 29.0, 29.0, 34.0, 34.0, 41.0, 43.0, 47.0, 45.0, 55.0, 42.0, 29.0, 28.0, 31.0, 29.0, 30.0, 23.0, 22.0, 27.0, 20.0, 18.0, 18.0, 19.0, 13.0, 19.0, 13.0, 14.0, 6.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.375, -4.248870849609375, -4.12274169921875, -3.996612548828125, -3.8704833984375, -3.744354248046875, -3.61822509765625, -3.492095947265625, -3.365966796875, -3.239837646484375, -3.11370849609375, -2.987579345703125, -2.8614501953125, -2.735321044921875, -2.60919189453125, -2.483062744140625, -2.35693359375, -2.230804443359375, -2.10467529296875, -1.978546142578125, -1.8524169921875, -1.726287841796875, -1.60015869140625, -1.474029541015625, -1.347900390625, -1.221771240234375, -1.09564208984375, -0.969512939453125, -0.8433837890625, -0.717254638671875, -0.59112548828125, -0.464996337890625, -0.3388671875, -0.212738037109375, -0.08660888671875, 0.039520263671875, 0.1656494140625, 0.291778564453125, 0.41790771484375, 0.544036865234375, 0.670166015625, 0.796295166015625, 0.92242431640625, 1.048553466796875, 1.1746826171875, 1.300811767578125, 1.42694091796875, 1.553070068359375, 1.67919921875, 1.805328369140625, 1.93145751953125, 2.057586669921875, 2.1837158203125, 2.309844970703125, 2.43597412109375, 2.562103271484375, 2.688232421875, 2.814361572265625, 2.94049072265625, 3.066619873046875, 3.1927490234375, 3.318878173828125, 3.44500732421875, 3.571136474609375, 3.697265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 9.0, 8.0, 5.0, 13.0, 14.0, 14.0, 22.0, 16.0, 39.0, 36.0, 45.0, 45.0, 69.0, 96.0, 141.0, 227.0, 565.0, 2535.0, 19977.0, 280666.0, 2480121.0, 1308128.0, 90879.0, 8166.0, 1360.0, 401.0, 176.0, 107.0, 68.0, 63.0, 48.0, 43.0, 32.0, 30.0, 23.0, 18.0, 17.0, 15.0, 11.0, 12.0, 9.0, 4.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-11.671875, -11.3458251953125, -11.019775390625, -10.6937255859375, -10.36767578125, -10.0416259765625, -9.715576171875, -9.3895263671875, -9.0634765625, -8.7374267578125, -8.411376953125, -8.0853271484375, -7.75927734375, -7.4332275390625, -7.107177734375, -6.7811279296875, -6.455078125, -6.1290283203125, -5.802978515625, -5.4769287109375, -5.15087890625, -4.8248291015625, -4.498779296875, -4.1727294921875, -3.8466796875, -3.5206298828125, -3.194580078125, -2.8685302734375, -2.54248046875, -2.2164306640625, -1.890380859375, -1.5643310546875, -1.23828125, -0.9122314453125, -0.586181640625, -0.2601318359375, 0.06591796875, 0.3919677734375, 0.718017578125, 1.0440673828125, 1.3701171875, 1.6961669921875, 2.022216796875, 2.3482666015625, 2.67431640625, 3.0003662109375, 3.326416015625, 3.6524658203125, 3.978515625, 4.3045654296875, 4.630615234375, 4.9566650390625, 5.28271484375, 5.6087646484375, 5.934814453125, 6.2608642578125, 6.5869140625, 6.9129638671875, 7.239013671875, 7.5650634765625, 7.89111328125, 8.2171630859375, 8.543212890625, 8.8692626953125, 9.1953125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 10.0, 14.0, 15.0, 23.0, 21.0, 29.0, 37.0, 64.0, 78.0, 112.0, 167.0, 218.0, 309.0, 379.0, 492.0, 499.0, 398.0, 323.0, 227.0, 166.0, 125.0, 80.0, 76.0, 53.0, 40.0, 30.0, 19.0, 22.0, 14.0, 9.0, 6.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.4375, -9.18359375, -8.9296875, -8.67578125, -8.421875, -8.16796875, -7.9140625, -7.66015625, -7.40625, -7.15234375, -6.8984375, -6.64453125, -6.390625, -6.13671875, -5.8828125, -5.62890625, -5.375, -5.12109375, -4.8671875, -4.61328125, -4.359375, -4.10546875, -3.8515625, -3.59765625, -3.34375, -3.08984375, -2.8359375, -2.58203125, -2.328125, -2.07421875, -1.8203125, -1.56640625, -1.3125, -1.05859375, -0.8046875, -0.55078125, -0.296875, -0.04296875, 0.2109375, 0.46484375, 0.71875, 0.97265625, 1.2265625, 1.48046875, 1.734375, 1.98828125, 2.2421875, 2.49609375, 2.75, 3.00390625, 3.2578125, 3.51171875, 3.765625, 4.01953125, 4.2734375, 4.52734375, 4.78125, 5.03515625, 5.2890625, 5.54296875, 5.796875, 6.05078125, 6.3046875, 6.55859375, 6.8125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 6.0, 18.0, 9.0, 22.0, 24.0, 40.0, 46.0, 60.0, 73.0, 115.0, 144.0, 263.0, 363.0, 949.0, 70194.0, 4084120.0, 35825.0, 810.0, 387.0, 244.0, 165.0, 102.0, 84.0, 55.0, 34.0, 29.0, 17.0, 26.0, 18.0, 10.0, 7.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.25, -32.955078125, -31.66015625, -30.365234375, -29.0703125, -27.775390625, -26.48046875, -25.185546875, -23.890625, -22.595703125, -21.30078125, -20.005859375, -18.7109375, -17.416015625, -16.12109375, -14.826171875, -13.53125, -12.236328125, -10.94140625, -9.646484375, -8.3515625, -7.056640625, -5.76171875, -4.466796875, -3.171875, -1.876953125, -0.58203125, 0.712890625, 2.0078125, 3.302734375, 4.59765625, 5.892578125, 7.1875, 8.482421875, 9.77734375, 11.072265625, 12.3671875, 13.662109375, 14.95703125, 16.251953125, 17.546875, 18.841796875, 20.13671875, 21.431640625, 22.7265625, 24.021484375, 25.31640625, 26.611328125, 27.90625, 29.201171875, 30.49609375, 31.791015625, 33.0859375, 34.380859375, 35.67578125, 36.970703125, 38.265625, 39.560546875, 40.85546875, 42.150390625, 43.4453125, 44.740234375, 46.03515625, 47.330078125, 48.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 0.0, 6.0, 17.0, 26.0, 45.0, 44.0, 53.0, 75.0, 104.0, 98.0, 92.0, 97.0, 80.0, 63.0, 56.0, 51.0, 29.0, 24.0, 10.0, 13.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.58039093017578, -23.791807174682617, -23.003225326538086, -22.214641571044922, -21.42605972290039, -20.637475967407227, -19.848892211914062, -19.06031036376953, -18.271728515625, -17.483144760131836, -16.694562911987305, -15.90597915649414, -15.11739730834961, -14.328813552856445, -13.540230751037598, -12.75164794921875, -11.963064193725586, -11.174481391906738, -10.38589859008789, -9.597314834594727, -8.808732986450195, -8.020149230957031, -7.231566429138184, -6.442983627319336, -5.654400825500488, -4.865818023681641, -4.077235221862793, -3.288651943206787, -2.5000691413879395, -1.7114863395690918, -0.9229030609130859, -0.13432025909423828, 0.6542606353759766, 1.4428435564041138, 2.231426477432251, 3.0200095176696777, 3.8085923194885254, 4.597175121307373, 5.385758399963379, 6.174341201782227, 6.962924003601074, 7.751506805419922, 8.54008960723877, 9.328672409057617, 10.117256164550781, 10.905838012695312, 11.694421768188477, 12.483004570007324, 13.271587371826172, 14.06017017364502, 14.848752975463867, 15.637336730957031, 16.425918579101562, 17.214502334594727, 18.00308609008789, 18.791667938232422, 19.580249786376953, 20.368833541870117, 21.15741539001465, 21.945999145507812, 22.734580993652344, 23.523164749145508, 24.311748504638672, 25.100330352783203, 25.888914108276367]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 10.0, 9.0, 14.0, 6.0, 18.0, 29.0, 20.0, 17.0, 24.0, 27.0, 32.0, 35.0, 37.0, 56.0, 53.0, 46.0, 44.0, 41.0, 51.0, 52.0, 42.0, 29.0, 37.0, 28.0, 34.0, 35.0, 25.0, 20.0, 22.0, 14.0, 21.0, 8.0, 15.0, 15.0, 8.0, 7.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.19389533996582, -29.341651916503906, -28.48940658569336, -27.637161254882812, -26.7849178314209, -25.932674407958984, -25.080429077148438, -24.22818374633789, -23.375940322875977, -22.523696899414062, -21.671451568603516, -20.81920623779297, -19.966962814331055, -19.11471939086914, -18.262474060058594, -17.410228729248047, -16.557985305786133, -15.705740928649902, -14.853496551513672, -14.001252174377441, -13.149007797241211, -12.29676342010498, -11.44451904296875, -10.59227466583252, -9.740030288696289, -8.887785911560059, -8.035541534423828, -7.183297157287598, -6.331052780151367, -5.478808403015137, -4.626564025878906, -3.774319648742676, -2.922077178955078, -2.0698328018188477, -1.2175884246826172, -0.3653440475463867, 0.48690032958984375, 1.3391447067260742, 2.1913890838623047, 3.043633460998535, 3.8958778381347656, 4.748122215270996, 5.600366592407227, 6.452610969543457, 7.3048553466796875, 8.157099723815918, 9.009344100952148, 9.861588478088379, 10.71383285522461, 11.56607723236084, 12.41832160949707, 13.2705659866333, 14.122810363769531, 14.975054740905762, 15.827299118041992, 16.679542541503906, 17.531787872314453, 18.384033203125, 19.236276626586914, 20.088520050048828, 20.940765380859375, 21.793010711669922, 22.645254135131836, 23.49749755859375, 24.349742889404297]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 1.0, 7.0, 4.0, 7.0, 9.0, 6.0, 8.0, 12.0, 13.0, 15.0, 18.0, 18.0, 25.0, 24.0, 31.0, 26.0, 34.0, 41.0, 41.0, 32.0, 46.0, 41.0, 44.0, 32.0, 42.0, 39.0, 34.0, 33.0, 36.0, 33.0, 26.0, 15.0, 25.0, 17.0, 27.0, 18.0, 18.0, 19.0, 15.0, 17.0, 17.0, 7.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0], "bins": [-4.390625, -4.269561767578125, -4.14849853515625, -4.027435302734375, -3.9063720703125, -3.785308837890625, -3.66424560546875, -3.543182373046875, -3.422119140625, -3.301055908203125, -3.17999267578125, -3.058929443359375, -2.9378662109375, -2.816802978515625, -2.69573974609375, -2.574676513671875, -2.45361328125, -2.332550048828125, -2.21148681640625, -2.090423583984375, -1.9693603515625, -1.848297119140625, -1.72723388671875, -1.606170654296875, -1.485107421875, -1.364044189453125, -1.24298095703125, -1.121917724609375, -1.0008544921875, -0.879791259765625, -0.75872802734375, -0.637664794921875, -0.5166015625, -0.395538330078125, -0.27447509765625, -0.153411865234375, -0.0323486328125, 0.088714599609375, 0.20977783203125, 0.330841064453125, 0.451904296875, 0.572967529296875, 0.69403076171875, 0.815093994140625, 0.9361572265625, 1.057220458984375, 1.17828369140625, 1.299346923828125, 1.42041015625, 1.541473388671875, 1.66253662109375, 1.783599853515625, 1.9046630859375, 2.025726318359375, 2.14678955078125, 2.267852783203125, 2.388916015625, 2.509979248046875, 2.63104248046875, 2.752105712890625, 2.8731689453125, 2.994232177734375, 3.11529541015625, 3.236358642578125, 3.357421875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 11.0, 15.0, 21.0, 31.0, 49.0, 72.0, 119.0, 231.0, 386.0, 754.0, 1343.0, 2454.0, 4491.0, 8800.0, 17420.0, 36397.0, 76222.0, 159768.0, 290082.0, 231193.0, 113020.0, 53489.0, 25551.0, 12552.0, 6528.0, 3350.0, 1788.0, 978.0, 558.0, 350.0, 193.0, 126.0, 76.0, 39.0, 36.0, 18.0, 12.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.73291015625, -0.7124176025390625, -0.691925048828125, -0.6714324951171875, -0.65093994140625, -0.6304473876953125, -0.609954833984375, -0.5894622802734375, -0.5689697265625, -0.5484771728515625, -0.527984619140625, -0.5074920654296875, -0.48699951171875, -0.4665069580078125, -0.446014404296875, -0.4255218505859375, -0.405029296875, -0.3845367431640625, -0.364044189453125, -0.3435516357421875, -0.32305908203125, -0.3025665283203125, -0.282073974609375, -0.2615814208984375, -0.2410888671875, -0.2205963134765625, -0.200103759765625, -0.1796112060546875, -0.15911865234375, -0.1386260986328125, -0.118133544921875, -0.0976409912109375, -0.0771484375, -0.0566558837890625, -0.036163330078125, -0.0156707763671875, 0.00482177734375, 0.0253143310546875, 0.045806884765625, 0.0662994384765625, 0.0867919921875, 0.1072845458984375, 0.127777099609375, 0.1482696533203125, 0.16876220703125, 0.1892547607421875, 0.209747314453125, 0.2302398681640625, 0.250732421875, 0.2712249755859375, 0.291717529296875, 0.3122100830078125, 0.33270263671875, 0.3531951904296875, 0.373687744140625, 0.3941802978515625, 0.4146728515625, 0.4351654052734375, 0.455657958984375, 0.4761505126953125, 0.49664306640625, 0.5171356201171875, 0.537628173828125, 0.5581207275390625, 0.57861328125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 3.0, 3.0, 10.0, 8.0, 5.0, 10.0, 12.0, 14.0, 17.0, 20.0, 30.0, 19.0, 18.0, 27.0, 29.0, 30.0, 32.0, 39.0, 38.0, 38.0, 34.0, 32.0, 1062.0, 37.0, 35.0, 34.0, 36.0, 22.0, 40.0, 35.0, 31.0, 26.0, 34.0, 19.0, 21.0, 11.0, 17.0, 14.0, 14.0, 24.0, 4.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0], "bins": [-2.626953125, -2.550048828125, -2.47314453125, -2.396240234375, -2.3193359375, -2.242431640625, -2.16552734375, -2.088623046875, -2.01171875, -1.934814453125, -1.85791015625, -1.781005859375, -1.7041015625, -1.627197265625, -1.55029296875, -1.473388671875, -1.396484375, -1.319580078125, -1.24267578125, -1.165771484375, -1.0888671875, -1.011962890625, -0.93505859375, -0.858154296875, -0.78125, -0.704345703125, -0.62744140625, -0.550537109375, -0.4736328125, -0.396728515625, -0.31982421875, -0.242919921875, -0.166015625, -0.089111328125, -0.01220703125, 0.064697265625, 0.1416015625, 0.218505859375, 0.29541015625, 0.372314453125, 0.44921875, 0.526123046875, 0.60302734375, 0.679931640625, 0.7568359375, 0.833740234375, 0.91064453125, 0.987548828125, 1.064453125, 1.141357421875, 1.21826171875, 1.295166015625, 1.3720703125, 1.448974609375, 1.52587890625, 1.602783203125, 1.6796875, 1.756591796875, 1.83349609375, 1.910400390625, 1.9873046875, 2.064208984375, 2.14111328125, 2.218017578125, 2.294921875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 13.0, 14.0, 17.0, 35.0, 43.0, 70.0, 80.0, 143.0, 175.0, 270.0, 400.0, 585.0, 770.0, 1223.0, 1782.0, 2562.0, 3807.0, 5770.0, 8941.0, 13541.0, 20788.0, 32601.0, 51060.0, 77353.0, 115157.0, 182800.0, 1186776.0, 130609.0, 90708.0, 58905.0, 38561.0, 24724.0, 15932.0, 10374.0, 6748.0, 4437.0, 3041.0, 2002.0, 1343.0, 903.0, 649.0, 440.0, 310.0, 173.0, 148.0, 106.0, 79.0, 59.0, 35.0, 19.0, 23.0, 16.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0], "bins": [-0.285400390625, -0.2765312194824219, -0.26766204833984375, -0.2587928771972656, -0.2499237060546875, -0.24105453491210938, -0.23218536376953125, -0.22331619262695312, -0.214447021484375, -0.20557785034179688, -0.19670867919921875, -0.18783950805664062, -0.1789703369140625, -0.17010116577148438, -0.16123199462890625, -0.15236282348632812, -0.14349365234375, -0.13462448120117188, -0.12575531005859375, -0.11688613891601562, -0.1080169677734375, -0.09914779663085938, -0.09027862548828125, -0.08140945434570312, -0.072540283203125, -0.06367111206054688, -0.05480194091796875, -0.045932769775390625, -0.0370635986328125, -0.028194427490234375, -0.01932525634765625, -0.010456085205078125, -0.0015869140625, 0.007282257080078125, 0.01615142822265625, 0.025020599365234375, 0.0338897705078125, 0.042758941650390625, 0.05162811279296875, 0.060497283935546875, 0.069366455078125, 0.07823562622070312, 0.08710479736328125, 0.09597396850585938, 0.1048431396484375, 0.11371231079101562, 0.12258148193359375, 0.13145065307617188, 0.14031982421875, 0.14918899536132812, 0.15805816650390625, 0.16692733764648438, 0.1757965087890625, 0.18466567993164062, 0.19353485107421875, 0.20240402221679688, 0.211273193359375, 0.22014236450195312, 0.22901153564453125, 0.23788070678710938, 0.2467498779296875, 0.2556190490722656, 0.26448822021484375, 0.2733573913574219, 0.2822265625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 5.0, 15.0, 22.0, 36.0, 48.0, 39.0, 69.0, 88.0, 142.0, 106.0, 112.0, 83.0, 76.0, 33.0, 23.0, 18.0, 13.0, 10.0, 10.0, 8.0, 5.0, 4.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00782012939453125, -0.007546544075012207, -0.007272958755493164, -0.006999373435974121, -0.006725788116455078, -0.006452202796936035, -0.006178617477416992, -0.005905032157897949, -0.005631446838378906, -0.005357861518859863, -0.00508427619934082, -0.004810690879821777, -0.004537105560302734, -0.004263520240783691, -0.0039899349212646484, -0.0037163496017456055, -0.0034427642822265625, -0.0031691789627075195, -0.0028955936431884766, -0.0026220083236694336, -0.0023484230041503906, -0.0020748376846313477, -0.0018012523651123047, -0.0015276670455932617, -0.0012540817260742188, -0.0009804964065551758, -0.0007069110870361328, -0.00043332576751708984, -0.00015974044799804688, 0.0001138448715209961, 0.00038743019104003906, 0.000661015510559082, 0.000934600830078125, 0.001208186149597168, 0.001481771469116211, 0.001755356788635254, 0.002028942108154297, 0.00230252742767334, 0.002576112747192383, 0.0028496980667114258, 0.0031232833862304688, 0.0033968687057495117, 0.0036704540252685547, 0.003944039344787598, 0.004217624664306641, 0.004491209983825684, 0.0047647953033447266, 0.0050383806228637695, 0.0053119659423828125, 0.0055855512619018555, 0.0058591365814208984, 0.006132721900939941, 0.006406307220458984, 0.006679892539978027, 0.00695347785949707, 0.007227063179016113, 0.007500648498535156, 0.007774233818054199, 0.008047819137573242, 0.008321404457092285, 0.008594989776611328, 0.008868575096130371, 0.009142160415649414, 0.009415745735168457, 0.0096893310546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 14.0, 3.0, 7.0, 6.0, 13.0, 21.0, 20.0, 38.0, 62.0, 64.0, 163.0, 338.0, 1056.0, 782402.0, 262558.0, 1003.0, 286.0, 146.0, 123.0, 60.0, 60.0, 32.0, 18.0, 10.0, 10.0, 8.0, 10.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1964111328125, -0.190948486328125, -0.18548583984375, -0.180023193359375, -0.174560546875, -0.169097900390625, -0.16363525390625, -0.158172607421875, -0.1527099609375, -0.147247314453125, -0.14178466796875, -0.136322021484375, -0.130859375, -0.125396728515625, -0.11993408203125, -0.114471435546875, -0.1090087890625, -0.103546142578125, -0.09808349609375, -0.092620849609375, -0.087158203125, -0.081695556640625, -0.07623291015625, -0.070770263671875, -0.0653076171875, -0.059844970703125, -0.05438232421875, -0.048919677734375, -0.04345703125, -0.037994384765625, -0.03253173828125, -0.027069091796875, -0.0216064453125, -0.016143798828125, -0.01068115234375, -0.005218505859375, 0.000244140625, 0.005706787109375, 0.01116943359375, 0.016632080078125, 0.0220947265625, 0.027557373046875, 0.03302001953125, 0.038482666015625, 0.0439453125, 0.049407958984375, 0.05487060546875, 0.060333251953125, 0.0657958984375, 0.071258544921875, 0.07672119140625, 0.082183837890625, 0.087646484375, 0.093109130859375, 0.09857177734375, 0.104034423828125, 0.1094970703125, 0.114959716796875, 0.12042236328125, 0.125885009765625, 0.13134765625, 0.136810302734375, 0.14227294921875, 0.147735595703125, 0.1531982421875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 22.0, 515.0, 437.0, 34.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06322511285543442, -0.061849094927310944, -0.06047308072447777, -0.05909706652164459, -0.05772104859352112, -0.056345030665397644, -0.05496901646256447, -0.05359300225973129, -0.05221698433160782, -0.050840966403484344, -0.04946495220065117, -0.04808893799781799, -0.04671292006969452, -0.045336902141571045, -0.04396088793873787, -0.042584873735904694, -0.04120885580778122, -0.039832837879657745, -0.03845682367682457, -0.037080809473991394, -0.03570479154586792, -0.034328773617744446, -0.03295275941491127, -0.031576745212078094, -0.03020072728395462, -0.028824711218476295, -0.02744869515299797, -0.026072679087519646, -0.02469666302204132, -0.023320646956562996, -0.02194463089108467, -0.020568614825606346, -0.019192596897482872, -0.017816580832004547, -0.016440564766526222, -0.015064548701047897, -0.013688532635569572, -0.012312516570091248, -0.010936500504612923, -0.009560484439134598, -0.008184468373656273, -0.006808452308177948, -0.005432436242699623, -0.004056420177221298, -0.0026804041117429733, -0.0013043880462646484, 7.162801921367645e-05, 0.0014476440846920013, 0.0028236601501703262, 0.004199676215648651, 0.005575692281126976, 0.006951708346605301, 0.008327724412083626, 0.00970374047756195, 0.011079756543040276, 0.0124557726085186, 0.013831788673996925, 0.01520780473947525, 0.016583820804953575, 0.0179598368704319, 0.019335852935910225, 0.02071186900138855, 0.022087885066866875, 0.0234639011323452, 0.024839917197823524]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 15.0, 4.0, 6.0, 13.0, 9.0, 9.0, 15.0, 24.0, 26.0, 20.0, 31.0, 23.0, 38.0, 35.0, 36.0, 35.0, 42.0, 41.0, 37.0, 39.0, 49.0, 37.0, 40.0, 43.0, 29.0, 37.0, 31.0, 34.0, 24.0, 31.0, 23.0, 19.0, 20.0, 18.0, 17.0, 5.0, 10.0, 12.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003990352153778076, -0.0038534821942448616, -0.003716612234711647, -0.0035797422751784325, -0.003442872315645218, -0.0033060023561120033, -0.0031691323965787888, -0.003032262437045574, -0.0028953924775123596, -0.002758522517979145, -0.0026216525584459305, -0.002484782598912716, -0.0023479126393795013, -0.0022110426798462868, -0.002074172720313072, -0.0019373027607798576, -0.001800432801246643, -0.0016635628417134285, -0.001526692882180214, -0.0013898229226469994, -0.0012529529631137848, -0.0011160830035805702, -0.0009792130440473557, -0.0008423430845141411, -0.0007054731249809265, -0.0005686031654477119, -0.0004317332059144974, -0.0002948632463812828, -0.00015799328684806824, -2.1123327314853668e-05, 0.0001157466322183609, 0.00025261659175157547, 0.00038948655128479004, 0.0005263565108180046, 0.0006632264703512192, 0.0008000964298844337, 0.0009369663894176483, 0.0010738363489508629, 0.0012107063084840775, 0.001347576268017292, 0.0014844462275505066, 0.0016213161870837212, 0.0017581861466169357, 0.0018950561061501503, 0.002031926065683365, 0.0021687960252165794, 0.002305665984749794, 0.0024425359442830086, 0.002579405903816223, 0.0027162758633494377, 0.0028531458228826523, 0.002990015782415867, 0.0031268857419490814, 0.003263755701482296, 0.0034006256610155106, 0.003537495620548725, 0.0036743655800819397, 0.0038112355396151543, 0.003948105499148369, 0.004084975458681583, 0.004221845418214798, 0.0043587153777480125, 0.004495585337281227, 0.004632455296814442, 0.004769325256347656]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 1.0, 7.0, 4.0, 7.0, 9.0, 6.0, 8.0, 12.0, 13.0, 15.0, 18.0, 18.0, 25.0, 24.0, 31.0, 26.0, 34.0, 41.0, 40.0, 33.0, 46.0, 41.0, 44.0, 32.0, 42.0, 39.0, 34.0, 33.0, 36.0, 33.0, 26.0, 15.0, 25.0, 17.0, 27.0, 18.0, 18.0, 19.0, 15.0, 17.0, 17.0, 7.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0], "bins": [-4.390625, -4.269561767578125, -4.14849853515625, -4.027435302734375, -3.9063720703125, -3.785308837890625, -3.66424560546875, -3.543182373046875, -3.422119140625, -3.301055908203125, -3.17999267578125, -3.058929443359375, -2.9378662109375, -2.816802978515625, -2.69573974609375, -2.574676513671875, -2.45361328125, -2.332550048828125, -2.21148681640625, -2.090423583984375, -1.9693603515625, -1.848297119140625, -1.72723388671875, -1.606170654296875, -1.485107421875, -1.364044189453125, -1.24298095703125, -1.121917724609375, -1.0008544921875, -0.879791259765625, -0.75872802734375, -0.637664794921875, -0.5166015625, -0.395538330078125, -0.27447509765625, -0.153411865234375, -0.0323486328125, 0.088714599609375, 0.20977783203125, 0.330841064453125, 0.451904296875, 0.572967529296875, 0.69403076171875, 0.815093994140625, 0.9361572265625, 1.057220458984375, 1.17828369140625, 1.299346923828125, 1.42041015625, 1.541473388671875, 1.66253662109375, 1.783599853515625, 1.9046630859375, 2.025726318359375, 2.14678955078125, 2.267852783203125, 2.388916015625, 2.509979248046875, 2.63104248046875, 2.752105712890625, 2.8731689453125, 2.994232177734375, 3.11529541015625, 3.236358642578125, 3.357421875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 6.0, 12.0, 11.0, 15.0, 20.0, 20.0, 25.0, 37.0, 45.0, 69.0, 96.0, 122.0, 171.0, 286.0, 574.0, 1199.0, 3757.0, 14727.0, 59502.0, 337743.0, 522650.0, 79580.0, 19758.0, 5056.0, 1481.0, 574.0, 291.0, 178.0, 104.0, 90.0, 82.0, 54.0, 43.0, 34.0, 24.0, 22.0, 26.0, 16.0, 10.0, 10.0, 4.0, 8.0, 6.0, 0.0, 3.0, 1.0, 0.0, 5.0], "bins": [-8.3515625, -8.1202392578125, -7.888916015625, -7.6575927734375, -7.42626953125, -7.1949462890625, -6.963623046875, -6.7322998046875, -6.5009765625, -6.2696533203125, -6.038330078125, -5.8070068359375, -5.57568359375, -5.3443603515625, -5.113037109375, -4.8817138671875, -4.650390625, -4.4190673828125, -4.187744140625, -3.9564208984375, -3.72509765625, -3.4937744140625, -3.262451171875, -3.0311279296875, -2.7998046875, -2.5684814453125, -2.337158203125, -2.1058349609375, -1.87451171875, -1.6431884765625, -1.411865234375, -1.1805419921875, -0.94921875, -0.7178955078125, -0.486572265625, -0.2552490234375, -0.02392578125, 0.2073974609375, 0.438720703125, 0.6700439453125, 0.9013671875, 1.1326904296875, 1.364013671875, 1.5953369140625, 1.82666015625, 2.0579833984375, 2.289306640625, 2.5206298828125, 2.751953125, 2.9832763671875, 3.214599609375, 3.4459228515625, 3.67724609375, 3.9085693359375, 4.139892578125, 4.3712158203125, 4.6025390625, 4.8338623046875, 5.065185546875, 5.2965087890625, 5.52783203125, 5.7591552734375, 5.990478515625, 6.2218017578125, 6.453125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 13.0, 12.0, 14.0, 9.0, 15.0, 12.0, 15.0, 17.0, 24.0, 19.0, 29.0, 34.0, 35.0, 54.0, 61.0, 64.0, 102.0, 247.0, 1523.0, 193.0, 88.0, 72.0, 48.0, 45.0, 31.0, 31.0, 26.0, 34.0, 27.0, 26.0, 16.0, 15.0, 14.0, 15.0, 13.0, 10.0, 6.0, 6.0, 0.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1484375, -12.74267578125, -12.3369140625, -11.93115234375, -11.525390625, -11.11962890625, -10.7138671875, -10.30810546875, -9.90234375, -9.49658203125, -9.0908203125, -8.68505859375, -8.279296875, -7.87353515625, -7.4677734375, -7.06201171875, -6.65625, -6.25048828125, -5.8447265625, -5.43896484375, -5.033203125, -4.62744140625, -4.2216796875, -3.81591796875, -3.41015625, -3.00439453125, -2.5986328125, -2.19287109375, -1.787109375, -1.38134765625, -0.9755859375, -0.56982421875, -0.1640625, 0.24169921875, 0.6474609375, 1.05322265625, 1.458984375, 1.86474609375, 2.2705078125, 2.67626953125, 3.08203125, 3.48779296875, 3.8935546875, 4.29931640625, 4.705078125, 5.11083984375, 5.5166015625, 5.92236328125, 6.328125, 6.73388671875, 7.1396484375, 7.54541015625, 7.951171875, 8.35693359375, 8.7626953125, 9.16845703125, 9.57421875, 9.97998046875, 10.3857421875, 10.79150390625, 11.197265625, 11.60302734375, 12.0087890625, 12.41455078125, 12.8203125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 7.0, 8.0, 3.0, 10.0, 11.0, 9.0, 18.0, 13.0, 16.0, 29.0, 25.0, 47.0, 42.0, 71.0, 74.0, 100.0, 140.0, 278.0, 669.0, 2958.0, 26969.0, 3038349.0, 69595.0, 4399.0, 878.0, 317.0, 166.0, 118.0, 66.0, 52.0, 50.0, 32.0, 30.0, 24.0, 22.0, 23.0, 21.0, 17.0, 14.0, 11.0, 5.0, 7.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-42.9375, -41.66015625, -40.3828125, -39.10546875, -37.828125, -36.55078125, -35.2734375, -33.99609375, -32.71875, -31.44140625, -30.1640625, -28.88671875, -27.609375, -26.33203125, -25.0546875, -23.77734375, -22.5, -21.22265625, -19.9453125, -18.66796875, -17.390625, -16.11328125, -14.8359375, -13.55859375, -12.28125, -11.00390625, -9.7265625, -8.44921875, -7.171875, -5.89453125, -4.6171875, -3.33984375, -2.0625, -0.78515625, 0.4921875, 1.76953125, 3.046875, 4.32421875, 5.6015625, 6.87890625, 8.15625, 9.43359375, 10.7109375, 11.98828125, 13.265625, 14.54296875, 15.8203125, 17.09765625, 18.375, 19.65234375, 20.9296875, 22.20703125, 23.484375, 24.76171875, 26.0390625, 27.31640625, 28.59375, 29.87109375, 31.1484375, 32.42578125, 33.703125, 34.98046875, 36.2578125, 37.53515625, 38.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 17.0, 16.0, 63.0, 105.0, 187.0, 202.0, 182.0, 147.0, 45.0, 22.0, 13.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.219508171081543, -9.132844924926758, -8.046182632446289, -6.959519863128662, -5.872857093811035, -4.786194324493408, -3.6995315551757812, -2.6128687858581543, -1.5262060165405273, -0.4395432472229004, 0.6471195220947266, 1.7337822914123535, 2.8204450607299805, 3.9071078300476074, 4.993770599365234, 6.080433368682861, 7.167096138000488, 8.253759384155273, 9.340421676635742, 10.427083969116211, 11.513747215270996, 12.600410461425781, 13.68707275390625, 14.773735046386719, 15.860398292541504, 16.94706153869629, 18.033723831176758, 19.120386123657227, 20.207050323486328, 21.293712615966797, 22.380374908447266, 23.467037200927734, 24.55370330810547, 25.640365600585938, 26.727027893066406, 27.813692092895508, 28.900354385375977, 29.987016677856445, 31.073680877685547, 32.160343170166016, 33.247005462646484, 34.33366775512695, 35.42033004760742, 36.50699234008789, 37.593658447265625, 38.680320739746094, 39.76698303222656, 40.85364532470703, 41.9403076171875, 43.02696990966797, 44.11363220214844, 45.200294494628906, 46.286956787109375, 47.37362289428711, 48.46028518676758, 49.54694747924805, 50.633609771728516, 51.720272064208984, 52.80693435668945, 53.89359664916992, 54.980262756347656, 56.066925048828125, 57.153587341308594, 58.24024963378906, 59.32691192626953]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 7.0, 5.0, 12.0, 4.0, 6.0, 10.0, 17.0, 16.0, 18.0, 16.0, 20.0, 30.0, 25.0, 27.0, 33.0, 22.0, 38.0, 35.0, 40.0, 33.0, 45.0, 41.0, 50.0, 42.0, 35.0, 41.0, 36.0, 35.0, 35.0, 27.0, 34.0, 28.0, 17.0, 16.0, 15.0, 17.0, 11.0, 11.0, 9.0, 10.0, 7.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.81783676147461, -35.67250061035156, -34.52716064453125, -33.3818244934082, -32.236488342285156, -31.09115219116211, -29.94581413269043, -28.80047607421875, -27.655139923095703, -26.509803771972656, -25.364465713500977, -24.219127655029297, -23.07379150390625, -21.928455352783203, -20.783117294311523, -19.637779235839844, -18.492443084716797, -17.34710693359375, -16.20176887512207, -15.056431770324707, -13.911094665527344, -12.76575756072998, -11.620420455932617, -10.475083351135254, -9.32974624633789, -8.184409141540527, -7.039072036743164, -5.893734931945801, -4.7483978271484375, -3.603060722351074, -2.457723617553711, -1.3123865127563477, -0.16704559326171875, 0.9782915115356445, 2.123628616333008, 3.268965721130371, 4.414302825927734, 5.559639930725098, 6.704977035522461, 7.850314140319824, 8.995651245117188, 10.14098834991455, 11.286325454711914, 12.431662559509277, 13.57699966430664, 14.722336769104004, 15.867673873901367, 17.013011932373047, 18.158348083496094, 19.30368423461914, 20.44902229309082, 21.5943603515625, 22.739696502685547, 23.885032653808594, 25.030370712280273, 26.175708770751953, 27.321044921875, 28.466381072998047, 29.611719131469727, 30.757057189941406, 31.902393341064453, 33.0477294921875, 34.19306945800781, 35.33840560913086, 36.483741760253906]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 7.0, 7.0, 7.0, 8.0, 9.0, 18.0, 19.0, 30.0, 22.0, 19.0, 32.0, 33.0, 28.0, 33.0, 33.0, 46.0, 44.0, 37.0, 55.0, 43.0, 47.0, 35.0, 24.0, 40.0, 33.0, 23.0, 38.0, 30.0, 20.0, 30.0, 18.0, 23.0, 15.0, 23.0, 15.0, 10.0, 11.0, 5.0, 2.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.453125, -4.306396484375, -4.15966796875, -4.012939453125, -3.8662109375, -3.719482421875, -3.57275390625, -3.426025390625, -3.279296875, -3.132568359375, -2.98583984375, -2.839111328125, -2.6923828125, -2.545654296875, -2.39892578125, -2.252197265625, -2.10546875, -1.958740234375, -1.81201171875, -1.665283203125, -1.5185546875, -1.371826171875, -1.22509765625, -1.078369140625, -0.931640625, -0.784912109375, -0.63818359375, -0.491455078125, -0.3447265625, -0.197998046875, -0.05126953125, 0.095458984375, 0.2421875, 0.388916015625, 0.53564453125, 0.682373046875, 0.8291015625, 0.975830078125, 1.12255859375, 1.269287109375, 1.416015625, 1.562744140625, 1.70947265625, 1.856201171875, 2.0029296875, 2.149658203125, 2.29638671875, 2.443115234375, 2.58984375, 2.736572265625, 2.88330078125, 3.030029296875, 3.1767578125, 3.323486328125, 3.47021484375, 3.616943359375, 3.763671875, 3.910400390625, 4.05712890625, 4.203857421875, 4.3505859375, 4.497314453125, 4.64404296875, 4.790771484375, 4.9375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 13.0, 13.0, 8.0, 17.0, 25.0, 30.0, 32.0, 60.0, 73.0, 133.0, 217.0, 384.0, 796.0, 1754.0, 4477.0, 12878.0, 44564.0, 171464.0, 610811.0, 1387844.0, 1275600.0, 496416.0, 133326.0, 35360.0, 10708.0, 3882.0, 1690.0, 726.0, 383.0, 187.0, 128.0, 73.0, 50.0, 36.0, 26.0, 28.0, 17.0, 14.0, 12.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9921875, -4.81951904296875, -4.6468505859375, -4.47418212890625, -4.301513671875, -4.12884521484375, -3.9561767578125, -3.78350830078125, -3.61083984375, -3.43817138671875, -3.2655029296875, -3.09283447265625, -2.920166015625, -2.74749755859375, -2.5748291015625, -2.40216064453125, -2.2294921875, -2.05682373046875, -1.8841552734375, -1.71148681640625, -1.538818359375, -1.36614990234375, -1.1934814453125, -1.02081298828125, -0.84814453125, -0.67547607421875, -0.5028076171875, -0.33013916015625, -0.157470703125, 0.01519775390625, 0.1878662109375, 0.36053466796875, 0.533203125, 0.70587158203125, 0.8785400390625, 1.05120849609375, 1.223876953125, 1.39654541015625, 1.5692138671875, 1.74188232421875, 1.91455078125, 2.08721923828125, 2.2598876953125, 2.43255615234375, 2.605224609375, 2.77789306640625, 2.9505615234375, 3.12322998046875, 3.2958984375, 3.46856689453125, 3.6412353515625, 3.81390380859375, 3.986572265625, 4.15924072265625, 4.3319091796875, 4.50457763671875, 4.67724609375, 4.84991455078125, 5.0225830078125, 5.19525146484375, 5.367919921875, 5.54058837890625, 5.7132568359375, 5.88592529296875, 6.05859375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 10.0, 17.0, 24.0, 42.0, 30.0, 45.0, 66.0, 90.0, 136.0, 169.0, 242.0, 323.0, 424.0, 470.0, 479.0, 414.0, 298.0, 215.0, 155.0, 118.0, 73.0, 73.0, 47.0, 32.0, 20.0, 12.0, 14.0, 10.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.40625, -10.1246337890625, -9.843017578125, -9.5614013671875, -9.27978515625, -8.9981689453125, -8.716552734375, -8.4349365234375, -8.1533203125, -7.8717041015625, -7.590087890625, -7.3084716796875, -7.02685546875, -6.7452392578125, -6.463623046875, -6.1820068359375, -5.900390625, -5.6187744140625, -5.337158203125, -5.0555419921875, -4.77392578125, -4.4923095703125, -4.210693359375, -3.9290771484375, -3.6474609375, -3.3658447265625, -3.084228515625, -2.8026123046875, -2.52099609375, -2.2393798828125, -1.957763671875, -1.6761474609375, -1.39453125, -1.1129150390625, -0.831298828125, -0.5496826171875, -0.26806640625, 0.0135498046875, 0.295166015625, 0.5767822265625, 0.8583984375, 1.1400146484375, 1.421630859375, 1.7032470703125, 1.98486328125, 2.2664794921875, 2.548095703125, 2.8297119140625, 3.111328125, 3.3929443359375, 3.674560546875, 3.9561767578125, 4.23779296875, 4.5194091796875, 4.801025390625, 5.0826416015625, 5.3642578125, 5.6458740234375, 5.927490234375, 6.2091064453125, 6.49072265625, 6.7723388671875, 7.053955078125, 7.3355712890625, 7.6171875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 6.0, 8.0, 13.0, 12.0, 15.0, 19.0, 50.0, 74.0, 93.0, 131.0, 236.0, 425.0, 792.0, 2180.0, 44102.0, 3847516.0, 291886.0, 4247.0, 1111.0, 516.0, 315.0, 201.0, 99.0, 56.0, 52.0, 45.0, 28.0, 19.0, 14.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.09375, -28.0791015625, -27.064453125, -26.0498046875, -25.03515625, -24.0205078125, -23.005859375, -21.9912109375, -20.9765625, -19.9619140625, -18.947265625, -17.9326171875, -16.91796875, -15.9033203125, -14.888671875, -13.8740234375, -12.859375, -11.8447265625, -10.830078125, -9.8154296875, -8.80078125, -7.7861328125, -6.771484375, -5.7568359375, -4.7421875, -3.7275390625, -2.712890625, -1.6982421875, -0.68359375, 0.3310546875, 1.345703125, 2.3603515625, 3.375, 4.3896484375, 5.404296875, 6.4189453125, 7.43359375, 8.4482421875, 9.462890625, 10.4775390625, 11.4921875, 12.5068359375, 13.521484375, 14.5361328125, 15.55078125, 16.5654296875, 17.580078125, 18.5947265625, 19.609375, 20.6240234375, 21.638671875, 22.6533203125, 23.66796875, 24.6826171875, 25.697265625, 26.7119140625, 27.7265625, 28.7412109375, 29.755859375, 30.7705078125, 31.78515625, 32.7998046875, 33.814453125, 34.8291015625, 35.84375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 211.0, 758.0, 45.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-397.21319580078125, -388.0487365722656, -378.88427734375, -369.7198486328125, -360.5553894042969, -351.39093017578125, -342.2264709472656, -333.06201171875, -323.8975830078125, -314.7331237792969, -305.56866455078125, -296.40423583984375, -287.2397766113281, -278.0753173828125, -268.9108581542969, -259.74639892578125, -250.58193969726562, -241.41748046875, -232.25303649902344, -223.0885772705078, -213.92413330078125, -204.75967407226562, -195.59521484375, -186.43075561523438, -177.2663116455078, -168.1018524169922, -158.93740844726562, -149.77294921875, -140.60848999023438, -131.4440460205078, -122.27958679199219, -113.1151351928711, -103.95066833496094, -94.78621673583984, -85.62176513671875, -76.45730590820312, -67.29285430908203, -58.12840270996094, -48.96394729614258, -39.79949188232422, -30.635040283203125, -21.4705867767334, -12.306133270263672, -3.1416797637939453, 6.022773742675781, 15.187225341796875, 24.351680755615234, 33.516136169433594, 42.68058776855469, 51.84503936767578, 61.00949478149414, 70.1739501953125, 79.3384017944336, 88.50285339355469, 97.66731262207031, 106.8317642211914, 115.9962158203125, 125.1606674194336, 134.3251190185547, 143.4895782470703, 152.65402221679688, 161.8184814453125, 170.98294067382812, 180.14739990234375, 189.3118438720703]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 5.0, 9.0, 8.0, 16.0, 15.0, 19.0, 17.0, 11.0, 31.0, 31.0, 27.0, 34.0, 28.0, 43.0, 46.0, 43.0, 65.0, 51.0, 58.0, 53.0, 36.0, 44.0, 41.0, 40.0, 34.0, 25.0, 25.0, 32.0, 25.0, 19.0, 23.0, 12.0, 6.0, 10.0, 8.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.778839111328125, -31.794004440307617, -30.80916976928711, -29.824337005615234, -28.839502334594727, -27.85466766357422, -26.869834899902344, -25.885000228881836, -24.900165557861328, -23.91533088684082, -22.930496215820312, -21.945663452148438, -20.96082878112793, -19.975994110107422, -18.991161346435547, -18.00632667541504, -17.02149200439453, -16.036657333374023, -15.051823616027832, -14.06698989868164, -13.082155227661133, -12.097320556640625, -11.112486839294434, -10.127653121948242, -9.142818450927734, -8.157983779907227, -7.173150062561035, -6.1883158683776855, -5.203481674194336, -4.218647480010986, -3.2338132858276367, -2.248979091644287, -1.2641448974609375, -0.2793107032775879, 0.7055234909057617, 1.6903576850891113, 2.675191879272461, 3.6600260734558105, 4.64486026763916, 5.62969446182251, 6.614528656005859, 7.599362850189209, 8.584197044372559, 9.56903076171875, 10.553865432739258, 11.538700103759766, 12.523533821105957, 13.508367538452148, 14.493202209472656, 15.478036880493164, 16.462871551513672, 17.447704315185547, 18.432538986206055, 19.417373657226562, 20.402206420898438, 21.387041091918945, 22.371875762939453, 23.35671043395996, 24.34154510498047, 25.326377868652344, 26.31121253967285, 27.29604721069336, 28.280879974365234, 29.265714645385742, 30.25054931640625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 6.0, 11.0, 9.0, 7.0, 11.0, 6.0, 20.0, 18.0, 25.0, 23.0, 21.0, 27.0, 36.0, 33.0, 46.0, 44.0, 43.0, 50.0, 50.0, 42.0, 39.0, 38.0, 34.0, 37.0, 36.0, 34.0, 42.0, 28.0, 29.0, 26.0, 16.0, 27.0, 13.0, 15.0, 11.0, 8.0, 11.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.6112060546875, -4.464599609375, -4.3179931640625, -4.17138671875, -4.0247802734375, -3.878173828125, -3.7315673828125, -3.5849609375, -3.4383544921875, -3.291748046875, -3.1451416015625, -2.99853515625, -2.8519287109375, -2.705322265625, -2.5587158203125, -2.412109375, -2.2655029296875, -2.118896484375, -1.9722900390625, -1.82568359375, -1.6790771484375, -1.532470703125, -1.3858642578125, -1.2392578125, -1.0926513671875, -0.946044921875, -0.7994384765625, -0.65283203125, -0.5062255859375, -0.359619140625, -0.2130126953125, -0.06640625, 0.0802001953125, 0.226806640625, 0.3734130859375, 0.52001953125, 0.6666259765625, 0.813232421875, 0.9598388671875, 1.1064453125, 1.2530517578125, 1.399658203125, 1.5462646484375, 1.69287109375, 1.8394775390625, 1.986083984375, 2.1326904296875, 2.279296875, 2.4259033203125, 2.572509765625, 2.7191162109375, 2.86572265625, 3.0123291015625, 3.158935546875, 3.3055419921875, 3.4521484375, 3.5987548828125, 3.745361328125, 3.8919677734375, 4.03857421875, 4.1851806640625, 4.331787109375, 4.4783935546875, 4.625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 4.0, 6.0, 8.0, 5.0, 10.0, 19.0, 22.0, 32.0, 38.0, 70.0, 81.0, 128.0, 201.0, 291.0, 426.0, 670.0, 1002.0, 1533.0, 2324.0, 3829.0, 5923.0, 9336.0, 14876.0, 24407.0, 39190.0, 66038.0, 110408.0, 175981.0, 209994.0, 148859.0, 91001.0, 54453.0, 32869.0, 20245.0, 12593.0, 7858.0, 4857.0, 3064.0, 2029.0, 1336.0, 846.0, 546.0, 347.0, 252.0, 170.0, 131.0, 61.0, 55.0, 39.0, 30.0, 27.0, 12.0, 5.0, 8.0, 9.0, 1.0, 8.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.476806640625, -0.461578369140625, -0.44635009765625, -0.431121826171875, -0.4158935546875, -0.400665283203125, -0.38543701171875, -0.370208740234375, -0.35498046875, -0.339752197265625, -0.32452392578125, -0.309295654296875, -0.2940673828125, -0.278839111328125, -0.26361083984375, -0.248382568359375, -0.233154296875, -0.217926025390625, -0.20269775390625, -0.187469482421875, -0.1722412109375, -0.157012939453125, -0.14178466796875, -0.126556396484375, -0.111328125, -0.096099853515625, -0.08087158203125, -0.065643310546875, -0.0504150390625, -0.035186767578125, -0.01995849609375, -0.004730224609375, 0.010498046875, 0.025726318359375, 0.04095458984375, 0.056182861328125, 0.0714111328125, 0.086639404296875, 0.10186767578125, 0.117095947265625, 0.13232421875, 0.147552490234375, 0.16278076171875, 0.178009033203125, 0.1932373046875, 0.208465576171875, 0.22369384765625, 0.238922119140625, 0.254150390625, 0.269378662109375, 0.28460693359375, 0.299835205078125, 0.3150634765625, 0.330291748046875, 0.34552001953125, 0.360748291015625, 0.3759765625, 0.391204833984375, 0.40643310546875, 0.421661376953125, 0.4368896484375, 0.452117919921875, 0.46734619140625, 0.482574462890625, 0.497802734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 6.0, 7.0, 11.0, 15.0, 11.0, 11.0, 14.0, 25.0, 12.0, 25.0, 26.0, 30.0, 34.0, 38.0, 32.0, 36.0, 29.0, 36.0, 31.0, 40.0, 1059.0, 36.0, 37.0, 29.0, 27.0, 44.0, 33.0, 25.0, 36.0, 22.0, 20.0, 23.0, 23.0, 20.0, 12.0, 19.0, 16.0, 15.0, 10.0, 11.0, 3.0, 7.0, 1.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.515625, -2.4346923828125, -2.353759765625, -2.2728271484375, -2.19189453125, -2.1109619140625, -2.030029296875, -1.9490966796875, -1.8681640625, -1.7872314453125, -1.706298828125, -1.6253662109375, -1.54443359375, -1.4635009765625, -1.382568359375, -1.3016357421875, -1.220703125, -1.1397705078125, -1.058837890625, -0.9779052734375, -0.89697265625, -0.8160400390625, -0.735107421875, -0.6541748046875, -0.5732421875, -0.4923095703125, -0.411376953125, -0.3304443359375, -0.24951171875, -0.1685791015625, -0.087646484375, -0.0067138671875, 0.07421875, 0.1551513671875, 0.236083984375, 0.3170166015625, 0.39794921875, 0.4788818359375, 0.559814453125, 0.6407470703125, 0.7216796875, 0.8026123046875, 0.883544921875, 0.9644775390625, 1.04541015625, 1.1263427734375, 1.207275390625, 1.2882080078125, 1.369140625, 1.4500732421875, 1.531005859375, 1.6119384765625, 1.69287109375, 1.7738037109375, 1.854736328125, 1.9356689453125, 2.0166015625, 2.0975341796875, 2.178466796875, 2.2593994140625, 2.34033203125, 2.4212646484375, 2.502197265625, 2.5831298828125, 2.6640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 8.0, 9.0, 10.0, 12.0, 11.0, 31.0, 44.0, 56.0, 81.0, 110.0, 176.0, 270.0, 411.0, 581.0, 811.0, 1277.0, 1841.0, 2942.0, 4165.0, 6654.0, 10004.0, 15680.0, 24539.0, 38636.0, 60227.0, 92889.0, 136574.0, 1210959.0, 165187.0, 114020.0, 74655.0, 47754.0, 30393.0, 19507.0, 12693.0, 8212.0, 5193.0, 3517.0, 2273.0, 1582.0, 1048.0, 680.0, 478.0, 278.0, 195.0, 138.0, 105.0, 73.0, 49.0, 24.0, 26.0, 12.0, 12.0, 9.0, 6.0, 4.0, 4.0, 2.0, 5.0, 1.0], "bins": [-0.30419921875, -0.29461669921875, -0.2850341796875, -0.27545166015625, -0.265869140625, -0.25628662109375, -0.2467041015625, -0.23712158203125, -0.2275390625, -0.21795654296875, -0.2083740234375, -0.19879150390625, -0.189208984375, -0.17962646484375, -0.1700439453125, -0.16046142578125, -0.15087890625, -0.14129638671875, -0.1317138671875, -0.12213134765625, -0.112548828125, -0.10296630859375, -0.0933837890625, -0.08380126953125, -0.07421875, -0.06463623046875, -0.0550537109375, -0.04547119140625, -0.035888671875, -0.02630615234375, -0.0167236328125, -0.00714111328125, 0.00244140625, 0.01202392578125, 0.0216064453125, 0.03118896484375, 0.040771484375, 0.05035400390625, 0.0599365234375, 0.06951904296875, 0.0791015625, 0.08868408203125, 0.0982666015625, 0.10784912109375, 0.117431640625, 0.12701416015625, 0.1365966796875, 0.14617919921875, 0.15576171875, 0.16534423828125, 0.1749267578125, 0.18450927734375, 0.194091796875, 0.20367431640625, 0.2132568359375, 0.22283935546875, 0.232421875, 0.24200439453125, 0.2515869140625, 0.26116943359375, 0.270751953125, 0.28033447265625, 0.2899169921875, 0.29949951171875, 0.30908203125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 7.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 12.0, 12.0, 18.0, 20.0, 43.0, 69.0, 115.0, 173.0, 159.0, 129.0, 68.0, 45.0, 26.0, 16.0, 11.0, 11.0, 5.0, 6.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0107574462890625, -0.010411262512207031, -0.010065078735351562, -0.009718894958496094, -0.009372711181640625, -0.009026527404785156, -0.008680343627929688, -0.008334159851074219, -0.00798797607421875, -0.007641792297363281, -0.0072956085205078125, -0.006949424743652344, -0.006603240966796875, -0.006257057189941406, -0.0059108734130859375, -0.005564689636230469, -0.005218505859375, -0.004872322082519531, -0.0045261383056640625, -0.004179954528808594, -0.003833770751953125, -0.0034875869750976562, -0.0031414031982421875, -0.0027952194213867188, -0.00244903564453125, -0.0021028518676757812, -0.0017566680908203125, -0.0014104843139648438, -0.001064300537109375, -0.0007181167602539062, -0.0003719329833984375, -2.574920654296875e-05, 0.0003204345703125, 0.0006666183471679688, 0.0010128021240234375, 0.0013589859008789062, 0.001705169677734375, 0.0020513534545898438, 0.0023975372314453125, 0.0027437210083007812, 0.00308990478515625, 0.0034360885620117188, 0.0037822723388671875, 0.004128456115722656, 0.004474639892578125, 0.004820823669433594, 0.0051670074462890625, 0.005513191223144531, 0.005859375, 0.006205558776855469, 0.0065517425537109375, 0.006897926330566406, 0.007244110107421875, 0.007590293884277344, 0.007936477661132812, 0.008282661437988281, 0.00862884521484375, 0.008975028991699219, 0.009321212768554688, 0.009667396545410156, 0.010013580322265625, 0.010359764099121094, 0.010705947875976562, 0.011052131652832031, 0.0113983154296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 5.0, 7.0, 6.0, 8.0, 8.0, 10.0, 11.0, 9.0, 12.0, 31.0, 36.0, 52.0, 74.0, 181.0, 275.0, 1202.0, 530110.0, 514557.0, 1202.0, 292.0, 161.0, 84.0, 47.0, 44.0, 32.0, 20.0, 9.0, 8.0, 14.0, 5.0, 9.0, 6.0, 7.0, 4.0, 6.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20361328125, -0.19744300842285156, -0.19127273559570312, -0.1851024627685547, -0.17893218994140625, -0.1727619171142578, -0.16659164428710938, -0.16042137145996094, -0.1542510986328125, -0.14808082580566406, -0.14191055297851562, -0.1357402801513672, -0.12957000732421875, -0.12339973449707031, -0.11722946166992188, -0.11105918884277344, -0.104888916015625, -0.09871864318847656, -0.09254837036132812, -0.08637809753417969, -0.08020782470703125, -0.07403755187988281, -0.06786727905273438, -0.06169700622558594, -0.0555267333984375, -0.04935646057128906, -0.043186187744140625, -0.03701591491699219, -0.03084564208984375, -0.024675369262695312, -0.018505096435546875, -0.012334823608398438, -0.00616455078125, 5.7220458984375e-06, 0.006175994873046875, 0.012346267700195312, 0.01851654052734375, 0.024686813354492188, 0.030857086181640625, 0.03702735900878906, 0.0431976318359375, 0.04936790466308594, 0.055538177490234375, 0.06170845031738281, 0.06787872314453125, 0.07404899597167969, 0.08021926879882812, 0.08638954162597656, 0.092559814453125, 0.09873008728027344, 0.10490036010742188, 0.11107063293457031, 0.11724090576171875, 0.12341117858886719, 0.12958145141601562, 0.13575172424316406, 0.1419219970703125, 0.14809226989746094, 0.15426254272460938, 0.1604328155517578, 0.16660308837890625, 0.1727733612060547, 0.17894363403320312, 0.18511390686035156, 0.1912841796875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 9.0, 939.0, 67.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.1896173059940338, -0.18638519942760468, -0.18315309286117554, -0.1799209862947464, -0.17668887972831726, -0.17345677316188812, -0.17022466659545898, -0.16699256002902985, -0.1637604534626007, -0.16052834689617157, -0.15729624032974243, -0.1540641337633133, -0.15083202719688416, -0.14759992063045502, -0.14436781406402588, -0.14113570749759674, -0.1379035860300064, -0.13467147946357727, -0.13143937289714813, -0.128207266330719, -0.12497515976428986, -0.12174305319786072, -0.11851094663143158, -0.11527883261442184, -0.1120467334985733, -0.10881462693214417, -0.10558252036571503, -0.10235041379928589, -0.09911830723285675, -0.09588620066642761, -0.09265409409999847, -0.08942198008298874, -0.086189866065979, -0.08295775949954987, -0.07972565293312073, -0.07649354636669159, -0.07326143980026245, -0.07002933323383331, -0.06679722666740417, -0.06356511265039444, -0.0603330098092556, -0.05710090324282646, -0.053868796676397324, -0.05063668638467789, -0.04740457981824875, -0.04417247325181961, -0.04094036668539047, -0.037708260118961334, -0.034476153552532196, -0.031244046986103058, -0.02801193855702877, -0.024779831990599632, -0.021547723561525345, -0.018315616995096207, -0.015083510428667068, -0.011851401999592781, -0.008619293570518494, -0.005387186072766781, -0.0021550790406763554, 0.0010770279914140701, 0.004309135489165783, 0.007541242986917496, 0.010773349553346634, 0.014005457982420921, 0.01723756454885006]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 11.0, 9.0, 12.0, 17.0, 21.0, 28.0, 30.0, 35.0, 52.0, 44.0, 56.0, 41.0, 65.0, 59.0, 58.0, 49.0, 54.0, 46.0, 58.0, 29.0, 44.0, 33.0, 21.0, 23.0, 22.0, 22.0, 13.0, 8.0, 11.0, 12.0, 8.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005301833152770996, -0.005056959576904774, -0.004812086001038551, -0.004567212425172329, -0.004322338849306107, -0.004077465273439884, -0.003832591697573662, -0.0035877181217074394, -0.003342844545841217, -0.0030979709699749947, -0.0028530973941087723, -0.00260822381824255, -0.0023633502423763275, -0.002118476666510105, -0.0018736030906438828, -0.0016287295147776604, -0.001383855938911438, -0.0011389823630452156, -0.0008941087871789932, -0.0006492352113127708, -0.00040436163544654846, -0.00015948805958032608, 8.53855162858963e-05, 0.0003302590921521187, 0.0005751326680183411, 0.0008200062438845634, 0.0010648798197507858, 0.0013097533956170082, 0.0015546269714832306, 0.001799500547349453, 0.0020443741232156754, 0.0022892476990818977, 0.00253412127494812, 0.0027789948508143425, 0.003023868426680565, 0.0032687420025467873, 0.0035136155784130096, 0.003758489154279232, 0.004003362730145454, 0.004248236306011677, 0.004493109881877899, 0.0047379834577441216, 0.004982857033610344, 0.005227730609476566, 0.005472604185342789, 0.005717477761209011, 0.0059623513370752335, 0.006207224912941456, 0.006452098488807678, 0.006696972064673901, 0.006941845640540123, 0.007186719216406345, 0.007431592792272568, 0.00767646636813879, 0.007921339944005013, 0.008166213519871235, 0.008411087095737457, 0.00865596067160368, 0.008900834247469902, 0.009145707823336124, 0.009390581399202347, 0.00963545497506857, 0.009880328550934792, 0.010125202126801014, 0.010370075702667236]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 6.0, 11.0, 9.0, 8.0, 10.0, 7.0, 19.0, 20.0, 23.0, 24.0, 20.0, 30.0, 33.0, 34.0, 47.0, 44.0, 41.0, 51.0, 49.0, 42.0, 39.0, 39.0, 34.0, 37.0, 36.0, 33.0, 42.0, 28.0, 29.0, 26.0, 16.0, 27.0, 13.0, 15.0, 11.0, 8.0, 11.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75390625, -4.60736083984375, -4.4608154296875, -4.31427001953125, -4.167724609375, -4.02117919921875, -3.8746337890625, -3.72808837890625, -3.58154296875, -3.43499755859375, -3.2884521484375, -3.14190673828125, -2.995361328125, -2.84881591796875, -2.7022705078125, -2.55572509765625, -2.4091796875, -2.26263427734375, -2.1160888671875, -1.96954345703125, -1.822998046875, -1.67645263671875, -1.5299072265625, -1.38336181640625, -1.23681640625, -1.09027099609375, -0.9437255859375, -0.79718017578125, -0.650634765625, -0.50408935546875, -0.3575439453125, -0.21099853515625, -0.064453125, 0.08209228515625, 0.2286376953125, 0.37518310546875, 0.521728515625, 0.66827392578125, 0.8148193359375, 0.96136474609375, 1.10791015625, 1.25445556640625, 1.4010009765625, 1.54754638671875, 1.694091796875, 1.84063720703125, 1.9871826171875, 2.13372802734375, 2.2802734375, 2.42681884765625, 2.5733642578125, 2.71990966796875, 2.866455078125, 3.01300048828125, 3.1595458984375, 3.30609130859375, 3.45263671875, 3.59918212890625, 3.7457275390625, 3.89227294921875, 4.038818359375, 4.18536376953125, 4.3319091796875, 4.47845458984375, 4.625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 7.0, 9.0, 9.0, 8.0, 13.0, 7.0, 20.0, 38.0, 56.0, 80.0, 142.0, 290.0, 603.0, 1307.0, 2954.0, 6925.0, 16210.0, 37500.0, 97181.0, 278768.0, 369043.0, 144667.0, 53482.0, 22008.0, 9589.0, 4146.0, 1760.0, 817.0, 417.0, 183.0, 113.0, 64.0, 32.0, 28.0, 28.0, 8.0, 7.0, 10.0, 6.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.124755859375, -4.96044921875, -4.796142578125, -4.6318359375, -4.467529296875, -4.30322265625, -4.138916015625, -3.974609375, -3.810302734375, -3.64599609375, -3.481689453125, -3.3173828125, -3.153076171875, -2.98876953125, -2.824462890625, -2.66015625, -2.495849609375, -2.33154296875, -2.167236328125, -2.0029296875, -1.838623046875, -1.67431640625, -1.510009765625, -1.345703125, -1.181396484375, -1.01708984375, -0.852783203125, -0.6884765625, -0.524169921875, -0.35986328125, -0.195556640625, -0.03125, 0.133056640625, 0.29736328125, 0.461669921875, 0.6259765625, 0.790283203125, 0.95458984375, 1.118896484375, 1.283203125, 1.447509765625, 1.61181640625, 1.776123046875, 1.9404296875, 2.104736328125, 2.26904296875, 2.433349609375, 2.59765625, 2.761962890625, 2.92626953125, 3.090576171875, 3.2548828125, 3.419189453125, 3.58349609375, 3.747802734375, 3.912109375, 4.076416015625, 4.24072265625, 4.405029296875, 4.5693359375, 4.733642578125, 4.89794921875, 5.062255859375, 5.2265625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 5.0, 6.0, 9.0, 14.0, 23.0, 30.0, 18.0, 29.0, 29.0, 32.0, 31.0, 39.0, 42.0, 52.0, 53.0, 113.0, 224.0, 1430.0, 269.0, 131.0, 68.0, 40.0, 54.0, 46.0, 42.0, 33.0, 33.0, 18.0, 17.0, 21.0, 12.0, 12.0, 14.0, 18.0, 5.0, 5.0, 8.0, 4.0, 4.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.14453125, -15.6640625, -15.18359375, -14.703125, -14.22265625, -13.7421875, -13.26171875, -12.78125, -12.30078125, -11.8203125, -11.33984375, -10.859375, -10.37890625, -9.8984375, -9.41796875, -8.9375, -8.45703125, -7.9765625, -7.49609375, -7.015625, -6.53515625, -6.0546875, -5.57421875, -5.09375, -4.61328125, -4.1328125, -3.65234375, -3.171875, -2.69140625, -2.2109375, -1.73046875, -1.25, -0.76953125, -0.2890625, 0.19140625, 0.671875, 1.15234375, 1.6328125, 2.11328125, 2.59375, 3.07421875, 3.5546875, 4.03515625, 4.515625, 4.99609375, 5.4765625, 5.95703125, 6.4375, 6.91796875, 7.3984375, 7.87890625, 8.359375, 8.83984375, 9.3203125, 9.80078125, 10.28125, 10.76171875, 11.2421875, 11.72265625, 12.203125, 12.68359375, 13.1640625, 13.64453125, 14.125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 16.0, 11.0, 13.0, 13.0, 23.0, 26.0, 31.0, 38.0, 78.0, 75.0, 118.0, 217.0, 283.0, 562.0, 1366.0, 7476.0, 1016485.0, 2105467.0, 10259.0, 1515.0, 636.0, 289.0, 181.0, 148.0, 93.0, 69.0, 55.0, 29.0, 24.0, 15.0, 17.0, 12.0, 7.0, 8.0, 11.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-35.0625, -34.062255859375, -33.06201171875, -32.061767578125, -31.0615234375, -30.061279296875, -29.06103515625, -28.060791015625, -27.060546875, -26.060302734375, -25.06005859375, -24.059814453125, -23.0595703125, -22.059326171875, -21.05908203125, -20.058837890625, -19.05859375, -18.058349609375, -17.05810546875, -16.057861328125, -15.0576171875, -14.057373046875, -13.05712890625, -12.056884765625, -11.056640625, -10.056396484375, -9.05615234375, -8.055908203125, -7.0556640625, -6.055419921875, -5.05517578125, -4.054931640625, -3.0546875, -2.054443359375, -1.05419921875, -0.053955078125, 0.9462890625, 1.946533203125, 2.94677734375, 3.947021484375, 4.947265625, 5.947509765625, 6.94775390625, 7.947998046875, 8.9482421875, 9.948486328125, 10.94873046875, 11.948974609375, 12.94921875, 13.949462890625, 14.94970703125, 15.949951171875, 16.9501953125, 17.950439453125, 18.95068359375, 19.950927734375, 20.951171875, 21.951416015625, 22.95166015625, 23.951904296875, 24.9521484375, 25.952392578125, 26.95263671875, 27.952880859375, 28.953125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 22.0, 120.0, 383.0, 354.0, 111.0, 22.0, 2.0, 1.0, 0.0, 1.0], "bins": [-128.77508544921875, -126.50971984863281, -124.24435424804688, -121.97898864746094, -119.713623046875, -117.44825744628906, -115.18289184570312, -112.91753387451172, -110.65216827392578, -108.38680267333984, -106.1214370727539, -103.85607147216797, -101.59070587158203, -99.32534790039062, -97.05998229980469, -94.79461669921875, -92.52925109863281, -90.26388549804688, -87.99851989746094, -85.733154296875, -83.46778869628906, -81.20242309570312, -78.93705749511719, -76.67169952392578, -74.40632629394531, -72.14096069335938, -69.87559509277344, -67.6102294921875, -65.34486389160156, -63.07950210571289, -60.81413650512695, -58.548770904541016, -56.283409118652344, -54.018043518066406, -51.75267791748047, -49.48731231689453, -47.22195053100586, -44.95658493041992, -42.691219329833984, -40.42585372924805, -38.16048812866211, -35.89512252807617, -33.629756927490234, -31.36439323425293, -29.099029541015625, -26.833663940429688, -24.56829833984375, -22.302932739257812, -20.037569046020508, -17.77220344543457, -15.506839752197266, -13.241474151611328, -10.976109504699707, -8.710744857788086, -6.445379257202148, -4.180014610290527, -1.9146499633789062, 0.35071492195129395, 2.616079807281494, 4.881444931030273, 7.1468095779418945, 9.412174224853516, 11.677539825439453, 13.942904472351074, 16.208269119262695]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 6.0, 9.0, 5.0, 5.0, 12.0, 10.0, 7.0, 11.0, 11.0, 17.0, 15.0, 28.0, 31.0, 31.0, 30.0, 33.0, 33.0, 36.0, 49.0, 36.0, 33.0, 40.0, 35.0, 32.0, 44.0, 44.0, 27.0, 35.0, 35.0, 37.0, 33.0, 26.0, 26.0, 13.0, 23.0, 22.0, 11.0, 13.0, 11.0, 8.0, 6.0, 5.0, 5.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-36.420597076416016, -35.336246490478516, -34.25189971923828, -33.16754913330078, -32.08319854736328, -30.99884796142578, -29.914499282836914, -28.830150604248047, -27.745800018310547, -26.661449432373047, -25.57710075378418, -24.492752075195312, -23.408401489257812, -22.324050903320312, -21.239702224731445, -20.155353546142578, -19.071002960205078, -17.986652374267578, -16.90230369567871, -15.817954063415527, -14.733604431152344, -13.64925479888916, -12.564905166625977, -11.480555534362793, -10.39620590209961, -9.311856269836426, -8.227506637573242, -7.143157005310059, -6.058807373046875, -4.974457740783691, -3.890108108520508, -2.805758476257324, -1.7214126586914062, -0.6370630264282227, 0.44728660583496094, 1.5316362380981445, 2.615985870361328, 3.7003355026245117, 4.784685134887695, 5.869034767150879, 6.9533843994140625, 8.037734031677246, 9.12208366394043, 10.206433296203613, 11.290782928466797, 12.37513256072998, 13.459482192993164, 14.543831825256348, 15.628181457519531, 16.71253204345703, 17.7968807220459, 18.881229400634766, 19.965579986572266, 21.049930572509766, 22.134279251098633, 23.2186279296875, 24.302978515625, 25.3873291015625, 26.471677780151367, 27.556026458740234, 28.640377044677734, 29.724727630615234, 30.8090763092041, 31.89342498779297, 32.97777557373047]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 2.0, 9.0, 9.0, 16.0, 11.0, 13.0, 21.0, 17.0, 21.0, 28.0, 42.0, 37.0, 33.0, 39.0, 50.0, 35.0, 42.0, 50.0, 53.0, 41.0, 44.0, 42.0, 34.0, 39.0, 32.0, 25.0, 32.0, 33.0, 23.0, 19.0, 20.0, 14.0, 13.0, 11.0, 8.0, 8.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.25390625, -5.09564208984375, -4.9373779296875, -4.77911376953125, -4.620849609375, -4.46258544921875, -4.3043212890625, -4.14605712890625, -3.98779296875, -3.82952880859375, -3.6712646484375, -3.51300048828125, -3.354736328125, -3.19647216796875, -3.0382080078125, -2.87994384765625, -2.7216796875, -2.56341552734375, -2.4051513671875, -2.24688720703125, -2.088623046875, -1.93035888671875, -1.7720947265625, -1.61383056640625, -1.45556640625, -1.29730224609375, -1.1390380859375, -0.98077392578125, -0.822509765625, -0.66424560546875, -0.5059814453125, -0.34771728515625, -0.189453125, -0.03118896484375, 0.1270751953125, 0.28533935546875, 0.443603515625, 0.60186767578125, 0.7601318359375, 0.91839599609375, 1.07666015625, 1.23492431640625, 1.3931884765625, 1.55145263671875, 1.709716796875, 1.86798095703125, 2.0262451171875, 2.18450927734375, 2.3427734375, 2.50103759765625, 2.6593017578125, 2.81756591796875, 2.975830078125, 3.13409423828125, 3.2923583984375, 3.45062255859375, 3.60888671875, 3.76715087890625, 3.9254150390625, 4.08367919921875, 4.241943359375, 4.40020751953125, 4.5584716796875, 4.71673583984375, 4.875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 4.0, 7.0, 3.0, 11.0, 5.0, 7.0, 18.0, 24.0, 11.0, 26.0, 29.0, 39.0, 42.0, 61.0, 81.0, 156.0, 373.0, 1545.0, 9986.0, 131384.0, 1956813.0, 1946742.0, 133866.0, 10468.0, 1606.0, 425.0, 164.0, 85.0, 60.0, 46.0, 28.0, 29.0, 28.0, 20.0, 21.0, 17.0, 8.0, 8.0, 7.0, 8.0, 4.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6796875, -11.314697265625, -10.94970703125, -10.584716796875, -10.2197265625, -9.854736328125, -9.48974609375, -9.124755859375, -8.759765625, -8.394775390625, -8.02978515625, -7.664794921875, -7.2998046875, -6.934814453125, -6.56982421875, -6.204833984375, -5.83984375, -5.474853515625, -5.10986328125, -4.744873046875, -4.3798828125, -4.014892578125, -3.64990234375, -3.284912109375, -2.919921875, -2.554931640625, -2.18994140625, -1.824951171875, -1.4599609375, -1.094970703125, -0.72998046875, -0.364990234375, 0.0, 0.364990234375, 0.72998046875, 1.094970703125, 1.4599609375, 1.824951171875, 2.18994140625, 2.554931640625, 2.919921875, 3.284912109375, 3.64990234375, 4.014892578125, 4.3798828125, 4.744873046875, 5.10986328125, 5.474853515625, 5.83984375, 6.204833984375, 6.56982421875, 6.934814453125, 7.2998046875, 7.664794921875, 8.02978515625, 8.394775390625, 8.759765625, 9.124755859375, 9.48974609375, 9.854736328125, 10.2197265625, 10.584716796875, 10.94970703125, 11.314697265625, 11.6796875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 10.0, 12.0, 13.0, 17.0, 20.0, 26.0, 43.0, 37.0, 57.0, 77.0, 105.0, 124.0, 173.0, 256.0, 372.0, 388.0, 448.0, 447.0, 353.0, 272.0, 207.0, 138.0, 113.0, 84.0, 66.0, 42.0, 38.0, 28.0, 26.0, 22.0, 9.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.56640625, -7.34814453125, -7.1298828125, -6.91162109375, -6.693359375, -6.47509765625, -6.2568359375, -6.03857421875, -5.8203125, -5.60205078125, -5.3837890625, -5.16552734375, -4.947265625, -4.72900390625, -4.5107421875, -4.29248046875, -4.07421875, -3.85595703125, -3.6376953125, -3.41943359375, -3.201171875, -2.98291015625, -2.7646484375, -2.54638671875, -2.328125, -2.10986328125, -1.8916015625, -1.67333984375, -1.455078125, -1.23681640625, -1.0185546875, -0.80029296875, -0.58203125, -0.36376953125, -0.1455078125, 0.07275390625, 0.291015625, 0.50927734375, 0.7275390625, 0.94580078125, 1.1640625, 1.38232421875, 1.6005859375, 1.81884765625, 2.037109375, 2.25537109375, 2.4736328125, 2.69189453125, 2.91015625, 3.12841796875, 3.3466796875, 3.56494140625, 3.783203125, 4.00146484375, 4.2197265625, 4.43798828125, 4.65625, 4.87451171875, 5.0927734375, 5.31103515625, 5.529296875, 5.74755859375, 5.9658203125, 6.18408203125, 6.40234375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 12.0, 20.0, 24.0, 31.0, 45.0, 66.0, 89.0, 104.0, 140.0, 255.0, 344.0, 679.0, 2541.0, 52063.0, 2939981.0, 1173490.0, 21108.0, 1641.0, 552.0, 331.0, 207.0, 137.0, 101.0, 68.0, 59.0, 43.0, 34.0, 21.0, 12.0, 19.0, 14.0, 4.0, 6.0, 5.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.609375, -21.8525390625, -21.095703125, -20.3388671875, -19.58203125, -18.8251953125, -18.068359375, -17.3115234375, -16.5546875, -15.7978515625, -15.041015625, -14.2841796875, -13.52734375, -12.7705078125, -12.013671875, -11.2568359375, -10.5, -9.7431640625, -8.986328125, -8.2294921875, -7.47265625, -6.7158203125, -5.958984375, -5.2021484375, -4.4453125, -3.6884765625, -2.931640625, -2.1748046875, -1.41796875, -0.6611328125, 0.095703125, 0.8525390625, 1.609375, 2.3662109375, 3.123046875, 3.8798828125, 4.63671875, 5.3935546875, 6.150390625, 6.9072265625, 7.6640625, 8.4208984375, 9.177734375, 9.9345703125, 10.69140625, 11.4482421875, 12.205078125, 12.9619140625, 13.71875, 14.4755859375, 15.232421875, 15.9892578125, 16.74609375, 17.5029296875, 18.259765625, 19.0166015625, 19.7734375, 20.5302734375, 21.287109375, 22.0439453125, 22.80078125, 23.5576171875, 24.314453125, 25.0712890625, 25.828125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 10.0, 39.0, 131.0, 253.0, 318.0, 173.0, 72.0, 18.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.6399154663086, -86.26260375976562, -83.88529205322266, -81.50798034667969, -79.13066864013672, -76.75335693359375, -74.37604522705078, -71.99873352050781, -69.62142944335938, -67.2441177368164, -64.86680603027344, -62.48949432373047, -60.1121826171875, -57.73487091064453, -55.35756301879883, -52.98025131225586, -50.602935791015625, -48.225624084472656, -45.84831237792969, -43.47100067138672, -41.09368896484375, -38.71637725830078, -36.33906936645508, -33.96175765991211, -31.58444595336914, -29.207134246826172, -26.829822540283203, -24.452512741088867, -22.0752010345459, -19.69788932800293, -17.320579528808594, -14.943267822265625, -12.565963745117188, -10.188652038574219, -7.811341285705566, -5.434030055999756, -3.0567188262939453, -0.6794071197509766, 1.6979036331176758, 4.075214385986328, 6.452526092529297, 8.829837799072266, 11.207148551940918, 13.58445930480957, 15.961771011352539, 18.339082717895508, 20.716392517089844, 23.093704223632812, 25.47101593017578, 27.84832763671875, 30.22563934326172, 32.60295104980469, 34.980262756347656, 37.357574462890625, 39.73488235473633, 42.1121940612793, 44.489505767822266, 46.866817474365234, 49.2441291809082, 51.62144088745117, 53.998748779296875, 56.376060485839844, 58.75337219238281, 61.13068389892578, 63.50799560546875]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 6.0, 9.0, 7.0, 13.0, 8.0, 15.0, 17.0, 21.0, 21.0, 24.0, 33.0, 21.0, 34.0, 26.0, 36.0, 43.0, 39.0, 49.0, 38.0, 46.0, 38.0, 48.0, 41.0, 38.0, 46.0, 28.0, 40.0, 25.0, 37.0, 19.0, 24.0, 24.0, 17.0, 10.0, 6.0, 12.0, 7.0, 10.0, 4.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.472126007080078, -24.712486267089844, -23.95284652709961, -23.193206787109375, -22.43356704711914, -21.673927307128906, -20.914287567138672, -20.154647827148438, -19.395008087158203, -18.63536834716797, -17.875728607177734, -17.1160888671875, -16.356449127197266, -15.596809387207031, -14.837169647216797, -14.077529907226562, -13.317890167236328, -12.558250427246094, -11.79861068725586, -11.038970947265625, -10.27933120727539, -9.519691467285156, -8.760051727294922, -8.000411987304688, -7.240772247314453, -6.481132507324219, -5.721492767333984, -4.96185302734375, -4.202213287353516, -3.4425735473632812, -2.682933807373047, -1.9232940673828125, -1.1636543273925781, -0.40401458740234375, 0.3556251525878906, 1.115264892578125, 1.8749046325683594, 2.6345443725585938, 3.394184112548828, 4.1538238525390625, 4.913463592529297, 5.673103332519531, 6.432743072509766, 7.1923828125, 7.952022552490234, 8.711662292480469, 9.471302032470703, 10.230941772460938, 10.990581512451172, 11.750221252441406, 12.50986099243164, 13.269500732421875, 14.02914047241211, 14.788780212402344, 15.548419952392578, 16.308059692382812, 17.067699432373047, 17.82733917236328, 18.586978912353516, 19.34661865234375, 20.106258392333984, 20.86589813232422, 21.625537872314453, 22.385177612304688, 23.144817352294922]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 6.0, 9.0, 11.0, 11.0, 15.0, 12.0, 26.0, 20.0, 23.0, 28.0, 21.0, 40.0, 33.0, 42.0, 37.0, 40.0, 42.0, 44.0, 47.0, 43.0, 45.0, 43.0, 31.0, 42.0, 39.0, 25.0, 35.0, 24.0, 21.0, 19.0, 18.0, 23.0, 15.0, 13.0, 10.0, 12.0, 7.0, 3.0, 5.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.703125, -4.55908203125, -4.4150390625, -4.27099609375, -4.126953125, -3.98291015625, -3.8388671875, -3.69482421875, -3.55078125, -3.40673828125, -3.2626953125, -3.11865234375, -2.974609375, -2.83056640625, -2.6865234375, -2.54248046875, -2.3984375, -2.25439453125, -2.1103515625, -1.96630859375, -1.822265625, -1.67822265625, -1.5341796875, -1.39013671875, -1.24609375, -1.10205078125, -0.9580078125, -0.81396484375, -0.669921875, -0.52587890625, -0.3818359375, -0.23779296875, -0.09375, 0.05029296875, 0.1943359375, 0.33837890625, 0.482421875, 0.62646484375, 0.7705078125, 0.91455078125, 1.05859375, 1.20263671875, 1.3466796875, 1.49072265625, 1.634765625, 1.77880859375, 1.9228515625, 2.06689453125, 2.2109375, 2.35498046875, 2.4990234375, 2.64306640625, 2.787109375, 2.93115234375, 3.0751953125, 3.21923828125, 3.36328125, 3.50732421875, 3.6513671875, 3.79541015625, 3.939453125, 4.08349609375, 4.2275390625, 4.37158203125, 4.515625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 13.0, 18.0, 18.0, 23.0, 42.0, 63.0, 89.0, 169.0, 191.0, 328.0, 589.0, 971.0, 1563.0, 2624.0, 4482.0, 7968.0, 13795.0, 24434.0, 44600.0, 81900.0, 147439.0, 226588.0, 208116.0, 125901.0, 69598.0, 37734.0, 20909.0, 11785.0, 6788.0, 3880.0, 2259.0, 1358.0, 865.0, 511.0, 350.0, 202.0, 135.0, 102.0, 53.0, 32.0, 23.0, 16.0, 5.0, 8.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.5751953125, -0.5586967468261719, -0.5421981811523438, -0.5256996154785156, -0.5092010498046875, -0.4927024841308594, -0.47620391845703125, -0.4597053527832031, -0.443206787109375, -0.4267082214355469, -0.41020965576171875, -0.3937110900878906, -0.3772125244140625, -0.3607139587402344, -0.34421539306640625, -0.3277168273925781, -0.31121826171875, -0.2947196960449219, -0.27822113037109375, -0.2617225646972656, -0.2452239990234375, -0.22872543334960938, -0.21222686767578125, -0.19572830200195312, -0.179229736328125, -0.16273117065429688, -0.14623260498046875, -0.12973403930664062, -0.1132354736328125, -0.09673690795898438, -0.08023834228515625, -0.06373977661132812, -0.0472412109375, -0.030742645263671875, -0.01424407958984375, 0.002254486083984375, 0.0187530517578125, 0.035251617431640625, 0.05175018310546875, 0.06824874877929688, 0.084747314453125, 0.10124588012695312, 0.11774444580078125, 0.13424301147460938, 0.1507415771484375, 0.16724014282226562, 0.18373870849609375, 0.20023727416992188, 0.21673583984375, 0.23323440551757812, 0.24973297119140625, 0.2662315368652344, 0.2827301025390625, 0.2992286682128906, 0.31572723388671875, 0.3322257995605469, 0.348724365234375, 0.3652229309082031, 0.38172149658203125, 0.3982200622558594, 0.4147186279296875, 0.4312171936035156, 0.44771575927734375, 0.4642143249511719, 0.480712890625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 7.0, 10.0, 11.0, 12.0, 17.0, 20.0, 11.0, 27.0, 23.0, 32.0, 37.0, 31.0, 52.0, 30.0, 38.0, 31.0, 40.0, 41.0, 1058.0, 43.0, 33.0, 44.0, 34.0, 30.0, 35.0, 29.0, 30.0, 36.0, 17.0, 27.0, 16.0, 19.0, 17.0, 15.0, 10.0, 11.0, 8.0, 9.0, 5.0, 9.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.1953125, -3.10491943359375, -3.0145263671875, -2.92413330078125, -2.833740234375, -2.74334716796875, -2.6529541015625, -2.56256103515625, -2.47216796875, -2.38177490234375, -2.2913818359375, -2.20098876953125, -2.110595703125, -2.02020263671875, -1.9298095703125, -1.83941650390625, -1.7490234375, -1.65863037109375, -1.5682373046875, -1.47784423828125, -1.387451171875, -1.29705810546875, -1.2066650390625, -1.11627197265625, -1.02587890625, -0.93548583984375, -0.8450927734375, -0.75469970703125, -0.664306640625, -0.57391357421875, -0.4835205078125, -0.39312744140625, -0.302734375, -0.21234130859375, -0.1219482421875, -0.03155517578125, 0.058837890625, 0.14923095703125, 0.2396240234375, 0.33001708984375, 0.42041015625, 0.51080322265625, 0.6011962890625, 0.69158935546875, 0.781982421875, 0.87237548828125, 0.9627685546875, 1.05316162109375, 1.1435546875, 1.23394775390625, 1.3243408203125, 1.41473388671875, 1.505126953125, 1.59552001953125, 1.6859130859375, 1.77630615234375, 1.86669921875, 1.95709228515625, 2.0474853515625, 2.13787841796875, 2.228271484375, 2.31866455078125, 2.4090576171875, 2.49945068359375, 2.58984375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 6.0, 4.0, 20.0, 21.0, 31.0, 50.0, 96.0, 102.0, 177.0, 226.0, 316.0, 436.0, 594.0, 938.0, 1260.0, 1737.0, 2470.0, 3583.0, 5115.0, 7318.0, 10625.0, 15274.0, 22148.0, 32633.0, 47083.0, 67356.0, 93478.0, 124041.0, 1187908.0, 132726.0, 101039.0, 72759.0, 51060.0, 35566.0, 24439.0, 16608.0, 11517.0, 7935.0, 5384.0, 3851.0, 2722.0, 1858.0, 1359.0, 971.0, 653.0, 535.0, 351.0, 254.0, 176.0, 115.0, 80.0, 52.0, 27.0, 25.0, 12.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.252197265625, -0.24422073364257812, -0.23624420166015625, -0.22826766967773438, -0.2202911376953125, -0.21231460571289062, -0.20433807373046875, -0.19636154174804688, -0.188385009765625, -0.18040847778320312, -0.17243194580078125, -0.16445541381835938, -0.1564788818359375, -0.14850234985351562, -0.14052581787109375, -0.13254928588867188, -0.12457275390625, -0.11659622192382812, -0.10861968994140625, -0.10064315795898438, -0.0926666259765625, -0.08469009399414062, -0.07671356201171875, -0.06873703002929688, -0.060760498046875, -0.052783966064453125, -0.04480743408203125, -0.036830902099609375, -0.0288543701171875, -0.020877838134765625, -0.01290130615234375, -0.004924774169921875, 0.0030517578125, 0.011028289794921875, 0.01900482177734375, 0.026981353759765625, 0.0349578857421875, 0.042934417724609375, 0.05091094970703125, 0.058887481689453125, 0.066864013671875, 0.07484054565429688, 0.08281707763671875, 0.09079360961914062, 0.0987701416015625, 0.10674667358398438, 0.11472320556640625, 0.12269973754882812, 0.13067626953125, 0.13865280151367188, 0.14662933349609375, 0.15460586547851562, 0.1625823974609375, 0.17055892944335938, 0.17853546142578125, 0.18651199340820312, 0.194488525390625, 0.20246505737304688, 0.21044158935546875, 0.21841812133789062, 0.2263946533203125, 0.23437118530273438, 0.24234771728515625, 0.2503242492675781, 0.25830078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 7.0, 10.0, 5.0, 10.0, 9.0, 11.0, 14.0, 25.0, 28.0, 50.0, 49.0, 98.0, 104.0, 123.0, 120.0, 70.0, 61.0, 42.0, 25.0, 28.0, 11.0, 10.0, 12.0, 9.0, 10.0, 7.0, 3.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005950927734375, -0.005760610103607178, -0.0055702924728393555, -0.005379974842071533, -0.005189657211303711, -0.004999339580535889, -0.004809021949768066, -0.004618704319000244, -0.004428386688232422, -0.0042380690574646, -0.004047751426696777, -0.003857433795928955, -0.003667116165161133, -0.0034767985343933105, -0.0032864809036254883, -0.003096163272857666, -0.0029058456420898438, -0.0027155280113220215, -0.0025252103805541992, -0.002334892749786377, -0.0021445751190185547, -0.0019542574882507324, -0.0017639398574829102, -0.0015736222267150879, -0.0013833045959472656, -0.0011929869651794434, -0.001002669334411621, -0.0008123517036437988, -0.0006220340728759766, -0.0004317164421081543, -0.00024139881134033203, -5.1081180572509766e-05, 0.0001392364501953125, 0.00032955408096313477, 0.000519871711730957, 0.0007101893424987793, 0.0009005069732666016, 0.0010908246040344238, 0.001281142234802246, 0.0014714598655700684, 0.0016617774963378906, 0.0018520951271057129, 0.002042412757873535, 0.0022327303886413574, 0.0024230480194091797, 0.002613365650177002, 0.0028036832809448242, 0.0029940009117126465, 0.0031843185424804688, 0.003374636173248291, 0.0035649538040161133, 0.0037552714347839355, 0.003945589065551758, 0.00413590669631958, 0.004326224327087402, 0.004516541957855225, 0.004706859588623047, 0.004897177219390869, 0.005087494850158691, 0.005277812480926514, 0.005468130111694336, 0.005658447742462158, 0.0058487653732299805, 0.006039083003997803, 0.006229400634765625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 4.0, 8.0, 16.0, 17.0, 15.0, 22.0, 27.0, 49.0, 48.0, 97.0, 172.0, 281.0, 761.0, 312645.0, 732629.0, 945.0, 293.0, 165.0, 92.0, 47.0, 44.0, 20.0, 29.0, 19.0, 19.0, 13.0, 7.0, 11.0, 9.0, 10.0, 5.0, 2.0, 7.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1400146484375, -0.13590145111083984, -0.1317882537841797, -0.12767505645751953, -0.12356185913085938, -0.11944866180419922, -0.11533546447753906, -0.1112222671508789, -0.10710906982421875, -0.1029958724975586, -0.09888267517089844, -0.09476947784423828, -0.09065628051757812, -0.08654308319091797, -0.08242988586425781, -0.07831668853759766, -0.0742034912109375, -0.07009029388427734, -0.06597709655761719, -0.06186389923095703, -0.057750701904296875, -0.05363750457763672, -0.04952430725097656, -0.045411109924316406, -0.04129791259765625, -0.037184715270996094, -0.03307151794433594, -0.02895832061767578, -0.024845123291015625, -0.02073192596435547, -0.016618728637695312, -0.012505531311035156, -0.008392333984375, -0.004279136657714844, -0.0001659393310546875, 0.003947257995605469, 0.008060455322265625, 0.012173652648925781, 0.016286849975585938, 0.020400047302246094, 0.02451324462890625, 0.028626441955566406, 0.03273963928222656, 0.03685283660888672, 0.040966033935546875, 0.04507923126220703, 0.04919242858886719, 0.053305625915527344, 0.0574188232421875, 0.061532020568847656, 0.06564521789550781, 0.06975841522216797, 0.07387161254882812, 0.07798480987548828, 0.08209800720214844, 0.0862112045288086, 0.09032440185546875, 0.0944375991821289, 0.09855079650878906, 0.10266399383544922, 0.10677719116210938, 0.11089038848876953, 0.11500358581542969, 0.11911678314208984, 0.12322998046875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [10.0, 89.0, 608.0, 271.0, 31.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018283004174008965, -0.0011512056225910783, -0.00047411082778126, 0.00020298396702855825, 0.0008800787618383765, 0.0015571735566481948, 0.002234268467873335, 0.002911363262683153, 0.0035884580574929714, 0.00426555285230279, 0.004942647647112608, 0.005619742441922426, 0.0062968372367322445, 0.006973932031542063, 0.007651026826351881, 0.008328121155500412, 0.00900521595031023, 0.009682310745120049, 0.010359405539929867, 0.011036500334739685, 0.011713595129549503, 0.012390689924359322, 0.01306778471916914, 0.013744879513978958, 0.014421974308788776, 0.015099069103598595, 0.015776164829730988, 0.01645325869321823, 0.017130352556705475, 0.017807448282837868, 0.01848454400897026, 0.019161637872457504, 0.019838731735944748, 0.02051582559943199, 0.021192921325564384, 0.021870017051696777, 0.02254711091518402, 0.023224204778671265, 0.023901300504803658, 0.02457839623093605, 0.025255490094423294, 0.025932583957910538, 0.02660967968404293, 0.027286775410175323, 0.027963869273662567, 0.02864096313714981, 0.029318058863282204, 0.029995154589414597, 0.03067224845290184, 0.031349342316389084, 0.032026439905166626, 0.03270353376865387, 0.03338062763214111, 0.03405772149562836, 0.0347348153591156, 0.03541191294789314, 0.036089006811380386, 0.03676610067486763, 0.03744319826364517, 0.038120292127132416, 0.03879738599061966, 0.0394744798541069, 0.04015157371759415, 0.04082867130637169, 0.04150576516985893]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 10.0, 8.0, 16.0, 20.0, 17.0, 16.0, 18.0, 23.0, 25.0, 28.0, 26.0, 36.0, 36.0, 39.0, 34.0, 40.0, 49.0, 29.0, 31.0, 41.0, 47.0, 39.0, 35.0, 43.0, 38.0, 30.0, 36.0, 24.0, 25.0, 17.0, 18.0, 15.0, 21.0, 14.0, 8.0, 7.0, 6.0, 10.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031104683876037598, -0.003012058325111866, -0.0029136482626199722, -0.0028152382001280785, -0.0027168281376361847, -0.002618418075144291, -0.002520008012652397, -0.0024215979501605034, -0.0023231878876686096, -0.002224777825176716, -0.002126367762684822, -0.0020279577001929283, -0.0019295476377010345, -0.0018311375752091408, -0.001732727512717247, -0.0016343174502253532, -0.0015359073877334595, -0.0014374973252415657, -0.001339087262749672, -0.0012406772002577782, -0.0011422671377658844, -0.0010438570752739906, -0.0009454470127820969, -0.0008470369502902031, -0.0007486268877983093, -0.0006502168253064156, -0.0005518067628145218, -0.000453396700322628, -0.00035498663783073425, -0.0002565765753388405, -0.00015816651284694672, -5.975645035505295e-05, 3.865361213684082e-05, 0.0001370636746287346, 0.00023547373712062836, 0.0003338837996125221, 0.0004322938621044159, 0.0005307039245963097, 0.0006291139870882034, 0.0007275240495800972, 0.000825934112071991, 0.0009243441745638847, 0.0010227542370557785, 0.0011211642995476723, 0.001219574362039566, 0.0013179844245314598, 0.0014163944870233536, 0.0015148045495152473, 0.0016132146120071411, 0.0017116246744990349, 0.0018100347369909286, 0.0019084447994828224, 0.002006854861974716, 0.00210526492446661, 0.0022036749869585037, 0.0023020850494503975, 0.0024004951119422913, 0.002498905174434185, 0.002597315236926079, 0.0026957252994179726, 0.0027941353619098663, 0.00289254542440176, 0.002990955486893654, 0.0030893655493855476, 0.0031877756118774414]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 6.0, 9.0, 11.0, 11.0, 15.0, 12.0, 26.0, 20.0, 23.0, 28.0, 21.0, 40.0, 33.0, 42.0, 37.0, 40.0, 42.0, 44.0, 47.0, 43.0, 45.0, 43.0, 31.0, 42.0, 39.0, 25.0, 35.0, 24.0, 21.0, 19.0, 17.0, 24.0, 15.0, 13.0, 10.0, 12.0, 7.0, 3.0, 5.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.703125, -4.55908203125, -4.4150390625, -4.27099609375, -4.126953125, -3.98291015625, -3.8388671875, -3.69482421875, -3.55078125, -3.40673828125, -3.2626953125, -3.11865234375, -2.974609375, -2.83056640625, -2.6865234375, -2.54248046875, -2.3984375, -2.25439453125, -2.1103515625, -1.96630859375, -1.822265625, -1.67822265625, -1.5341796875, -1.39013671875, -1.24609375, -1.10205078125, -0.9580078125, -0.81396484375, -0.669921875, -0.52587890625, -0.3818359375, -0.23779296875, -0.09375, 0.05029296875, 0.1943359375, 0.33837890625, 0.482421875, 0.62646484375, 0.7705078125, 0.91455078125, 1.05859375, 1.20263671875, 1.3466796875, 1.49072265625, 1.634765625, 1.77880859375, 1.9228515625, 2.06689453125, 2.2109375, 2.35498046875, 2.4990234375, 2.64306640625, 2.787109375, 2.93115234375, 3.0751953125, 3.21923828125, 3.36328125, 3.50732421875, 3.6513671875, 3.79541015625, 3.939453125, 4.08349609375, 4.2275390625, 4.37158203125, 4.515625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 7.0, 9.0, 15.0, 16.0, 19.0, 24.0, 35.0, 47.0, 74.0, 65.0, 107.0, 142.0, 205.0, 338.0, 650.0, 1729.0, 6949.0, 31052.0, 176923.0, 640838.0, 152157.0, 27748.0, 6189.0, 1562.0, 558.0, 304.0, 201.0, 136.0, 103.0, 74.0, 58.0, 57.0, 35.0, 26.0, 23.0, 17.0, 10.0, 13.0, 5.0, 6.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.125, -8.852294921875, -8.57958984375, -8.306884765625, -8.0341796875, -7.761474609375, -7.48876953125, -7.216064453125, -6.943359375, -6.670654296875, -6.39794921875, -6.125244140625, -5.8525390625, -5.579833984375, -5.30712890625, -5.034423828125, -4.76171875, -4.489013671875, -4.21630859375, -3.943603515625, -3.6708984375, -3.398193359375, -3.12548828125, -2.852783203125, -2.580078125, -2.307373046875, -2.03466796875, -1.761962890625, -1.4892578125, -1.216552734375, -0.94384765625, -0.671142578125, -0.3984375, -0.125732421875, 0.14697265625, 0.419677734375, 0.6923828125, 0.965087890625, 1.23779296875, 1.510498046875, 1.783203125, 2.055908203125, 2.32861328125, 2.601318359375, 2.8740234375, 3.146728515625, 3.41943359375, 3.692138671875, 3.96484375, 4.237548828125, 4.51025390625, 4.782958984375, 5.0556640625, 5.328369140625, 5.60107421875, 5.873779296875, 6.146484375, 6.419189453125, 6.69189453125, 6.964599609375, 7.2373046875, 7.510009765625, 7.78271484375, 8.055419921875, 8.328125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 10.0, 5.0, 3.0, 4.0, 1.0, 6.0, 10.0, 11.0, 8.0, 18.0, 23.0, 21.0, 22.0, 30.0, 26.0, 32.0, 46.0, 40.0, 60.0, 90.0, 189.0, 1491.0, 350.0, 113.0, 74.0, 44.0, 38.0, 47.0, 43.0, 37.0, 21.0, 30.0, 34.0, 20.0, 19.0, 9.0, 13.0, 2.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5, -13.995849609375, -13.49169921875, -12.987548828125, -12.4833984375, -11.979248046875, -11.47509765625, -10.970947265625, -10.466796875, -9.962646484375, -9.45849609375, -8.954345703125, -8.4501953125, -7.946044921875, -7.44189453125, -6.937744140625, -6.43359375, -5.929443359375, -5.42529296875, -4.921142578125, -4.4169921875, -3.912841796875, -3.40869140625, -2.904541015625, -2.400390625, -1.896240234375, -1.39208984375, -0.887939453125, -0.3837890625, 0.120361328125, 0.62451171875, 1.128662109375, 1.6328125, 2.136962890625, 2.64111328125, 3.145263671875, 3.6494140625, 4.153564453125, 4.65771484375, 5.161865234375, 5.666015625, 6.170166015625, 6.67431640625, 7.178466796875, 7.6826171875, 8.186767578125, 8.69091796875, 9.195068359375, 9.69921875, 10.203369140625, 10.70751953125, 11.211669921875, 11.7158203125, 12.219970703125, 12.72412109375, 13.228271484375, 13.732421875, 14.236572265625, 14.74072265625, 15.244873046875, 15.7490234375, 16.253173828125, 16.75732421875, 17.261474609375, 17.765625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 8.0, 13.0, 24.0, 31.0, 28.0, 52.0, 38.0, 50.0, 80.0, 110.0, 150.0, 249.0, 583.0, 1932.0, 26844.0, 3063242.0, 48428.0, 2332.0, 627.0, 275.0, 139.0, 108.0, 65.0, 53.0, 52.0, 28.0, 31.0, 24.0, 20.0, 16.0, 12.0, 6.0, 7.0, 4.0, 8.0, 3.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-38.0, -36.900390625, -35.80078125, -34.701171875, -33.6015625, -32.501953125, -31.40234375, -30.302734375, -29.203125, -28.103515625, -27.00390625, -25.904296875, -24.8046875, -23.705078125, -22.60546875, -21.505859375, -20.40625, -19.306640625, -18.20703125, -17.107421875, -16.0078125, -14.908203125, -13.80859375, -12.708984375, -11.609375, -10.509765625, -9.41015625, -8.310546875, -7.2109375, -6.111328125, -5.01171875, -3.912109375, -2.8125, -1.712890625, -0.61328125, 0.486328125, 1.5859375, 2.685546875, 3.78515625, 4.884765625, 5.984375, 7.083984375, 8.18359375, 9.283203125, 10.3828125, 11.482421875, 12.58203125, 13.681640625, 14.78125, 15.880859375, 16.98046875, 18.080078125, 19.1796875, 20.279296875, 21.37890625, 22.478515625, 23.578125, 24.677734375, 25.77734375, 26.876953125, 27.9765625, 29.076171875, 30.17578125, 31.275390625, 32.375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 9.0, 144.0, 711.0, 149.0, 4.0, 1.0], "bins": [-221.3907928466797, -217.72946166992188, -214.06814575195312, -210.4068145751953, -206.74549865722656, -203.08416748046875, -199.4228515625, -195.7615203857422, -192.10020446777344, -188.43887329101562, -184.77755737304688, -181.11622619628906, -177.4549102783203, -173.7935791015625, -170.13226318359375, -166.47093200683594, -162.80960083007812, -159.1482696533203, -155.48695373535156, -151.82562255859375, -148.164306640625, -144.5029754638672, -140.84165954589844, -137.18032836914062, -133.51901245117188, -129.85768127441406, -126.19636535644531, -122.53504180908203, -118.87371826171875, -115.21238708496094, -111.55107116699219, -107.88973999023438, -104.2284164428711, -100.56709289550781, -96.90576934814453, -93.24444580078125, -89.58312225341797, -85.92179870605469, -82.26046752929688, -78.5991439819336, -74.93782043457031, -71.27649688720703, -67.61517333984375, -63.95384979248047, -60.29252243041992, -56.63119888305664, -52.96987533569336, -49.30854797363281, -45.6472282409668, -41.985904693603516, -38.324581146240234, -34.66325378417969, -31.001930236816406, -27.340606689453125, -23.679283142089844, -20.01795768737793, -16.35663414001465, -12.69530963897705, -9.033985137939453, -5.372661590576172, -1.7113370895385742, 1.9499874114990234, 5.611310958862305, 9.272636413574219, 12.9339599609375]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 10.0, 8.0, 14.0, 16.0, 15.0, 25.0, 28.0, 23.0, 17.0, 31.0, 34.0, 38.0, 27.0, 45.0, 42.0, 44.0, 53.0, 35.0, 44.0, 49.0, 38.0, 50.0, 29.0, 30.0, 28.0, 30.0, 28.0, 28.0, 27.0, 20.0, 19.0, 15.0, 14.0, 9.0, 6.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.35503005981445, -37.15213394165039, -35.949241638183594, -34.74634552001953, -33.54344940185547, -32.34055709838867, -31.13766098022461, -29.93476676940918, -28.73187255859375, -27.52897834777832, -26.32608413696289, -25.123188018798828, -23.9202938079834, -22.71739959716797, -21.514503479003906, -20.311609268188477, -19.108715057373047, -17.905820846557617, -16.702926635742188, -15.500030517578125, -14.297136306762695, -13.094242095947266, -11.89134693145752, -10.688451766967773, -9.485557556152344, -8.282663345336914, -7.079768180847168, -5.87687349319458, -4.673978805541992, -3.4710841178894043, -2.2681894302368164, -1.0652942657470703, 0.13759994506835938, 1.3404946327209473, 2.543389320373535, 3.746284008026123, 4.949178695678711, 6.152073383331299, 7.354968070983887, 8.557863235473633, 9.760757446289062, 10.963651657104492, 12.166546821594238, 13.369441986083984, 14.572336196899414, 15.775230407714844, 16.978126525878906, 18.181020736694336, 19.383914947509766, 20.586809158325195, 21.789703369140625, 22.992599487304688, 24.195493698120117, 25.398387908935547, 26.60128402709961, 27.80417823791504, 29.00707244873047, 30.2099666595459, 31.412860870361328, 32.61575698852539, 33.81864929199219, 35.02154541015625, 36.22444152832031, 37.427337646484375, 38.63022994995117]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 5.0, 8.0, 7.0, 13.0, 14.0, 13.0, 21.0, 20.0, 25.0, 26.0, 34.0, 40.0, 32.0, 37.0, 43.0, 57.0, 56.0, 47.0, 34.0, 48.0, 49.0, 40.0, 33.0, 35.0, 29.0, 23.0, 31.0, 31.0, 21.0, 24.0, 20.0, 10.0, 14.0, 16.0, 8.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.96484375, -4.80511474609375, -4.6453857421875, -4.48565673828125, -4.325927734375, -4.16619873046875, -4.0064697265625, -3.84674072265625, -3.68701171875, -3.52728271484375, -3.3675537109375, -3.20782470703125, -3.048095703125, -2.88836669921875, -2.7286376953125, -2.56890869140625, -2.4091796875, -2.24945068359375, -2.0897216796875, -1.92999267578125, -1.770263671875, -1.61053466796875, -1.4508056640625, -1.29107666015625, -1.13134765625, -0.97161865234375, -0.8118896484375, -0.65216064453125, -0.492431640625, -0.33270263671875, -0.1729736328125, -0.01324462890625, 0.146484375, 0.30621337890625, 0.4659423828125, 0.62567138671875, 0.785400390625, 0.94512939453125, 1.1048583984375, 1.26458740234375, 1.42431640625, 1.58404541015625, 1.7437744140625, 1.90350341796875, 2.063232421875, 2.22296142578125, 2.3826904296875, 2.54241943359375, 2.7021484375, 2.86187744140625, 3.0216064453125, 3.18133544921875, 3.341064453125, 3.50079345703125, 3.6605224609375, 3.82025146484375, 3.97998046875, 4.13970947265625, 4.2994384765625, 4.45916748046875, 4.618896484375, 4.77862548828125, 4.9383544921875, 5.09808349609375, 5.2578125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 7.0, 8.0, 9.0, 8.0, 12.0, 13.0, 11.0, 30.0, 24.0, 35.0, 58.0, 91.0, 138.0, 299.0, 623.0, 1602.0, 5234.0, 25440.0, 222248.0, 1807983.0, 1862719.0, 233617.0, 26148.0, 5036.0, 1550.0, 633.0, 270.0, 130.0, 82.0, 46.0, 35.0, 22.0, 26.0, 17.0, 13.0, 12.0, 15.0, 13.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4140625, -9.1104736328125, -8.806884765625, -8.5032958984375, -8.19970703125, -7.8961181640625, -7.592529296875, -7.2889404296875, -6.9853515625, -6.6817626953125, -6.378173828125, -6.0745849609375, -5.77099609375, -5.4674072265625, -5.163818359375, -4.8602294921875, -4.556640625, -4.2530517578125, -3.949462890625, -3.6458740234375, -3.34228515625, -3.0386962890625, -2.735107421875, -2.4315185546875, -2.1279296875, -1.8243408203125, -1.520751953125, -1.2171630859375, -0.91357421875, -0.6099853515625, -0.306396484375, -0.0028076171875, 0.30078125, 0.6043701171875, 0.907958984375, 1.2115478515625, 1.51513671875, 1.8187255859375, 2.122314453125, 2.4259033203125, 2.7294921875, 3.0330810546875, 3.336669921875, 3.6402587890625, 3.94384765625, 4.2474365234375, 4.551025390625, 4.8546142578125, 5.158203125, 5.4617919921875, 5.765380859375, 6.0689697265625, 6.37255859375, 6.6761474609375, 6.979736328125, 7.2833251953125, 7.5869140625, 7.8905029296875, 8.194091796875, 8.4976806640625, 8.80126953125, 9.1048583984375, 9.408447265625, 9.7120361328125, 10.015625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 5.0, 11.0, 12.0, 15.0, 18.0, 20.0, 42.0, 55.0, 70.0, 78.0, 134.0, 157.0, 230.0, 295.0, 325.0, 417.0, 486.0, 383.0, 298.0, 255.0, 191.0, 140.0, 107.0, 67.0, 69.0, 44.0, 36.0, 21.0, 21.0, 11.0, 10.0, 8.0, 4.0, 10.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.09375, -7.877685546875, -7.66162109375, -7.445556640625, -7.2294921875, -7.013427734375, -6.79736328125, -6.581298828125, -6.365234375, -6.149169921875, -5.93310546875, -5.717041015625, -5.5009765625, -5.284912109375, -5.06884765625, -4.852783203125, -4.63671875, -4.420654296875, -4.20458984375, -3.988525390625, -3.7724609375, -3.556396484375, -3.34033203125, -3.124267578125, -2.908203125, -2.692138671875, -2.47607421875, -2.260009765625, -2.0439453125, -1.827880859375, -1.61181640625, -1.395751953125, -1.1796875, -0.963623046875, -0.74755859375, -0.531494140625, -0.3154296875, -0.099365234375, 0.11669921875, 0.332763671875, 0.548828125, 0.764892578125, 0.98095703125, 1.197021484375, 1.4130859375, 1.629150390625, 1.84521484375, 2.061279296875, 2.27734375, 2.493408203125, 2.70947265625, 2.925537109375, 3.1416015625, 3.357666015625, 3.57373046875, 3.789794921875, 4.005859375, 4.221923828125, 4.43798828125, 4.654052734375, 4.8701171875, 5.086181640625, 5.30224609375, 5.518310546875, 5.734375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 9.0, 2.0, 7.0, 4.0, 15.0, 4.0, 16.0, 26.0, 38.0, 47.0, 57.0, 80.0, 100.0, 164.0, 221.0, 306.0, 638.0, 1471.0, 5849.0, 49892.0, 948522.0, 2987179.0, 180249.0, 14578.0, 2546.0, 894.0, 435.0, 290.0, 190.0, 142.0, 87.0, 56.0, 41.0, 30.0, 21.0, 16.0, 22.0, 14.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.15625, -13.636474609375, -13.11669921875, -12.596923828125, -12.0771484375, -11.557373046875, -11.03759765625, -10.517822265625, -9.998046875, -9.478271484375, -8.95849609375, -8.438720703125, -7.9189453125, -7.399169921875, -6.87939453125, -6.359619140625, -5.83984375, -5.320068359375, -4.80029296875, -4.280517578125, -3.7607421875, -3.240966796875, -2.72119140625, -2.201416015625, -1.681640625, -1.161865234375, -0.64208984375, -0.122314453125, 0.3974609375, 0.917236328125, 1.43701171875, 1.956787109375, 2.4765625, 2.996337890625, 3.51611328125, 4.035888671875, 4.5556640625, 5.075439453125, 5.59521484375, 6.114990234375, 6.634765625, 7.154541015625, 7.67431640625, 8.194091796875, 8.7138671875, 9.233642578125, 9.75341796875, 10.273193359375, 10.79296875, 11.312744140625, 11.83251953125, 12.352294921875, 12.8720703125, 13.391845703125, 13.91162109375, 14.431396484375, 14.951171875, 15.470947265625, 15.99072265625, 16.510498046875, 17.0302734375, 17.550048828125, 18.06982421875, 18.589599609375, 19.109375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 16.0, 36.0, 133.0, 240.0, 254.0, 190.0, 105.0, 29.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.32569694519043, -17.063838958740234, -14.801979064941406, -12.540121078491211, -10.2782621383667, -8.016403198242188, -5.754545211791992, -3.4926862716674805, -1.2308273315429688, 1.0310313701629639, 3.2928900718688965, 5.55474853515625, 7.816607475280762, 10.078466415405273, 12.340324401855469, 14.60218334197998, 16.864042282104492, 19.125900268554688, 21.387760162353516, 23.64961814880371, 25.911476135253906, 28.173336029052734, 30.43519401550293, 32.697052001953125, 34.95891189575195, 37.22077178955078, 39.482627868652344, 41.74448776245117, 44.00634765625, 46.26820373535156, 48.53006362915039, 50.79192352294922, 53.05378723144531, 55.31564712524414, 57.5775032043457, 59.83936309814453, 62.10122299194336, 64.36308288574219, 66.62493896484375, 68.88679504394531, 71.1486587524414, 73.41051483154297, 75.67237854003906, 77.93423461914062, 80.19609069824219, 82.45795440673828, 84.71981048583984, 86.9816665649414, 89.2435302734375, 91.50538635253906, 93.76725006103516, 96.02910614013672, 98.29096221923828, 100.55282592773438, 102.81468200683594, 105.0765380859375, 107.33839416503906, 109.60025024414062, 111.86211395263672, 114.12397003173828, 116.38582611083984, 118.64768981933594, 120.9095458984375, 123.17140197753906, 125.43326568603516]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 13.0, 4.0, 8.0, 9.0, 11.0, 6.0, 21.0, 17.0, 14.0, 25.0, 29.0, 21.0, 32.0, 25.0, 27.0, 35.0, 38.0, 39.0, 37.0, 40.0, 40.0, 32.0, 41.0, 40.0, 34.0, 36.0, 39.0, 24.0, 47.0, 21.0, 22.0, 24.0, 27.0, 20.0, 17.0, 11.0, 15.0, 9.0, 7.0, 6.0, 9.0, 12.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.581222534179688, -23.817628860473633, -23.054035186767578, -22.290441513061523, -21.52684783935547, -20.763256072998047, -19.999662399291992, -19.236068725585938, -18.472475051879883, -17.708881378173828, -16.945287704467773, -16.18169403076172, -15.41810131072998, -14.654507637023926, -13.890914916992188, -13.127321243286133, -12.363727569580078, -11.600133895874023, -10.836540222167969, -10.07294750213623, -9.309353828430176, -8.545760154724121, -7.782166957855225, -7.018573760986328, -6.254980087280273, -5.491386413574219, -4.727793216705322, -3.9641997814178467, -3.200606346130371, -2.4370129108428955, -1.67341947555542, -0.9098262786865234, -0.14623260498046875, 0.6173608303070068, 1.3809542655944824, 2.144547700881958, 2.9081411361694336, 3.671734571456909, 4.435328006744385, 5.198921203613281, 5.962514877319336, 6.726108551025391, 7.489701747894287, 8.253294944763184, 9.016888618469238, 9.780482292175293, 10.544075012207031, 11.307668685913086, 12.07126235961914, 12.834856033325195, 13.59844970703125, 14.362042427062988, 15.125636100769043, 15.889229774475098, 16.652822494506836, 17.41641616821289, 18.180009841918945, 18.943603515625, 19.707197189331055, 20.47079086303711, 21.23438262939453, 21.997976303100586, 22.76156997680664, 23.525163650512695, 24.28875732421875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 7.0, 12.0, 14.0, 8.0, 13.0, 11.0, 27.0, 33.0, 30.0, 33.0, 45.0, 36.0, 47.0, 51.0, 46.0, 44.0, 55.0, 45.0, 41.0, 43.0, 30.0, 37.0, 39.0, 28.0, 31.0, 29.0, 25.0, 19.0, 25.0, 13.0, 14.0, 12.0, 15.0, 7.0, 9.0, 2.0, 3.0, 5.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.76788330078125, -4.6021728515625, -4.43646240234375, -4.270751953125, -4.10504150390625, -3.9393310546875, -3.77362060546875, -3.60791015625, -3.44219970703125, -3.2764892578125, -3.11077880859375, -2.945068359375, -2.77935791015625, -2.6136474609375, -2.44793701171875, -2.2822265625, -2.11651611328125, -1.9508056640625, -1.78509521484375, -1.619384765625, -1.45367431640625, -1.2879638671875, -1.12225341796875, -0.95654296875, -0.79083251953125, -0.6251220703125, -0.45941162109375, -0.293701171875, -0.12799072265625, 0.0377197265625, 0.20343017578125, 0.369140625, 0.53485107421875, 0.7005615234375, 0.86627197265625, 1.031982421875, 1.19769287109375, 1.3634033203125, 1.52911376953125, 1.69482421875, 1.86053466796875, 2.0262451171875, 2.19195556640625, 2.357666015625, 2.52337646484375, 2.6890869140625, 2.85479736328125, 3.0205078125, 3.18621826171875, 3.3519287109375, 3.51763916015625, 3.683349609375, 3.84906005859375, 4.0147705078125, 4.18048095703125, 4.34619140625, 4.51190185546875, 4.6776123046875, 4.84332275390625, 5.009033203125, 5.17474365234375, 5.3404541015625, 5.50616455078125, 5.671875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 7.0, 10.0, 21.0, 26.0, 34.0, 45.0, 77.0, 95.0, 158.0, 199.0, 284.0, 428.0, 574.0, 862.0, 1136.0, 1690.0, 2361.0, 3445.0, 5007.0, 7273.0, 10819.0, 15982.0, 23783.0, 34650.0, 50966.0, 74511.0, 107442.0, 143696.0, 155304.0, 125652.0, 89036.0, 61879.0, 41860.0, 28563.0, 19081.0, 12978.0, 8877.0, 6146.0, 4136.0, 2853.0, 1957.0, 1337.0, 993.0, 710.0, 463.0, 337.0, 237.0, 187.0, 156.0, 59.0, 67.0, 47.0, 26.0, 18.0, 10.0, 3.0, 5.0, 1.0, 3.0, 1.0, 4.0], "bins": [-0.337646484375, -0.3268394470214844, -0.31603240966796875, -0.3052253723144531, -0.2944183349609375, -0.2836112976074219, -0.27280426025390625, -0.2619972229003906, -0.251190185546875, -0.24038314819335938, -0.22957611083984375, -0.21876907348632812, -0.2079620361328125, -0.19715499877929688, -0.18634796142578125, -0.17554092407226562, -0.16473388671875, -0.15392684936523438, -0.14311981201171875, -0.13231277465820312, -0.1215057373046875, -0.11069869995117188, -0.09989166259765625, -0.08908462524414062, -0.078277587890625, -0.06747055053710938, -0.05666351318359375, -0.045856475830078125, -0.0350494384765625, -0.024242401123046875, -0.01343536376953125, -0.002628326416015625, 0.0081787109375, 0.018985748291015625, 0.02979278564453125, 0.040599822998046875, 0.0514068603515625, 0.062213897705078125, 0.07302093505859375, 0.08382797241210938, 0.094635009765625, 0.10544204711914062, 0.11624908447265625, 0.12705612182617188, 0.1378631591796875, 0.14867019653320312, 0.15947723388671875, 0.17028427124023438, 0.18109130859375, 0.19189834594726562, 0.20270538330078125, 0.21351242065429688, 0.2243194580078125, 0.23512649536132812, 0.24593353271484375, 0.2567405700683594, 0.267547607421875, 0.2783546447753906, 0.28916168212890625, 0.2999687194824219, 0.3107757568359375, 0.3215827941894531, 0.33238983154296875, 0.3431968688964844, 0.35400390625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 10.0, 5.0, 8.0, 12.0, 10.0, 10.0, 16.0, 18.0, 21.0, 18.0, 20.0, 23.0, 36.0, 22.0, 25.0, 35.0, 50.0, 40.0, 39.0, 39.0, 1076.0, 41.0, 32.0, 34.0, 39.0, 42.0, 25.0, 34.0, 33.0, 39.0, 28.0, 19.0, 17.0, 15.0, 12.0, 20.0, 10.0, 11.0, 10.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.380859375, -3.285308837890625, -3.18975830078125, -3.094207763671875, -2.9986572265625, -2.903106689453125, -2.80755615234375, -2.712005615234375, -2.616455078125, -2.520904541015625, -2.42535400390625, -2.329803466796875, -2.2342529296875, -2.138702392578125, -2.04315185546875, -1.947601318359375, -1.85205078125, -1.756500244140625, -1.66094970703125, -1.565399169921875, -1.4698486328125, -1.374298095703125, -1.27874755859375, -1.183197021484375, -1.087646484375, -0.992095947265625, -0.89654541015625, -0.800994873046875, -0.7054443359375, -0.609893798828125, -0.51434326171875, -0.418792724609375, -0.3232421875, -0.227691650390625, -0.13214111328125, -0.036590576171875, 0.0589599609375, 0.154510498046875, 0.25006103515625, 0.345611572265625, 0.441162109375, 0.536712646484375, 0.63226318359375, 0.727813720703125, 0.8233642578125, 0.918914794921875, 1.01446533203125, 1.110015869140625, 1.20556640625, 1.301116943359375, 1.39666748046875, 1.492218017578125, 1.5877685546875, 1.683319091796875, 1.77886962890625, 1.874420166015625, 1.969970703125, 2.065521240234375, 2.16107177734375, 2.256622314453125, 2.3521728515625, 2.447723388671875, 2.54327392578125, 2.638824462890625, 2.734375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 7.0, 5.0, 8.0, 13.0, 21.0, 19.0, 42.0, 53.0, 90.0, 118.0, 167.0, 269.0, 404.0, 625.0, 852.0, 1274.0, 1901.0, 2875.0, 4167.0, 6156.0, 9181.0, 13829.0, 19996.0, 29396.0, 42261.0, 62362.0, 87626.0, 118922.0, 1155798.0, 174946.0, 109506.0, 79366.0, 55067.0, 38522.0, 26112.0, 18049.0, 12007.0, 8036.0, 5533.0, 3749.0, 2591.0, 1714.0, 1128.0, 762.0, 511.0, 374.0, 229.0, 170.0, 93.0, 76.0, 56.0, 28.0, 24.0, 18.0, 14.0, 9.0, 9.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.259033203125, -0.2509002685546875, -0.242767333984375, -0.2346343994140625, -0.22650146484375, -0.2183685302734375, -0.210235595703125, -0.2021026611328125, -0.1939697265625, -0.1858367919921875, -0.177703857421875, -0.1695709228515625, -0.16143798828125, -0.1533050537109375, -0.145172119140625, -0.1370391845703125, -0.12890625, -0.1207733154296875, -0.112640380859375, -0.1045074462890625, -0.09637451171875, -0.0882415771484375, -0.080108642578125, -0.0719757080078125, -0.0638427734375, -0.0557098388671875, -0.047576904296875, -0.0394439697265625, -0.03131103515625, -0.0231781005859375, -0.015045166015625, -0.0069122314453125, 0.001220703125, 0.0093536376953125, 0.017486572265625, 0.0256195068359375, 0.03375244140625, 0.0418853759765625, 0.050018310546875, 0.0581512451171875, 0.0662841796875, 0.0744171142578125, 0.082550048828125, 0.0906829833984375, 0.09881591796875, 0.1069488525390625, 0.115081787109375, 0.1232147216796875, 0.13134765625, 0.1394805908203125, 0.147613525390625, 0.1557464599609375, 0.16387939453125, 0.1720123291015625, 0.180145263671875, 0.1882781982421875, 0.1964111328125, 0.2045440673828125, 0.212677001953125, 0.2208099365234375, 0.22894287109375, 0.2370758056640625, 0.245208740234375, 0.2533416748046875, 0.261474609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 11.0, 6.0, 6.0, 8.0, 14.0, 13.0, 9.0, 29.0, 27.0, 39.0, 47.0, 56.0, 73.0, 86.0, 91.0, 99.0, 67.0, 55.0, 54.0, 36.0, 33.0, 22.0, 21.0, 17.0, 12.0, 13.0, 7.0, 9.0, 8.0, 3.0, 6.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005779266357421875, -0.005607903003692627, -0.005436539649963379, -0.005265176296234131, -0.005093812942504883, -0.004922449588775635, -0.004751086235046387, -0.004579722881317139, -0.004408359527587891, -0.004236996173858643, -0.0040656328201293945, -0.0038942694664001465, -0.0037229061126708984, -0.0035515427589416504, -0.0033801794052124023, -0.0032088160514831543, -0.0030374526977539062, -0.002866089344024658, -0.00269472599029541, -0.002523362636566162, -0.002351999282836914, -0.002180635929107666, -0.002009272575378418, -0.00183790922164917, -0.0016665458679199219, -0.0014951825141906738, -0.0013238191604614258, -0.0011524558067321777, -0.0009810924530029297, -0.0008097290992736816, -0.0006383657455444336, -0.00046700239181518555, -0.0002956390380859375, -0.00012427568435668945, 4.7087669372558594e-05, 0.00021845102310180664, 0.0003898143768310547, 0.0005611777305603027, 0.0007325410842895508, 0.0009039044380187988, 0.0010752677917480469, 0.001246631145477295, 0.001417994499206543, 0.001589357852935791, 0.001760721206665039, 0.0019320845603942871, 0.002103447914123535, 0.002274811267852783, 0.0024461746215820312, 0.0026175379753112793, 0.0027889013290405273, 0.0029602646827697754, 0.0031316280364990234, 0.0033029913902282715, 0.0034743547439575195, 0.0036457180976867676, 0.0038170814514160156, 0.003988444805145264, 0.004159808158874512, 0.00433117151260376, 0.004502534866333008, 0.004673898220062256, 0.004845261573791504, 0.005016624927520752, 0.00518798828125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 6.0, 4.0, 12.0, 11.0, 15.0, 14.0, 30.0, 37.0, 47.0, 37.0, 80.0, 95.0, 159.0, 253.0, 504.0, 2448.0, 973615.0, 69232.0, 861.0, 365.0, 231.0, 128.0, 100.0, 57.0, 45.0, 25.0, 29.0, 29.0, 10.0, 8.0, 11.0, 14.0, 10.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.10546875, -0.10215091705322266, -0.09883308410644531, -0.09551525115966797, -0.09219741821289062, -0.08887958526611328, -0.08556175231933594, -0.0822439193725586, -0.07892608642578125, -0.0756082534790039, -0.07229042053222656, -0.06897258758544922, -0.06565475463867188, -0.06233692169189453, -0.05901908874511719, -0.055701255798339844, -0.0523834228515625, -0.049065589904785156, -0.04574775695800781, -0.04242992401123047, -0.039112091064453125, -0.03579425811767578, -0.03247642517089844, -0.029158592224121094, -0.02584075927734375, -0.022522926330566406, -0.019205093383789062, -0.01588726043701172, -0.012569427490234375, -0.009251594543457031, -0.0059337615966796875, -0.0026159286499023438, 0.000701904296875, 0.004019737243652344, 0.0073375701904296875, 0.010655403137207031, 0.013973236083984375, 0.01729106903076172, 0.020608901977539062, 0.023926734924316406, 0.02724456787109375, 0.030562400817871094, 0.03388023376464844, 0.03719806671142578, 0.040515899658203125, 0.04383373260498047, 0.04715156555175781, 0.050469398498535156, 0.0537872314453125, 0.057105064392089844, 0.06042289733886719, 0.06374073028564453, 0.06705856323242188, 0.07037639617919922, 0.07369422912597656, 0.0770120620727539, 0.08032989501953125, 0.0836477279663086, 0.08696556091308594, 0.09028339385986328, 0.09360122680664062, 0.09691905975341797, 0.10023689270019531, 0.10355472564697266, 0.10687255859375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 44.0, 631.0, 323.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003898837836459279, -0.0030843750573694706, -0.002269912511110306, -0.0014554497320204973, -0.0006409871857613325, 0.0001734753604978323, 0.0009879383724182844, 0.0018024009186774492, 0.002616863464936614, 0.0034313262440264225, 0.004245788790285587, 0.005060251802206039, 0.005874713882803917, 0.006689176894724369, 0.007503639906644821, 0.008318101987242699, 0.00913256499916315, 0.009947028011083603, 0.01076149009168148, 0.011575953103601933, 0.012390416115522385, 0.013204878196120262, 0.014019341208040714, 0.014833804219961166, 0.015648266300559044, 0.01646272838115692, 0.017277192324399948, 0.018091654404997826, 0.018906116485595703, 0.01972058042883873, 0.020535042509436607, 0.021349504590034485, 0.02216396853327751, 0.02297843061387539, 0.023792894557118416, 0.024607356637716293, 0.02542181871831417, 0.02623628079891205, 0.027050744742155075, 0.027865206822752953, 0.02867966890335083, 0.029494130983948708, 0.030308594927191734, 0.031123057007789612, 0.03193752095103264, 0.03275198116898537, 0.033566445112228394, 0.03438090905547142, 0.03519537299871445, 0.036009836941957474, 0.0368242971599102, 0.03763876110315323, 0.038453225046396255, 0.039267685264348984, 0.04008214920759201, 0.04089661315083504, 0.041711073368787766, 0.04252553731203079, 0.04333999752998352, 0.04415446147322655, 0.044968925416469574, 0.0457833856344223, 0.04659784957766533, 0.047412313520908356, 0.048226773738861084]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 10.0, 7.0, 17.0, 11.0, 11.0, 7.0, 12.0, 22.0, 32.0, 35.0, 34.0, 33.0, 44.0, 39.0, 44.0, 57.0, 43.0, 59.0, 46.0, 42.0, 47.0, 48.0, 28.0, 37.0, 47.0, 21.0, 26.0, 39.0, 21.0, 26.0, 13.0, 10.0, 7.0, 8.0, 9.0, 4.0, 2.0, 5.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003369152545928955, -0.0032685473561286926, -0.00316794216632843, -0.0030673369765281677, -0.0029667317867279053, -0.002866126596927643, -0.0027655214071273804, -0.002664916217327118, -0.0025643110275268555, -0.002463705837726593, -0.0023631006479263306, -0.002262495458126068, -0.0021618902683258057, -0.002061285078525543, -0.0019606798887252808, -0.0018600746989250183, -0.0017594695091247559, -0.0016588643193244934, -0.001558259129524231, -0.0014576539397239685, -0.001357048749923706, -0.0012564435601234436, -0.0011558383703231812, -0.0010552331805229187, -0.0009546279907226562, -0.0008540228009223938, -0.0007534176111221313, -0.0006528124213218689, -0.0005522072315216064, -0.000451602041721344, -0.00035099685192108154, -0.0002503916621208191, -0.00014978647232055664, -4.918128252029419e-05, 5.142390727996826e-05, 0.0001520290970802307, 0.00025263428688049316, 0.0003532394766807556, 0.00045384466648101807, 0.0005544498562812805, 0.000655055046081543, 0.0007556602358818054, 0.0008562654256820679, 0.0009568706154823303, 0.0010574758052825928, 0.0011580809950828552, 0.0012586861848831177, 0.0013592913746833801, 0.0014598965644836426, 0.001560501754283905, 0.0016611069440841675, 0.00176171213388443, 0.0018623173236846924, 0.001962922513484955, 0.0020635277032852173, 0.0021641328930854797, 0.002264738082885742, 0.0023653432726860046, 0.002465948462486267, 0.0025665536522865295, 0.002667158842086792, 0.0027677640318870544, 0.002868369221687317, 0.0029689744114875793, 0.003069579601287842]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 7.0, 12.0, 14.0, 8.0, 13.0, 11.0, 27.0, 33.0, 30.0, 33.0, 45.0, 36.0, 47.0, 51.0, 46.0, 44.0, 55.0, 45.0, 41.0, 43.0, 30.0, 37.0, 39.0, 28.0, 31.0, 29.0, 25.0, 19.0, 25.0, 13.0, 14.0, 12.0, 15.0, 7.0, 9.0, 2.0, 3.0, 5.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.76788330078125, -4.6021728515625, -4.43646240234375, -4.270751953125, -4.10504150390625, -3.9393310546875, -3.77362060546875, -3.60791015625, -3.44219970703125, -3.2764892578125, -3.11077880859375, -2.945068359375, -2.77935791015625, -2.6136474609375, -2.44793701171875, -2.2822265625, -2.11651611328125, -1.9508056640625, -1.78509521484375, -1.619384765625, -1.45367431640625, -1.2879638671875, -1.12225341796875, -0.95654296875, -0.79083251953125, -0.6251220703125, -0.45941162109375, -0.293701171875, -0.12799072265625, 0.0377197265625, 0.20343017578125, 0.369140625, 0.53485107421875, 0.7005615234375, 0.86627197265625, 1.031982421875, 1.19769287109375, 1.3634033203125, 1.52911376953125, 1.69482421875, 1.86053466796875, 2.0262451171875, 2.19195556640625, 2.357666015625, 2.52337646484375, 2.6890869140625, 2.85479736328125, 3.0205078125, 3.18621826171875, 3.3519287109375, 3.51763916015625, 3.683349609375, 3.84906005859375, 4.0147705078125, 4.18048095703125, 4.34619140625, 4.51190185546875, 4.6776123046875, 4.84332275390625, 5.009033203125, 5.17474365234375, 5.3404541015625, 5.50616455078125, 5.671875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 9.0, 8.0, 13.0, 19.0, 31.0, 26.0, 34.0, 43.0, 64.0, 102.0, 117.0, 189.0, 255.0, 347.0, 484.0, 795.0, 1871.0, 7124.0, 35964.0, 484276.0, 470093.0, 35321.0, 6949.0, 1908.0, 769.0, 456.0, 315.0, 250.0, 165.0, 119.0, 126.0, 78.0, 57.0, 44.0, 35.0, 35.0, 15.0, 15.0, 8.0, 4.0, 8.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2734375, -11.8642578125, -11.455078125, -11.0458984375, -10.63671875, -10.2275390625, -9.818359375, -9.4091796875, -9.0, -8.5908203125, -8.181640625, -7.7724609375, -7.36328125, -6.9541015625, -6.544921875, -6.1357421875, -5.7265625, -5.3173828125, -4.908203125, -4.4990234375, -4.08984375, -3.6806640625, -3.271484375, -2.8623046875, -2.453125, -2.0439453125, -1.634765625, -1.2255859375, -0.81640625, -0.4072265625, 0.001953125, 0.4111328125, 0.8203125, 1.2294921875, 1.638671875, 2.0478515625, 2.45703125, 2.8662109375, 3.275390625, 3.6845703125, 4.09375, 4.5029296875, 4.912109375, 5.3212890625, 5.73046875, 6.1396484375, 6.548828125, 6.9580078125, 7.3671875, 7.7763671875, 8.185546875, 8.5947265625, 9.00390625, 9.4130859375, 9.822265625, 10.2314453125, 10.640625, 11.0498046875, 11.458984375, 11.8681640625, 12.27734375, 12.6865234375, 13.095703125, 13.5048828125, 13.9140625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 14.0, 6.0, 8.0, 19.0, 20.0, 15.0, 20.0, 27.0, 26.0, 18.0, 33.0, 38.0, 47.0, 47.0, 58.0, 92.0, 232.0, 1599.0, 204.0, 78.0, 55.0, 51.0, 38.0, 36.0, 39.0, 37.0, 26.0, 29.0, 18.0, 12.0, 18.0, 11.0, 10.0, 9.0, 14.0, 6.0, 3.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.96875, -14.52099609375, -14.0732421875, -13.62548828125, -13.177734375, -12.72998046875, -12.2822265625, -11.83447265625, -11.38671875, -10.93896484375, -10.4912109375, -10.04345703125, -9.595703125, -9.14794921875, -8.7001953125, -8.25244140625, -7.8046875, -7.35693359375, -6.9091796875, -6.46142578125, -6.013671875, -5.56591796875, -5.1181640625, -4.67041015625, -4.22265625, -3.77490234375, -3.3271484375, -2.87939453125, -2.431640625, -1.98388671875, -1.5361328125, -1.08837890625, -0.640625, -0.19287109375, 0.2548828125, 0.70263671875, 1.150390625, 1.59814453125, 2.0458984375, 2.49365234375, 2.94140625, 3.38916015625, 3.8369140625, 4.28466796875, 4.732421875, 5.18017578125, 5.6279296875, 6.07568359375, 6.5234375, 6.97119140625, 7.4189453125, 7.86669921875, 8.314453125, 8.76220703125, 9.2099609375, 9.65771484375, 10.10546875, 10.55322265625, 11.0009765625, 11.44873046875, 11.896484375, 12.34423828125, 12.7919921875, 13.23974609375, 13.6875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 4.0, 6.0, 10.0, 13.0, 12.0, 13.0, 22.0, 26.0, 20.0, 37.0, 33.0, 55.0, 73.0, 73.0, 131.0, 230.0, 457.0, 1420.0, 16740.0, 3042421.0, 79649.0, 2696.0, 655.0, 290.0, 157.0, 101.0, 69.0, 44.0, 39.0, 38.0, 27.0, 22.0, 27.0, 15.0, 12.0, 14.0, 8.0, 7.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-37.03125, -35.82421875, -34.6171875, -33.41015625, -32.203125, -30.99609375, -29.7890625, -28.58203125, -27.375, -26.16796875, -24.9609375, -23.75390625, -22.546875, -21.33984375, -20.1328125, -18.92578125, -17.71875, -16.51171875, -15.3046875, -14.09765625, -12.890625, -11.68359375, -10.4765625, -9.26953125, -8.0625, -6.85546875, -5.6484375, -4.44140625, -3.234375, -2.02734375, -0.8203125, 0.38671875, 1.59375, 2.80078125, 4.0078125, 5.21484375, 6.421875, 7.62890625, 8.8359375, 10.04296875, 11.25, 12.45703125, 13.6640625, 14.87109375, 16.078125, 17.28515625, 18.4921875, 19.69921875, 20.90625, 22.11328125, 23.3203125, 24.52734375, 25.734375, 26.94140625, 28.1484375, 29.35546875, 30.5625, 31.76953125, 32.9765625, 34.18359375, 35.390625, 36.59765625, 37.8046875, 39.01171875, 40.21875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 77.0, 476.0, 413.0, 45.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.42146301269531, -118.77576446533203, -116.13006591796875, -113.48436737060547, -110.83866882324219, -108.1929702758789, -105.54727172851562, -102.90157318115234, -100.25587463378906, -97.61017608642578, -94.9644775390625, -92.31877899169922, -89.67308044433594, -87.02738189697266, -84.38168334960938, -81.7359848022461, -79.09028625488281, -76.44458770751953, -73.79888916015625, -71.15319061279297, -68.50749206542969, -65.8617935180664, -63.216094970703125, -60.570396423339844, -57.92469787597656, -55.27899932861328, -52.63330078125, -49.98760223388672, -47.34190368652344, -44.696205139160156, -42.050506591796875, -39.404808044433594, -36.759117126464844, -34.11341857910156, -31.46772003173828, -28.822021484375, -26.17632293701172, -23.530624389648438, -20.884925842285156, -18.239227294921875, -15.593528747558594, -12.947830200195312, -10.302131652832031, -7.65643310546875, -5.010734558105469, -2.3650360107421875, 0.28066253662109375, 2.926361083984375, 5.572059631347656, 8.217758178710938, 10.863456726074219, 13.5091552734375, 16.15485382080078, 18.800552368164062, 21.446250915527344, 24.091949462890625, 26.737648010253906, 29.383346557617188, 32.02904510498047, 34.67474365234375, 37.32044219970703, 39.96614074707031, 42.611839294433594, 45.257537841796875, 47.903236389160156]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 7.0, 5.0, 10.0, 14.0, 21.0, 21.0, 21.0, 20.0, 31.0, 26.0, 24.0, 37.0, 21.0, 22.0, 37.0, 34.0, 38.0, 46.0, 38.0, 41.0, 36.0, 43.0, 37.0, 33.0, 38.0, 35.0, 33.0, 29.0, 29.0, 19.0, 17.0, 16.0, 12.0, 14.0, 17.0, 16.0, 11.0, 10.0, 9.0, 9.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-38.20920944213867, -37.112247467041016, -36.015281677246094, -34.91831970214844, -33.82135772705078, -32.724395751953125, -31.627431869506836, -30.530467987060547, -29.43350601196289, -28.336544036865234, -27.239580154418945, -26.142616271972656, -25.045654296875, -23.948692321777344, -22.851728439331055, -21.754764556884766, -20.65780258178711, -19.560840606689453, -18.463876724243164, -17.366912841796875, -16.26995086669922, -15.172987937927246, -14.076025009155273, -12.9790620803833, -11.882099151611328, -10.785136222839355, -9.688173294067383, -8.59121036529541, -7.4942474365234375, -6.397284507751465, -5.300321578979492, -4.2033586502075195, -3.1063919067382812, -2.0094289779663086, -0.9124660491943359, 0.18449687957763672, 1.2814598083496094, 2.378422737121582, 3.4753856658935547, 4.572348594665527, 5.6693115234375, 6.766274452209473, 7.863237380981445, 8.960200309753418, 10.05716323852539, 11.154126167297363, 12.251089096069336, 13.348052024841309, 14.445014953613281, 15.541977882385254, 16.638940811157227, 17.735904693603516, 18.832866668701172, 19.929828643798828, 21.026792526245117, 22.123756408691406, 23.220718383789062, 24.31768035888672, 25.414644241333008, 26.511608123779297, 27.608570098876953, 28.70553207397461, 29.8024959564209, 30.899459838867188, 31.996421813964844]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 6.0, 8.0, 7.0, 8.0, 8.0, 14.0, 11.0, 20.0, 18.0, 14.0, 20.0, 34.0, 28.0, 35.0, 35.0, 42.0, 36.0, 46.0, 44.0, 45.0, 47.0, 39.0, 43.0, 33.0, 34.0, 34.0, 29.0, 29.0, 22.0, 22.0, 16.0, 31.0, 27.0, 17.0, 9.0, 22.0, 11.0, 13.0, 8.0, 4.0, 8.0, 8.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-4.95703125, -4.80584716796875, -4.6546630859375, -4.50347900390625, -4.352294921875, -4.20111083984375, -4.0499267578125, -3.89874267578125, -3.74755859375, -3.59637451171875, -3.4451904296875, -3.29400634765625, -3.142822265625, -2.99163818359375, -2.8404541015625, -2.68927001953125, -2.5380859375, -2.38690185546875, -2.2357177734375, -2.08453369140625, -1.933349609375, -1.78216552734375, -1.6309814453125, -1.47979736328125, -1.32861328125, -1.17742919921875, -1.0262451171875, -0.87506103515625, -0.723876953125, -0.57269287109375, -0.4215087890625, -0.27032470703125, -0.119140625, 0.03204345703125, 0.1832275390625, 0.33441162109375, 0.485595703125, 0.63677978515625, 0.7879638671875, 0.93914794921875, 1.09033203125, 1.24151611328125, 1.3927001953125, 1.54388427734375, 1.695068359375, 1.84625244140625, 1.9974365234375, 2.14862060546875, 2.2998046875, 2.45098876953125, 2.6021728515625, 2.75335693359375, 2.904541015625, 3.05572509765625, 3.2069091796875, 3.35809326171875, 3.50927734375, 3.66046142578125, 3.8116455078125, 3.96282958984375, 4.114013671875, 4.26519775390625, 4.4163818359375, 4.56756591796875, 4.71875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 5.0, 7.0, 7.0, 10.0, 16.0, 14.0, 19.0, 19.0, 47.0, 59.0, 71.0, 72.0, 120.0, 153.0, 267.0, 323.0, 651.0, 1276.0, 2917.0, 7931.0, 27520.0, 124043.0, 567005.0, 1645661.0, 1339602.0, 368409.0, 78861.0, 18635.0, 5781.0, 2141.0, 1012.0, 519.0, 326.0, 204.0, 159.0, 100.0, 73.0, 49.0, 56.0, 30.0, 25.0, 18.0, 16.0, 12.0, 15.0, 6.0, 9.0, 6.0, 9.0, 2.0, 3.0, 0.0, 2.0], "bins": [-6.890625, -6.69293212890625, -6.4952392578125, -6.29754638671875, -6.099853515625, -5.90216064453125, -5.7044677734375, -5.50677490234375, -5.30908203125, -5.11138916015625, -4.9136962890625, -4.71600341796875, -4.518310546875, -4.32061767578125, -4.1229248046875, -3.92523193359375, -3.7275390625, -3.52984619140625, -3.3321533203125, -3.13446044921875, -2.936767578125, -2.73907470703125, -2.5413818359375, -2.34368896484375, -2.14599609375, -1.94830322265625, -1.7506103515625, -1.55291748046875, -1.355224609375, -1.15753173828125, -0.9598388671875, -0.76214599609375, -0.564453125, -0.36676025390625, -0.1690673828125, 0.02862548828125, 0.226318359375, 0.42401123046875, 0.6217041015625, 0.81939697265625, 1.01708984375, 1.21478271484375, 1.4124755859375, 1.61016845703125, 1.807861328125, 2.00555419921875, 2.2032470703125, 2.40093994140625, 2.5986328125, 2.79632568359375, 2.9940185546875, 3.19171142578125, 3.389404296875, 3.58709716796875, 3.7847900390625, 3.98248291015625, 4.18017578125, 4.37786865234375, 4.5755615234375, 4.77325439453125, 4.970947265625, 5.16864013671875, 5.3663330078125, 5.56402587890625, 5.76171875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 1.0, 9.0, 4.0, 16.0, 13.0, 20.0, 25.0, 29.0, 35.0, 79.0, 77.0, 112.0, 177.0, 183.0, 292.0, 371.0, 437.0, 439.0, 403.0, 344.0, 276.0, 200.0, 124.0, 108.0, 64.0, 40.0, 52.0, 26.0, 30.0, 22.0, 19.0, 10.0, 9.0, 6.0, 2.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.88671875, -6.6602783203125, -6.433837890625, -6.2073974609375, -5.98095703125, -5.7545166015625, -5.528076171875, -5.3016357421875, -5.0751953125, -4.8487548828125, -4.622314453125, -4.3958740234375, -4.16943359375, -3.9429931640625, -3.716552734375, -3.4901123046875, -3.263671875, -3.0372314453125, -2.810791015625, -2.5843505859375, -2.35791015625, -2.1314697265625, -1.905029296875, -1.6785888671875, -1.4521484375, -1.2257080078125, -0.999267578125, -0.7728271484375, -0.54638671875, -0.3199462890625, -0.093505859375, 0.1329345703125, 0.359375, 0.5858154296875, 0.812255859375, 1.0386962890625, 1.26513671875, 1.4915771484375, 1.718017578125, 1.9444580078125, 2.1708984375, 2.3973388671875, 2.623779296875, 2.8502197265625, 3.07666015625, 3.3031005859375, 3.529541015625, 3.7559814453125, 3.982421875, 4.2088623046875, 4.435302734375, 4.6617431640625, 4.88818359375, 5.1146240234375, 5.341064453125, 5.5675048828125, 5.7939453125, 6.0203857421875, 6.246826171875, 6.4732666015625, 6.69970703125, 6.9261474609375, 7.152587890625, 7.3790283203125, 7.60546875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 2.0, 10.0, 14.0, 16.0, 18.0, 29.0, 42.0, 53.0, 86.0, 118.0, 140.0, 218.0, 405.0, 759.0, 1752.0, 9246.0, 125609.0, 2947060.0, 1056855.0, 44349.0, 4732.0, 1185.0, 582.0, 316.0, 217.0, 133.0, 94.0, 66.0, 38.0, 32.0, 24.0, 22.0, 13.0, 15.0, 3.0, 4.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-19.5, -18.92333984375, -18.3466796875, -17.77001953125, -17.193359375, -16.61669921875, -16.0400390625, -15.46337890625, -14.88671875, -14.31005859375, -13.7333984375, -13.15673828125, -12.580078125, -12.00341796875, -11.4267578125, -10.85009765625, -10.2734375, -9.69677734375, -9.1201171875, -8.54345703125, -7.966796875, -7.39013671875, -6.8134765625, -6.23681640625, -5.66015625, -5.08349609375, -4.5068359375, -3.93017578125, -3.353515625, -2.77685546875, -2.2001953125, -1.62353515625, -1.046875, -0.47021484375, 0.1064453125, 0.68310546875, 1.259765625, 1.83642578125, 2.4130859375, 2.98974609375, 3.56640625, 4.14306640625, 4.7197265625, 5.29638671875, 5.873046875, 6.44970703125, 7.0263671875, 7.60302734375, 8.1796875, 8.75634765625, 9.3330078125, 9.90966796875, 10.486328125, 11.06298828125, 11.6396484375, 12.21630859375, 12.79296875, 13.36962890625, 13.9462890625, 14.52294921875, 15.099609375, 15.67626953125, 16.2529296875, 16.82958984375, 17.40625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 18.0, 72.0, 151.0, 221.0, 228.0, 164.0, 104.0, 38.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.307598114013672, -16.325965881347656, -14.344331741333008, -12.362698554992676, -10.381065368652344, -8.399432182312012, -6.41779899597168, -4.436165809631348, -2.4545326232910156, -0.4728994369506836, 1.5087337493896484, 3.4903669357299805, 5.4720001220703125, 7.4536333084106445, 9.435266494750977, 11.416899681091309, 13.39853286743164, 15.380166053771973, 17.361799240112305, 19.343433380126953, 21.32506561279297, 23.306697845458984, 25.288331985473633, 27.26996612548828, 29.251598358154297, 31.233230590820312, 33.214866638183594, 35.19649887084961, 37.178131103515625, 39.15976333618164, 41.141395568847656, 43.12303161621094, 45.10466003417969, 47.0862922668457, 49.06792449951172, 51.049560546875, 53.031192779541016, 55.01282501220703, 56.99446105957031, 58.97609329223633, 60.957725524902344, 62.93935775756836, 64.92098999023438, 66.90262603759766, 68.88426208496094, 70.86589050292969, 72.84752655029297, 74.82915496826172, 76.810791015625, 78.79242706298828, 80.77405548095703, 82.75569152832031, 84.73731994628906, 86.71895599365234, 88.70059204101562, 90.68222045898438, 92.66385650634766, 94.64549255371094, 96.62712097167969, 98.60875701904297, 100.59039306640625, 102.572021484375, 104.55365753173828, 106.53528594970703, 108.51692199707031]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 4.0, 7.0, 10.0, 12.0, 23.0, 14.0, 14.0, 19.0, 16.0, 32.0, 28.0, 36.0, 36.0, 27.0, 42.0, 38.0, 31.0, 37.0, 37.0, 47.0, 46.0, 36.0, 39.0, 24.0, 38.0, 41.0, 27.0, 26.0, 28.0, 17.0, 23.0, 21.0, 17.0, 12.0, 15.0, 12.0, 8.0, 7.0, 8.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-24.549427032470703, -23.84429168701172, -23.139156341552734, -22.434022903442383, -21.7288875579834, -21.023752212524414, -20.318618774414062, -19.613483428955078, -18.908348083496094, -18.20321273803711, -17.498077392578125, -16.792943954467773, -16.08780860900879, -15.382673263549805, -14.677538871765137, -13.972404479980469, -13.267269134521484, -12.5621337890625, -11.856999397277832, -11.151865005493164, -10.44672966003418, -9.741594314575195, -9.036459922790527, -8.33132553100586, -7.626190185546875, -6.921055316925049, -6.215920448303223, -5.5107855796813965, -4.80565071105957, -4.100515842437744, -3.395380973815918, -2.690246105194092, -1.9851112365722656, -1.2799763679504395, -0.5748414993286133, 0.1302933692932129, 0.8354282379150391, 1.5405631065368652, 2.2456979751586914, 2.9508328437805176, 3.6559677124023438, 4.36110258102417, 5.066237449645996, 5.771372318267822, 6.476507186889648, 7.181642055511475, 7.886776924133301, 8.591911315917969, 9.297046661376953, 10.002182006835938, 10.707316398620605, 11.412450790405273, 12.117586135864258, 12.822721481323242, 13.52785587310791, 14.232990264892578, 14.938125610351562, 15.643260955810547, 16.34839630126953, 17.053529739379883, 17.758665084838867, 18.46380043029785, 19.168933868408203, 19.874069213867188, 20.579204559326172]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 6.0, 6.0, 5.0, 12.0, 7.0, 7.0, 14.0, 13.0, 23.0, 20.0, 14.0, 24.0, 36.0, 27.0, 34.0, 31.0, 36.0, 40.0, 48.0, 42.0, 34.0, 47.0, 39.0, 41.0, 45.0, 36.0, 30.0, 33.0, 27.0, 17.0, 26.0, 25.0, 22.0, 20.0, 19.0, 10.0, 17.0, 11.0, 8.0, 11.0, 8.0, 6.0, 6.0, 5.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.8828125, -4.73370361328125, -4.5845947265625, -4.43548583984375, -4.286376953125, -4.13726806640625, -3.9881591796875, -3.83905029296875, -3.68994140625, -3.54083251953125, -3.3917236328125, -3.24261474609375, -3.093505859375, -2.94439697265625, -2.7952880859375, -2.64617919921875, -2.4970703125, -2.34796142578125, -2.1988525390625, -2.04974365234375, -1.900634765625, -1.75152587890625, -1.6024169921875, -1.45330810546875, -1.30419921875, -1.15509033203125, -1.0059814453125, -0.85687255859375, -0.707763671875, -0.55865478515625, -0.4095458984375, -0.26043701171875, -0.111328125, 0.03778076171875, 0.1868896484375, 0.33599853515625, 0.485107421875, 0.63421630859375, 0.7833251953125, 0.93243408203125, 1.08154296875, 1.23065185546875, 1.3797607421875, 1.52886962890625, 1.677978515625, 1.82708740234375, 1.9761962890625, 2.12530517578125, 2.2744140625, 2.42352294921875, 2.5726318359375, 2.72174072265625, 2.870849609375, 3.01995849609375, 3.1690673828125, 3.31817626953125, 3.46728515625, 3.61639404296875, 3.7655029296875, 3.91461181640625, 4.063720703125, 4.21282958984375, 4.3619384765625, 4.51104736328125, 4.66015625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 10.0, 4.0, 6.0, 26.0, 30.0, 31.0, 44.0, 89.0, 132.0, 191.0, 252.0, 329.0, 463.0, 681.0, 979.0, 1388.0, 1851.0, 2574.0, 3680.0, 5325.0, 7632.0, 11141.0, 16341.0, 24308.0, 36237.0, 54169.0, 81056.0, 114873.0, 150665.0, 152998.0, 120019.0, 84430.0, 56905.0, 38133.0, 25372.0, 17324.0, 11907.0, 7999.0, 5529.0, 3963.0, 2723.0, 1972.0, 1333.0, 1020.0, 680.0, 548.0, 359.0, 254.0, 194.0, 138.0, 65.0, 60.0, 40.0, 45.0, 19.0, 12.0, 10.0, 8.0, 1.0, 1.0, 2.0], "bins": [-0.36865234375, -0.35715484619140625, -0.3456573486328125, -0.33415985107421875, -0.322662353515625, -0.31116485595703125, -0.2996673583984375, -0.28816986083984375, -0.27667236328125, -0.26517486572265625, -0.2536773681640625, -0.24217987060546875, -0.230682373046875, -0.21918487548828125, -0.2076873779296875, -0.19618988037109375, -0.1846923828125, -0.17319488525390625, -0.1616973876953125, -0.15019989013671875, -0.138702392578125, -0.12720489501953125, -0.1157073974609375, -0.10420989990234375, -0.09271240234375, -0.08121490478515625, -0.0697174072265625, -0.05821990966796875, -0.046722412109375, -0.03522491455078125, -0.0237274169921875, -0.01222991943359375, -0.000732421875, 0.01076507568359375, 0.0222625732421875, 0.03376007080078125, 0.045257568359375, 0.05675506591796875, 0.0682525634765625, 0.07975006103515625, 0.09124755859375, 0.10274505615234375, 0.1142425537109375, 0.12574005126953125, 0.137237548828125, 0.14873504638671875, 0.1602325439453125, 0.17173004150390625, 0.1832275390625, 0.19472503662109375, 0.2062225341796875, 0.21772003173828125, 0.229217529296875, 0.24071502685546875, 0.2522125244140625, 0.26371002197265625, 0.27520751953125, 0.28670501708984375, 0.2982025146484375, 0.30970001220703125, 0.321197509765625, 0.33269500732421875, 0.3441925048828125, 0.35569000244140625, 0.3671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 10.0, 4.0, 4.0, 9.0, 10.0, 14.0, 11.0, 19.0, 20.0, 26.0, 26.0, 27.0, 31.0, 37.0, 35.0, 32.0, 39.0, 34.0, 43.0, 43.0, 1059.0, 41.0, 40.0, 43.0, 29.0, 39.0, 35.0, 34.0, 34.0, 32.0, 32.0, 17.0, 20.0, 22.0, 19.0, 17.0, 6.0, 10.0, 3.0, 4.0, 4.0, 0.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-3.716796875, -3.612701416015625, -3.50860595703125, -3.404510498046875, -3.3004150390625, -3.196319580078125, -3.09222412109375, -2.988128662109375, -2.884033203125, -2.779937744140625, -2.67584228515625, -2.571746826171875, -2.4676513671875, -2.363555908203125, -2.25946044921875, -2.155364990234375, -2.05126953125, -1.947174072265625, -1.84307861328125, -1.738983154296875, -1.6348876953125, -1.530792236328125, -1.42669677734375, -1.322601318359375, -1.218505859375, -1.114410400390625, -1.01031494140625, -0.906219482421875, -0.8021240234375, -0.698028564453125, -0.59393310546875, -0.489837646484375, -0.3857421875, -0.281646728515625, -0.17755126953125, -0.073455810546875, 0.0306396484375, 0.134735107421875, 0.23883056640625, 0.342926025390625, 0.447021484375, 0.551116943359375, 0.65521240234375, 0.759307861328125, 0.8634033203125, 0.967498779296875, 1.07159423828125, 1.175689697265625, 1.27978515625, 1.383880615234375, 1.48797607421875, 1.592071533203125, 1.6961669921875, 1.800262451171875, 1.90435791015625, 2.008453369140625, 2.112548828125, 2.216644287109375, 2.32073974609375, 2.424835205078125, 2.5289306640625, 2.633026123046875, 2.73712158203125, 2.841217041015625, 2.9453125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [9.0, 6.0, 11.0, 9.0, 22.0, 26.0, 33.0, 64.0, 82.0, 105.0, 166.0, 223.0, 278.0, 426.0, 608.0, 846.0, 1240.0, 1760.0, 2450.0, 3505.0, 5014.0, 7160.0, 10291.0, 14800.0, 21037.0, 30519.0, 42952.0, 61039.0, 83883.0, 110043.0, 986149.0, 323818.0, 107969.0, 81826.0, 59042.0, 42012.0, 29272.0, 20766.0, 14273.0, 10083.0, 6788.0, 4865.0, 3354.0, 2452.0, 1738.0, 1208.0, 857.0, 596.0, 406.0, 338.0, 221.0, 145.0, 113.0, 88.0, 55.0, 50.0, 20.0, 13.0, 12.0, 6.0, 5.0, 3.0, 1.0, 1.0], "bins": [-0.2479248046875, -0.2399158477783203, -0.23190689086914062, -0.22389793395996094, -0.21588897705078125, -0.20788002014160156, -0.19987106323242188, -0.1918621063232422, -0.1838531494140625, -0.1758441925048828, -0.16783523559570312, -0.15982627868652344, -0.15181732177734375, -0.14380836486816406, -0.13579940795898438, -0.1277904510498047, -0.119781494140625, -0.11177253723144531, -0.10376358032226562, -0.09575462341308594, -0.08774566650390625, -0.07973670959472656, -0.07172775268554688, -0.06371879577636719, -0.0557098388671875, -0.04770088195800781, -0.039691925048828125, -0.03168296813964844, -0.02367401123046875, -0.015665054321289062, -0.007656097412109375, 0.0003528594970703125, 0.00836181640625, 0.016370773315429688, 0.024379730224609375, 0.03238868713378906, 0.04039764404296875, 0.04840660095214844, 0.056415557861328125, 0.06442451477050781, 0.0724334716796875, 0.08044242858886719, 0.08845138549804688, 0.09646034240722656, 0.10446929931640625, 0.11247825622558594, 0.12048721313476562, 0.1284961700439453, 0.136505126953125, 0.1445140838623047, 0.15252304077148438, 0.16053199768066406, 0.16854095458984375, 0.17654991149902344, 0.18455886840820312, 0.1925678253173828, 0.2005767822265625, 0.2085857391357422, 0.21659469604492188, 0.22460365295410156, 0.23261260986328125, 0.24062156677246094, 0.24863052368164062, 0.2566394805908203, 0.2646484375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 3.0, 2.0, 11.0, 13.0, 9.0, 11.0, 17.0, 16.0, 20.0, 23.0, 20.0, 28.0, 38.0, 58.0, 58.0, 88.0, 85.0, 86.0, 69.0, 60.0, 60.0, 38.0, 37.0, 28.0, 22.0, 22.0, 11.0, 11.0, 7.0, 10.0, 8.0, 4.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.00467681884765625, -0.004553020000457764, -0.004429221153259277, -0.004305422306060791, -0.004181623458862305, -0.004057824611663818, -0.003934025764465332, -0.0038102269172668457, -0.0036864280700683594, -0.003562629222869873, -0.0034388303756713867, -0.0033150315284729004, -0.003191232681274414, -0.0030674338340759277, -0.0029436349868774414, -0.002819836139678955, -0.0026960372924804688, -0.0025722384452819824, -0.002448439598083496, -0.0023246407508850098, -0.0022008419036865234, -0.002077043056488037, -0.0019532442092895508, -0.0018294453620910645, -0.0017056465148925781, -0.0015818476676940918, -0.0014580488204956055, -0.0013342499732971191, -0.0012104511260986328, -0.0010866522789001465, -0.0009628534317016602, -0.0008390545845031738, -0.0007152557373046875, -0.0005914568901062012, -0.00046765804290771484, -0.0003438591957092285, -0.0002200603485107422, -9.626150131225586e-05, 2.753734588623047e-05, 0.0001513361930847168, 0.0002751350402832031, 0.00039893388748168945, 0.0005227327346801758, 0.0006465315818786621, 0.0007703304290771484, 0.0008941292762756348, 0.001017928123474121, 0.0011417269706726074, 0.0012655258178710938, 0.00138932466506958, 0.0015131235122680664, 0.0016369223594665527, 0.001760721206665039, 0.0018845200538635254, 0.0020083189010620117, 0.002132117748260498, 0.0022559165954589844, 0.0023797154426574707, 0.002503514289855957, 0.0026273131370544434, 0.0027511119842529297, 0.002874910831451416, 0.0029987096786499023, 0.0031225085258483887, 0.003246307373046875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 13.0, 8.0, 9.0, 14.0, 14.0, 23.0, 40.0, 28.0, 69.0, 78.0, 126.0, 201.0, 320.0, 665.0, 11600.0, 998411.0, 34953.0, 939.0, 356.0, 203.0, 127.0, 65.0, 60.0, 39.0, 51.0, 23.0, 27.0, 20.0, 16.0, 7.0, 8.0, 8.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06787109375, -0.06541252136230469, -0.06295394897460938, -0.06049537658691406, -0.05803680419921875, -0.05557823181152344, -0.053119659423828125, -0.05066108703613281, -0.0482025146484375, -0.04574394226074219, -0.043285369873046875, -0.04082679748535156, -0.03836822509765625, -0.03590965270996094, -0.033451080322265625, -0.030992507934570312, -0.028533935546875, -0.026075363159179688, -0.023616790771484375, -0.021158218383789062, -0.01869964599609375, -0.016241073608398438, -0.013782501220703125, -0.011323928833007812, -0.0088653564453125, -0.0064067840576171875, -0.003948211669921875, -0.0014896392822265625, 0.00096893310546875, 0.0034275054931640625, 0.005886077880859375, 0.008344650268554688, 0.01080322265625, 0.013261795043945312, 0.015720367431640625, 0.018178939819335938, 0.02063751220703125, 0.023096084594726562, 0.025554656982421875, 0.028013229370117188, 0.0304718017578125, 0.03293037414550781, 0.035388946533203125, 0.03784751892089844, 0.04030609130859375, 0.04276466369628906, 0.045223236083984375, 0.04768180847167969, 0.050140380859375, 0.05259895324707031, 0.055057525634765625, 0.05751609802246094, 0.05997467041015625, 0.06243324279785156, 0.06489181518554688, 0.06735038757324219, 0.0698089599609375, 0.07226753234863281, 0.07472610473632812, 0.07718467712402344, 0.07964324951171875, 0.08210182189941406, 0.08456039428710938, 0.08701896667480469, 0.0894775390625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 153.0, 796.0, 57.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01752881519496441, -0.0166240893304348, -0.01571936532855034, -0.014814639464020729, -0.01390991359949112, -0.013005188666284084, -0.01210046373307705, -0.01119573786854744, -0.010291012935340405, -0.00938628800213337, -0.00848156213760376, -0.007576837204396725, -0.006672111805528402, -0.00576738640666008, -0.004862661473453045, -0.0039579360745847225, -0.0030532106757164, -0.0021484852768480778, -0.001243760110810399, -0.00033903494477272034, 0.000565690454095602, 0.0014704158529639244, 0.0023751407861709595, 0.003279866185039282, 0.004184591583907604, 0.005089316982775927, 0.005994042381644249, 0.006898767314851284, 0.007803492713719606, 0.008708218112587929, 0.009612943045794964, 0.010517667979001999, 0.011422395706176758, 0.012327120639383793, 0.013231846503913403, 0.014136571437120438, 0.015041297301650047, 0.015946023166179657, 0.016850747168064117, 0.017755473032593727, 0.018660198897123337, 0.019564924761652946, 0.020469648763537407, 0.021374374628067017, 0.022279100492596626, 0.023183826357126236, 0.024088550359010696, 0.024993276223540306, 0.025898000225424767, 0.026802726089954376, 0.027707450091838837, 0.028612175956368446, 0.029516901820898056, 0.030421625822782516, 0.031326353549957275, 0.032231077551841736, 0.033135801553726196, 0.03404052555561066, 0.034945253282785416, 0.035849977284669876, 0.03675470128655434, 0.037659429013729095, 0.038564153015613556, 0.039468877017498016, 0.040373604744672775]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 11.0, 7.0, 12.0, 8.0, 14.0, 23.0, 25.0, 36.0, 28.0, 43.0, 42.0, 37.0, 32.0, 46.0, 35.0, 44.0, 45.0, 56.0, 53.0, 45.0, 37.0, 37.0, 40.0, 41.0, 29.0, 26.0, 21.0, 13.0, 14.0, 13.0, 16.0, 10.0, 9.0, 15.0, 7.0, 5.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002440512180328369, -0.0023599201813340187, -0.0022793281823396683, -0.002198736183345318, -0.0021181441843509674, -0.002037552185356617, -0.0019569601863622665, -0.001876368187367916, -0.0017957761883735657, -0.0017151841893792152, -0.0016345921903848648, -0.0015540001913905144, -0.001473408192396164, -0.0013928161934018135, -0.001312224194407463, -0.0012316321954131126, -0.0011510401964187622, -0.0010704481974244118, -0.0009898561984300613, -0.0009092641994357109, -0.0008286722004413605, -0.00074808020144701, -0.0006674882024526596, -0.0005868962034583092, -0.0005063042044639587, -0.0004257122054696083, -0.0003451202064752579, -0.00026452820748090744, -0.000183936208486557, -0.00010334420949220657, -2.275221049785614e-05, 5.783978849649429e-05, 0.00013843178749084473, 0.00021902378648519516, 0.0002996157854795456, 0.000380207784473896, 0.00046079978346824646, 0.0005413917824625969, 0.0006219837814569473, 0.0007025757804512978, 0.0007831677794456482, 0.0008637597784399986, 0.0009443517774343491, 0.0010249437764286995, 0.00110553577542305, 0.0011861277744174004, 0.0012667197734117508, 0.0013473117724061012, 0.0014279037714004517, 0.001508495770394802, 0.0015890877693891525, 0.001669679768383503, 0.0017502717673778534, 0.0018308637663722038, 0.0019114557653665543, 0.0019920477643609047, 0.002072639763355255, 0.0021532317623496056, 0.002233823761343956, 0.0023144157603383064, 0.002395007759332657, 0.0024755997583270073, 0.0025561917573213577, 0.002636783756315708, 0.0027173757553100586]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 6.0, 6.0, 5.0, 12.0, 7.0, 7.0, 14.0, 13.0, 23.0, 20.0, 14.0, 24.0, 36.0, 28.0, 34.0, 30.0, 36.0, 40.0, 48.0, 42.0, 34.0, 47.0, 39.0, 41.0, 45.0, 36.0, 31.0, 32.0, 27.0, 17.0, 26.0, 25.0, 22.0, 20.0, 19.0, 10.0, 17.0, 11.0, 8.0, 11.0, 8.0, 5.0, 7.0, 5.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.8828125, -4.73370361328125, -4.5845947265625, -4.43548583984375, -4.286376953125, -4.13726806640625, -3.9881591796875, -3.83905029296875, -3.68994140625, -3.54083251953125, -3.3917236328125, -3.24261474609375, -3.093505859375, -2.94439697265625, -2.7952880859375, -2.64617919921875, -2.4970703125, -2.34796142578125, -2.1988525390625, -2.04974365234375, -1.900634765625, -1.75152587890625, -1.6024169921875, -1.45330810546875, -1.30419921875, -1.15509033203125, -1.0059814453125, -0.85687255859375, -0.707763671875, -0.55865478515625, -0.4095458984375, -0.26043701171875, -0.111328125, 0.03778076171875, 0.1868896484375, 0.33599853515625, 0.485107421875, 0.63421630859375, 0.7833251953125, 0.93243408203125, 1.08154296875, 1.23065185546875, 1.3797607421875, 1.52886962890625, 1.677978515625, 1.82708740234375, 1.9761962890625, 2.12530517578125, 2.2744140625, 2.42352294921875, 2.5726318359375, 2.72174072265625, 2.870849609375, 3.01995849609375, 3.1690673828125, 3.31817626953125, 3.46728515625, 3.61639404296875, 3.7655029296875, 3.91461181640625, 4.063720703125, 4.21282958984375, 4.3619384765625, 4.51104736328125, 4.66015625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 9.0, 17.0, 8.0, 21.0, 22.0, 39.0, 52.0, 55.0, 93.0, 104.0, 150.0, 252.0, 370.0, 633.0, 1114.0, 2025.0, 4450.0, 10601.0, 26732.0, 69419.0, 185369.0, 401048.0, 213954.0, 79116.0, 30504.0, 11967.0, 4980.0, 2292.0, 1172.0, 695.0, 400.0, 234.0, 165.0, 99.0, 93.0, 55.0, 56.0, 38.0, 38.0, 30.0, 15.0, 22.0, 12.0, 12.0, 6.0, 3.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-6.1484375, -5.95965576171875, -5.7708740234375, -5.58209228515625, -5.393310546875, -5.20452880859375, -5.0157470703125, -4.82696533203125, -4.63818359375, -4.44940185546875, -4.2606201171875, -4.07183837890625, -3.883056640625, -3.69427490234375, -3.5054931640625, -3.31671142578125, -3.1279296875, -2.93914794921875, -2.7503662109375, -2.56158447265625, -2.372802734375, -2.18402099609375, -1.9952392578125, -1.80645751953125, -1.61767578125, -1.42889404296875, -1.2401123046875, -1.05133056640625, -0.862548828125, -0.67376708984375, -0.4849853515625, -0.29620361328125, -0.107421875, 0.08135986328125, 0.2701416015625, 0.45892333984375, 0.647705078125, 0.83648681640625, 1.0252685546875, 1.21405029296875, 1.40283203125, 1.59161376953125, 1.7803955078125, 1.96917724609375, 2.157958984375, 2.34674072265625, 2.5355224609375, 2.72430419921875, 2.9130859375, 3.10186767578125, 3.2906494140625, 3.47943115234375, 3.668212890625, 3.85699462890625, 4.0457763671875, 4.23455810546875, 4.42333984375, 4.61212158203125, 4.8009033203125, 4.98968505859375, 5.178466796875, 5.36724853515625, 5.5560302734375, 5.74481201171875, 5.93359375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 8.0, 3.0, 5.0, 3.0, 12.0, 10.0, 16.0, 25.0, 24.0, 23.0, 30.0, 38.0, 37.0, 39.0, 40.0, 63.0, 94.0, 185.0, 1440.0, 354.0, 149.0, 82.0, 47.0, 40.0, 40.0, 42.0, 40.0, 33.0, 23.0, 19.0, 20.0, 15.0, 7.0, 9.0, 12.0, 6.0, 5.0, 8.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8125, -15.315185546875, -14.81787109375, -14.320556640625, -13.8232421875, -13.325927734375, -12.82861328125, -12.331298828125, -11.833984375, -11.336669921875, -10.83935546875, -10.342041015625, -9.8447265625, -9.347412109375, -8.85009765625, -8.352783203125, -7.85546875, -7.358154296875, -6.86083984375, -6.363525390625, -5.8662109375, -5.368896484375, -4.87158203125, -4.374267578125, -3.876953125, -3.379638671875, -2.88232421875, -2.385009765625, -1.8876953125, -1.390380859375, -0.89306640625, -0.395751953125, 0.1015625, 0.598876953125, 1.09619140625, 1.593505859375, 2.0908203125, 2.588134765625, 3.08544921875, 3.582763671875, 4.080078125, 4.577392578125, 5.07470703125, 5.572021484375, 6.0693359375, 6.566650390625, 7.06396484375, 7.561279296875, 8.05859375, 8.555908203125, 9.05322265625, 9.550537109375, 10.0478515625, 10.545166015625, 11.04248046875, 11.539794921875, 12.037109375, 12.534423828125, 13.03173828125, 13.529052734375, 14.0263671875, 14.523681640625, 15.02099609375, 15.518310546875, 16.015625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 10.0, 16.0, 10.0, 18.0, 24.0, 21.0, 42.0, 51.0, 59.0, 80.0, 140.0, 175.0, 291.0, 424.0, 821.0, 3620.0, 76529.0, 2807404.0, 245559.0, 7814.0, 1091.0, 485.0, 313.0, 167.0, 158.0, 94.0, 82.0, 59.0, 36.0, 26.0, 16.0, 15.0, 6.0, 10.0, 4.0, 16.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.828125, -21.138427734375, -20.44873046875, -19.759033203125, -19.0693359375, -18.379638671875, -17.68994140625, -17.000244140625, -16.310546875, -15.620849609375, -14.93115234375, -14.241455078125, -13.5517578125, -12.862060546875, -12.17236328125, -11.482666015625, -10.79296875, -10.103271484375, -9.41357421875, -8.723876953125, -8.0341796875, -7.344482421875, -6.65478515625, -5.965087890625, -5.275390625, -4.585693359375, -3.89599609375, -3.206298828125, -2.5166015625, -1.826904296875, -1.13720703125, -0.447509765625, 0.2421875, 0.931884765625, 1.62158203125, 2.311279296875, 3.0009765625, 3.690673828125, 4.38037109375, 5.070068359375, 5.759765625, 6.449462890625, 7.13916015625, 7.828857421875, 8.5185546875, 9.208251953125, 9.89794921875, 10.587646484375, 11.27734375, 11.967041015625, 12.65673828125, 13.346435546875, 14.0361328125, 14.725830078125, 15.41552734375, 16.105224609375, 16.794921875, 17.484619140625, 18.17431640625, 18.864013671875, 19.5537109375, 20.243408203125, 20.93310546875, 21.622802734375, 22.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 450.0, 555.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-298.1723937988281, -292.32733154296875, -286.48223876953125, -280.6371765136719, -274.7921142578125, -268.947021484375, -263.1019592285156, -257.2568664550781, -251.41180419921875, -245.5667266845703, -239.72164916992188, -233.8765869140625, -228.03150939941406, -222.18643188476562, -216.34136962890625, -210.4962921142578, -204.65121459960938, -198.80613708496094, -192.9610595703125, -187.11599731445312, -181.2709197998047, -175.42584228515625, -169.58078002929688, -163.73570251464844, -157.890625, -152.04554748535156, -146.20046997070312, -140.35540771484375, -134.5103302001953, -128.66525268554688, -122.82018280029297, -116.97511291503906, -111.1300277709961, -105.28495788574219, -99.43988037109375, -93.59480285644531, -87.7497329711914, -81.9046630859375, -76.05958557128906, -70.21450805664062, -64.36943817138672, -58.52436447143555, -52.679290771484375, -46.8342170715332, -40.98914337158203, -35.14406967163086, -29.298995971679688, -23.453922271728516, -17.608848571777344, -11.763774871826172, -5.918701171875, -0.07362747192382812, 5.771446228027344, 11.616519927978516, 17.461593627929688, 23.30666732788086, 29.15174102783203, 34.9968147277832, 40.841888427734375, 46.68696212768555, 52.53203582763672, 58.37710952758789, 64.22218322753906, 70.0672607421875, 75.9123306274414]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 13.0, 7.0, 7.0, 10.0, 17.0, 14.0, 21.0, 19.0, 25.0, 22.0, 19.0, 29.0, 25.0, 37.0, 36.0, 43.0, 33.0, 46.0, 40.0, 53.0, 37.0, 37.0, 36.0, 40.0, 39.0, 29.0, 38.0, 36.0, 17.0, 33.0, 19.0, 19.0, 25.0, 8.0, 18.0, 15.0, 7.0, 8.0, 7.0, 3.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.2372989654541, -28.192447662353516, -27.14759635925293, -26.102745056152344, -25.057891845703125, -24.013042449951172, -22.968189239501953, -21.923337936401367, -20.87848663330078, -19.833635330200195, -18.78878402709961, -17.743932723999023, -16.699081420898438, -15.654229164123535, -14.609376907348633, -13.564525604248047, -12.519674301147461, -11.474822998046875, -10.429971694946289, -9.385119438171387, -8.3402681350708, -7.295416831970215, -6.250565052032471, -5.205713272094727, -4.160861968994141, -3.1160104274749756, -2.0711588859558105, -1.0263073444366455, 0.01854419708251953, 1.0633955001831055, 2.1082472801208496, 3.1530990600585938, 4.197948455810547, 5.242799758911133, 6.287651538848877, 7.332503318786621, 8.377354621887207, 9.422205924987793, 10.467058181762695, 11.511909484863281, 12.556760787963867, 13.601612091064453, 14.646463394165039, 15.691315650939941, 16.736167907714844, 17.781017303466797, 18.825870513916016, 19.8707218170166, 20.915573120117188, 21.960424423217773, 23.00527572631836, 24.050127029418945, 25.09497833251953, 26.13983154296875, 27.184682846069336, 28.229534149169922, 29.274385452270508, 30.319236755371094, 31.36408805847168, 32.408939361572266, 33.453792572021484, 34.49864196777344, 35.543495178222656, 36.588348388671875, 37.63319778442383]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 9.0, 6.0, 5.0, 6.0, 19.0, 11.0, 22.0, 31.0, 28.0, 27.0, 41.0, 47.0, 32.0, 39.0, 50.0, 34.0, 52.0, 46.0, 47.0, 48.0, 38.0, 43.0, 37.0, 24.0, 23.0, 40.0, 32.0, 26.0, 19.0, 22.0, 18.0, 20.0, 11.0, 6.0, 9.0, 4.0, 4.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.0, -5.82373046875, -5.6474609375, -5.47119140625, -5.294921875, -5.11865234375, -4.9423828125, -4.76611328125, -4.58984375, -4.41357421875, -4.2373046875, -4.06103515625, -3.884765625, -3.70849609375, -3.5322265625, -3.35595703125, -3.1796875, -3.00341796875, -2.8271484375, -2.65087890625, -2.474609375, -2.29833984375, -2.1220703125, -1.94580078125, -1.76953125, -1.59326171875, -1.4169921875, -1.24072265625, -1.064453125, -0.88818359375, -0.7119140625, -0.53564453125, -0.359375, -0.18310546875, -0.0068359375, 0.16943359375, 0.345703125, 0.52197265625, 0.6982421875, 0.87451171875, 1.05078125, 1.22705078125, 1.4033203125, 1.57958984375, 1.755859375, 1.93212890625, 2.1083984375, 2.28466796875, 2.4609375, 2.63720703125, 2.8134765625, 2.98974609375, 3.166015625, 3.34228515625, 3.5185546875, 3.69482421875, 3.87109375, 4.04736328125, 4.2236328125, 4.39990234375, 4.576171875, 4.75244140625, 4.9287109375, 5.10498046875, 5.28125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 7.0, 7.0, 8.0, 14.0, 13.0, 20.0, 23.0, 28.0, 42.0, 80.0, 121.0, 165.0, 320.0, 546.0, 1086.0, 2170.0, 5333.0, 14209.0, 45197.0, 161318.0, 546158.0, 1367435.0, 1337546.0, 507188.0, 142168.0, 40470.0, 13141.0, 4903.0, 2160.0, 1015.0, 543.0, 304.0, 183.0, 97.0, 67.0, 54.0, 31.0, 26.0, 16.0, 18.0, 8.0, 12.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.46875, -5.3028564453125, -5.136962890625, -4.9710693359375, -4.80517578125, -4.6392822265625, -4.473388671875, -4.3074951171875, -4.1416015625, -3.9757080078125, -3.809814453125, -3.6439208984375, -3.47802734375, -3.3121337890625, -3.146240234375, -2.9803466796875, -2.814453125, -2.6485595703125, -2.482666015625, -2.3167724609375, -2.15087890625, -1.9849853515625, -1.819091796875, -1.6531982421875, -1.4873046875, -1.3214111328125, -1.155517578125, -0.9896240234375, -0.82373046875, -0.6578369140625, -0.491943359375, -0.3260498046875, -0.16015625, 0.0057373046875, 0.171630859375, 0.3375244140625, 0.50341796875, 0.6693115234375, 0.835205078125, 1.0010986328125, 1.1669921875, 1.3328857421875, 1.498779296875, 1.6646728515625, 1.83056640625, 1.9964599609375, 2.162353515625, 2.3282470703125, 2.494140625, 2.6600341796875, 2.825927734375, 2.9918212890625, 3.15771484375, 3.3236083984375, 3.489501953125, 3.6553955078125, 3.8212890625, 3.9871826171875, 4.153076171875, 4.3189697265625, 4.48486328125, 4.6507568359375, 4.816650390625, 4.9825439453125, 5.1484375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 4.0, 4.0, 7.0, 13.0, 18.0, 19.0, 22.0, 24.0, 32.0, 55.0, 68.0, 102.0, 121.0, 171.0, 212.0, 294.0, 368.0, 434.0, 460.0, 377.0, 358.0, 216.0, 174.0, 120.0, 93.0, 77.0, 50.0, 38.0, 32.0, 26.0, 18.0, 12.0, 12.0, 7.0, 6.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.390625, -7.18597412109375, -6.9813232421875, -6.77667236328125, -6.572021484375, -6.36737060546875, -6.1627197265625, -5.95806884765625, -5.75341796875, -5.54876708984375, -5.3441162109375, -5.13946533203125, -4.934814453125, -4.73016357421875, -4.5255126953125, -4.32086181640625, -4.1162109375, -3.91156005859375, -3.7069091796875, -3.50225830078125, -3.297607421875, -3.09295654296875, -2.8883056640625, -2.68365478515625, -2.47900390625, -2.27435302734375, -2.0697021484375, -1.86505126953125, -1.660400390625, -1.45574951171875, -1.2510986328125, -1.04644775390625, -0.841796875, -0.63714599609375, -0.4324951171875, -0.22784423828125, -0.023193359375, 0.18145751953125, 0.3861083984375, 0.59075927734375, 0.79541015625, 1.00006103515625, 1.2047119140625, 1.40936279296875, 1.614013671875, 1.81866455078125, 2.0233154296875, 2.22796630859375, 2.4326171875, 2.63726806640625, 2.8419189453125, 3.04656982421875, 3.251220703125, 3.45587158203125, 3.6605224609375, 3.86517333984375, 4.06982421875, 4.27447509765625, 4.4791259765625, 4.68377685546875, 4.888427734375, 5.09307861328125, 5.2977294921875, 5.50238037109375, 5.70703125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 5.0, 11.0, 9.0, 18.0, 18.0, 32.0, 34.0, 49.0, 63.0, 102.0, 150.0, 260.0, 525.0, 1061.0, 2850.0, 8786.0, 33567.0, 157382.0, 1066187.0, 2408479.0, 414665.0, 73641.0, 17826.0, 5004.0, 1767.0, 748.0, 344.0, 207.0, 142.0, 89.0, 59.0, 51.0, 42.0, 24.0, 26.0, 9.0, 21.0, 13.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.34375, -9.044921875, -8.74609375, -8.447265625, -8.1484375, -7.849609375, -7.55078125, -7.251953125, -6.953125, -6.654296875, -6.35546875, -6.056640625, -5.7578125, -5.458984375, -5.16015625, -4.861328125, -4.5625, -4.263671875, -3.96484375, -3.666015625, -3.3671875, -3.068359375, -2.76953125, -2.470703125, -2.171875, -1.873046875, -1.57421875, -1.275390625, -0.9765625, -0.677734375, -0.37890625, -0.080078125, 0.21875, 0.517578125, 0.81640625, 1.115234375, 1.4140625, 1.712890625, 2.01171875, 2.310546875, 2.609375, 2.908203125, 3.20703125, 3.505859375, 3.8046875, 4.103515625, 4.40234375, 4.701171875, 5.0, 5.298828125, 5.59765625, 5.896484375, 6.1953125, 6.494140625, 6.79296875, 7.091796875, 7.390625, 7.689453125, 7.98828125, 8.287109375, 8.5859375, 8.884765625, 9.18359375, 9.482421875, 9.78125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 22.0, 47.0, 97.0, 150.0, 175.0, 176.0, 140.0, 98.0, 64.0, 21.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.483957290649414, -21.083271026611328, -19.68258285522461, -18.281896591186523, -16.881210327148438, -15.480523109436035, -14.079835891723633, -12.679149627685547, -11.278462409973145, -9.877775192260742, -8.477088928222656, -7.076401710510254, -5.67571496963501, -4.275028228759766, -2.8743410110473633, -1.4736547470092773, -0.072967529296875, 1.3277193307876587, 2.7284061908721924, 4.129093170166016, 5.52977991104126, 6.930466651916504, 8.331153869628906, 9.731840133666992, 11.132527351379395, 12.533214569091797, 13.933900833129883, 15.334588050842285, 16.735275268554688, 18.135961532592773, 19.53664779663086, 20.937335968017578, 22.338024139404297, 23.738710403442383, 25.1393985748291, 26.540084838867188, 27.940771102905273, 29.34145736694336, 30.742145538330078, 32.14282989501953, 33.54351806640625, 34.94420623779297, 36.34489059448242, 37.74557876586914, 39.14626693725586, 40.54695129394531, 41.94763946533203, 43.34832763671875, 44.74901580810547, 46.14970397949219, 47.55038833618164, 48.95107650756836, 50.35176467895508, 51.75244903564453, 53.15313720703125, 54.55382537841797, 55.95450973510742, 57.35519790649414, 58.755882263183594, 60.15657043457031, 61.55725860595703, 62.957942962646484, 64.35862731933594, 65.75931549072266, 67.16000366210938]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 3.0, 3.0, 7.0, 13.0, 8.0, 7.0, 22.0, 10.0, 20.0, 31.0, 27.0, 32.0, 29.0, 44.0, 35.0, 32.0, 35.0, 45.0, 39.0, 40.0, 54.0, 47.0, 51.0, 30.0, 40.0, 43.0, 39.0, 29.0, 29.0, 26.0, 21.0, 21.0, 20.0, 22.0, 11.0, 4.0, 10.0, 6.0, 4.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.14306640625, -23.337657928466797, -22.532249450683594, -21.72684097290039, -20.921430587768555, -20.11602210998535, -19.31061363220215, -18.505205154418945, -17.699796676635742, -16.89438819885254, -16.088979721069336, -15.283570289611816, -14.478161811828613, -13.672752380371094, -12.86734390258789, -12.061935424804688, -11.256525993347168, -10.451117515563965, -9.645708084106445, -8.840299606323242, -8.034891128540039, -7.229482173919678, -6.424073219299316, -5.618664741516113, -4.813255786895752, -4.007846832275391, -3.2024383544921875, -2.397029399871826, -1.591620683670044, -0.7862119674682617, 0.01919698715209961, 0.8246054649353027, 1.630014419555664, 2.4354231357574463, 3.2408318519592285, 4.04624080657959, 4.851649284362793, 5.657058238983154, 6.462467193603516, 7.267875671386719, 8.073284149169922, 8.878692626953125, 9.684102058410645, 10.489510536193848, 11.29491901397705, 12.10032844543457, 12.905736923217773, 13.711145401000977, 14.516554832458496, 15.3219633102417, 16.12737274169922, 16.932781219482422, 17.738189697265625, 18.543598175048828, 19.34900665283203, 20.154415130615234, 20.95982551574707, 21.765233993530273, 22.570642471313477, 23.376052856445312, 24.181461334228516, 24.98686981201172, 25.792278289794922, 26.597686767578125, 27.403095245361328]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 7.0, 6.0, 12.0, 15.0, 13.0, 10.0, 24.0, 41.0, 22.0, 26.0, 29.0, 45.0, 43.0, 28.0, 43.0, 41.0, 43.0, 44.0, 41.0, 40.0, 52.0, 44.0, 34.0, 35.0, 25.0, 30.0, 23.0, 28.0, 22.0, 27.0, 22.0, 22.0, 6.0, 8.0, 5.0, 3.0, 5.0, 8.0, 5.0, 0.0, 5.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.4453125, -5.2796630859375, -5.114013671875, -4.9483642578125, -4.78271484375, -4.6170654296875, -4.451416015625, -4.2857666015625, -4.1201171875, -3.9544677734375, -3.788818359375, -3.6231689453125, -3.45751953125, -3.2918701171875, -3.126220703125, -2.9605712890625, -2.794921875, -2.6292724609375, -2.463623046875, -2.2979736328125, -2.13232421875, -1.9666748046875, -1.801025390625, -1.6353759765625, -1.4697265625, -1.3040771484375, -1.138427734375, -0.9727783203125, -0.80712890625, -0.6414794921875, -0.475830078125, -0.3101806640625, -0.14453125, 0.0211181640625, 0.186767578125, 0.3524169921875, 0.51806640625, 0.6837158203125, 0.849365234375, 1.0150146484375, 1.1806640625, 1.3463134765625, 1.511962890625, 1.6776123046875, 1.84326171875, 2.0089111328125, 2.174560546875, 2.3402099609375, 2.505859375, 2.6715087890625, 2.837158203125, 3.0028076171875, 3.16845703125, 3.3341064453125, 3.499755859375, 3.6654052734375, 3.8310546875, 3.9967041015625, 4.162353515625, 4.3280029296875, 4.49365234375, 4.6593017578125, 4.824951171875, 4.9906005859375, 5.15625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 12.0, 17.0, 30.0, 44.0, 82.0, 92.0, 153.0, 198.0, 253.0, 415.0, 595.0, 834.0, 1262.0, 1845.0, 2717.0, 4155.0, 6419.0, 10109.0, 15758.0, 25307.0, 41876.0, 67661.0, 109760.0, 164801.0, 192905.0, 148457.0, 96006.0, 58628.0, 36178.0, 22049.0, 13788.0, 8770.0, 5822.0, 3793.0, 2409.0, 1703.0, 1165.0, 792.0, 514.0, 346.0, 270.0, 196.0, 125.0, 77.0, 52.0, 36.0, 18.0, 16.0, 21.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.464599609375, -0.4502410888671875, -0.435882568359375, -0.4215240478515625, -0.40716552734375, -0.3928070068359375, -0.378448486328125, -0.3640899658203125, -0.3497314453125, -0.3353729248046875, -0.321014404296875, -0.3066558837890625, -0.29229736328125, -0.2779388427734375, -0.263580322265625, -0.2492218017578125, -0.23486328125, -0.2205047607421875, -0.206146240234375, -0.1917877197265625, -0.17742919921875, -0.1630706787109375, -0.148712158203125, -0.1343536376953125, -0.1199951171875, -0.1056365966796875, -0.091278076171875, -0.0769195556640625, -0.06256103515625, -0.0482025146484375, -0.033843994140625, -0.0194854736328125, -0.005126953125, 0.0092315673828125, 0.023590087890625, 0.0379486083984375, 0.05230712890625, 0.0666656494140625, 0.081024169921875, 0.0953826904296875, 0.1097412109375, 0.1240997314453125, 0.138458251953125, 0.1528167724609375, 0.16717529296875, 0.1815338134765625, 0.195892333984375, 0.2102508544921875, 0.224609375, 0.2389678955078125, 0.253326416015625, 0.2676849365234375, 0.28204345703125, 0.2964019775390625, 0.310760498046875, 0.3251190185546875, 0.3394775390625, 0.3538360595703125, 0.368194580078125, 0.3825531005859375, 0.39691162109375, 0.4112701416015625, 0.425628662109375, 0.4399871826171875, 0.454345703125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 7.0, 14.0, 12.0, 19.0, 12.0, 16.0, 22.0, 22.0, 32.0, 43.0, 42.0, 34.0, 29.0, 53.0, 52.0, 38.0, 1059.0, 45.0, 43.0, 36.0, 44.0, 36.0, 49.0, 27.0, 30.0, 36.0, 25.0, 22.0, 19.0, 14.0, 20.0, 10.0, 10.0, 7.0, 8.0, 5.0, 5.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34765625, -3.23602294921875, -3.1243896484375, -3.01275634765625, -2.901123046875, -2.78948974609375, -2.6778564453125, -2.56622314453125, -2.45458984375, -2.34295654296875, -2.2313232421875, -2.11968994140625, -2.008056640625, -1.89642333984375, -1.7847900390625, -1.67315673828125, -1.5615234375, -1.44989013671875, -1.3382568359375, -1.22662353515625, -1.114990234375, -1.00335693359375, -0.8917236328125, -0.78009033203125, -0.66845703125, -0.55682373046875, -0.4451904296875, -0.33355712890625, -0.221923828125, -0.11029052734375, 0.0013427734375, 0.11297607421875, 0.224609375, 0.33624267578125, 0.4478759765625, 0.55950927734375, 0.671142578125, 0.78277587890625, 0.8944091796875, 1.00604248046875, 1.11767578125, 1.22930908203125, 1.3409423828125, 1.45257568359375, 1.564208984375, 1.67584228515625, 1.7874755859375, 1.89910888671875, 2.0107421875, 2.12237548828125, 2.2340087890625, 2.34564208984375, 2.457275390625, 2.56890869140625, 2.6805419921875, 2.79217529296875, 2.90380859375, 3.01544189453125, 3.1270751953125, 3.23870849609375, 3.350341796875, 3.46197509765625, 3.5736083984375, 3.68524169921875, 3.796875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 5.0, 5.0, 11.0, 20.0, 39.0, 49.0, 90.0, 125.0, 167.0, 272.0, 367.0, 528.0, 775.0, 1109.0, 1614.0, 2397.0, 3528.0, 5231.0, 7978.0, 11929.0, 17874.0, 26136.0, 39201.0, 58110.0, 83427.0, 114928.0, 370263.0, 966440.0, 117183.0, 85076.0, 59572.0, 40443.0, 27327.0, 18127.0, 12000.0, 8014.0, 5386.0, 3719.0, 2483.0, 1572.0, 1113.0, 776.0, 562.0, 400.0, 260.0, 152.0, 117.0, 90.0, 49.0, 39.0, 19.0, 16.0, 13.0, 5.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.308837890625, -0.2994880676269531, -0.29013824462890625, -0.2807884216308594, -0.2714385986328125, -0.2620887756347656, -0.25273895263671875, -0.24338912963867188, -0.234039306640625, -0.22468948364257812, -0.21533966064453125, -0.20598983764648438, -0.1966400146484375, -0.18729019165039062, -0.17794036865234375, -0.16859054565429688, -0.15924072265625, -0.14989089965820312, -0.14054107666015625, -0.13119125366210938, -0.1218414306640625, -0.11249160766601562, -0.10314178466796875, -0.09379196166992188, -0.084442138671875, -0.07509231567382812, -0.06574249267578125, -0.056392669677734375, -0.0470428466796875, -0.037693023681640625, -0.02834320068359375, -0.018993377685546875, -0.0096435546875, -0.000293731689453125, 0.00905609130859375, 0.018405914306640625, 0.0277557373046875, 0.037105560302734375, 0.04645538330078125, 0.055805206298828125, 0.065155029296875, 0.07450485229492188, 0.08385467529296875, 0.09320449829101562, 0.1025543212890625, 0.11190414428710938, 0.12125396728515625, 0.13060379028320312, 0.13995361328125, 0.14930343627929688, 0.15865325927734375, 0.16800308227539062, 0.1773529052734375, 0.18670272827148438, 0.19605255126953125, 0.20540237426757812, 0.214752197265625, 0.22410202026367188, 0.23345184326171875, 0.24280166625976562, 0.2521514892578125, 0.2615013122558594, 0.27085113525390625, 0.2802009582519531, 0.28955078125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 5.0, 3.0, 10.0, 6.0, 14.0, 18.0, 20.0, 25.0, 34.0, 61.0, 66.0, 83.0, 104.0, 99.0, 97.0, 92.0, 76.0, 41.0, 36.0, 35.0, 16.0, 13.0, 11.0, 9.0, 9.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.005168914794921875, -0.005014479160308838, -0.004860043525695801, -0.004705607891082764, -0.0045511722564697266, -0.0043967366218566895, -0.004242300987243652, -0.004087865352630615, -0.003933429718017578, -0.003778994083404541, -0.003624558448791504, -0.003470122814178467, -0.0033156871795654297, -0.0031612515449523926, -0.0030068159103393555, -0.0028523802757263184, -0.0026979446411132812, -0.002543509006500244, -0.002389073371887207, -0.00223463773727417, -0.002080202102661133, -0.0019257664680480957, -0.0017713308334350586, -0.0016168951988220215, -0.0014624595642089844, -0.0013080239295959473, -0.0011535882949829102, -0.000999152660369873, -0.0008447170257568359, -0.0006902813911437988, -0.0005358457565307617, -0.0003814101219177246, -0.0002269744873046875, -7.253885269165039e-05, 8.189678192138672e-05, 0.00023633241653442383, 0.00039076805114746094, 0.000545203685760498, 0.0006996393203735352, 0.0008540749549865723, 0.0010085105895996094, 0.0011629462242126465, 0.0013173818588256836, 0.0014718174934387207, 0.0016262531280517578, 0.001780688762664795, 0.001935124397277832, 0.002089560031890869, 0.0022439956665039062, 0.0023984313011169434, 0.0025528669357299805, 0.0027073025703430176, 0.0028617382049560547, 0.003016173839569092, 0.003170609474182129, 0.003325045108795166, 0.003479480743408203, 0.0036339163780212402, 0.0037883520126342773, 0.0039427876472473145, 0.0040972232818603516, 0.004251658916473389, 0.004406094551086426, 0.004560530185699463, 0.0047149658203125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 3.0, 4.0, 12.0, 13.0, 20.0, 32.0, 39.0, 59.0, 95.0, 132.0, 228.0, 506.0, 4306.0, 991960.0, 49394.0, 889.0, 303.0, 195.0, 90.0, 65.0, 56.0, 30.0, 30.0, 17.0, 12.0, 11.0, 8.0, 5.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0928955078125, -0.08987140655517578, -0.08684730529785156, -0.08382320404052734, -0.08079910278320312, -0.0777750015258789, -0.07475090026855469, -0.07172679901123047, -0.06870269775390625, -0.06567859649658203, -0.06265449523925781, -0.059630393981933594, -0.056606292724609375, -0.053582191467285156, -0.05055809020996094, -0.04753398895263672, -0.0445098876953125, -0.04148578643798828, -0.03846168518066406, -0.035437583923339844, -0.032413482666015625, -0.029389381408691406, -0.026365280151367188, -0.02334117889404297, -0.02031707763671875, -0.01729297637939453, -0.014268875122070312, -0.011244773864746094, -0.008220672607421875, -0.005196571350097656, -0.0021724700927734375, 0.0008516311645507812, 0.003875732421875, 0.006899833679199219, 0.009923934936523438, 0.012948036193847656, 0.015972137451171875, 0.018996238708496094, 0.022020339965820312, 0.02504444122314453, 0.02806854248046875, 0.03109264373779297, 0.03411674499511719, 0.037140846252441406, 0.040164947509765625, 0.043189048767089844, 0.04621315002441406, 0.04923725128173828, 0.0522613525390625, 0.05528545379638672, 0.05830955505371094, 0.061333656311035156, 0.06435775756835938, 0.0673818588256836, 0.07040596008300781, 0.07343006134033203, 0.07645416259765625, 0.07947826385498047, 0.08250236511230469, 0.0855264663696289, 0.08855056762695312, 0.09157466888427734, 0.09459877014160156, 0.09762287139892578, 0.10064697265625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 202.0, 775.0, 34.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053008273243904114, -0.05195494741201401, -0.0509016178548336, -0.0498482920229435, -0.04879496246576309, -0.047741636633872986, -0.04668830707669258, -0.045634981244802475, -0.04458165168762207, -0.043528325855731964, -0.04247499629855156, -0.04142167046666145, -0.04036834090948105, -0.03931501507759094, -0.03826168552041054, -0.03720835968852043, -0.03615503013134003, -0.03510170429944992, -0.034048374742269516, -0.03299504891037941, -0.031941719353199005, -0.03088839165866375, -0.029835063964128494, -0.028781738132238388, -0.027728412300348282, -0.026675084605813026, -0.02562175691127777, -0.024568429216742516, -0.02351510152220726, -0.022461773827672005, -0.02140844613313675, -0.020355120301246643, -0.01930179074406624, -0.018248463049530983, -0.017195135354995728, -0.016141807660460472, -0.015088479965925217, -0.014035152271389961, -0.01298182550817728, -0.011928497813642025, -0.01087517011910677, -0.009821842424571514, -0.008768514730036259, -0.007715187501162291, -0.006661859806627035, -0.00560853211209178, -0.004555204883217812, -0.003501877188682556, -0.0024485494941473007, -0.0013952219160273671, -0.0003418943379074335, 0.0007114331237971783, 0.0017647608183324337, 0.002818088512867689, 0.0038714157417416573, 0.004924743436276913, 0.005978071130812168, 0.0070313988253474236, 0.008084726519882679, 0.00913805328309536, 0.010191380977630615, 0.01124470867216587, 0.012298036366701126, 0.013351364061236382, 0.014404691755771637]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 9.0, 16.0, 23.0, 27.0, 29.0, 28.0, 34.0, 42.0, 54.0, 62.0, 66.0, 56.0, 61.0, 76.0, 68.0, 59.0, 58.0, 26.0, 37.0, 30.0, 31.0, 22.0, 22.0, 19.0, 11.0, 8.0, 8.0, 3.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002965986728668213, -0.002864253707230091, -0.0027625206857919693, -0.0026607876643538475, -0.0025590546429157257, -0.002457321621477604, -0.002355588600039482, -0.0022538555786013603, -0.0021521225571632385, -0.0020503895357251167, -0.001948656514286995, -0.0018469234928488731, -0.0017451904714107513, -0.0016434574499726295, -0.0015417244285345078, -0.001439991407096386, -0.0013382583856582642, -0.0012365253642201424, -0.0011347923427820206, -0.0010330593213438988, -0.000931326299905777, -0.0008295932784676552, -0.0007278602570295334, -0.0006261272355914116, -0.0005243942141532898, -0.000422661192715168, -0.0003209281712770462, -0.0002191951498389244, -0.00011746212840080261, -1.5729106962680817e-05, 8.600391447544098e-05, 0.00018773693591356277, 0.00028946995735168457, 0.00039120297878980637, 0.0004929360002279282, 0.00059466902166605, 0.0006964020431041718, 0.0007981350645422935, 0.0008998680859804153, 0.0010016011074185371, 0.001103334128856659, 0.0012050671502947807, 0.0013068001717329025, 0.0014085331931710243, 0.0015102662146091461, 0.001611999236047268, 0.0017137322574853897, 0.0018154652789235115, 0.0019171983003616333, 0.002018931321799755, 0.002120664343237877, 0.0022223973646759987, 0.0023241303861141205, 0.0024258634075522423, 0.002527596428990364, 0.002629329450428486, 0.0027310624718666077, 0.0028327954933047295, 0.0029345285147428513, 0.003036261536180973, 0.003137994557619095, 0.0032397275790572166, 0.0033414606004953384, 0.0034431936219334602, 0.003544926643371582]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 7.0, 6.0, 12.0, 15.0, 13.0, 10.0, 24.0, 41.0, 22.0, 26.0, 29.0, 45.0, 43.0, 28.0, 43.0, 41.0, 43.0, 45.0, 40.0, 40.0, 52.0, 44.0, 34.0, 35.0, 25.0, 30.0, 23.0, 28.0, 22.0, 27.0, 22.0, 22.0, 6.0, 8.0, 5.0, 3.0, 5.0, 8.0, 5.0, 0.0, 5.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.4453125, -5.2796630859375, -5.114013671875, -4.9483642578125, -4.78271484375, -4.6170654296875, -4.451416015625, -4.2857666015625, -4.1201171875, -3.9544677734375, -3.788818359375, -3.6231689453125, -3.45751953125, -3.2918701171875, -3.126220703125, -2.9605712890625, -2.794921875, -2.6292724609375, -2.463623046875, -2.2979736328125, -2.13232421875, -1.9666748046875, -1.801025390625, -1.6353759765625, -1.4697265625, -1.3040771484375, -1.138427734375, -0.9727783203125, -0.80712890625, -0.6414794921875, -0.475830078125, -0.3101806640625, -0.14453125, 0.0211181640625, 0.186767578125, 0.3524169921875, 0.51806640625, 0.6837158203125, 0.849365234375, 1.0150146484375, 1.1806640625, 1.3463134765625, 1.511962890625, 1.6776123046875, 1.84326171875, 2.0089111328125, 2.174560546875, 2.3402099609375, 2.505859375, 2.6715087890625, 2.837158203125, 3.0028076171875, 3.16845703125, 3.3341064453125, 3.499755859375, 3.6654052734375, 3.8310546875, 3.9967041015625, 4.162353515625, 4.3280029296875, 4.49365234375, 4.6593017578125, 4.824951171875, 4.9906005859375, 5.15625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 11.0, 14.0, 15.0, 23.0, 38.0, 47.0, 75.0, 77.0, 131.0, 151.0, 200.0, 299.0, 479.0, 788.0, 1453.0, 3274.0, 8122.0, 24166.0, 72535.0, 220896.0, 425893.0, 191663.0, 63438.0, 21142.0, 7160.0, 2808.0, 1350.0, 737.0, 464.0, 286.0, 228.0, 145.0, 98.0, 84.0, 66.0, 52.0, 29.0, 26.0, 22.0, 11.0, 14.0, 9.0, 8.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0], "bins": [-7.5390625, -7.3135986328125, -7.088134765625, -6.8626708984375, -6.63720703125, -6.4117431640625, -6.186279296875, -5.9608154296875, -5.7353515625, -5.5098876953125, -5.284423828125, -5.0589599609375, -4.83349609375, -4.6080322265625, -4.382568359375, -4.1571044921875, -3.931640625, -3.7061767578125, -3.480712890625, -3.2552490234375, -3.02978515625, -2.8043212890625, -2.578857421875, -2.3533935546875, -2.1279296875, -1.9024658203125, -1.677001953125, -1.4515380859375, -1.22607421875, -1.0006103515625, -0.775146484375, -0.5496826171875, -0.32421875, -0.0987548828125, 0.126708984375, 0.3521728515625, 0.57763671875, 0.8031005859375, 1.028564453125, 1.2540283203125, 1.4794921875, 1.7049560546875, 1.930419921875, 2.1558837890625, 2.38134765625, 2.6068115234375, 2.832275390625, 3.0577392578125, 3.283203125, 3.5086669921875, 3.734130859375, 3.9595947265625, 4.18505859375, 4.4105224609375, 4.635986328125, 4.8614501953125, 5.0869140625, 5.3123779296875, 5.537841796875, 5.7633056640625, 5.98876953125, 6.2142333984375, 6.439697265625, 6.6651611328125, 6.890625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 6.0, 2.0, 11.0, 8.0, 11.0, 16.0, 23.0, 27.0, 32.0, 28.0, 33.0, 44.0, 48.0, 57.0, 73.0, 104.0, 150.0, 276.0, 1383.0, 174.0, 119.0, 64.0, 57.0, 44.0, 41.0, 30.0, 32.0, 24.0, 24.0, 32.0, 11.0, 14.0, 14.0, 10.0, 9.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.3157958984375, -12.858154296875, -12.4005126953125, -11.94287109375, -11.4852294921875, -11.027587890625, -10.5699462890625, -10.1123046875, -9.6546630859375, -9.197021484375, -8.7393798828125, -8.28173828125, -7.8240966796875, -7.366455078125, -6.9088134765625, -6.451171875, -5.9935302734375, -5.535888671875, -5.0782470703125, -4.62060546875, -4.1629638671875, -3.705322265625, -3.2476806640625, -2.7900390625, -2.3323974609375, -1.874755859375, -1.4171142578125, -0.95947265625, -0.5018310546875, -0.044189453125, 0.4134521484375, 0.87109375, 1.3287353515625, 1.786376953125, 2.2440185546875, 2.70166015625, 3.1593017578125, 3.616943359375, 4.0745849609375, 4.5322265625, 4.9898681640625, 5.447509765625, 5.9051513671875, 6.36279296875, 6.8204345703125, 7.278076171875, 7.7357177734375, 8.193359375, 8.6510009765625, 9.108642578125, 9.5662841796875, 10.02392578125, 10.4815673828125, 10.939208984375, 11.3968505859375, 11.8544921875, 12.3121337890625, 12.769775390625, 13.2274169921875, 13.68505859375, 14.1427001953125, 14.600341796875, 15.0579833984375, 15.515625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 1.0, 6.0, 8.0, 5.0, 20.0, 21.0, 17.0, 37.0, 44.0, 51.0, 84.0, 100.0, 167.0, 260.0, 374.0, 682.0, 1721.0, 23032.0, 2649683.0, 459673.0, 6984.0, 1085.0, 561.0, 316.0, 200.0, 164.0, 112.0, 74.0, 48.0, 55.0, 35.0, 15.0, 19.0, 19.0, 10.0, 9.0, 4.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.109375, -28.2734375, -27.4375, -26.6015625, -25.765625, -24.9296875, -24.09375, -23.2578125, -22.421875, -21.5859375, -20.75, -19.9140625, -19.078125, -18.2421875, -17.40625, -16.5703125, -15.734375, -14.8984375, -14.0625, -13.2265625, -12.390625, -11.5546875, -10.71875, -9.8828125, -9.046875, -8.2109375, -7.375, -6.5390625, -5.703125, -4.8671875, -4.03125, -3.1953125, -2.359375, -1.5234375, -0.6875, 0.1484375, 0.984375, 1.8203125, 2.65625, 3.4921875, 4.328125, 5.1640625, 6.0, 6.8359375, 7.671875, 8.5078125, 9.34375, 10.1796875, 11.015625, 11.8515625, 12.6875, 13.5234375, 14.359375, 15.1953125, 16.03125, 16.8671875, 17.703125, 18.5390625, 19.375, 20.2109375, 21.046875, 21.8828125, 22.71875, 23.5546875, 24.390625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 44.0, 897.0, 76.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.91563415527344, -197.97793579101562, -191.04025268554688, -184.10255432128906, -177.1648712158203, -170.2271728515625, -163.28948974609375, -156.35179138183594, -149.41409301757812, -142.4763946533203, -135.53871154785156, -128.60101318359375, -121.663330078125, -114.72563171386719, -107.7879409790039, -100.85025024414062, -93.91256713867188, -86.9748764038086, -80.03718566894531, -73.0994873046875, -66.16180419921875, -59.2241096496582, -52.286415100097656, -45.348724365234375, -38.411033630371094, -31.473342895507812, -24.5356502532959, -17.597957611083984, -10.660266876220703, -3.722576141357422, 3.215118408203125, 10.152809143066406, 17.090484619140625, 24.028175354003906, 30.96586799621582, 37.903560638427734, 44.841251373291016, 51.7789421081543, 58.716636657714844, 65.65432739257812, 72.5920181274414, 79.52970886230469, 86.46739959716797, 93.40509033203125, 100.34278869628906, 107.28047180175781, 114.21817016601562, 121.1558609008789, 128.0935516357422, 135.03125, 141.96893310546875, 148.90663146972656, 155.8443145751953, 162.78201293945312, 169.71969604492188, 176.6573944091797, 183.5950927734375, 190.5327911376953, 197.47047424316406, 204.40817260742188, 211.34585571289062, 218.28355407714844, 225.22125244140625, 232.158935546875, 239.09661865234375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 1.0, 4.0, 4.0, 10.0, 11.0, 12.0, 11.0, 17.0, 20.0, 24.0, 23.0, 28.0, 35.0, 26.0, 32.0, 37.0, 40.0, 42.0, 46.0, 45.0, 39.0, 51.0, 48.0, 51.0, 36.0, 34.0, 25.0, 32.0, 24.0, 21.0, 21.0, 30.0, 22.0, 21.0, 15.0, 8.0, 13.0, 11.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-33.521141052246094, -32.4847297668457, -31.448320388793945, -30.411911010742188, -29.375499725341797, -28.33909034729004, -27.30268096923828, -26.26626968383789, -25.229860305786133, -24.193450927734375, -23.157039642333984, -22.120630264282227, -21.08422088623047, -20.047809600830078, -19.01140022277832, -17.974990844726562, -16.938579559326172, -15.902169227600098, -14.865758895874023, -13.829349517822266, -12.792939186096191, -11.756528854370117, -10.72011947631836, -9.683709144592285, -8.647298812866211, -7.610888481140137, -6.574478626251221, -5.538068771362305, -4.5016584396362305, -3.4652481079101562, -2.4288382530212402, -1.3924283981323242, -0.35601806640625, 0.6803920269012451, 1.7168021202087402, 2.7532122135162354, 3.7896223068237305, 4.826032638549805, 5.862442493438721, 6.898852348327637, 7.935262680053711, 8.971673011779785, 10.00808334350586, 11.044492721557617, 12.080903053283691, 13.117313385009766, 14.153722763061523, 15.190133094787598, 16.226543426513672, 17.26295280456543, 18.29936408996582, 19.335773468017578, 20.37218475341797, 21.408594131469727, 22.445003509521484, 23.481414794921875, 24.517824172973633, 25.55423355102539, 26.59064483642578, 27.62705421447754, 28.663463592529297, 29.699874877929688, 30.736284255981445, 31.772693634033203, 32.809104919433594]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 8.0, 10.0, 14.0, 14.0, 20.0, 20.0, 36.0, 30.0, 34.0, 29.0, 40.0, 52.0, 42.0, 48.0, 49.0, 52.0, 50.0, 44.0, 32.0, 42.0, 37.0, 40.0, 39.0, 25.0, 38.0, 15.0, 27.0, 19.0, 14.0, 16.0, 11.0, 11.0, 8.0, 10.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.49493408203125, -5.3062744140625, -5.11761474609375, -4.928955078125, -4.74029541015625, -4.5516357421875, -4.36297607421875, -4.17431640625, -3.98565673828125, -3.7969970703125, -3.60833740234375, -3.419677734375, -3.23101806640625, -3.0423583984375, -2.85369873046875, -2.6650390625, -2.47637939453125, -2.2877197265625, -2.09906005859375, -1.910400390625, -1.72174072265625, -1.5330810546875, -1.34442138671875, -1.15576171875, -0.96710205078125, -0.7784423828125, -0.58978271484375, -0.401123046875, -0.21246337890625, -0.0238037109375, 0.16485595703125, 0.353515625, 0.54217529296875, 0.7308349609375, 0.91949462890625, 1.108154296875, 1.29681396484375, 1.4854736328125, 1.67413330078125, 1.86279296875, 2.05145263671875, 2.2401123046875, 2.42877197265625, 2.617431640625, 2.80609130859375, 2.9947509765625, 3.18341064453125, 3.3720703125, 3.56072998046875, 3.7493896484375, 3.93804931640625, 4.126708984375, 4.31536865234375, 4.5040283203125, 4.69268798828125, 4.88134765625, 5.07000732421875, 5.2586669921875, 5.44732666015625, 5.635986328125, 5.82464599609375, 6.0133056640625, 6.20196533203125, 6.390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 6.0, 12.0, 7.0, 9.0, 15.0, 15.0, 21.0, 23.0, 29.0, 35.0, 33.0, 55.0, 67.0, 96.0, 122.0, 151.0, 214.0, 246.0, 351.0, 659.0, 22471.0, 4105454.0, 61639.0, 903.0, 384.0, 301.0, 196.0, 149.0, 148.0, 104.0, 61.0, 58.0, 48.0, 31.0, 35.0, 17.0, 15.0, 19.0, 15.0, 14.0, 6.0, 5.0, 10.0, 8.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-44.03125, -42.6796875, -41.328125, -39.9765625, -38.625, -37.2734375, -35.921875, -34.5703125, -33.21875, -31.8671875, -30.515625, -29.1640625, -27.8125, -26.4609375, -25.109375, -23.7578125, -22.40625, -21.0546875, -19.703125, -18.3515625, -17.0, -15.6484375, -14.296875, -12.9453125, -11.59375, -10.2421875, -8.890625, -7.5390625, -6.1875, -4.8359375, -3.484375, -2.1328125, -0.78125, 0.5703125, 1.921875, 3.2734375, 4.625, 5.9765625, 7.328125, 8.6796875, 10.03125, 11.3828125, 12.734375, 14.0859375, 15.4375, 16.7890625, 18.140625, 19.4921875, 20.84375, 22.1953125, 23.546875, 24.8984375, 26.25, 27.6015625, 28.953125, 30.3046875, 31.65625, 33.0078125, 34.359375, 35.7109375, 37.0625, 38.4140625, 39.765625, 41.1171875, 42.46875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 7.0, 4.0, 11.0, 18.0, 19.0, 27.0, 19.0, 33.0, 53.0, 61.0, 92.0, 111.0, 183.0, 307.0, 489.0, 613.0, 601.0, 462.0, 289.0, 214.0, 111.0, 92.0, 63.0, 51.0, 32.0, 16.0, 19.0, 15.0, 15.0, 15.0, 4.0, 4.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.4609375, -8.1790771484375, -7.897216796875, -7.6153564453125, -7.33349609375, -7.0516357421875, -6.769775390625, -6.4879150390625, -6.2060546875, -5.9241943359375, -5.642333984375, -5.3604736328125, -5.07861328125, -4.7967529296875, -4.514892578125, -4.2330322265625, -3.951171875, -3.6693115234375, -3.387451171875, -3.1055908203125, -2.82373046875, -2.5418701171875, -2.260009765625, -1.9781494140625, -1.6962890625, -1.4144287109375, -1.132568359375, -0.8507080078125, -0.56884765625, -0.2869873046875, -0.005126953125, 0.2767333984375, 0.55859375, 0.8404541015625, 1.122314453125, 1.4041748046875, 1.68603515625, 1.9678955078125, 2.249755859375, 2.5316162109375, 2.8134765625, 3.0953369140625, 3.377197265625, 3.6590576171875, 3.94091796875, 4.2227783203125, 4.504638671875, 4.7864990234375, 5.068359375, 5.3502197265625, 5.632080078125, 5.9139404296875, 6.19580078125, 6.4776611328125, 6.759521484375, 7.0413818359375, 7.3232421875, 7.6051025390625, 7.886962890625, 8.1688232421875, 8.45068359375, 8.7325439453125, 9.014404296875, 9.2962646484375, 9.578125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 11.0, 11.0, 25.0, 19.0, 28.0, 44.0, 58.0, 108.0, 251.0, 711.0, 6705.0, 1068312.0, 3104273.0, 12103.0, 936.0, 312.0, 126.0, 62.0, 47.0, 35.0, 24.0, 13.0, 21.0, 14.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.46875, -32.27685546875, -31.0849609375, -29.89306640625, -28.701171875, -27.50927734375, -26.3173828125, -25.12548828125, -23.93359375, -22.74169921875, -21.5498046875, -20.35791015625, -19.166015625, -17.97412109375, -16.7822265625, -15.59033203125, -14.3984375, -13.20654296875, -12.0146484375, -10.82275390625, -9.630859375, -8.43896484375, -7.2470703125, -6.05517578125, -4.86328125, -3.67138671875, -2.4794921875, -1.28759765625, -0.095703125, 1.09619140625, 2.2880859375, 3.47998046875, 4.671875, 5.86376953125, 7.0556640625, 8.24755859375, 9.439453125, 10.63134765625, 11.8232421875, 13.01513671875, 14.20703125, 15.39892578125, 16.5908203125, 17.78271484375, 18.974609375, 20.16650390625, 21.3583984375, 22.55029296875, 23.7421875, 24.93408203125, 26.1259765625, 27.31787109375, 28.509765625, 29.70166015625, 30.8935546875, 32.08544921875, 33.27734375, 34.46923828125, 35.6611328125, 36.85302734375, 38.044921875, 39.23681640625, 40.4287109375, 41.62060546875, 42.8125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 13.0, 22.0, 120.0, 216.0, 278.0, 207.0, 96.0, 42.0, 15.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.4635238647461, -78.320556640625, -76.17758178710938, -74.03461456298828, -71.89164733886719, -69.74867248535156, -67.60570526123047, -65.46273803710938, -63.319766998291016, -61.176795959472656, -59.03382873535156, -56.8908576965332, -54.747886657714844, -52.60491943359375, -50.46194839477539, -48.31897735595703, -46.17601013183594, -44.03303909301758, -41.890071868896484, -39.747100830078125, -37.60413360595703, -35.46116256713867, -33.31819152832031, -31.175222396850586, -29.03225326538086, -26.889284133911133, -24.746315002441406, -22.603343963623047, -20.46037483215332, -18.317405700683594, -16.174434661865234, -14.031465530395508, -11.888500213623047, -9.74553108215332, -7.602560997009277, -5.459591388702393, -3.316621780395508, -1.1736526489257812, 0.9693174362182617, 3.1122875213623047, 5.255256652832031, 7.398226261138916, 9.5411958694458, 11.684165954589844, 13.82713508605957, 15.970104217529297, 18.113075256347656, 20.256044387817383, 22.39901351928711, 24.541982650756836, 26.684951782226562, 28.827922821044922, 30.97089195251465, 33.113861083984375, 35.256832122802734, 37.399803161621094, 39.54277038574219, 41.68574142456055, 43.82870864868164, 45.9716796875, 48.114646911621094, 50.25761795043945, 52.40058898925781, 54.543556213378906, 56.686527252197266]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 3.0, 10.0, 10.0, 7.0, 10.0, 13.0, 11.0, 21.0, 14.0, 28.0, 22.0, 27.0, 26.0, 21.0, 35.0, 27.0, 28.0, 36.0, 39.0, 39.0, 33.0, 29.0, 49.0, 33.0, 33.0, 35.0, 36.0, 42.0, 29.0, 27.0, 25.0, 30.0, 20.0, 32.0, 23.0, 13.0, 11.0, 12.0, 12.0, 7.0, 11.0, 8.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-28.293987274169922, -27.503644943237305, -26.713300704956055, -25.922958374023438, -25.13261604309082, -24.34227180480957, -23.551929473876953, -22.761585235595703, -21.971242904663086, -21.18090057373047, -20.39055633544922, -19.6002140045166, -18.809871673583984, -18.019527435302734, -17.229185104370117, -16.4388427734375, -15.648499488830566, -14.858156204223633, -14.067813873291016, -13.277470588684082, -12.487127304077148, -11.696784973144531, -10.906441688537598, -10.116098403930664, -9.325756072998047, -8.535412788391113, -7.745069980621338, -6.9547271728515625, -6.164383888244629, -5.3740410804748535, -4.583698272705078, -3.7933549880981445, -3.003011703491211, -2.2126686573028564, -1.4223257303237915, -0.6319828033447266, 0.15836024284362793, 0.9487032890319824, 1.7390460968017578, 2.5293893814086914, 3.319732189178467, 4.110074996948242, 4.900418281555176, 5.690761089324951, 6.481103897094727, 7.27144718170166, 8.061790466308594, 8.852132797241211, 9.642476081848145, 10.432819366455078, 11.223161697387695, 12.013504981994629, 12.803848266601562, 13.59419059753418, 14.384533882141113, 15.174877166748047, 15.965219497680664, 16.75556182861328, 17.54590606689453, 18.33624839782715, 19.126590728759766, 19.916934967041016, 20.707277297973633, 21.49761962890625, 22.2879638671875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 6.0, 12.0, 8.0, 12.0, 16.0, 21.0, 21.0, 24.0, 25.0, 29.0, 26.0, 27.0, 42.0, 36.0, 39.0, 32.0, 31.0, 38.0, 37.0, 43.0, 40.0, 34.0, 33.0, 29.0, 32.0, 33.0, 31.0, 22.0, 28.0, 27.0, 25.0, 13.0, 17.0, 16.0, 8.0, 11.0, 11.0, 12.0, 8.0, 2.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.8125, -4.66558837890625, -4.5186767578125, -4.37176513671875, -4.224853515625, -4.07794189453125, -3.9310302734375, -3.78411865234375, -3.63720703125, -3.49029541015625, -3.3433837890625, -3.19647216796875, -3.049560546875, -2.90264892578125, -2.7557373046875, -2.60882568359375, -2.4619140625, -2.31500244140625, -2.1680908203125, -2.02117919921875, -1.874267578125, -1.72735595703125, -1.5804443359375, -1.43353271484375, -1.28662109375, -1.13970947265625, -0.9927978515625, -0.84588623046875, -0.698974609375, -0.55206298828125, -0.4051513671875, -0.25823974609375, -0.111328125, 0.03558349609375, 0.1824951171875, 0.32940673828125, 0.476318359375, 0.62322998046875, 0.7701416015625, 0.91705322265625, 1.06396484375, 1.21087646484375, 1.3577880859375, 1.50469970703125, 1.651611328125, 1.79852294921875, 1.9454345703125, 2.09234619140625, 2.2392578125, 2.38616943359375, 2.5330810546875, 2.67999267578125, 2.826904296875, 2.97381591796875, 3.1207275390625, 3.26763916015625, 3.41455078125, 3.56146240234375, 3.7083740234375, 3.85528564453125, 4.002197265625, 4.14910888671875, 4.2960205078125, 4.44293212890625, 4.58984375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 4.0, 5.0, 10.0, 16.0, 16.0, 30.0, 37.0, 54.0, 85.0, 120.0, 202.0, 306.0, 417.0, 746.0, 1058.0, 1677.0, 2677.0, 4441.0, 7027.0, 11598.0, 18864.0, 30980.0, 51803.0, 87186.0, 145139.0, 207290.0, 183758.0, 117105.0, 69732.0, 41598.0, 25020.0, 15047.0, 9143.0, 5766.0, 3441.0, 2221.0, 1343.0, 895.0, 572.0, 376.0, 270.0, 163.0, 109.0, 65.0, 46.0, 36.0, 28.0, 12.0, 11.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5, -0.48262786865234375, -0.4652557373046875, -0.44788360595703125, -0.430511474609375, -0.41313934326171875, -0.3957672119140625, -0.37839508056640625, -0.36102294921875, -0.34365081787109375, -0.3262786865234375, -0.30890655517578125, -0.291534423828125, -0.27416229248046875, -0.2567901611328125, -0.23941802978515625, -0.2220458984375, -0.20467376708984375, -0.1873016357421875, -0.16992950439453125, -0.152557373046875, -0.13518524169921875, -0.1178131103515625, -0.10044097900390625, -0.08306884765625, -0.06569671630859375, -0.0483245849609375, -0.03095245361328125, -0.013580322265625, 0.00379180908203125, 0.0211639404296875, 0.03853607177734375, 0.055908203125, 0.07328033447265625, 0.0906524658203125, 0.10802459716796875, 0.125396728515625, 0.14276885986328125, 0.1601409912109375, 0.17751312255859375, 0.19488525390625, 0.21225738525390625, 0.2296295166015625, 0.24700164794921875, 0.264373779296875, 0.28174591064453125, 0.2991180419921875, 0.31649017333984375, 0.3338623046875, 0.35123443603515625, 0.3686065673828125, 0.38597869873046875, 0.403350830078125, 0.42072296142578125, 0.4380950927734375, 0.45546722412109375, 0.47283935546875, 0.49021148681640625, 0.5075836181640625, 0.5249557495117188, 0.542327880859375, 0.5597000122070312, 0.5770721435546875, 0.5944442749023438, 0.61181640625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 10.0, 10.0, 10.0, 14.0, 11.0, 15.0, 27.0, 22.0, 36.0, 25.0, 29.0, 38.0, 36.0, 31.0, 48.0, 30.0, 38.0, 38.0, 1074.0, 45.0, 63.0, 33.0, 36.0, 38.0, 45.0, 29.0, 18.0, 21.0, 20.0, 19.0, 24.0, 17.0, 14.0, 12.0, 13.0, 5.0, 9.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.703125, -3.59765625, -3.4921875, -3.38671875, -3.28125, -3.17578125, -3.0703125, -2.96484375, -2.859375, -2.75390625, -2.6484375, -2.54296875, -2.4375, -2.33203125, -2.2265625, -2.12109375, -2.015625, -1.91015625, -1.8046875, -1.69921875, -1.59375, -1.48828125, -1.3828125, -1.27734375, -1.171875, -1.06640625, -0.9609375, -0.85546875, -0.75, -0.64453125, -0.5390625, -0.43359375, -0.328125, -0.22265625, -0.1171875, -0.01171875, 0.09375, 0.19921875, 0.3046875, 0.41015625, 0.515625, 0.62109375, 0.7265625, 0.83203125, 0.9375, 1.04296875, 1.1484375, 1.25390625, 1.359375, 1.46484375, 1.5703125, 1.67578125, 1.78125, 1.88671875, 1.9921875, 2.09765625, 2.203125, 2.30859375, 2.4140625, 2.51953125, 2.625, 2.73046875, 2.8359375, 2.94140625, 3.046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 11.0, 9.0, 18.0, 18.0, 28.0, 51.0, 77.0, 105.0, 147.0, 183.0, 282.0, 424.0, 617.0, 938.0, 1406.0, 2074.0, 3115.0, 4703.0, 7198.0, 10773.0, 16309.0, 24464.0, 36473.0, 54621.0, 80096.0, 114811.0, 235153.0, 1113356.0, 122663.0, 87252.0, 59554.0, 39981.0, 26921.0, 17926.0, 11813.0, 7924.0, 5216.0, 3413.0, 2253.0, 1575.0, 1053.0, 681.0, 473.0, 313.0, 231.0, 145.0, 94.0, 62.0, 35.0, 36.0, 18.0, 13.0, 8.0, 8.0, 6.0, 8.0, 3.0, 1.0], "bins": [-0.32763671875, -0.31774139404296875, -0.3078460693359375, -0.29795074462890625, -0.288055419921875, -0.27816009521484375, -0.2682647705078125, -0.25836944580078125, -0.24847412109375, -0.23857879638671875, -0.2286834716796875, -0.21878814697265625, -0.208892822265625, -0.19899749755859375, -0.1891021728515625, -0.17920684814453125, -0.1693115234375, -0.15941619873046875, -0.1495208740234375, -0.13962554931640625, -0.129730224609375, -0.11983489990234375, -0.1099395751953125, -0.10004425048828125, -0.09014892578125, -0.08025360107421875, -0.0703582763671875, -0.06046295166015625, -0.050567626953125, -0.04067230224609375, -0.0307769775390625, -0.02088165283203125, -0.010986328125, -0.00109100341796875, 0.0088043212890625, 0.01869964599609375, 0.028594970703125, 0.03849029541015625, 0.0483856201171875, 0.05828094482421875, 0.06817626953125, 0.07807159423828125, 0.0879669189453125, 0.09786224365234375, 0.107757568359375, 0.11765289306640625, 0.1275482177734375, 0.13744354248046875, 0.1473388671875, 0.15723419189453125, 0.1671295166015625, 0.17702484130859375, 0.186920166015625, 0.19681549072265625, 0.2067108154296875, 0.21660614013671875, 0.22650146484375, 0.23639678955078125, 0.2462921142578125, 0.25618743896484375, 0.266082763671875, 0.27597808837890625, 0.2858734130859375, 0.29576873779296875, 0.3056640625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 5.0, 12.0, 9.0, 12.0, 15.0, 24.0, 25.0, 33.0, 34.0, 45.0, 80.0, 74.0, 100.0, 105.0, 99.0, 61.0, 40.0, 37.0, 44.0, 21.0, 19.0, 13.0, 9.0, 10.0, 9.0, 9.0, 10.0, 3.0, 5.0, 5.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0106201171875, -0.01029050350189209, -0.00996088981628418, -0.00963127613067627, -0.00930166244506836, -0.00897204875946045, -0.008642435073852539, -0.008312821388244629, -0.007983207702636719, -0.007653594017028809, -0.0073239803314208984, -0.006994366645812988, -0.006664752960205078, -0.006335139274597168, -0.006005525588989258, -0.005675911903381348, -0.0053462982177734375, -0.005016684532165527, -0.004687070846557617, -0.004357457160949707, -0.004027843475341797, -0.0036982297897338867, -0.0033686161041259766, -0.0030390024185180664, -0.0027093887329101562, -0.002379775047302246, -0.002050161361694336, -0.0017205476760864258, -0.0013909339904785156, -0.0010613203048706055, -0.0007317066192626953, -0.00040209293365478516, -7.2479248046875e-05, 0.00025713443756103516, 0.0005867481231689453, 0.0009163618087768555, 0.0012459754943847656, 0.0015755891799926758, 0.001905202865600586, 0.002234816551208496, 0.0025644302368164062, 0.0028940439224243164, 0.0032236576080322266, 0.0035532712936401367, 0.003882884979248047, 0.004212498664855957, 0.004542112350463867, 0.004871726036071777, 0.0052013397216796875, 0.005530953407287598, 0.005860567092895508, 0.006190180778503418, 0.006519794464111328, 0.006849408149719238, 0.0071790218353271484, 0.007508635520935059, 0.007838249206542969, 0.008167862892150879, 0.008497476577758789, 0.0088270902633667, 0.00915670394897461, 0.00948631763458252, 0.00981593132019043, 0.01014554500579834, 0.01047515869140625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 7.0, 6.0, 7.0, 10.0, 13.0, 16.0, 23.0, 29.0, 23.0, 30.0, 34.0, 67.0, 88.0, 143.0, 176.0, 283.0, 543.0, 2707.0, 983789.0, 58184.0, 1042.0, 462.0, 240.0, 133.0, 123.0, 78.0, 67.0, 43.0, 44.0, 27.0, 19.0, 14.0, 7.0, 10.0, 3.0, 7.0, 12.0, 5.0, 3.0, 3.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.1812744140625, -0.17557334899902344, -0.16987228393554688, -0.1641712188720703, -0.15847015380859375, -0.1527690887451172, -0.14706802368164062, -0.14136695861816406, -0.1356658935546875, -0.12996482849121094, -0.12426376342773438, -0.11856269836425781, -0.11286163330078125, -0.10716056823730469, -0.10145950317382812, -0.09575843811035156, -0.090057373046875, -0.08435630798339844, -0.07865524291992188, -0.07295417785644531, -0.06725311279296875, -0.06155204772949219, -0.055850982666015625, -0.05014991760253906, -0.0444488525390625, -0.03874778747558594, -0.033046722412109375, -0.027345657348632812, -0.02164459228515625, -0.015943527221679688, -0.010242462158203125, -0.0045413970947265625, 0.00115966796875, 0.0068607330322265625, 0.012561798095703125, 0.018262863159179688, 0.02396392822265625, 0.029664993286132812, 0.035366058349609375, 0.04106712341308594, 0.0467681884765625, 0.05246925354003906, 0.058170318603515625, 0.06387138366699219, 0.06957244873046875, 0.07527351379394531, 0.08097457885742188, 0.08667564392089844, 0.092376708984375, 0.09807777404785156, 0.10377883911132812, 0.10947990417480469, 0.11518096923828125, 0.12088203430175781, 0.12658309936523438, 0.13228416442871094, 0.1379852294921875, 0.14368629455566406, 0.14938735961914062, 0.1550884246826172, 0.16078948974609375, 0.1664905548095703, 0.17219161987304688, 0.17789268493652344, 0.18359375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 149.0, 851.0, 17.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022697191685438156, -0.0202452652156353, -0.017793338745832443, -0.015341412276029587, -0.01288948580622673, -0.010437559336423874, -0.007985632866621017, -0.005533706396818161, -0.0030817799270153046, -0.0006298534572124481, 0.0018220730125904083, 0.004273999482393265, 0.006725925952196121, 0.009177852421998978, 0.011629778891801834, 0.01408170536160469, 0.016533631831407547, 0.018985558301210403, 0.02143748477101326, 0.023889411240816116, 0.026341337710618973, 0.02879326418042183, 0.031245190650224686, 0.03369711712002754, 0.0361490435898304, 0.038600970059633255, 0.04105289652943611, 0.04350482299923897, 0.045956749469041824, 0.04840867593884468, 0.05086060240864754, 0.053312528878450394, 0.05576445162296295, 0.05821637809276581, 0.060668304562568665, 0.06312023103237152, 0.06557215750217438, 0.06802408397197723, 0.07047601044178009, 0.07292793691158295, 0.0753798633813858, 0.07783178985118866, 0.08028371632099152, 0.08273564279079437, 0.08518756926059723, 0.08763949573040009, 0.09009142220020294, 0.0925433486700058, 0.09499527513980865, 0.09744720160961151, 0.09989912807941437, 0.10235105454921722, 0.10480298101902008, 0.10725490748882294, 0.1097068339586258, 0.11215876042842865, 0.1146106868982315, 0.11706261336803436, 0.11951453983783722, 0.12196646630764008, 0.12441839277744293, 0.1268703192472458, 0.12932224571704865, 0.1317741721868515, 0.13422609865665436]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 6.0, 2.0, 7.0, 13.0, 9.0, 16.0, 21.0, 25.0, 27.0, 31.0, 36.0, 25.0, 42.0, 55.0, 45.0, 48.0, 53.0, 59.0, 42.0, 49.0, 44.0, 46.0, 39.0, 39.0, 28.0, 30.0, 32.0, 26.0, 27.0, 20.0, 15.0, 10.0, 5.0, 10.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.008723914623260498, -0.008495654910802841, -0.008267395198345184, -0.008039135485887527, -0.007810875773429871, -0.007582616060972214, -0.007354356348514557, -0.0071260966360569, -0.006897836923599243, -0.006669577211141586, -0.0064413174986839294, -0.006213057786226273, -0.005984798073768616, -0.005756538361310959, -0.005528278648853302, -0.005300018936395645, -0.005071759223937988, -0.004843499511480331, -0.0046152397990226746, -0.004386980086565018, -0.004158720374107361, -0.003930460661649704, -0.003702200949192047, -0.0034739412367343903, -0.0032456815242767334, -0.0030174218118190765, -0.0027891620993614197, -0.002560902386903763, -0.002332642674446106, -0.002104382961988449, -0.0018761232495307922, -0.0016478635370731354, -0.0014196038246154785, -0.0011913441121578217, -0.0009630843997001648, -0.0007348246872425079, -0.0005065649747848511, -0.0002783052623271942, -5.0045549869537354e-05, 0.0001782141625881195, 0.00040647387504577637, 0.0006347335875034332, 0.0008629932999610901, 0.001091253012418747, 0.0013195127248764038, 0.0015477724373340607, 0.0017760321497917175, 0.0020042918622493744, 0.0022325515747070312, 0.002460811287164688, 0.002689070999622345, 0.002917330712080002, 0.0031455904245376587, 0.0033738501369953156, 0.0036021098494529724, 0.0038303695619106293, 0.004058629274368286, 0.004286888986825943, 0.0045151486992836, 0.004743408411741257, 0.004971668124198914, 0.0051999278366565704, 0.005428187549114227, 0.005656447261571884, 0.005884706974029541]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 6.0, 13.0, 7.0, 12.0, 16.0, 21.0, 21.0, 25.0, 24.0, 29.0, 27.0, 26.0, 43.0, 35.0, 40.0, 32.0, 30.0, 38.0, 37.0, 44.0, 40.0, 33.0, 33.0, 29.0, 32.0, 33.0, 33.0, 20.0, 29.0, 27.0, 24.0, 14.0, 17.0, 15.0, 8.0, 11.0, 12.0, 11.0, 8.0, 2.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.80859375, -4.66168212890625, -4.5147705078125, -4.36785888671875, -4.220947265625, -4.07403564453125, -3.9271240234375, -3.78021240234375, -3.63330078125, -3.48638916015625, -3.3394775390625, -3.19256591796875, -3.045654296875, -2.89874267578125, -2.7518310546875, -2.60491943359375, -2.4580078125, -2.31109619140625, -2.1641845703125, -2.01727294921875, -1.870361328125, -1.72344970703125, -1.5765380859375, -1.42962646484375, -1.28271484375, -1.13580322265625, -0.9888916015625, -0.84197998046875, -0.695068359375, -0.54815673828125, -0.4012451171875, -0.25433349609375, -0.107421875, 0.03948974609375, 0.1864013671875, 0.33331298828125, 0.480224609375, 0.62713623046875, 0.7740478515625, 0.92095947265625, 1.06787109375, 1.21478271484375, 1.3616943359375, 1.50860595703125, 1.655517578125, 1.80242919921875, 1.9493408203125, 2.09625244140625, 2.2431640625, 2.39007568359375, 2.5369873046875, 2.68389892578125, 2.830810546875, 2.97772216796875, 3.1246337890625, 3.27154541015625, 3.41845703125, 3.56536865234375, 3.7122802734375, 3.85919189453125, 4.006103515625, 4.15301513671875, 4.2999267578125, 4.44683837890625, 4.59375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 6.0, 6.0, 5.0, 10.0, 17.0, 12.0, 20.0, 23.0, 30.0, 44.0, 71.0, 92.0, 104.0, 127.0, 163.0, 218.0, 278.0, 383.0, 486.0, 621.0, 825.0, 1197.0, 1887.0, 4153.0, 14596.0, 63164.0, 250795.0, 471102.0, 176484.0, 42376.0, 10042.0, 3233.0, 1629.0, 1083.0, 756.0, 605.0, 424.0, 343.0, 265.0, 197.0, 180.0, 109.0, 96.0, 70.0, 57.0, 48.0, 27.0, 24.0, 20.0, 16.0, 17.0, 10.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8671875, -8.58447265625, -8.3017578125, -8.01904296875, -7.736328125, -7.45361328125, -7.1708984375, -6.88818359375, -6.60546875, -6.32275390625, -6.0400390625, -5.75732421875, -5.474609375, -5.19189453125, -4.9091796875, -4.62646484375, -4.34375, -4.06103515625, -3.7783203125, -3.49560546875, -3.212890625, -2.93017578125, -2.6474609375, -2.36474609375, -2.08203125, -1.79931640625, -1.5166015625, -1.23388671875, -0.951171875, -0.66845703125, -0.3857421875, -0.10302734375, 0.1796875, 0.46240234375, 0.7451171875, 1.02783203125, 1.310546875, 1.59326171875, 1.8759765625, 2.15869140625, 2.44140625, 2.72412109375, 3.0068359375, 3.28955078125, 3.572265625, 3.85498046875, 4.1376953125, 4.42041015625, 4.703125, 4.98583984375, 5.2685546875, 5.55126953125, 5.833984375, 6.11669921875, 6.3994140625, 6.68212890625, 6.96484375, 7.24755859375, 7.5302734375, 7.81298828125, 8.095703125, 8.37841796875, 8.6611328125, 8.94384765625, 9.2265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 7.0, 8.0, 10.0, 10.0, 17.0, 20.0, 19.0, 17.0, 22.0, 28.0, 39.0, 48.0, 46.0, 82.0, 107.0, 161.0, 327.0, 1368.0, 179.0, 116.0, 71.0, 60.0, 45.0, 41.0, 28.0, 33.0, 30.0, 22.0, 23.0, 8.0, 9.0, 6.0, 5.0, 8.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.1015625, -13.67529296875, -13.2490234375, -12.82275390625, -12.396484375, -11.97021484375, -11.5439453125, -11.11767578125, -10.69140625, -10.26513671875, -9.8388671875, -9.41259765625, -8.986328125, -8.56005859375, -8.1337890625, -7.70751953125, -7.28125, -6.85498046875, -6.4287109375, -6.00244140625, -5.576171875, -5.14990234375, -4.7236328125, -4.29736328125, -3.87109375, -3.44482421875, -3.0185546875, -2.59228515625, -2.166015625, -1.73974609375, -1.3134765625, -0.88720703125, -0.4609375, -0.03466796875, 0.3916015625, 0.81787109375, 1.244140625, 1.67041015625, 2.0966796875, 2.52294921875, 2.94921875, 3.37548828125, 3.8017578125, 4.22802734375, 4.654296875, 5.08056640625, 5.5068359375, 5.93310546875, 6.359375, 6.78564453125, 7.2119140625, 7.63818359375, 8.064453125, 8.49072265625, 8.9169921875, 9.34326171875, 9.76953125, 10.19580078125, 10.6220703125, 11.04833984375, 11.474609375, 11.90087890625, 12.3271484375, 12.75341796875, 13.1796875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 9.0, 10.0, 19.0, 22.0, 14.0, 40.0, 38.0, 41.0, 78.0, 109.0, 153.0, 260.0, 370.0, 636.0, 1355.0, 6242.0, 3124873.0, 8155.0, 1397.0, 682.0, 359.0, 244.0, 168.0, 103.0, 77.0, 61.0, 41.0, 29.0, 18.0, 17.0, 15.0, 10.0, 8.0, 7.0, 7.0, 5.0, 2.0, 6.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.28125, -46.64599609375, -45.0107421875, -43.37548828125, -41.740234375, -40.10498046875, -38.4697265625, -36.83447265625, -35.19921875, -33.56396484375, -31.9287109375, -30.29345703125, -28.658203125, -27.02294921875, -25.3876953125, -23.75244140625, -22.1171875, -20.48193359375, -18.8466796875, -17.21142578125, -15.576171875, -13.94091796875, -12.3056640625, -10.67041015625, -9.03515625, -7.39990234375, -5.7646484375, -4.12939453125, -2.494140625, -0.85888671875, 0.7763671875, 2.41162109375, 4.046875, 5.68212890625, 7.3173828125, 8.95263671875, 10.587890625, 12.22314453125, 13.8583984375, 15.49365234375, 17.12890625, 18.76416015625, 20.3994140625, 22.03466796875, 23.669921875, 25.30517578125, 26.9404296875, 28.57568359375, 30.2109375, 31.84619140625, 33.4814453125, 35.11669921875, 36.751953125, 38.38720703125, 40.0224609375, 41.65771484375, 43.29296875, 44.92822265625, 46.5634765625, 48.19873046875, 49.833984375, 51.46923828125, 53.1044921875, 54.73974609375, 56.375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 42.0, 146.0, 272.0, 298.0, 165.0, 50.0, 23.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.94337463378906, -49.07318115234375, -47.2029914855957, -45.33279800415039, -43.462608337402344, -41.59241485595703, -39.722225189208984, -37.85203170776367, -35.981842041015625, -34.11164855957031, -32.241458892822266, -30.371267318725586, -28.501075744628906, -26.630882263183594, -24.760692596435547, -22.890499114990234, -21.020307540893555, -19.150115966796875, -17.279924392700195, -15.409732818603516, -13.539541244506836, -11.66934871673584, -9.79915714263916, -7.9289655685424805, -6.058773994445801, -4.188582420349121, -2.3183906078338623, -0.4481987953186035, 1.4219927787780762, 3.292184829711914, 5.162376403808594, 7.032567977905273, 8.902759552001953, 10.772951126098633, 12.643142700195312, 14.513334274291992, 16.383525848388672, 18.253719329833984, 20.12390899658203, 21.994102478027344, 23.86429214477539, 25.73448371887207, 27.60467529296875, 29.47486686706543, 31.34505844116211, 33.21525192260742, 35.08544158935547, 36.95563507080078, 38.825828552246094, 40.696022033691406, 42.56621170043945, 44.436405181884766, 46.30659484863281, 48.176788330078125, 50.04697799682617, 51.917171478271484, 53.78736114501953, 55.657554626464844, 57.52774429321289, 59.3979377746582, 61.26812744140625, 63.13832092285156, 65.00851440429688, 66.87870025634766, 68.74889373779297]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 7.0, 12.0, 14.0, 7.0, 12.0, 12.0, 20.0, 26.0, 22.0, 22.0, 39.0, 35.0, 38.0, 44.0, 38.0, 43.0, 53.0, 45.0, 44.0, 34.0, 37.0, 41.0, 30.0, 33.0, 40.0, 39.0, 43.0, 31.0, 24.0, 19.0, 24.0, 15.0, 16.0, 9.0, 6.0, 10.0, 5.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-41.3906364440918, -40.25326919555664, -39.115901947021484, -37.97853469848633, -36.84116744995117, -35.703800201416016, -34.56643295288086, -33.42906188964844, -32.29169464111328, -31.154327392578125, -30.01696014404297, -28.879592895507812, -27.742225646972656, -26.6048583984375, -25.46748924255371, -24.330121994018555, -23.19275665283203, -22.055389404296875, -20.91802215576172, -19.780654907226562, -18.643287658691406, -17.50592041015625, -16.36855125427246, -15.231184005737305, -14.093816757202148, -12.956449508666992, -11.819082260131836, -10.681714057922363, -9.544346809387207, -8.40697956085205, -7.269611835479736, -6.132244110107422, -4.994876861572266, -3.8575093746185303, -2.720141887664795, -1.5827744007110596, -0.4454069137573242, 0.691960334777832, 1.8293280601501465, 2.966695785522461, 4.104063034057617, 5.241430282592773, 6.378798007965088, 7.516165733337402, 8.653532981872559, 9.790900230407715, 10.928268432617188, 12.065635681152344, 13.2030029296875, 14.340370178222656, 15.477737426757812, 16.61510467529297, 17.752471923828125, 18.88983917236328, 20.02720832824707, 21.164575576782227, 22.301942825317383, 23.43931007385254, 24.576677322387695, 25.71404457092285, 26.85141372680664, 27.988780975341797, 29.126148223876953, 30.26351547241211, 31.400882720947266]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 4.0, 7.0, 11.0, 7.0, 15.0, 8.0, 11.0, 15.0, 17.0, 22.0, 26.0, 30.0, 31.0, 32.0, 39.0, 40.0, 36.0, 32.0, 43.0, 35.0, 38.0, 38.0, 40.0, 39.0, 30.0, 39.0, 36.0, 24.0, 35.0, 31.0, 24.0, 22.0, 21.0, 22.0, 18.0, 11.0, 21.0, 11.0, 6.0, 5.0, 5.0, 6.0, 5.0, 9.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.15234375, -4.9964599609375, -4.840576171875, -4.6846923828125, -4.52880859375, -4.3729248046875, -4.217041015625, -4.0611572265625, -3.9052734375, -3.7493896484375, -3.593505859375, -3.4376220703125, -3.28173828125, -3.1258544921875, -2.969970703125, -2.8140869140625, -2.658203125, -2.5023193359375, -2.346435546875, -2.1905517578125, -2.03466796875, -1.8787841796875, -1.722900390625, -1.5670166015625, -1.4111328125, -1.2552490234375, -1.099365234375, -0.9434814453125, -0.78759765625, -0.6317138671875, -0.475830078125, -0.3199462890625, -0.1640625, -0.0081787109375, 0.147705078125, 0.3035888671875, 0.45947265625, 0.6153564453125, 0.771240234375, 0.9271240234375, 1.0830078125, 1.2388916015625, 1.394775390625, 1.5506591796875, 1.70654296875, 1.8624267578125, 2.018310546875, 2.1741943359375, 2.330078125, 2.4859619140625, 2.641845703125, 2.7977294921875, 2.95361328125, 3.1094970703125, 3.265380859375, 3.4212646484375, 3.5771484375, 3.7330322265625, 3.888916015625, 4.0447998046875, 4.20068359375, 4.3565673828125, 4.512451171875, 4.6683349609375, 4.82421875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 15.0, 11.0, 28.0, 37.0, 43.0, 64.0, 112.0, 199.0, 302.0, 594.0, 1087.0, 2038.0, 4186.0, 10357.0, 30976.0, 152383.0, 839023.0, 2063722.0, 879344.0, 157613.0, 32730.0, 10672.0, 4291.0, 1926.0, 1076.0, 580.0, 328.0, 205.0, 123.0, 71.0, 44.0, 30.0, 18.0, 19.0, 9.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.515625, -8.26153564453125, -8.0074462890625, -7.75335693359375, -7.499267578125, -7.24517822265625, -6.9910888671875, -6.73699951171875, -6.48291015625, -6.22882080078125, -5.9747314453125, -5.72064208984375, -5.466552734375, -5.21246337890625, -4.9583740234375, -4.70428466796875, -4.4501953125, -4.19610595703125, -3.9420166015625, -3.68792724609375, -3.433837890625, -3.17974853515625, -2.9256591796875, -2.67156982421875, -2.41748046875, -2.16339111328125, -1.9093017578125, -1.65521240234375, -1.401123046875, -1.14703369140625, -0.8929443359375, -0.63885498046875, -0.384765625, -0.13067626953125, 0.1234130859375, 0.37750244140625, 0.631591796875, 0.88568115234375, 1.1397705078125, 1.39385986328125, 1.64794921875, 1.90203857421875, 2.1561279296875, 2.41021728515625, 2.664306640625, 2.91839599609375, 3.1724853515625, 3.42657470703125, 3.6806640625, 3.93475341796875, 4.1888427734375, 4.44293212890625, 4.697021484375, 4.95111083984375, 5.2052001953125, 5.45928955078125, 5.71337890625, 5.96746826171875, 6.2215576171875, 6.47564697265625, 6.729736328125, 6.98382568359375, 7.2379150390625, 7.49200439453125, 7.74609375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 5.0, 9.0, 16.0, 24.0, 26.0, 39.0, 46.0, 55.0, 80.0, 103.0, 129.0, 191.0, 240.0, 297.0, 448.0, 519.0, 459.0, 336.0, 254.0, 159.0, 158.0, 116.0, 85.0, 65.0, 50.0, 39.0, 31.0, 28.0, 16.0, 10.0, 14.0, 7.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.421875, -7.142822265625, -6.86376953125, -6.584716796875, -6.3056640625, -6.026611328125, -5.74755859375, -5.468505859375, -5.189453125, -4.910400390625, -4.63134765625, -4.352294921875, -4.0732421875, -3.794189453125, -3.51513671875, -3.236083984375, -2.95703125, -2.677978515625, -2.39892578125, -2.119873046875, -1.8408203125, -1.561767578125, -1.28271484375, -1.003662109375, -0.724609375, -0.445556640625, -0.16650390625, 0.112548828125, 0.3916015625, 0.670654296875, 0.94970703125, 1.228759765625, 1.5078125, 1.786865234375, 2.06591796875, 2.344970703125, 2.6240234375, 2.903076171875, 3.18212890625, 3.461181640625, 3.740234375, 4.019287109375, 4.29833984375, 4.577392578125, 4.8564453125, 5.135498046875, 5.41455078125, 5.693603515625, 5.97265625, 6.251708984375, 6.53076171875, 6.809814453125, 7.0888671875, 7.367919921875, 7.64697265625, 7.926025390625, 8.205078125, 8.484130859375, 8.76318359375, 9.042236328125, 9.3212890625, 9.600341796875, 9.87939453125, 10.158447265625, 10.4375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 3.0, 3.0, 12.0, 6.0, 19.0, 21.0, 41.0, 56.0, 60.0, 112.0, 178.0, 281.0, 486.0, 805.0, 1669.0, 4903.0, 35532.0, 613371.0, 3251050.0, 261274.0, 18031.0, 3319.0, 1325.0, 645.0, 365.0, 230.0, 156.0, 113.0, 81.0, 55.0, 28.0, 15.0, 11.0, 10.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.140625, -16.6417236328125, -16.142822265625, -15.6439208984375, -15.14501953125, -14.6461181640625, -14.147216796875, -13.6483154296875, -13.1494140625, -12.6505126953125, -12.151611328125, -11.6527099609375, -11.15380859375, -10.6549072265625, -10.156005859375, -9.6571044921875, -9.158203125, -8.6593017578125, -8.160400390625, -7.6614990234375, -7.16259765625, -6.6636962890625, -6.164794921875, -5.6658935546875, -5.1669921875, -4.6680908203125, -4.169189453125, -3.6702880859375, -3.17138671875, -2.6724853515625, -2.173583984375, -1.6746826171875, -1.17578125, -0.6768798828125, -0.177978515625, 0.3209228515625, 0.81982421875, 1.3187255859375, 1.817626953125, 2.3165283203125, 2.8154296875, 3.3143310546875, 3.813232421875, 4.3121337890625, 4.81103515625, 5.3099365234375, 5.808837890625, 6.3077392578125, 6.806640625, 7.3055419921875, 7.804443359375, 8.3033447265625, 8.80224609375, 9.3011474609375, 9.800048828125, 10.2989501953125, 10.7978515625, 11.2967529296875, 11.795654296875, 12.2945556640625, 12.79345703125, 13.2923583984375, 13.791259765625, 14.2901611328125, 14.7890625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 213.0, 772.0, 27.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-502.45086669921875, -492.8404541015625, -483.23004150390625, -473.6195983886719, -464.0091857910156, -454.3987731933594, -444.7883605957031, -435.17791748046875, -425.5675048828125, -415.95709228515625, -406.3466796875, -396.7362365722656, -387.1258239746094, -377.5154113769531, -367.9049987792969, -358.2945556640625, -348.68414306640625, -339.07373046875, -329.46331787109375, -319.8528747558594, -310.2424621582031, -300.6320495605469, -291.0216369628906, -281.41119384765625, -271.8008117675781, -262.1903991699219, -252.57997131347656, -242.9695587158203, -233.359130859375, -223.74871826171875, -214.1383056640625, -204.5278778076172, -194.91744995117188, -185.30703735351562, -175.6966094970703, -166.08619689941406, -156.47576904296875, -146.8653564453125, -137.25494384765625, -127.64451599121094, -118.03410339355469, -108.4236831665039, -98.81326293945312, -89.20285034179688, -79.59242248535156, -69.98200988769531, -60.37158966064453, -50.76116943359375, -41.15074920654297, -31.540328979492188, -21.92991065979004, -12.31949234008789, -2.7090721130371094, 6.901348114013672, 16.511764526367188, 26.12218475341797, 35.73260498046875, 45.34302520751953, 54.95344543457031, 64.56385803222656, 74.17428588867188, 83.78469848632812, 93.3951187133789, 103.00553894042969, 112.61595916748047]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 11.0, 4.0, 2.0, 18.0, 12.0, 18.0, 21.0, 19.0, 22.0, 16.0, 28.0, 27.0, 32.0, 32.0, 37.0, 38.0, 45.0, 42.0, 32.0, 42.0, 44.0, 26.0, 25.0, 33.0, 24.0, 42.0, 27.0, 32.0, 40.0, 24.0, 22.0, 22.0, 27.0, 20.0, 15.0, 15.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-30.332887649536133, -29.39901351928711, -28.465139389038086, -27.531265258789062, -26.59739112854004, -25.663516998291016, -24.729644775390625, -23.79576873779297, -22.861896514892578, -21.928022384643555, -20.99414825439453, -20.060274124145508, -19.126399993896484, -18.19252586364746, -17.258651733398438, -16.324779510498047, -15.39090347290039, -14.457029342651367, -13.523155212402344, -12.58928108215332, -11.655406951904297, -10.721532821655273, -9.787659645080566, -8.853785514831543, -7.9199113845825195, -6.986037254333496, -6.052163124084473, -5.118289470672607, -4.184415340423584, -3.2505412101745605, -2.3166675567626953, -1.3827934265136719, -0.4489173889160156, 0.48495662212371826, 1.4188306331634521, 2.3527045249938965, 3.28657865524292, 4.220452785491943, 5.154326438903809, 6.088200569152832, 7.0220746994018555, 7.955948829650879, 8.889822959899902, 9.82369613647461, 10.757570266723633, 11.691444396972656, 12.62531852722168, 13.559192657470703, 14.493066787719727, 15.42694091796875, 16.360815048217773, 17.294689178466797, 18.22856330871582, 19.162437438964844, 20.096309661865234, 21.03018569946289, 21.96405792236328, 22.897932052612305, 23.831806182861328, 24.76568031311035, 25.699554443359375, 26.6334285736084, 27.567302703857422, 28.501174926757812, 29.43505096435547]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 21.0, 15.0, 15.0, 25.0, 23.0, 22.0, 32.0, 36.0, 42.0, 51.0, 36.0, 52.0, 48.0, 60.0, 56.0, 46.0, 31.0, 50.0, 47.0, 40.0, 34.0, 35.0, 35.0, 19.0, 30.0, 11.0, 17.0, 12.0, 9.0, 6.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.1796875, -5.02783203125, -4.8759765625, -4.72412109375, -4.572265625, -4.42041015625, -4.2685546875, -4.11669921875, -3.96484375, -3.81298828125, -3.6611328125, -3.50927734375, -3.357421875, -3.20556640625, -3.0537109375, -2.90185546875, -2.75, -2.59814453125, -2.4462890625, -2.29443359375, -2.142578125, -1.99072265625, -1.8388671875, -1.68701171875, -1.53515625, -1.38330078125, -1.2314453125, -1.07958984375, -0.927734375, -0.77587890625, -0.6240234375, -0.47216796875, -0.3203125, -0.16845703125, -0.0166015625, 0.13525390625, 0.287109375, 0.43896484375, 0.5908203125, 0.74267578125, 0.89453125, 1.04638671875, 1.1982421875, 1.35009765625, 1.501953125, 1.65380859375, 1.8056640625, 1.95751953125, 2.109375, 2.26123046875, 2.4130859375, 2.56494140625, 2.716796875, 2.86865234375, 3.0205078125, 3.17236328125, 3.32421875, 3.47607421875, 3.6279296875, 3.77978515625, 3.931640625, 4.08349609375, 4.2353515625, 4.38720703125, 4.5390625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 6.0, 15.0, 24.0, 33.0, 40.0, 59.0, 86.0, 123.0, 196.0, 269.0, 426.0, 623.0, 1019.0, 1513.0, 2324.0, 3890.0, 6016.0, 9648.0, 15784.0, 26389.0, 44503.0, 76195.0, 130555.0, 199063.0, 201225.0, 133936.0, 78531.0, 45755.0, 27100.0, 16118.0, 10025.0, 6124.0, 3849.0, 2486.0, 1530.0, 1037.0, 664.0, 430.0, 301.0, 173.0, 166.0, 105.0, 58.0, 50.0, 23.0, 15.0, 14.0, 16.0, 8.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.43359375, -0.4200553894042969, -0.40651702880859375, -0.3929786682128906, -0.3794403076171875, -0.3659019470214844, -0.35236358642578125, -0.3388252258300781, -0.325286865234375, -0.3117485046386719, -0.29821014404296875, -0.2846717834472656, -0.2711334228515625, -0.2575950622558594, -0.24405670166015625, -0.23051834106445312, -0.21697998046875, -0.20344161987304688, -0.18990325927734375, -0.17636489868164062, -0.1628265380859375, -0.14928817749023438, -0.13574981689453125, -0.12221145629882812, -0.108673095703125, -0.09513473510742188, -0.08159637451171875, -0.06805801391601562, -0.0545196533203125, -0.040981292724609375, -0.02744293212890625, -0.013904571533203125, -0.0003662109375, 0.013172149658203125, 0.02671051025390625, 0.040248870849609375, 0.0537872314453125, 0.06732559204101562, 0.08086395263671875, 0.09440231323242188, 0.107940673828125, 0.12147903442382812, 0.13501739501953125, 0.14855575561523438, 0.1620941162109375, 0.17563247680664062, 0.18917083740234375, 0.20270919799804688, 0.21624755859375, 0.22978591918945312, 0.24332427978515625, 0.2568626403808594, 0.2704010009765625, 0.2839393615722656, 0.29747772216796875, 0.3110160827636719, 0.324554443359375, 0.3380928039550781, 0.35163116455078125, 0.3651695251464844, 0.3787078857421875, 0.3922462463378906, 0.40578460693359375, 0.4193229675292969, 0.432861328125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 9.0, 6.0, 10.0, 14.0, 17.0, 25.0, 16.0, 27.0, 30.0, 23.0, 35.0, 35.0, 35.0, 53.0, 44.0, 52.0, 46.0, 1060.0, 37.0, 50.0, 44.0, 60.0, 38.0, 34.0, 25.0, 41.0, 25.0, 27.0, 16.0, 26.0, 14.0, 8.0, 9.0, 6.0, 7.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.55078125, -3.451629638671875, -3.35247802734375, -3.253326416015625, -3.1541748046875, -3.055023193359375, -2.95587158203125, -2.856719970703125, -2.757568359375, -2.658416748046875, -2.55926513671875, -2.460113525390625, -2.3609619140625, -2.261810302734375, -2.16265869140625, -2.063507080078125, -1.96435546875, -1.865203857421875, -1.76605224609375, -1.666900634765625, -1.5677490234375, -1.468597412109375, -1.36944580078125, -1.270294189453125, -1.171142578125, -1.071990966796875, -0.97283935546875, -0.873687744140625, -0.7745361328125, -0.675384521484375, -0.57623291015625, -0.477081298828125, -0.3779296875, -0.278778076171875, -0.17962646484375, -0.080474853515625, 0.0186767578125, 0.117828369140625, 0.21697998046875, 0.316131591796875, 0.415283203125, 0.514434814453125, 0.61358642578125, 0.712738037109375, 0.8118896484375, 0.911041259765625, 1.01019287109375, 1.109344482421875, 1.20849609375, 1.307647705078125, 1.40679931640625, 1.505950927734375, 1.6051025390625, 1.704254150390625, 1.80340576171875, 1.902557373046875, 2.001708984375, 2.100860595703125, 2.20001220703125, 2.299163818359375, 2.3983154296875, 2.497467041015625, 2.59661865234375, 2.695770263671875, 2.794921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 7.0, 6.0, 18.0, 20.0, 26.0, 44.0, 60.0, 74.0, 114.0, 191.0, 274.0, 410.0, 561.0, 805.0, 1161.0, 1691.0, 2413.0, 3517.0, 5120.0, 7295.0, 10727.0, 15748.0, 22775.0, 32962.0, 46819.0, 65056.0, 88727.0, 116395.0, 1172310.0, 142427.0, 101853.0, 75621.0, 55439.0, 38931.0, 27412.0, 18811.0, 12774.0, 8946.0, 6080.0, 4108.0, 2907.0, 1954.0, 1408.0, 932.0, 714.0, 460.0, 330.0, 226.0, 148.0, 106.0, 71.0, 51.0, 30.0, 28.0, 17.0, 14.0, 3.0, 10.0, 4.0, 2.0, 1.0], "bins": [-0.228759765625, -0.22155380249023438, -0.21434783935546875, -0.20714187622070312, -0.1999359130859375, -0.19272994995117188, -0.18552398681640625, -0.17831802368164062, -0.171112060546875, -0.16390609741210938, -0.15670013427734375, -0.14949417114257812, -0.1422882080078125, -0.13508224487304688, -0.12787628173828125, -0.12067031860351562, -0.11346435546875, -0.10625839233398438, -0.09905242919921875, -0.09184646606445312, -0.0846405029296875, -0.07743453979492188, -0.07022857666015625, -0.06302261352539062, -0.055816650390625, -0.048610687255859375, -0.04140472412109375, -0.034198760986328125, -0.0269927978515625, -0.019786834716796875, -0.01258087158203125, -0.005374908447265625, 0.0018310546875, 0.009037017822265625, 0.01624298095703125, 0.023448944091796875, 0.0306549072265625, 0.037860870361328125, 0.04506683349609375, 0.052272796630859375, 0.059478759765625, 0.06668472290039062, 0.07389068603515625, 0.08109664916992188, 0.0883026123046875, 0.09550857543945312, 0.10271453857421875, 0.10992050170898438, 0.11712646484375, 0.12433242797851562, 0.13153839111328125, 0.13874435424804688, 0.1459503173828125, 0.15315628051757812, 0.16036224365234375, 0.16756820678710938, 0.174774169921875, 0.18198013305664062, 0.18918609619140625, 0.19639205932617188, 0.2035980224609375, 0.21080398559570312, 0.21800994873046875, 0.22521591186523438, 0.232421875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 1.0, 6.0, 5.0, 6.0, 7.0, 9.0, 9.0, 7.0, 15.0, 16.0, 28.0, 34.0, 36.0, 53.0, 75.0, 83.0, 104.0, 110.0, 78.0, 76.0, 44.0, 34.0, 29.0, 29.0, 29.0, 16.0, 15.0, 10.0, 12.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00537109375, -0.0051937103271484375, -0.005016326904296875, -0.0048389434814453125, -0.00466156005859375, -0.0044841766357421875, -0.004306793212890625, -0.0041294097900390625, -0.0039520263671875, -0.0037746429443359375, -0.003597259521484375, -0.0034198760986328125, -0.00324249267578125, -0.0030651092529296875, -0.002887725830078125, -0.0027103424072265625, -0.002532958984375, -0.0023555755615234375, -0.002178192138671875, -0.0020008087158203125, -0.00182342529296875, -0.0016460418701171875, -0.001468658447265625, -0.0012912750244140625, -0.0011138916015625, -0.0009365081787109375, -0.000759124755859375, -0.0005817413330078125, -0.00040435791015625, -0.0002269744873046875, -4.9591064453125e-05, 0.0001277923583984375, 0.00030517578125, 0.0004825592041015625, 0.000659942626953125, 0.0008373260498046875, 0.00101470947265625, 0.0011920928955078125, 0.001369476318359375, 0.0015468597412109375, 0.0017242431640625, 0.0019016265869140625, 0.002079010009765625, 0.0022563934326171875, 0.00243377685546875, 0.0026111602783203125, 0.002788543701171875, 0.0029659271240234375, 0.003143310546875, 0.0033206939697265625, 0.003498077392578125, 0.0036754608154296875, 0.00385284423828125, 0.0040302276611328125, 0.004207611083984375, 0.0043849945068359375, 0.0045623779296875, 0.0047397613525390625, 0.004917144775390625, 0.0050945281982421875, 0.00527191162109375, 0.0054492950439453125, 0.005626678466796875, 0.0058040618896484375, 0.0059814453125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 11.0, 11.0, 12.0, 21.0, 25.0, 27.0, 57.0, 67.0, 84.0, 111.0, 141.0, 282.0, 606.0, 4394.0, 977582.0, 62715.0, 1167.0, 436.0, 246.0, 148.0, 106.0, 53.0, 52.0, 38.0, 27.0, 19.0, 22.0, 11.0, 17.0, 10.0, 9.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1065673828125, -0.10341072082519531, -0.10025405883789062, -0.09709739685058594, -0.09394073486328125, -0.09078407287597656, -0.08762741088867188, -0.08447074890136719, -0.0813140869140625, -0.07815742492675781, -0.07500076293945312, -0.07184410095214844, -0.06868743896484375, -0.06553077697753906, -0.062374114990234375, -0.05921745300292969, -0.056060791015625, -0.05290412902832031, -0.049747467041015625, -0.04659080505371094, -0.04343414306640625, -0.04027748107910156, -0.037120819091796875, -0.03396415710449219, -0.0308074951171875, -0.027650833129882812, -0.024494171142578125, -0.021337509155273438, -0.01818084716796875, -0.015024185180664062, -0.011867523193359375, -0.008710861206054688, -0.00555419921875, -0.0023975372314453125, 0.000759124755859375, 0.0039157867431640625, 0.00707244873046875, 0.010229110717773438, 0.013385772705078125, 0.016542434692382812, 0.0196990966796875, 0.022855758666992188, 0.026012420654296875, 0.029169082641601562, 0.03232574462890625, 0.03548240661621094, 0.038639068603515625, 0.04179573059082031, 0.044952392578125, 0.04810905456542969, 0.051265716552734375, 0.05442237854003906, 0.05757904052734375, 0.06073570251464844, 0.06389236450195312, 0.06704902648925781, 0.0702056884765625, 0.07336235046386719, 0.07651901245117188, 0.07967567443847656, 0.08283233642578125, 0.08598899841308594, 0.08914566040039062, 0.09230232238769531, 0.095458984375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 113.0, 895.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015621923841536045, -0.013453865423798561, -0.011285806074738503, -0.009117746725678444, -0.00694968830794096, -0.004781628958880901, -0.0026135705411434174, -0.0004455121234059334, 0.0017225472256541252, 0.0038906061090528965, 0.006058664992451668, 0.008226724341511726, 0.01039478275924921, 0.012562842108309269, 0.014730900526046753, 0.01689895987510681, 0.01906701922416687, 0.02123507857322693, 0.023403137922286987, 0.025571195408701897, 0.027739254757761955, 0.029907314106822014, 0.03207537159323692, 0.03424343094229698, 0.03641149029135704, 0.0385795496404171, 0.04074760898947716, 0.042915668338537216, 0.045083723962306976, 0.047251783311367035, 0.049419842660427094, 0.05158790200948715, 0.05375596135854721, 0.05592402070760727, 0.05809208005666733, 0.060260139405727386, 0.062428198754787445, 0.0645962581038475, 0.06676431745290756, 0.06893236935138702, 0.07110042870044708, 0.07326848804950714, 0.0754365473985672, 0.07760460674762726, 0.07977266609668732, 0.08194072544574738, 0.08410878479480743, 0.08627684414386749, 0.08844490349292755, 0.09061296284198761, 0.09278102219104767, 0.09494908154010773, 0.09711714088916779, 0.09928520023822784, 0.1014532595872879, 0.10362131893634796, 0.10578937828540802, 0.10795743763446808, 0.11012549698352814, 0.1122935563325882, 0.11446161568164825, 0.11662967503070831, 0.11879773437976837, 0.12096579372882843, 0.12313384562730789]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 12.0, 8.0, 11.0, 21.0, 20.0, 19.0, 54.0, 58.0, 54.0, 65.0, 68.0, 79.0, 68.0, 97.0, 87.0, 64.0, 44.0, 52.0, 38.0, 32.0, 17.0, 12.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007954180240631104, -0.007755565457046032, -0.00755695067346096, -0.007358335889875889, -0.007159721106290817, -0.006961106322705746, -0.006762491539120674, -0.006563876755535603, -0.006365261971950531, -0.0061666471883654594, -0.005968032404780388, -0.005769417621195316, -0.005570802837610245, -0.005372188054025173, -0.005173573270440102, -0.00497495848685503, -0.0047763437032699585, -0.004577728919684887, -0.004379114136099815, -0.004180499352514744, -0.003981884568929672, -0.0037832697853446007, -0.003584655001759529, -0.0033860402181744576, -0.003187425434589386, -0.0029888106510043144, -0.002790195867419243, -0.0025915810838341713, -0.0023929663002490997, -0.002194351516664028, -0.0019957367330789566, -0.001797121949493885, -0.0015985071659088135, -0.001399892382323742, -0.0012012775987386703, -0.0010026628151535988, -0.0008040480315685272, -0.0006054332479834557, -0.0004068184643983841, -0.00020820368081331253, -9.588897228240967e-06, 0.0001890258863568306, 0.00038764066994190216, 0.0005862554535269737, 0.0007848702371120453, 0.0009834850206971169, 0.0011820998042821884, 0.00138071458786726, 0.0015793293714523315, 0.001777944155037403, 0.0019765589386224747, 0.0021751737222075462, 0.002373788505792618, 0.0025724032893776894, 0.002771018072962761, 0.0029696328565478325, 0.003168247640132904, 0.0033668624237179756, 0.003565477207303047, 0.0037640919908881187, 0.00396270677447319, 0.004161321558058262, 0.0043599363416433334, 0.004558551125228405, 0.0047571659088134766]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 21.0, 15.0, 15.0, 25.0, 23.0, 22.0, 32.0, 36.0, 42.0, 51.0, 36.0, 52.0, 48.0, 60.0, 56.0, 46.0, 31.0, 50.0, 48.0, 39.0, 34.0, 35.0, 34.0, 20.0, 30.0, 11.0, 17.0, 12.0, 9.0, 6.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.1796875, -5.02783203125, -4.8759765625, -4.72412109375, -4.572265625, -4.42041015625, -4.2685546875, -4.11669921875, -3.96484375, -3.81298828125, -3.6611328125, -3.50927734375, -3.357421875, -3.20556640625, -3.0537109375, -2.90185546875, -2.75, -2.59814453125, -2.4462890625, -2.29443359375, -2.142578125, -1.99072265625, -1.8388671875, -1.68701171875, -1.53515625, -1.38330078125, -1.2314453125, -1.07958984375, -0.927734375, -0.77587890625, -0.6240234375, -0.47216796875, -0.3203125, -0.16845703125, -0.0166015625, 0.13525390625, 0.287109375, 0.43896484375, 0.5908203125, 0.74267578125, 0.89453125, 1.04638671875, 1.1982421875, 1.35009765625, 1.501953125, 1.65380859375, 1.8056640625, 1.95751953125, 2.109375, 2.26123046875, 2.4130859375, 2.56494140625, 2.716796875, 2.86865234375, 3.0205078125, 3.17236328125, 3.32421875, 3.47607421875, 3.6279296875, 3.77978515625, 3.931640625, 4.08349609375, 4.2353515625, 4.38720703125, 4.5390625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 14.0, 13.0, 24.0, 25.0, 25.0, 49.0, 67.0, 96.0, 136.0, 162.0, 246.0, 363.0, 542.0, 817.0, 1134.0, 1657.0, 2459.0, 4586.0, 16460.0, 177026.0, 734871.0, 86537.0, 10402.0, 3809.0, 2188.0, 1507.0, 993.0, 686.0, 474.0, 311.0, 244.0, 182.0, 122.0, 100.0, 66.0, 46.0, 30.0, 26.0, 17.0, 10.0, 5.0, 6.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.491455078125, -11.10009765625, -10.708740234375, -10.3173828125, -9.926025390625, -9.53466796875, -9.143310546875, -8.751953125, -8.360595703125, -7.96923828125, -7.577880859375, -7.1865234375, -6.795166015625, -6.40380859375, -6.012451171875, -5.62109375, -5.229736328125, -4.83837890625, -4.447021484375, -4.0556640625, -3.664306640625, -3.27294921875, -2.881591796875, -2.490234375, -2.098876953125, -1.70751953125, -1.316162109375, -0.9248046875, -0.533447265625, -0.14208984375, 0.249267578125, 0.640625, 1.031982421875, 1.42333984375, 1.814697265625, 2.2060546875, 2.597412109375, 2.98876953125, 3.380126953125, 3.771484375, 4.162841796875, 4.55419921875, 4.945556640625, 5.3369140625, 5.728271484375, 6.11962890625, 6.510986328125, 6.90234375, 7.293701171875, 7.68505859375, 8.076416015625, 8.4677734375, 8.859130859375, 9.25048828125, 9.641845703125, 10.033203125, 10.424560546875, 10.81591796875, 11.207275390625, 11.5986328125, 11.989990234375, 12.38134765625, 12.772705078125, 13.1640625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 11.0, 4.0, 10.0, 10.0, 4.0, 9.0, 7.0, 16.0, 19.0, 20.0, 21.0, 25.0, 28.0, 33.0, 33.0, 38.0, 71.0, 72.0, 134.0, 238.0, 1468.0, 202.0, 104.0, 71.0, 66.0, 45.0, 36.0, 37.0, 29.0, 26.0, 20.0, 18.0, 17.0, 12.0, 19.0, 8.0, 11.0, 9.0, 8.0, 3.0, 7.0, 5.0, 5.0, 2.0, 2.0, 6.0, 2.0, 2.0, 1.0], "bins": [-10.71875, -10.415283203125, -10.11181640625, -9.808349609375, -9.5048828125, -9.201416015625, -8.89794921875, -8.594482421875, -8.291015625, -7.987548828125, -7.68408203125, -7.380615234375, -7.0771484375, -6.773681640625, -6.47021484375, -6.166748046875, -5.86328125, -5.559814453125, -5.25634765625, -4.952880859375, -4.6494140625, -4.345947265625, -4.04248046875, -3.739013671875, -3.435546875, -3.132080078125, -2.82861328125, -2.525146484375, -2.2216796875, -1.918212890625, -1.61474609375, -1.311279296875, -1.0078125, -0.704345703125, -0.40087890625, -0.097412109375, 0.2060546875, 0.509521484375, 0.81298828125, 1.116455078125, 1.419921875, 1.723388671875, 2.02685546875, 2.330322265625, 2.6337890625, 2.937255859375, 3.24072265625, 3.544189453125, 3.84765625, 4.151123046875, 4.45458984375, 4.758056640625, 5.0615234375, 5.364990234375, 5.66845703125, 5.971923828125, 6.275390625, 6.578857421875, 6.88232421875, 7.185791015625, 7.4892578125, 7.792724609375, 8.09619140625, 8.399658203125, 8.703125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 0.0, 7.0, 9.0, 12.0, 12.0, 19.0, 20.0, 18.0, 29.0, 32.0, 42.0, 63.0, 87.0, 120.0, 168.0, 273.0, 439.0, 749.0, 1740.0, 12778.0, 3117465.0, 8122.0, 1553.0, 676.0, 383.0, 227.0, 179.0, 115.0, 76.0, 70.0, 43.0, 31.0, 35.0, 19.0, 16.0, 11.0, 14.0, 5.0, 8.0, 13.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.125, -32.96630859375, -31.8076171875, -30.64892578125, -29.490234375, -28.33154296875, -27.1728515625, -26.01416015625, -24.85546875, -23.69677734375, -22.5380859375, -21.37939453125, -20.220703125, -19.06201171875, -17.9033203125, -16.74462890625, -15.5859375, -14.42724609375, -13.2685546875, -12.10986328125, -10.951171875, -9.79248046875, -8.6337890625, -7.47509765625, -6.31640625, -5.15771484375, -3.9990234375, -2.84033203125, -1.681640625, -0.52294921875, 0.6357421875, 1.79443359375, 2.953125, 4.11181640625, 5.2705078125, 6.42919921875, 7.587890625, 8.74658203125, 9.9052734375, 11.06396484375, 12.22265625, 13.38134765625, 14.5400390625, 15.69873046875, 16.857421875, 18.01611328125, 19.1748046875, 20.33349609375, 21.4921875, 22.65087890625, 23.8095703125, 24.96826171875, 26.126953125, 27.28564453125, 28.4443359375, 29.60302734375, 30.76171875, 31.92041015625, 33.0791015625, 34.23779296875, 35.396484375, 36.55517578125, 37.7138671875, 38.87255859375, 40.03125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 25.0, 69.0, 133.0, 257.0, 254.0, 158.0, 70.0, 21.0, 8.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.35519790649414, -40.84904861450195, -39.34290313720703, -37.836753845214844, -36.33060836791992, -34.824459075927734, -33.31831359863281, -31.812164306640625, -30.30601692199707, -28.799869537353516, -27.29372215270996, -25.787574768066406, -24.28142547607422, -22.775279998779297, -21.26913070678711, -19.762983322143555, -18.2568359375, -16.750688552856445, -15.24454116821289, -13.73839282989502, -12.232245445251465, -10.72609806060791, -9.219949722290039, -7.713802337646484, -6.20765495300293, -4.701507568359375, -3.195359706878662, -1.6892118453979492, -0.18306446075439453, 1.3230829238891602, 2.8292312622070312, 4.335378646850586, 5.841522216796875, 7.34766960144043, 8.853816986083984, 10.359965324401855, 11.86611270904541, 13.372260093688965, 14.878408432006836, 16.38455581665039, 17.890703201293945, 19.3968505859375, 20.902997970581055, 22.40914535522461, 23.915294647216797, 25.42144012451172, 26.927589416503906, 28.43373680114746, 29.939884185791016, 31.44603157043457, 32.952178955078125, 34.45832824707031, 35.964473724365234, 37.47062301635742, 38.976768493652344, 40.48291778564453, 41.98906707763672, 43.495216369628906, 45.00136184692383, 46.507511138916016, 48.01365661621094, 49.519805908203125, 51.02595520019531, 52.532100677490234, 54.038246154785156]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 1.0, 4.0, 11.0, 14.0, 13.0, 12.0, 9.0, 20.0, 20.0, 21.0, 25.0, 21.0, 28.0, 26.0, 34.0, 34.0, 35.0, 41.0, 39.0, 37.0, 35.0, 38.0, 44.0, 43.0, 40.0, 32.0, 31.0, 30.0, 26.0, 25.0, 27.0, 30.0, 26.0, 11.0, 14.0, 21.0, 11.0, 9.0, 12.0, 7.0, 11.0, 7.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.226558685302734, -24.397172927856445, -23.567785263061523, -22.738399505615234, -21.909011840820312, -21.079626083374023, -20.250240325927734, -19.420852661132812, -18.591466903686523, -17.762081146240234, -16.932693481445312, -16.103307723999023, -15.273921012878418, -14.444534301757812, -13.615147590637207, -12.785760879516602, -11.956374168395996, -11.12698745727539, -10.297600746154785, -9.46821403503418, -8.63882827758789, -7.809441566467285, -6.98005485534668, -6.150668621063232, -5.321281909942627, -4.4918951988220215, -3.662508964538574, -2.8331222534179688, -2.0037357807159424, -1.174349308013916, -0.34496259689331055, 0.4844236373901367, 1.3138103485107422, 2.1431968212127686, 2.972583293914795, 3.8019700050354004, 4.631356239318848, 5.460742950439453, 6.290129661560059, 7.119515895843506, 7.948902606964111, 8.778288841247559, 9.607675552368164, 10.43706226348877, 11.266448974609375, 12.095834732055664, 12.925222396850586, 13.754608154296875, 14.58399486541748, 15.413381576538086, 16.242767333984375, 17.072154998779297, 17.901540756225586, 18.730926513671875, 19.560314178466797, 20.389699935913086, 21.219087600708008, 22.048473358154297, 22.87786102294922, 23.707246780395508, 24.53663444519043, 25.36602020263672, 26.19540786743164, 27.02479362487793, 27.85417938232422]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 14.0, 8.0, 11.0, 16.0, 14.0, 22.0, 17.0, 15.0, 21.0, 36.0, 28.0, 28.0, 30.0, 53.0, 40.0, 46.0, 58.0, 45.0, 33.0, 51.0, 39.0, 40.0, 38.0, 37.0, 31.0, 29.0, 38.0, 22.0, 25.0, 19.0, 18.0, 13.0, 10.0, 15.0, 4.0, 8.0, 6.0, 5.0, 6.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3359375, -4.19158935546875, -4.0472412109375, -3.90289306640625, -3.758544921875, -3.61419677734375, -3.4698486328125, -3.32550048828125, -3.18115234375, -3.03680419921875, -2.8924560546875, -2.74810791015625, -2.603759765625, -2.45941162109375, -2.3150634765625, -2.17071533203125, -2.0263671875, -1.88201904296875, -1.7376708984375, -1.59332275390625, -1.448974609375, -1.30462646484375, -1.1602783203125, -1.01593017578125, -0.87158203125, -0.72723388671875, -0.5828857421875, -0.43853759765625, -0.294189453125, -0.14984130859375, -0.0054931640625, 0.13885498046875, 0.283203125, 0.42755126953125, 0.5718994140625, 0.71624755859375, 0.860595703125, 1.00494384765625, 1.1492919921875, 1.29364013671875, 1.43798828125, 1.58233642578125, 1.7266845703125, 1.87103271484375, 2.015380859375, 2.15972900390625, 2.3040771484375, 2.44842529296875, 2.5927734375, 2.73712158203125, 2.8814697265625, 3.02581787109375, 3.170166015625, 3.31451416015625, 3.4588623046875, 3.60321044921875, 3.74755859375, 3.89190673828125, 4.0362548828125, 4.18060302734375, 4.324951171875, 4.46929931640625, 4.6136474609375, 4.75799560546875, 4.90234375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 14.0, 15.0, 21.0, 23.0, 35.0, 58.0, 80.0, 108.0, 143.0, 203.0, 282.0, 427.0, 670.0, 1195.0, 1931.0, 3801.0, 7845.0, 20786.0, 79997.0, 421921.0, 1553060.0, 1561153.0, 424944.0, 78751.0, 20019.0, 7743.0, 3774.0, 2042.0, 1127.0, 701.0, 456.0, 308.0, 176.0, 130.0, 102.0, 66.0, 54.0, 33.0, 20.0, 13.0, 12.0, 9.0, 9.0, 4.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.80859375, -5.6270751953125, -5.445556640625, -5.2640380859375, -5.08251953125, -4.9010009765625, -4.719482421875, -4.5379638671875, -4.3564453125, -4.1749267578125, -3.993408203125, -3.8118896484375, -3.63037109375, -3.4488525390625, -3.267333984375, -3.0858154296875, -2.904296875, -2.7227783203125, -2.541259765625, -2.3597412109375, -2.17822265625, -1.9967041015625, -1.815185546875, -1.6336669921875, -1.4521484375, -1.2706298828125, -1.089111328125, -0.9075927734375, -0.72607421875, -0.5445556640625, -0.363037109375, -0.1815185546875, 0.0, 0.1815185546875, 0.363037109375, 0.5445556640625, 0.72607421875, 0.9075927734375, 1.089111328125, 1.2706298828125, 1.4521484375, 1.6336669921875, 1.815185546875, 1.9967041015625, 2.17822265625, 2.3597412109375, 2.541259765625, 2.7227783203125, 2.904296875, 3.0858154296875, 3.267333984375, 3.4488525390625, 3.63037109375, 3.8118896484375, 3.993408203125, 4.1749267578125, 4.3564453125, 4.5379638671875, 4.719482421875, 4.9010009765625, 5.08251953125, 5.2640380859375, 5.445556640625, 5.6270751953125, 5.80859375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 7.0, 12.0, 36.0, 65.0, 131.0, 244.0, 418.0, 694.0, 851.0, 703.0, 429.0, 217.0, 127.0, 62.0, 26.0, 26.0, 13.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.688720703125, -17.25244140625, -16.816162109375, -16.3798828125, -15.943603515625, -15.50732421875, -15.071044921875, -14.634765625, -14.198486328125, -13.76220703125, -13.325927734375, -12.8896484375, -12.453369140625, -12.01708984375, -11.580810546875, -11.14453125, -10.708251953125, -10.27197265625, -9.835693359375, -9.3994140625, -8.963134765625, -8.52685546875, -8.090576171875, -7.654296875, -7.218017578125, -6.78173828125, -6.345458984375, -5.9091796875, -5.472900390625, -5.03662109375, -4.600341796875, -4.1640625, -3.727783203125, -3.29150390625, -2.855224609375, -2.4189453125, -1.982666015625, -1.54638671875, -1.110107421875, -0.673828125, -0.237548828125, 0.19873046875, 0.635009765625, 1.0712890625, 1.507568359375, 1.94384765625, 2.380126953125, 2.81640625, 3.252685546875, 3.68896484375, 4.125244140625, 4.5615234375, 4.997802734375, 5.43408203125, 5.870361328125, 6.306640625, 6.742919921875, 7.17919921875, 7.615478515625, 8.0517578125, 8.488037109375, 8.92431640625, 9.360595703125, 9.796875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 11.0, 11.0, 21.0, 31.0, 50.0, 173.0, 349.0, 877.0, 3366.0, 223381.0, 3951946.0, 11464.0, 1662.0, 536.0, 208.0, 103.0, 43.0, 26.0, 9.0, 6.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.21875, -20.26513671875, -19.3115234375, -18.35791015625, -17.404296875, -16.45068359375, -15.4970703125, -14.54345703125, -13.58984375, -12.63623046875, -11.6826171875, -10.72900390625, -9.775390625, -8.82177734375, -7.8681640625, -6.91455078125, -5.9609375, -5.00732421875, -4.0537109375, -3.10009765625, -2.146484375, -1.19287109375, -0.2392578125, 0.71435546875, 1.66796875, 2.62158203125, 3.5751953125, 4.52880859375, 5.482421875, 6.43603515625, 7.3896484375, 8.34326171875, 9.296875, 10.25048828125, 11.2041015625, 12.15771484375, 13.111328125, 14.06494140625, 15.0185546875, 15.97216796875, 16.92578125, 17.87939453125, 18.8330078125, 19.78662109375, 20.740234375, 21.69384765625, 22.6474609375, 23.60107421875, 24.5546875, 25.50830078125, 26.4619140625, 27.41552734375, 28.369140625, 29.32275390625, 30.2763671875, 31.22998046875, 32.18359375, 33.13720703125, 34.0908203125, 35.04443359375, 35.998046875, 36.95166015625, 37.9052734375, 38.85888671875, 39.8125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 132.0, 676.0, 193.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.4481506347656, -297.6725769042969, -291.89703369140625, -286.1214599609375, -280.34588623046875, -274.5703430175781, -268.7947692871094, -263.01922607421875, -257.24365234375, -251.4680938720703, -245.69252014160156, -239.91696166992188, -234.1414031982422, -228.3658447265625, -222.59027099609375, -216.81471252441406, -211.03915405273438, -205.2635955810547, -199.48802185058594, -193.71246337890625, -187.93690490722656, -182.16134643554688, -176.38577270507812, -170.61021423339844, -164.8346405029297, -159.05908203125, -153.28350830078125, -147.50794982910156, -141.73239135742188, -135.9568328857422, -130.18125915527344, -124.40570068359375, -118.63013458251953, -112.85456848144531, -107.07901000976562, -101.3034439086914, -95.52788543701172, -89.7523193359375, -83.97676086425781, -78.2011947631836, -72.42562866210938, -66.65006256103516, -60.87450408935547, -55.09893798828125, -49.32337951660156, -43.547813415527344, -37.77225112915039, -31.996688842773438, -26.22113037109375, -20.445568084716797, -14.670004844665527, -8.894441604614258, -3.1188793182373047, 2.6566829681396484, 8.432247161865234, 14.207809448242188, 19.98337173461914, 25.758934020996094, 31.534496307373047, 37.31005859375, 43.08562469482422, 48.861183166503906, 54.636749267578125, 60.41231155395508, 66.18787384033203]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 5.0, 4.0, 9.0, 12.0, 12.0, 15.0, 15.0, 15.0, 20.0, 24.0, 19.0, 29.0, 34.0, 40.0, 29.0, 30.0, 30.0, 47.0, 34.0, 37.0, 45.0, 48.0, 45.0, 46.0, 31.0, 43.0, 32.0, 30.0, 32.0, 21.0, 18.0, 19.0, 20.0, 20.0, 15.0, 14.0, 9.0, 4.0, 9.0, 10.0, 5.0, 6.0, 3.0, 0.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-26.45172119140625, -25.59737205505371, -24.743022918701172, -23.888675689697266, -23.034326553344727, -22.179977416992188, -21.32562828063965, -20.47127914428711, -19.616931915283203, -18.762582778930664, -17.908233642578125, -17.05388641357422, -16.19953727722168, -15.34518814086914, -14.490839004516602, -13.636490821838379, -12.78214168548584, -11.9277925491333, -11.073444366455078, -10.219095230102539, -9.364747047424316, -8.510397911071777, -7.6560492515563965, -6.801700592041016, -5.947351932525635, -5.093003273010254, -4.238654613494873, -3.384305715560913, -2.5299570560455322, -1.6756081581115723, -0.8212594985961914, 0.03308916091918945, 0.8874378204345703, 1.7417864799499512, 2.596135139465332, 3.450484037399292, 4.304832458496094, 5.159181594848633, 6.013530254364014, 6.8678789138793945, 7.722227573394775, 8.576576232910156, 9.430925369262695, 10.285273551940918, 11.139622688293457, 11.99397087097168, 12.848320007324219, 13.702669143676758, 14.55701732635498, 15.41136646270752, 16.265714645385742, 17.12006378173828, 17.97441291809082, 18.82876205444336, 19.683109283447266, 20.537458419799805, 21.391807556152344, 22.246156692504883, 23.100505828857422, 23.954853057861328, 24.809202194213867, 25.663551330566406, 26.517900466918945, 27.372249603271484, 28.22659683227539]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 12.0, 17.0, 10.0, 13.0, 26.0, 22.0, 24.0, 26.0, 32.0, 37.0, 31.0, 34.0, 35.0, 51.0, 46.0, 47.0, 46.0, 45.0, 39.0, 34.0, 39.0, 47.0, 23.0, 27.0, 26.0, 24.0, 24.0, 22.0, 20.0, 21.0, 11.0, 15.0, 15.0, 7.0, 4.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.234375, -3.13543701171875, -3.0364990234375, -2.93756103515625, -2.838623046875, -2.73968505859375, -2.6407470703125, -2.54180908203125, -2.44287109375, -2.34393310546875, -2.2449951171875, -2.14605712890625, -2.047119140625, -1.94818115234375, -1.8492431640625, -1.75030517578125, -1.6513671875, -1.55242919921875, -1.4534912109375, -1.35455322265625, -1.255615234375, -1.15667724609375, -1.0577392578125, -0.95880126953125, -0.85986328125, -0.76092529296875, -0.6619873046875, -0.56304931640625, -0.464111328125, -0.36517333984375, -0.2662353515625, -0.16729736328125, -0.068359375, 0.03057861328125, 0.1295166015625, 0.22845458984375, 0.327392578125, 0.42633056640625, 0.5252685546875, 0.62420654296875, 0.72314453125, 0.82208251953125, 0.9210205078125, 1.01995849609375, 1.118896484375, 1.21783447265625, 1.3167724609375, 1.41571044921875, 1.5146484375, 1.61358642578125, 1.7125244140625, 1.81146240234375, 1.910400390625, 2.00933837890625, 2.1082763671875, 2.20721435546875, 2.30615234375, 2.40509033203125, 2.5040283203125, 2.60296630859375, 2.701904296875, 2.80084228515625, 2.8997802734375, 2.99871826171875, 3.09765625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 6.0, 8.0, 16.0, 15.0, 32.0, 40.0, 45.0, 68.0, 136.0, 188.0, 253.0, 367.0, 553.0, 761.0, 1139.0, 1696.0, 2635.0, 3884.0, 5912.0, 9072.0, 14099.0, 22936.0, 36674.0, 59473.0, 95825.0, 148497.0, 198556.0, 162032.0, 106156.0, 66356.0, 40753.0, 25299.0, 15711.0, 10089.0, 6401.0, 4219.0, 2826.0, 1872.0, 1198.0, 907.0, 607.0, 391.0, 272.0, 176.0, 113.0, 90.0, 64.0, 48.0, 29.0, 25.0, 8.0, 12.0, 6.0, 8.0, 6.0, 4.0, 1.0, 3.0], "bins": [-0.306640625, -0.2972373962402344, -0.28783416748046875, -0.2784309387207031, -0.2690277099609375, -0.2596244812011719, -0.25022125244140625, -0.24081802368164062, -0.231414794921875, -0.22201156616210938, -0.21260833740234375, -0.20320510864257812, -0.1938018798828125, -0.18439865112304688, -0.17499542236328125, -0.16559219360351562, -0.15618896484375, -0.14678573608398438, -0.13738250732421875, -0.12797927856445312, -0.1185760498046875, -0.10917282104492188, -0.09976959228515625, -0.09036636352539062, -0.080963134765625, -0.07155990600585938, -0.06215667724609375, -0.052753448486328125, -0.0433502197265625, -0.033946990966796875, -0.02454376220703125, -0.015140533447265625, -0.0057373046875, 0.003665924072265625, 0.01306915283203125, 0.022472381591796875, 0.0318756103515625, 0.041278839111328125, 0.05068206787109375, 0.060085296630859375, 0.069488525390625, 0.07889175415039062, 0.08829498291015625, 0.09769821166992188, 0.1071014404296875, 0.11650466918945312, 0.12590789794921875, 0.13531112670898438, 0.14471435546875, 0.15411758422851562, 0.16352081298828125, 0.17292404174804688, 0.1823272705078125, 0.19173049926757812, 0.20113372802734375, 0.21053695678710938, 0.219940185546875, 0.22934341430664062, 0.23874664306640625, 0.24814987182617188, 0.2575531005859375, 0.2669563293457031, 0.27635955810546875, 0.2857627868652344, 0.295166015625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 16.0, 21.0, 18.0, 14.0, 18.0, 18.0, 27.0, 29.0, 27.0, 23.0, 36.0, 42.0, 44.0, 39.0, 39.0, 48.0, 1064.0, 39.0, 39.0, 38.0, 39.0, 45.0, 35.0, 30.0, 23.0, 27.0, 23.0, 20.0, 18.0, 16.0, 15.0, 16.0, 23.0, 9.0, 4.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.931640625, -1.867034912109375, -1.80242919921875, -1.737823486328125, -1.6732177734375, -1.608612060546875, -1.54400634765625, -1.479400634765625, -1.414794921875, -1.350189208984375, -1.28558349609375, -1.220977783203125, -1.1563720703125, -1.091766357421875, -1.02716064453125, -0.962554931640625, -0.89794921875, -0.833343505859375, -0.76873779296875, -0.704132080078125, -0.6395263671875, -0.574920654296875, -0.51031494140625, -0.445709228515625, -0.381103515625, -0.316497802734375, -0.25189208984375, -0.187286376953125, -0.1226806640625, -0.058074951171875, 0.00653076171875, 0.071136474609375, 0.1357421875, 0.200347900390625, 0.26495361328125, 0.329559326171875, 0.3941650390625, 0.458770751953125, 0.52337646484375, 0.587982177734375, 0.652587890625, 0.717193603515625, 0.78179931640625, 0.846405029296875, 0.9110107421875, 0.975616455078125, 1.04022216796875, 1.104827880859375, 1.16943359375, 1.234039306640625, 1.29864501953125, 1.363250732421875, 1.4278564453125, 1.492462158203125, 1.55706787109375, 1.621673583984375, 1.686279296875, 1.750885009765625, 1.81549072265625, 1.880096435546875, 1.9447021484375, 2.009307861328125, 2.07391357421875, 2.138519287109375, 2.203125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 4.0, 9.0, 14.0, 7.0, 25.0, 23.0, 31.0, 60.0, 117.0, 153.0, 230.0, 332.0, 471.0, 687.0, 961.0, 1397.0, 2031.0, 2916.0, 4265.0, 6215.0, 8884.0, 13221.0, 19171.0, 28317.0, 40882.0, 59233.0, 85300.0, 115815.0, 1100169.0, 233393.0, 111683.0, 81455.0, 56372.0, 38594.0, 26492.0, 18263.0, 12519.0, 8538.0, 5881.0, 3982.0, 2750.0, 1954.0, 1332.0, 903.0, 651.0, 484.0, 307.0, 228.0, 135.0, 98.0, 70.0, 37.0, 31.0, 20.0, 11.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0], "bins": [-0.1951904296875, -0.18907737731933594, -0.18296432495117188, -0.1768512725830078, -0.17073822021484375, -0.1646251678466797, -0.15851211547851562, -0.15239906311035156, -0.1462860107421875, -0.14017295837402344, -0.13405990600585938, -0.1279468536376953, -0.12183380126953125, -0.11572074890136719, -0.10960769653320312, -0.10349464416503906, -0.097381591796875, -0.09126853942871094, -0.08515548706054688, -0.07904243469238281, -0.07292938232421875, -0.06681632995605469, -0.060703277587890625, -0.05459022521972656, -0.0484771728515625, -0.04236412048339844, -0.036251068115234375, -0.030138015747070312, -0.02402496337890625, -0.017911911010742188, -0.011798858642578125, -0.0056858062744140625, 0.00042724609375, 0.0065402984619140625, 0.012653350830078125, 0.018766403198242188, 0.02487945556640625, 0.030992507934570312, 0.037105560302734375, 0.04321861267089844, 0.0493316650390625, 0.05544471740722656, 0.061557769775390625, 0.06767082214355469, 0.07378387451171875, 0.07989692687988281, 0.08600997924804688, 0.09212303161621094, 0.098236083984375, 0.10434913635253906, 0.11046218872070312, 0.11657524108886719, 0.12268829345703125, 0.1288013458251953, 0.13491439819335938, 0.14102745056152344, 0.1471405029296875, 0.15325355529785156, 0.15936660766601562, 0.1654796600341797, 0.17159271240234375, 0.1777057647705078, 0.18381881713867188, 0.18993186950683594, 0.196044921875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 11.0, 11.0, 6.0, 14.0, 22.0, 20.0, 26.0, 47.0, 63.0, 90.0, 92.0, 124.0, 119.0, 93.0, 62.0, 42.0, 29.0, 20.0, 21.0, 11.0, 13.0, 9.0, 10.0, 3.0, 7.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00463104248046875, -0.004510730504989624, -0.004390418529510498, -0.004270106554031372, -0.004149794578552246, -0.00402948260307312, -0.003909170627593994, -0.003788858652114868, -0.003668546676635742, -0.003548234701156616, -0.0034279227256774902, -0.0033076107501983643, -0.0031872987747192383, -0.0030669867992401123, -0.0029466748237609863, -0.0028263628482818604, -0.0027060508728027344, -0.0025857388973236084, -0.0024654269218444824, -0.0023451149463653564, -0.0022248029708862305, -0.0021044909954071045, -0.0019841790199279785, -0.0018638670444488525, -0.0017435550689697266, -0.0016232430934906006, -0.0015029311180114746, -0.0013826191425323486, -0.0012623071670532227, -0.0011419951915740967, -0.0010216832160949707, -0.0009013712406158447, -0.0007810592651367188, -0.0006607472896575928, -0.0005404353141784668, -0.0004201233386993408, -0.00029981136322021484, -0.00017949938774108887, -5.918741226196289e-05, 6.112456321716309e-05, 0.00018143653869628906, 0.00030174851417541504, 0.000422060489654541, 0.000542372465133667, 0.000662684440612793, 0.0007829964160919189, 0.0009033083915710449, 0.001023620367050171, 0.0011439323425292969, 0.0012642443180084229, 0.0013845562934875488, 0.0015048682689666748, 0.0016251802444458008, 0.0017454922199249268, 0.0018658041954040527, 0.0019861161708831787, 0.0021064281463623047, 0.0022267401218414307, 0.0023470520973205566, 0.0024673640727996826, 0.0025876760482788086, 0.0027079880237579346, 0.0028282999992370605, 0.0029486119747161865, 0.0030689239501953125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 24.0, 25.0, 28.0, 33.0, 52.0, 75.0, 113.0, 212.0, 340.0, 805.0, 9883.0, 1026974.0, 8176.0, 776.0, 383.0, 204.0, 115.0, 75.0, 65.0, 29.0, 25.0, 23.0, 25.0, 9.0, 10.0, 12.0, 5.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.05401611328125, -0.05189704895019531, -0.049777984619140625, -0.04765892028808594, -0.04553985595703125, -0.04342079162597656, -0.041301727294921875, -0.03918266296386719, -0.0370635986328125, -0.03494453430175781, -0.032825469970703125, -0.030706405639648438, -0.02858734130859375, -0.026468276977539062, -0.024349212646484375, -0.022230148315429688, -0.020111083984375, -0.017992019653320312, -0.015872955322265625, -0.013753890991210938, -0.01163482666015625, -0.009515762329101562, -0.007396697998046875, -0.0052776336669921875, -0.0031585693359375, -0.0010395050048828125, 0.001079559326171875, 0.0031986236572265625, 0.00531768798828125, 0.0074367523193359375, 0.009555816650390625, 0.011674880981445312, 0.0137939453125, 0.015913009643554688, 0.018032073974609375, 0.020151138305664062, 0.02227020263671875, 0.024389266967773438, 0.026508331298828125, 0.028627395629882812, 0.0307464599609375, 0.03286552429199219, 0.034984588623046875, 0.03710365295410156, 0.03922271728515625, 0.04134178161621094, 0.043460845947265625, 0.04557991027832031, 0.047698974609375, 0.04981803894042969, 0.051937103271484375, 0.05405616760253906, 0.05617523193359375, 0.05829429626464844, 0.060413360595703125, 0.06253242492675781, 0.0646514892578125, 0.06677055358886719, 0.06888961791992188, 0.07100868225097656, 0.07312774658203125, 0.07524681091308594, 0.07736587524414062, 0.07948493957519531, 0.08160400390625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 67.0, 863.0, 81.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01530770305544138, -0.014657065272331238, -0.014006426557898521, -0.01335578877478838, -0.012705150991678238, -0.012054513208568096, -0.011403875425457954, -0.010753236711025238, -0.010102598927915096, -0.009451961144804955, -0.008801322430372238, -0.008150684647262096, -0.007500046864151955, -0.006849409081041813, -0.006198770832270384, -0.005548132583498955, -0.004897494800388813, -0.004246857017278671, -0.003596218768507242, -0.002945580752566457, -0.0022949427366256714, -0.001644304720684886, -0.0009936667047441006, -0.0003430284559726715, 0.00030760932713747025, 0.0009582473430782557, 0.001608885359019041, 0.0022595233749598265, 0.002910161390900612, 0.0035607994068413973, 0.004211437422782183, 0.004862075671553612, 0.005512714385986328, 0.00616335216909647, 0.006813990417867899, 0.007464628666639328, 0.00811526644974947, 0.008765904232859612, 0.009416542947292328, 0.01006718073040247, 0.010717818513512611, 0.011368456296622753, 0.012019094079732895, 0.012669732794165611, 0.013320370577275753, 0.013971008360385895, 0.014621647074818611, 0.015272284857928753, 0.015922922641038895, 0.01657356135547161, 0.017224198207259178, 0.017874836921691895, 0.01852547377347946, 0.019176112487912178, 0.019826751202344894, 0.02047738805413246, 0.021128026768565178, 0.021778665482997894, 0.02242930233478546, 0.023079941049218178, 0.023730579763650894, 0.02438121661543846, 0.025031855329871178, 0.025682494044303894, 0.02633313089609146]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 6.0, 9.0, 9.0, 23.0, 18.0, 26.0, 34.0, 38.0, 34.0, 44.0, 41.0, 59.0, 56.0, 55.0, 62.0, 60.0, 57.0, 50.0, 51.0, 53.0, 49.0, 37.0, 23.0, 20.0, 24.0, 19.0, 14.0, 12.0, 3.0, 9.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0030756592750549316, -0.0029958300292491913, -0.002916000783443451, -0.0028361715376377106, -0.00275634229183197, -0.00267651304602623, -0.0025966838002204895, -0.002516854554414749, -0.002437025308609009, -0.0023571960628032684, -0.002277366816997528, -0.0021975375711917877, -0.0021177083253860474, -0.002037879079580307, -0.0019580498337745667, -0.0018782205879688263, -0.001798391342163086, -0.0017185620963573456, -0.0016387328505516052, -0.0015589036047458649, -0.0014790743589401245, -0.0013992451131343842, -0.0013194158673286438, -0.0012395866215229034, -0.001159757375717163, -0.0010799281299114227, -0.0010000988841056824, -0.000920269638299942, -0.0008404403924942017, -0.0007606111466884613, -0.000680781900882721, -0.0006009526550769806, -0.0005211234092712402, -0.0004412941634654999, -0.0003614649176597595, -0.00028163567185401917, -0.0002018064260482788, -0.00012197718024253845, -4.2147934436798096e-05, 3.768131136894226e-05, 0.00011751055717468262, 0.00019733980298042297, 0.00027716904878616333, 0.0003569982945919037, 0.00043682754039764404, 0.0005166567862033844, 0.0005964860320091248, 0.0006763152778148651, 0.0007561445236206055, 0.0008359737694263458, 0.0009158030152320862, 0.0009956322610378265, 0.001075461506843567, 0.0011552907526493073, 0.0012351199984550476, 0.001314949244260788, 0.0013947784900665283, 0.0014746077358722687, 0.001554436981678009, 0.0016342662274837494, 0.0017140954732894897, 0.00179392471909523, 0.0018737539649009705, 0.001953583210706711, 0.002033412456512451]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 12.0, 17.0, 10.0, 13.0, 26.0, 22.0, 24.0, 26.0, 32.0, 37.0, 31.0, 34.0, 35.0, 50.0, 47.0, 47.0, 46.0, 45.0, 39.0, 34.0, 39.0, 47.0, 23.0, 27.0, 26.0, 24.0, 24.0, 22.0, 20.0, 21.0, 11.0, 15.0, 15.0, 7.0, 4.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.234375, -3.13543701171875, -3.0364990234375, -2.93756103515625, -2.838623046875, -2.73968505859375, -2.6407470703125, -2.54180908203125, -2.44287109375, -2.34393310546875, -2.2449951171875, -2.14605712890625, -2.047119140625, -1.94818115234375, -1.8492431640625, -1.75030517578125, -1.6513671875, -1.55242919921875, -1.4534912109375, -1.35455322265625, -1.255615234375, -1.15667724609375, -1.0577392578125, -0.95880126953125, -0.85986328125, -0.76092529296875, -0.6619873046875, -0.56304931640625, -0.464111328125, -0.36517333984375, -0.2662353515625, -0.16729736328125, -0.068359375, 0.03057861328125, 0.1295166015625, 0.22845458984375, 0.327392578125, 0.42633056640625, 0.5252685546875, 0.62420654296875, 0.72314453125, 0.82208251953125, 0.9210205078125, 1.01995849609375, 1.118896484375, 1.21783447265625, 1.3167724609375, 1.41571044921875, 1.5146484375, 1.61358642578125, 1.7125244140625, 1.81146240234375, 1.910400390625, 2.00933837890625, 2.1082763671875, 2.20721435546875, 2.30615234375, 2.40509033203125, 2.5040283203125, 2.60296630859375, 2.701904296875, 2.80084228515625, 2.8997802734375, 2.99871826171875, 3.09765625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 9.0, 11.0, 20.0, 23.0, 35.0, 50.0, 60.0, 85.0, 139.0, 153.0, 209.0, 285.0, 370.0, 604.0, 954.0, 1658.0, 2998.0, 6954.0, 23355.0, 144343.0, 648618.0, 175293.0, 26558.0, 7602.0, 3276.0, 1709.0, 1014.0, 619.0, 418.0, 289.0, 220.0, 141.0, 105.0, 84.0, 72.0, 54.0, 31.0, 31.0, 31.0, 15.0, 10.0, 11.0, 7.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.99359130859375, -5.8035888671875, -5.61358642578125, -5.423583984375, -5.23358154296875, -5.0435791015625, -4.85357666015625, -4.66357421875, -4.47357177734375, -4.2835693359375, -4.09356689453125, -3.903564453125, -3.71356201171875, -3.5235595703125, -3.33355712890625, -3.1435546875, -2.95355224609375, -2.7635498046875, -2.57354736328125, -2.383544921875, -2.19354248046875, -2.0035400390625, -1.81353759765625, -1.62353515625, -1.43353271484375, -1.2435302734375, -1.05352783203125, -0.863525390625, -0.67352294921875, -0.4835205078125, -0.29351806640625, -0.103515625, 0.08648681640625, 0.2764892578125, 0.46649169921875, 0.656494140625, 0.84649658203125, 1.0364990234375, 1.22650146484375, 1.41650390625, 1.60650634765625, 1.7965087890625, 1.98651123046875, 2.176513671875, 2.36651611328125, 2.5565185546875, 2.74652099609375, 2.9365234375, 3.12652587890625, 3.3165283203125, 3.50653076171875, 3.696533203125, 3.88653564453125, 4.0765380859375, 4.26654052734375, 4.45654296875, 4.64654541015625, 4.8365478515625, 5.02655029296875, 5.216552734375, 5.40655517578125, 5.5965576171875, 5.78656005859375, 5.9765625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 5.0, 8.0, 7.0, 6.0, 10.0, 9.0, 20.0, 18.0, 27.0, 28.0, 30.0, 43.0, 36.0, 37.0, 54.0, 61.0, 159.0, 279.0, 1468.0, 237.0, 111.0, 74.0, 51.0, 47.0, 41.0, 28.0, 27.0, 17.0, 17.0, 18.0, 7.0, 16.0, 6.0, 6.0, 7.0, 7.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.8046875, -9.52789306640625, -9.2510986328125, -8.97430419921875, -8.697509765625, -8.42071533203125, -8.1439208984375, -7.86712646484375, -7.59033203125, -7.31353759765625, -7.0367431640625, -6.75994873046875, -6.483154296875, -6.20635986328125, -5.9295654296875, -5.65277099609375, -5.3759765625, -5.09918212890625, -4.8223876953125, -4.54559326171875, -4.268798828125, -3.99200439453125, -3.7152099609375, -3.43841552734375, -3.16162109375, -2.88482666015625, -2.6080322265625, -2.33123779296875, -2.054443359375, -1.77764892578125, -1.5008544921875, -1.22406005859375, -0.947265625, -0.67047119140625, -0.3936767578125, -0.11688232421875, 0.159912109375, 0.43670654296875, 0.7135009765625, 0.99029541015625, 1.26708984375, 1.54388427734375, 1.8206787109375, 2.09747314453125, 2.374267578125, 2.65106201171875, 2.9278564453125, 3.20465087890625, 3.4814453125, 3.75823974609375, 4.0350341796875, 4.31182861328125, 4.588623046875, 4.86541748046875, 5.1422119140625, 5.41900634765625, 5.69580078125, 5.97259521484375, 6.2493896484375, 6.52618408203125, 6.802978515625, 7.07977294921875, 7.3565673828125, 7.63336181640625, 7.91015625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 10.0, 13.0, 14.0, 23.0, 44.0, 73.0, 95.0, 139.0, 213.0, 354.0, 890.0, 5458.0, 3119621.0, 16307.0, 1208.0, 484.0, 231.0, 170.0, 120.0, 80.0, 42.0, 29.0, 17.0, 11.0, 11.0, 11.0, 5.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.78125, -20.992431640625, -20.20361328125, -19.414794921875, -18.6259765625, -17.837158203125, -17.04833984375, -16.259521484375, -15.470703125, -14.681884765625, -13.89306640625, -13.104248046875, -12.3154296875, -11.526611328125, -10.73779296875, -9.948974609375, -9.16015625, -8.371337890625, -7.58251953125, -6.793701171875, -6.0048828125, -5.216064453125, -4.42724609375, -3.638427734375, -2.849609375, -2.060791015625, -1.27197265625, -0.483154296875, 0.3056640625, 1.094482421875, 1.88330078125, 2.672119140625, 3.4609375, 4.249755859375, 5.03857421875, 5.827392578125, 6.6162109375, 7.405029296875, 8.19384765625, 8.982666015625, 9.771484375, 10.560302734375, 11.34912109375, 12.137939453125, 12.9267578125, 13.715576171875, 14.50439453125, 15.293212890625, 16.08203125, 16.870849609375, 17.65966796875, 18.448486328125, 19.2373046875, 20.026123046875, 20.81494140625, 21.603759765625, 22.392578125, 23.181396484375, 23.97021484375, 24.759033203125, 25.5478515625, 26.336669921875, 27.12548828125, 27.914306640625, 28.703125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 11.0, 293.0, 645.0, 63.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.00791931152344, -103.30741882324219, -100.6069107055664, -97.90641021728516, -95.2059097290039, -92.50540161132812, -89.80490112304688, -87.10440063476562, -84.40390014648438, -81.70339965820312, -79.00289154052734, -76.3023910522461, -73.60189056396484, -70.90138244628906, -68.20088195800781, -65.50038146972656, -62.79987335205078, -60.099369049072266, -57.398868560791016, -54.6983642578125, -51.99786376953125, -49.297359466552734, -46.59685516357422, -43.89635467529297, -41.19585037231445, -38.49534606933594, -35.79484558105469, -33.09434127807617, -30.39383888244629, -27.693336486816406, -24.99283218383789, -22.292329788208008, -19.591827392578125, -16.891324996948242, -14.190821647644043, -11.490318298339844, -8.789815902709961, -6.089313507080078, -3.3888092041015625, -0.6883068084716797, 2.012195587158203, 4.712698459625244, 7.413201332092285, 10.113704681396484, 12.814207077026367, 15.51470947265625, 18.215213775634766, 20.91571617126465, 23.61621856689453, 26.316720962524414, 29.017223358154297, 31.717727661132812, 34.41822814941406, 37.11873245239258, 39.819236755371094, 42.519737243652344, 45.22024154663086, 47.920745849609375, 50.621246337890625, 53.32175064086914, 56.022254943847656, 58.722755432128906, 61.42325973510742, 64.12376403808594, 66.82426452636719]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 5.0, 4.0, 9.0, 13.0, 11.0, 21.0, 10.0, 23.0, 26.0, 25.0, 29.0, 24.0, 31.0, 33.0, 30.0, 35.0, 51.0, 44.0, 38.0, 43.0, 28.0, 27.0, 36.0, 39.0, 34.0, 32.0, 33.0, 39.0, 24.0, 31.0, 18.0, 28.0, 17.0, 20.0, 15.0, 10.0, 19.0, 7.0, 5.0, 4.0, 7.0, 7.0, 9.0, 2.0, 1.0, 5.0], "bins": [-24.096588134765625, -23.508955001831055, -22.921323776245117, -22.333690643310547, -21.746057510375977, -21.15842628479004, -20.57079315185547, -19.98316192626953, -19.39552879333496, -18.80789566040039, -18.220264434814453, -17.632631301879883, -17.044998168945312, -16.457366943359375, -15.869733810424805, -15.28210163116455, -14.69446849822998, -14.106836318969727, -13.519203186035156, -12.931571006774902, -12.343938827514648, -11.756305694580078, -11.168673515319824, -10.58104133605957, -9.993408203125, -9.405776023864746, -8.818142890930176, -8.230510711669922, -7.642878532409668, -7.055245876312256, -6.467613220214844, -5.87998104095459, -5.292348861694336, -4.704716205596924, -4.11708402633667, -3.529451370239258, -2.941818952560425, -2.354186534881592, -1.7665538787841797, -1.1789216995239258, -0.5912890434265137, -0.0036565661430358887, 0.5839759111404419, 1.1716084480285645, 1.7592408657073975, 2.3468732833862305, 2.9345059394836426, 3.5221381187438965, 4.109770774841309, 4.697403430938721, 5.285035610198975, 5.872668266296387, 6.460300445556641, 7.047933101654053, 7.635565757751465, 8.223197937011719, 8.810831069946289, 9.398463249206543, 9.986096382141113, 10.573728561401367, 11.161360740661621, 11.748992919921875, 12.336626052856445, 12.9242582321167, 13.511890411376953]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 3.0, 6.0, 2.0, 7.0, 10.0, 6.0, 14.0, 18.0, 20.0, 26.0, 27.0, 28.0, 32.0, 33.0, 31.0, 29.0, 36.0, 43.0, 39.0, 44.0, 43.0, 45.0, 41.0, 39.0, 33.0, 39.0, 31.0, 24.0, 32.0, 26.0, 43.0, 23.0, 21.0, 17.0, 19.0, 18.0, 8.0, 9.0, 11.0, 4.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.487945556640625, -3.37237548828125, -3.256805419921875, -3.1412353515625, -3.025665283203125, -2.91009521484375, -2.794525146484375, -2.678955078125, -2.563385009765625, -2.44781494140625, -2.332244873046875, -2.2166748046875, -2.101104736328125, -1.98553466796875, -1.869964599609375, -1.75439453125, -1.638824462890625, -1.52325439453125, -1.407684326171875, -1.2921142578125, -1.176544189453125, -1.06097412109375, -0.945404052734375, -0.829833984375, -0.714263916015625, -0.59869384765625, -0.483123779296875, -0.3675537109375, -0.251983642578125, -0.13641357421875, -0.020843505859375, 0.0947265625, 0.210296630859375, 0.32586669921875, 0.441436767578125, 0.5570068359375, 0.672576904296875, 0.78814697265625, 0.903717041015625, 1.019287109375, 1.134857177734375, 1.25042724609375, 1.365997314453125, 1.4815673828125, 1.597137451171875, 1.71270751953125, 1.828277587890625, 1.94384765625, 2.059417724609375, 2.17498779296875, 2.290557861328125, 2.4061279296875, 2.521697998046875, 2.63726806640625, 2.752838134765625, 2.868408203125, 2.983978271484375, 3.09954833984375, 3.215118408203125, 3.3306884765625, 3.446258544921875, 3.56182861328125, 3.677398681640625, 3.79296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 16.0, 16.0, 12.0, 30.0, 33.0, 35.0, 61.0, 77.0, 97.0, 145.0, 187.0, 280.0, 395.0, 538.0, 808.0, 1625.0, 5724.0, 115048.0, 3516468.0, 535385.0, 11990.0, 2130.0, 953.0, 615.0, 423.0, 307.0, 224.0, 161.0, 123.0, 95.0, 74.0, 40.0, 35.0, 23.0, 22.0, 23.0, 10.0, 7.0, 11.0, 6.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.953125, -17.36767578125, -16.7822265625, -16.19677734375, -15.611328125, -15.02587890625, -14.4404296875, -13.85498046875, -13.26953125, -12.68408203125, -12.0986328125, -11.51318359375, -10.927734375, -10.34228515625, -9.7568359375, -9.17138671875, -8.5859375, -8.00048828125, -7.4150390625, -6.82958984375, -6.244140625, -5.65869140625, -5.0732421875, -4.48779296875, -3.90234375, -3.31689453125, -2.7314453125, -2.14599609375, -1.560546875, -0.97509765625, -0.3896484375, 0.19580078125, 0.78125, 1.36669921875, 1.9521484375, 2.53759765625, 3.123046875, 3.70849609375, 4.2939453125, 4.87939453125, 5.46484375, 6.05029296875, 6.6357421875, 7.22119140625, 7.806640625, 8.39208984375, 8.9775390625, 9.56298828125, 10.1484375, 10.73388671875, 11.3193359375, 11.90478515625, 12.490234375, 13.07568359375, 13.6611328125, 14.24658203125, 14.83203125, 15.41748046875, 16.0029296875, 16.58837890625, 17.173828125, 17.75927734375, 18.3447265625, 18.93017578125, 19.515625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 5.0, 13.0, 18.0, 32.0, 43.0, 63.0, 98.0, 163.0, 235.0, 296.0, 422.0, 546.0, 587.0, 453.0, 330.0, 234.0, 172.0, 103.0, 84.0, 51.0, 37.0, 24.0, 15.0, 9.0, 11.0, 2.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.921875, -7.6905517578125, -7.459228515625, -7.2279052734375, -6.99658203125, -6.7652587890625, -6.533935546875, -6.3026123046875, -6.0712890625, -5.8399658203125, -5.608642578125, -5.3773193359375, -5.14599609375, -4.9146728515625, -4.683349609375, -4.4520263671875, -4.220703125, -3.9893798828125, -3.758056640625, -3.5267333984375, -3.29541015625, -3.0640869140625, -2.832763671875, -2.6014404296875, -2.3701171875, -2.1387939453125, -1.907470703125, -1.6761474609375, -1.44482421875, -1.2135009765625, -0.982177734375, -0.7508544921875, -0.51953125, -0.2882080078125, -0.056884765625, 0.1744384765625, 0.40576171875, 0.6370849609375, 0.868408203125, 1.0997314453125, 1.3310546875, 1.5623779296875, 1.793701171875, 2.0250244140625, 2.25634765625, 2.4876708984375, 2.718994140625, 2.9503173828125, 3.181640625, 3.4129638671875, 3.644287109375, 3.8756103515625, 4.10693359375, 4.3382568359375, 4.569580078125, 4.8009033203125, 5.0322265625, 5.2635498046875, 5.494873046875, 5.7261962890625, 5.95751953125, 6.1888427734375, 6.420166015625, 6.6514892578125, 6.8828125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 4.0, 12.0, 17.0, 23.0, 37.0, 85.0, 155.0, 366.0, 725.0, 1804.0, 5776.0, 27013.0, 266580.0, 2668384.0, 1119628.0, 85902.0, 12340.0, 3295.0, 1173.0, 498.0, 212.0, 137.0, 39.0, 27.0, 11.0, 5.0, 10.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.1171875, -8.85498046875, -8.5927734375, -8.33056640625, -8.068359375, -7.80615234375, -7.5439453125, -7.28173828125, -7.01953125, -6.75732421875, -6.4951171875, -6.23291015625, -5.970703125, -5.70849609375, -5.4462890625, -5.18408203125, -4.921875, -4.65966796875, -4.3974609375, -4.13525390625, -3.873046875, -3.61083984375, -3.3486328125, -3.08642578125, -2.82421875, -2.56201171875, -2.2998046875, -2.03759765625, -1.775390625, -1.51318359375, -1.2509765625, -0.98876953125, -0.7265625, -0.46435546875, -0.2021484375, 0.06005859375, 0.322265625, 0.58447265625, 0.8466796875, 1.10888671875, 1.37109375, 1.63330078125, 1.8955078125, 2.15771484375, 2.419921875, 2.68212890625, 2.9443359375, 3.20654296875, 3.46875, 3.73095703125, 3.9931640625, 4.25537109375, 4.517578125, 4.77978515625, 5.0419921875, 5.30419921875, 5.56640625, 5.82861328125, 6.0908203125, 6.35302734375, 6.615234375, 6.87744140625, 7.1396484375, 7.40185546875, 7.6640625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 6.0, 10.0, 25.0, 27.0, 61.0, 64.0, 78.0, 107.0, 111.0, 105.0, 104.0, 86.0, 60.0, 61.0, 38.0, 24.0, 17.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.49061393737793, -21.953781127929688, -20.416948318481445, -18.880115509033203, -17.343280792236328, -15.806448936462402, -14.269615173339844, -12.732782363891602, -11.19594955444336, -9.659116744995117, -8.122283935546875, -6.585450172424316, -5.048617362976074, -3.511784553527832, -1.9749507904052734, -0.43811798095703125, 1.098714828491211, 2.6355478763580322, 4.1723809242248535, 5.709214210510254, 7.246047019958496, 8.782879829406738, 10.319713592529297, 11.856546401977539, 13.393379211425781, 14.930212020874023, 16.467044830322266, 18.00387954711914, 19.54071044921875, 21.077545166015625, 22.614377975463867, 24.15121078491211, 25.68804168701172, 27.22487449645996, 28.761707305908203, 30.298542022705078, 31.835372924804688, 33.37220764160156, 34.90904235839844, 36.44587326049805, 37.982704162597656, 39.51953887939453, 41.05636978149414, 42.593204498291016, 44.130035400390625, 45.6668701171875, 47.203704833984375, 48.740535736083984, 50.27737045288086, 51.814205169677734, 53.351036071777344, 54.88787078857422, 56.42470169067383, 57.9615364074707, 59.49836730957031, 61.03520202636719, 62.57203674316406, 64.10887145996094, 65.64570617675781, 67.18253326416016, 68.71936798095703, 70.2562026977539, 71.79303741455078, 73.32986450195312, 74.86669921875]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 10.0, 5.0, 12.0, 9.0, 8.0, 11.0, 16.0, 14.0, 23.0, 23.0, 20.0, 22.0, 31.0, 34.0, 36.0, 32.0, 26.0, 33.0, 38.0, 34.0, 37.0, 40.0, 41.0, 33.0, 35.0, 40.0, 39.0, 31.0, 29.0, 30.0, 24.0, 26.0, 23.0, 16.0, 23.0, 15.0, 11.0, 15.0, 10.0, 6.0, 9.0, 2.0, 3.0, 6.0, 3.0, 7.0, 2.0, 6.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.584197998046875, -19.88762855529785, -19.191059112548828, -18.494491577148438, -17.797922134399414, -17.10135269165039, -16.404783248901367, -15.708213806152344, -15.011645317077637, -14.315075874328613, -13.618507385253906, -12.921937942504883, -12.22536849975586, -11.528800010681152, -10.832230567932129, -10.135662078857422, -9.439092636108398, -8.742523193359375, -8.045954704284668, -7.3493852615356445, -6.652816295623779, -5.956247329711914, -5.259677886962891, -4.563108921051025, -3.86653995513916, -3.169970989227295, -2.4734017848968506, -1.7768325805664062, -1.080263614654541, -0.3836946487426758, 0.31287479400634766, 1.009443759918213, 1.706014633178711, 2.402583599090576, 3.0991528034210205, 3.795722007751465, 4.49229097366333, 5.188859939575195, 5.885429382324219, 6.581998348236084, 7.278567314147949, 7.9751362800598145, 8.67170524597168, 9.368274688720703, 10.064844131469727, 10.761412620544434, 11.457982063293457, 12.154550552368164, 12.851119995117188, 13.547689437866211, 14.244257926940918, 14.940827369689941, 15.637395858764648, 16.333965301513672, 17.030534744262695, 17.72710418701172, 18.42367172241211, 19.120241165161133, 19.816810607910156, 20.513378143310547, 21.20994758605957, 21.906517028808594, 22.603086471557617, 23.29965591430664, 23.996225357055664]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 11.0, 11.0, 7.0, 23.0, 16.0, 24.0, 18.0, 20.0, 22.0, 38.0, 28.0, 32.0, 49.0, 31.0, 32.0, 29.0, 42.0, 32.0, 44.0, 54.0, 32.0, 46.0, 36.0, 31.0, 36.0, 39.0, 13.0, 23.0, 22.0, 17.0, 16.0, 11.0, 12.0, 15.0, 8.0, 13.0, 4.0, 4.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.09375, -37.77099609375, -36.4482421875, -35.12548828125, -33.802734375, -32.47998046875, -31.1572265625, -29.83447265625, -28.51171875, -27.18896484375, -25.8662109375, -24.54345703125, -23.220703125, -21.89794921875, -20.5751953125, -19.25244140625, -17.9296875, -16.60693359375, -15.2841796875, -13.96142578125, -12.638671875, -11.31591796875, -9.9931640625, -8.67041015625, -7.34765625, -6.02490234375, -4.7021484375, -3.37939453125, -2.056640625, -0.73388671875, 0.5888671875, 1.91162109375, 3.234375, 4.55712890625, 5.8798828125, 7.20263671875, 8.525390625, 9.84814453125, 11.1708984375, 12.49365234375, 13.81640625, 15.13916015625, 16.4619140625, 17.78466796875, 19.107421875, 20.43017578125, 21.7529296875, 23.07568359375, 24.3984375, 25.72119140625, 27.0439453125, 28.36669921875, 29.689453125, 31.01220703125, 32.3349609375, 33.65771484375, 34.98046875, 36.30322265625, 37.6259765625, 38.94873046875, 40.271484375, 41.59423828125, 42.9169921875, 44.23974609375, 45.5625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 8.0, 16.0, 11.0, 16.0, 39.0, 54.0, 96.0, 171.0, 268.0, 481.0, 814.0, 1532.0, 2869.0, 5160.0, 9510.0, 17232.0, 32337.0, 60639.0, 112853.0, 196248.0, 241178.0, 167531.0, 92166.0, 49199.0, 26476.0, 14361.0, 7806.0, 4131.0, 2388.0, 1225.0, 737.0, 412.0, 224.0, 131.0, 81.0, 53.0, 33.0, 19.0, 11.0, 10.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.67578125, -4.53118896484375, -4.3865966796875, -4.24200439453125, -4.097412109375, -3.95281982421875, -3.8082275390625, -3.66363525390625, -3.51904296875, -3.37445068359375, -3.2298583984375, -3.08526611328125, -2.940673828125, -2.79608154296875, -2.6514892578125, -2.50689697265625, -2.3623046875, -2.21771240234375, -2.0731201171875, -1.92852783203125, -1.783935546875, -1.63934326171875, -1.4947509765625, -1.35015869140625, -1.20556640625, -1.06097412109375, -0.9163818359375, -0.77178955078125, -0.627197265625, -0.48260498046875, -0.3380126953125, -0.19342041015625, -0.048828125, 0.09576416015625, 0.2403564453125, 0.38494873046875, 0.529541015625, 0.67413330078125, 0.8187255859375, 0.96331787109375, 1.10791015625, 1.25250244140625, 1.3970947265625, 1.54168701171875, 1.686279296875, 1.83087158203125, 1.9754638671875, 2.12005615234375, 2.2646484375, 2.40924072265625, 2.5538330078125, 2.69842529296875, 2.843017578125, 2.98760986328125, 3.1322021484375, 3.27679443359375, 3.42138671875, 3.56597900390625, 3.7105712890625, 3.85516357421875, 3.999755859375, 4.14434814453125, 4.2889404296875, 4.43353271484375, 4.578125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 11.0, 14.0, 11.0, 9.0, 28.0, 14.0, 21.0, 20.0, 24.0, 25.0, 22.0, 23.0, 29.0, 23.0, 39.0, 26.0, 41.0, 40.0, 34.0, 1069.0, 36.0, 47.0, 38.0, 40.0, 31.0, 34.0, 27.0, 33.0, 24.0, 28.0, 20.0, 21.0, 17.0, 18.0, 13.0, 12.0, 11.0, 11.0, 7.0, 8.0, 5.0, 9.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.84375, -23.04052734375, -22.2373046875, -21.43408203125, -20.630859375, -19.82763671875, -19.0244140625, -18.22119140625, -17.41796875, -16.61474609375, -15.8115234375, -15.00830078125, -14.205078125, -13.40185546875, -12.5986328125, -11.79541015625, -10.9921875, -10.18896484375, -9.3857421875, -8.58251953125, -7.779296875, -6.97607421875, -6.1728515625, -5.36962890625, -4.56640625, -3.76318359375, -2.9599609375, -2.15673828125, -1.353515625, -0.55029296875, 0.2529296875, 1.05615234375, 1.859375, 2.66259765625, 3.4658203125, 4.26904296875, 5.072265625, 5.87548828125, 6.6787109375, 7.48193359375, 8.28515625, 9.08837890625, 9.8916015625, 10.69482421875, 11.498046875, 12.30126953125, 13.1044921875, 13.90771484375, 14.7109375, 15.51416015625, 16.3173828125, 17.12060546875, 17.923828125, 18.72705078125, 19.5302734375, 20.33349609375, 21.13671875, 21.93994140625, 22.7431640625, 23.54638671875, 24.349609375, 25.15283203125, 25.9560546875, 26.75927734375, 27.5625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 8.0, 8.0, 13.0, 17.0, 38.0, 45.0, 90.0, 119.0, 167.0, 204.0, 331.0, 510.0, 739.0, 1108.0, 1520.0, 2259.0, 3394.0, 4848.0, 7160.0, 10200.0, 14749.0, 21386.0, 31250.0, 44939.0, 65710.0, 95184.0, 128621.0, 1195652.0, 135511.0, 102049.0, 71631.0, 49300.0, 33685.0, 23248.0, 16190.0, 10930.0, 7661.0, 5272.0, 3658.0, 2475.0, 1722.0, 1100.0, 768.0, 523.0, 387.0, 259.0, 167.0, 109.0, 67.0, 54.0, 33.0, 22.0, 22.0, 15.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.341796875, -2.265289306640625, -2.18878173828125, -2.112274169921875, -2.0357666015625, -1.959259033203125, -1.88275146484375, -1.806243896484375, -1.729736328125, -1.653228759765625, -1.57672119140625, -1.500213623046875, -1.4237060546875, -1.347198486328125, -1.27069091796875, -1.194183349609375, -1.11767578125, -1.041168212890625, -0.96466064453125, -0.888153076171875, -0.8116455078125, -0.735137939453125, -0.65863037109375, -0.582122802734375, -0.505615234375, -0.429107666015625, -0.35260009765625, -0.276092529296875, -0.1995849609375, -0.123077392578125, -0.04656982421875, 0.029937744140625, 0.1064453125, 0.182952880859375, 0.25946044921875, 0.335968017578125, 0.4124755859375, 0.488983154296875, 0.56549072265625, 0.641998291015625, 0.718505859375, 0.795013427734375, 0.87152099609375, 0.948028564453125, 1.0245361328125, 1.101043701171875, 1.17755126953125, 1.254058837890625, 1.33056640625, 1.407073974609375, 1.48358154296875, 1.560089111328125, 1.6365966796875, 1.713104248046875, 1.78961181640625, 1.866119384765625, 1.942626953125, 2.019134521484375, 2.09564208984375, 2.172149658203125, 2.2486572265625, 2.325164794921875, 2.40167236328125, 2.478179931640625, 2.5546875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 7.0, 5.0, 8.0, 10.0, 11.0, 10.0, 15.0, 26.0, 29.0, 39.0, 44.0, 58.0, 69.0, 80.0, 71.0, 67.0, 72.0, 64.0, 56.0, 43.0, 28.0, 26.0, 17.0, 25.0, 18.0, 9.0, 7.0, 17.0, 1.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.050872802734375, -0.049353599548339844, -0.04783439636230469, -0.04631519317626953, -0.044795989990234375, -0.04327678680419922, -0.04175758361816406, -0.040238380432128906, -0.03871917724609375, -0.037199974060058594, -0.03568077087402344, -0.03416156768798828, -0.032642364501953125, -0.03112316131591797, -0.029603958129882812, -0.028084754943847656, -0.0265655517578125, -0.025046348571777344, -0.023527145385742188, -0.02200794219970703, -0.020488739013671875, -0.01896953582763672, -0.017450332641601562, -0.015931129455566406, -0.01441192626953125, -0.012892723083496094, -0.011373519897460938, -0.009854316711425781, -0.008335113525390625, -0.006815910339355469, -0.0052967071533203125, -0.0037775039672851562, -0.00225830078125, -0.0007390975952148438, 0.0007801055908203125, 0.0022993087768554688, 0.003818511962890625, 0.005337715148925781, 0.0068569183349609375, 0.008376121520996094, 0.00989532470703125, 0.011414527893066406, 0.012933731079101562, 0.014452934265136719, 0.015972137451171875, 0.01749134063720703, 0.019010543823242188, 0.020529747009277344, 0.0220489501953125, 0.023568153381347656, 0.025087356567382812, 0.02660655975341797, 0.028125762939453125, 0.02964496612548828, 0.031164169311523438, 0.032683372497558594, 0.03420257568359375, 0.035721778869628906, 0.03724098205566406, 0.03876018524169922, 0.040279388427734375, 0.04179859161376953, 0.04331779479980469, 0.044836997985839844, 0.046356201171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 2.0, 1.0, 11.0, 6.0, 18.0, 21.0, 27.0, 36.0, 40.0, 38.0, 76.0, 97.0, 124.0, 165.0, 284.0, 406.0, 679.0, 1273.0, 2739.0, 6623.0, 19371.0, 66218.0, 238722.0, 461205.0, 175671.0, 49705.0, 14599.0, 5248.0, 2248.0, 1116.0, 575.0, 361.0, 234.0, 120.0, 106.0, 91.0, 79.0, 48.0, 36.0, 31.0, 18.0, 17.0, 19.0, 10.0, 17.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2393798828125, -0.23150062561035156, -0.22362136840820312, -0.2157421112060547, -0.20786285400390625, -0.1999835968017578, -0.19210433959960938, -0.18422508239746094, -0.1763458251953125, -0.16846656799316406, -0.16058731079101562, -0.1527080535888672, -0.14482879638671875, -0.1369495391845703, -0.12907028198242188, -0.12119102478027344, -0.113311767578125, -0.10543251037597656, -0.09755325317382812, -0.08967399597167969, -0.08179473876953125, -0.07391548156738281, -0.06603622436523438, -0.05815696716308594, -0.0502777099609375, -0.04239845275878906, -0.034519195556640625, -0.026639938354492188, -0.01876068115234375, -0.010881423950195312, -0.003002166748046875, 0.0048770904541015625, 0.01275634765625, 0.020635604858398438, 0.028514862060546875, 0.03639411926269531, 0.04427337646484375, 0.05215263366699219, 0.060031890869140625, 0.06791114807128906, 0.0757904052734375, 0.08366966247558594, 0.09154891967773438, 0.09942817687988281, 0.10730743408203125, 0.11518669128417969, 0.12306594848632812, 0.13094520568847656, 0.138824462890625, 0.14670372009277344, 0.15458297729492188, 0.1624622344970703, 0.17034149169921875, 0.1782207489013672, 0.18610000610351562, 0.19397926330566406, 0.2018585205078125, 0.20973777770996094, 0.21761703491210938, 0.2254962921142578, 0.23337554931640625, 0.2412548065185547, 0.24913406372070312, 0.25701332092285156, 0.264892578125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 18.0, 44.0, 155.0, 248.0, 228.0, 129.0, 68.0, 35.0, 29.0, 12.0, 10.0, 3.0, 5.0, 9.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05374011769890785, -0.04865960776805878, -0.0435790978372097, -0.038498587906360626, -0.03341807797551155, -0.028337568044662476, -0.0232570581138134, -0.018176548182964325, -0.01309603825211525, -0.008015528321266174, -0.002935018390417099, 0.0021454915404319763, 0.007226001471281052, 0.012306511402130127, 0.017387021332979202, 0.022467531263828278, 0.027548041194677353, 0.03262855112552643, 0.037709061056375504, 0.04278957098722458, 0.047870080918073654, 0.05295059084892273, 0.058031100779771805, 0.06311161071062088, 0.06819212436676025, 0.07327263057231903, 0.0783531442284584, 0.08343365788459778, 0.08851416409015656, 0.09359467029571533, 0.0986751839518547, 0.10375569760799408, 0.10883620381355286, 0.11391671001911163, 0.11899722367525101, 0.12407773733139038, 0.12915824353694916, 0.13423874974250793, 0.1393192708492279, 0.14439977705478668, 0.14948028326034546, 0.15456078946590424, 0.159641295671463, 0.16472181677818298, 0.16980232298374176, 0.17488282918930054, 0.1799633502960205, 0.18504385650157928, 0.19012436270713806, 0.19520486891269684, 0.20028537511825562, 0.20536589622497559, 0.21044640243053436, 0.21552690863609314, 0.2206074297428131, 0.2256879359483719, 0.23076844215393066, 0.23584894835948944, 0.24092945456504822, 0.2460099756717682, 0.25109046697616577, 0.25617098808288574, 0.2612515091896057, 0.2663320004940033, 0.27141252160072327]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 3.0, 3.0, 6.0, 10.0, 14.0, 19.0, 10.0, 9.0, 22.0, 21.0, 23.0, 28.0, 34.0, 31.0, 38.0, 38.0, 36.0, 31.0, 50.0, 39.0, 49.0, 40.0, 37.0, 40.0, 40.0, 29.0, 31.0, 37.0, 35.0, 28.0, 22.0, 15.0, 29.0, 17.0, 17.0, 19.0, 8.0, 8.0, 9.0, 2.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.06254440546035767, -0.06078276038169861, -0.05902111902832985, -0.05725947767496109, -0.05549783259630203, -0.053736187517642975, -0.051974546164274216, -0.05021290481090546, -0.0484512597322464, -0.04668961465358734, -0.04492797330021858, -0.04316633194684982, -0.041404686868190765, -0.03964304178953171, -0.03788140043616295, -0.03611975908279419, -0.03435811400413513, -0.032596468925476074, -0.030834827572107315, -0.029073184356093407, -0.0273115411400795, -0.02554989792406559, -0.02378825470805168, -0.022026611492037773, -0.020264968276023865, -0.018503325060009956, -0.016741681843996048, -0.01498003862798214, -0.013218395411968231, -0.011456752195954323, -0.009695108979940414, -0.007933465763926506, -0.006171822547912598, -0.004410179331898689, -0.002648536115884781, -0.0008868928998708725, 0.0008747503161430359, 0.0026363935321569443, 0.004398036748170853, 0.006159679964184761, 0.00792132318019867, 0.009682966396212578, 0.011444609612226486, 0.013206252828240395, 0.014967896044254303, 0.01672953926026821, 0.01849118247628212, 0.020252825692296028, 0.022014468908309937, 0.023776112124323845, 0.025537755340337753, 0.02729939855635166, 0.02906104177236557, 0.03082268498837948, 0.03258432820439339, 0.034345969557762146, 0.036107614636421204, 0.03786925971508026, 0.03963090106844902, 0.04139254242181778, 0.04315418750047684, 0.044915832579135895, 0.046677473932504654, 0.04843911528587341, 0.05020076036453247]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 2.0, 7.0, 4.0, 9.0, 12.0, 9.0, 13.0, 8.0, 19.0, 19.0, 23.0, 20.0, 17.0, 24.0, 40.0, 25.0, 31.0, 51.0, 29.0, 35.0, 30.0, 41.0, 29.0, 46.0, 56.0, 33.0, 45.0, 31.0, 31.0, 40.0, 39.0, 13.0, 22.0, 19.0, 21.0, 15.0, 12.0, 9.0, 18.0, 7.0, 13.0, 4.0, 6.0, 5.0, 7.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.09375, -37.771484375, -36.44921875, -35.126953125, -33.8046875, -32.482421875, -31.16015625, -29.837890625, -28.515625, -27.193359375, -25.87109375, -24.548828125, -23.2265625, -21.904296875, -20.58203125, -19.259765625, -17.9375, -16.615234375, -15.29296875, -13.970703125, -12.6484375, -11.326171875, -10.00390625, -8.681640625, -7.359375, -6.037109375, -4.71484375, -3.392578125, -2.0703125, -0.748046875, 0.57421875, 1.896484375, 3.21875, 4.541015625, 5.86328125, 7.185546875, 8.5078125, 9.830078125, 11.15234375, 12.474609375, 13.796875, 15.119140625, 16.44140625, 17.763671875, 19.0859375, 20.408203125, 21.73046875, 23.052734375, 24.375, 25.697265625, 27.01953125, 28.341796875, 29.6640625, 30.986328125, 32.30859375, 33.630859375, 34.953125, 36.275390625, 37.59765625, 38.919921875, 40.2421875, 41.564453125, 42.88671875, 44.208984375, 45.53125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 2.0, 5.0, 2.0, 4.0, 8.0, 9.0, 7.0, 18.0, 11.0, 28.0, 32.0, 48.0, 59.0, 68.0, 105.0, 119.0, 190.0, 252.0, 378.0, 582.0, 886.0, 1392.0, 2632.0, 5519.0, 13063.0, 36342.0, 113747.0, 337116.0, 350781.0, 120586.0, 38402.0, 13480.0, 5702.0, 2680.0, 1501.0, 882.0, 551.0, 374.0, 251.0, 194.0, 138.0, 104.0, 63.0, 47.0, 43.0, 34.0, 33.0, 24.0, 14.0, 10.0, 10.0, 7.0, 8.0, 8.0, 6.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.66796875, -5.47918701171875, -5.2904052734375, -5.10162353515625, -4.912841796875, -4.72406005859375, -4.5352783203125, -4.34649658203125, -4.15771484375, -3.96893310546875, -3.7801513671875, -3.59136962890625, -3.402587890625, -3.21380615234375, -3.0250244140625, -2.83624267578125, -2.6474609375, -2.45867919921875, -2.2698974609375, -2.08111572265625, -1.892333984375, -1.70355224609375, -1.5147705078125, -1.32598876953125, -1.13720703125, -0.94842529296875, -0.7596435546875, -0.57086181640625, -0.382080078125, -0.19329833984375, -0.0045166015625, 0.18426513671875, 0.373046875, 0.56182861328125, 0.7506103515625, 0.93939208984375, 1.128173828125, 1.31695556640625, 1.5057373046875, 1.69451904296875, 1.88330078125, 2.07208251953125, 2.2608642578125, 2.44964599609375, 2.638427734375, 2.82720947265625, 3.0159912109375, 3.20477294921875, 3.3935546875, 3.58233642578125, 3.7711181640625, 3.95989990234375, 4.148681640625, 4.33746337890625, 4.5262451171875, 4.71502685546875, 4.90380859375, 5.09259033203125, 5.2813720703125, 5.47015380859375, 5.658935546875, 5.84771728515625, 6.0364990234375, 6.22528076171875, 6.4140625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 12.0, 13.0, 18.0, 27.0, 34.0, 46.0, 58.0, 54.0, 61.0, 71.0, 535.0, 1688.0, 79.0, 75.0, 60.0, 46.0, 46.0, 41.0, 18.0, 17.0, 13.0, 10.0, 10.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.25, -85.818359375, -82.38671875, -78.955078125, -75.5234375, -72.091796875, -68.66015625, -65.228515625, -61.796875, -58.365234375, -54.93359375, -51.501953125, -48.0703125, -44.638671875, -41.20703125, -37.775390625, -34.34375, -30.912109375, -27.48046875, -24.048828125, -20.6171875, -17.185546875, -13.75390625, -10.322265625, -6.890625, -3.458984375, -0.02734375, 3.404296875, 6.8359375, 10.267578125, 13.69921875, 17.130859375, 20.5625, 23.994140625, 27.42578125, 30.857421875, 34.2890625, 37.720703125, 41.15234375, 44.583984375, 48.015625, 51.447265625, 54.87890625, 58.310546875, 61.7421875, 65.173828125, 68.60546875, 72.037109375, 75.46875, 78.900390625, 82.33203125, 85.763671875, 89.1953125, 92.626953125, 96.05859375, 99.490234375, 102.921875, 106.353515625, 109.78515625, 113.216796875, 116.6484375, 120.080078125, 123.51171875, 126.943359375, 130.375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 11.0, 8.0, 12.0, 21.0, 30.0, 42.0, 66.0, 110.0, 157.0, 239.0, 427.0, 796.0, 1726.0, 5848.0, 72782.0, 2939283.0, 112798.0, 7253.0, 1954.0, 947.0, 458.0, 267.0, 172.0, 104.0, 68.0, 36.0, 26.0, 19.0, 15.0, 15.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.58349609375, -17.0263671875, -16.46923828125, -15.912109375, -15.35498046875, -14.7978515625, -14.24072265625, -13.68359375, -13.12646484375, -12.5693359375, -12.01220703125, -11.455078125, -10.89794921875, -10.3408203125, -9.78369140625, -9.2265625, -8.66943359375, -8.1123046875, -7.55517578125, -6.998046875, -6.44091796875, -5.8837890625, -5.32666015625, -4.76953125, -4.21240234375, -3.6552734375, -3.09814453125, -2.541015625, -1.98388671875, -1.4267578125, -0.86962890625, -0.3125, 0.24462890625, 0.8017578125, 1.35888671875, 1.916015625, 2.47314453125, 3.0302734375, 3.58740234375, 4.14453125, 4.70166015625, 5.2587890625, 5.81591796875, 6.373046875, 6.93017578125, 7.4873046875, 8.04443359375, 8.6015625, 9.15869140625, 9.7158203125, 10.27294921875, 10.830078125, 11.38720703125, 11.9443359375, 12.50146484375, 13.05859375, 13.61572265625, 14.1728515625, 14.72998046875, 15.287109375, 15.84423828125, 16.4013671875, 16.95849609375, 17.515625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 12.0, 16.0, 35.0, 137.0, 249.0, 261.0, 159.0, 63.0, 33.0, 11.0, 7.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.87174987792969, -111.63179779052734, -105.391845703125, -99.15188598632812, -92.91193389892578, -86.67198181152344, -80.43202209472656, -74.19207000732422, -67.95211791992188, -61.71216583251953, -55.47220993041992, -49.23225402832031, -42.99230194091797, -36.752349853515625, -30.512393951416016, -24.272438049316406, -18.032485961914062, -11.792531967163086, -5.552577972412109, 0.6873760223388672, 6.927330017089844, 13.16728401184082, 19.407238006591797, 25.647193908691406, 31.88714599609375, 38.127098083496094, 44.3670539855957, 50.60700988769531, 56.846961975097656, 63.0869140625, 69.32687377929688, 75.56682586669922, 81.8067626953125, 88.04671478271484, 94.28666687011719, 100.52662658691406, 106.7665786743164, 113.00653076171875, 119.24649047851562, 125.48644256591797, 131.7263946533203, 137.9663543701172, 144.206298828125, 150.44625854492188, 156.68621826171875, 162.92616271972656, 169.16612243652344, 175.40606689453125, 181.64602661132812, 187.885986328125, 194.1259307861328, 200.3658905029297, 206.6058349609375, 212.84579467773438, 219.08575439453125, 225.32571411132812, 231.56565856933594, 237.8056182861328, 244.04556274414062, 250.2855224609375, 256.5254821777344, 262.76544189453125, 269.00537109375, 275.2453308105469, 281.48529052734375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 9.0, 21.0, 20.0, 19.0, 18.0, 27.0, 26.0, 32.0, 46.0, 53.0, 35.0, 50.0, 45.0, 53.0, 54.0, 42.0, 55.0, 42.0, 53.0, 41.0, 37.0, 35.0, 29.0, 31.0, 24.0, 10.0, 14.0, 11.0, 15.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.05052947998047, -83.86641693115234, -80.68231201171875, -77.49819946289062, -74.3140869140625, -71.12997436523438, -67.94586944580078, -64.76175689697266, -61.5776481628418, -58.39353942871094, -55.20942687988281, -52.02531814575195, -48.841209411621094, -45.65709686279297, -42.47298812866211, -39.28887939453125, -36.104766845703125, -32.920658111572266, -29.73654556274414, -26.55243682861328, -23.36832618713379, -20.184215545654297, -17.000106811523438, -13.815996170043945, -10.631885528564453, -7.447775363922119, -4.263665199279785, -1.0795555114746094, 2.104555130004883, 5.288665771484375, 8.472774505615234, 11.656885147094727, 14.84100341796875, 18.025114059448242, 21.209224700927734, 24.393333435058594, 27.577444076538086, 30.761554718017578, 33.94566345214844, 37.12977600097656, 40.31388473510742, 43.49799346923828, 46.682106018066406, 49.866214752197266, 53.050323486328125, 56.23443603515625, 59.41854476928711, 62.60265350341797, 65.7867660522461, 68.97087860107422, 72.15498352050781, 75.33909606933594, 78.52320861816406, 81.70732116699219, 84.89142608642578, 88.0755386352539, 91.2596435546875, 94.44375610351562, 97.62786102294922, 100.81197357177734, 103.99608612060547, 107.18019104003906, 110.36430358886719, 113.54841613769531, 116.73252868652344]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 6.0, 6.0, 13.0, 9.0, 17.0, 32.0, 37.0, 52.0, 89.0, 107.0, 186.0, 231.0, 335.0, 446.0, 578.0, 860.0, 1168.0, 1648.0, 2166.0, 3041.0, 3792.0, 1018168.0, 4059.0, 3133.0, 2297.0, 1674.0, 1190.0, 872.0, 652.0, 502.0, 346.0, 232.0, 169.0, 132.0, 85.0, 74.0, 51.0, 28.0, 22.0, 14.0, 10.0, 6.0, 9.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.715913772583008, -16.202951431274414, -15.68998908996582, -15.177027702331543, -14.66406536102295, -14.151103019714355, -13.638141632080078, -13.125179290771484, -12.61221694946289, -12.099254608154297, -11.586292266845703, -11.073330879211426, -10.560368537902832, -10.047406196594238, -9.534444808959961, -9.021482467651367, -8.508520126342773, -7.99555778503418, -7.482595920562744, -6.969634056091309, -6.456671714782715, -5.943709373474121, -5.4307475090026855, -4.91778564453125, -4.404823303222656, -3.8918612003326416, -3.378899097442627, -2.8659369945526123, -2.3529748916625977, -1.840012788772583, -1.3270506858825684, -0.8140885829925537, -0.30112457275390625, 0.2118375301361084, 0.724799633026123, 1.2377617359161377, 1.7507238388061523, 2.263685941696167, 2.7766480445861816, 3.2896101474761963, 3.802572250366211, 4.315534591674805, 4.82849645614624, 5.341458320617676, 5.8544206619262695, 6.367383003234863, 6.880344867706299, 7.393306732177734, 7.906269073486328, 8.419231414794922, 8.932193756103516, 9.445155143737793, 9.958117485046387, 10.47107982635498, 10.984041213989258, 11.497003555297852, 12.009965896606445, 12.522928237915039, 13.035890579223633, 13.54885196685791, 14.061814308166504, 14.574776649475098, 15.087738037109375, 15.600700378417969, 16.113662719726562]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 13.0, 13.0, 42.0, 45.0, 79.0, 220.0, 51462328.0, 279.0, 37.0, 23.0, 15.0, 10.0, 9.0, 14.0, 4.0, 6.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3950.024169921875, -3832.3740234375, -3714.723876953125, -3597.07373046875, -3479.423583984375, -3361.7734375, -3244.123291015625, -3126.47314453125, -3008.822998046875, -2891.1728515625, -2773.522705078125, -2655.87255859375, -2538.222412109375, -2420.572265625, -2302.922119140625, -2185.27197265625, -2067.621826171875, -1949.9716796875, -1832.321533203125, -1714.67138671875, -1597.021240234375, -1479.37109375, -1361.720947265625, -1244.07080078125, -1126.420654296875, -1008.7705078125, -891.120361328125, -773.47021484375, -655.820068359375, -538.169921875, -420.519775390625, -302.86962890625, -185.21923828125, -67.569091796875, 50.0810546875, 167.731201171875, 285.38134765625, 403.031494140625, 520.681640625, 638.331787109375, 755.98193359375, 873.632080078125, 991.2822265625, 1108.932373046875, 1226.58251953125, 1344.232666015625, 1461.8828125, 1579.532958984375, 1697.18310546875, 1814.833251953125, 1932.4833984375, 2050.133544921875, 2167.78369140625, 2285.433837890625, 2403.083984375, 2520.734130859375, 2638.38427734375, 2756.034423828125, 2873.6845703125, 2991.334716796875, 3108.98486328125, 3226.635009765625, 3344.28515625, 3461.935302734375, 3579.58544921875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [5.0, 2.0, 10.0, 13.0, 19.0, 20.0, 48.0, 44.0, 98.0, 102.0, 156.0, 250.0, 384.0, 635.0, 873.0, 1407.0, 1975.0, 2891.0, 4386.0, 6686.0, 10199.0, 15661.0, 24655.0, 37671.0, 57893.0, 89095.0, 135667.0, 203810.0, 294215.0, 415767.0, 3460216.0, 530213.0, 326457.0, 227738.0, 153931.0, 101321.0, 65161.0, 42226.0, 27323.0, 17923.0, 11706.0, 7735.0, 4873.0, 3273.0, 2217.0, 1495.0, 1012.0, 636.0, 456.0, 311.0, 179.0, 140.0, 114.0, 61.0, 40.0, 23.0, 10.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 4.0], "bins": [-0.98876953125, -0.9565048217773438, -0.9242401123046875, -0.8919754028320312, -0.859710693359375, -0.8274459838867188, -0.7951812744140625, -0.7629165649414062, -0.73065185546875, -0.6983871459960938, -0.6661224365234375, -0.6338577270507812, -0.601593017578125, -0.5693283081054688, -0.5370635986328125, -0.5047988891601562, -0.4725341796875, -0.44026947021484375, -0.4080047607421875, -0.37574005126953125, -0.343475341796875, -0.31121063232421875, -0.2789459228515625, -0.24668121337890625, -0.21441650390625, -0.18215179443359375, -0.1498870849609375, -0.11762237548828125, -0.085357666015625, -0.05309295654296875, -0.0208282470703125, 0.01143646240234375, 0.043701171875, 0.07596588134765625, 0.1082305908203125, 0.14049530029296875, 0.172760009765625, 0.20502471923828125, 0.2372894287109375, 0.26955413818359375, 0.30181884765625, 0.33408355712890625, 0.3663482666015625, 0.39861297607421875, 0.430877685546875, 0.46314239501953125, 0.4954071044921875, 0.5276718139648438, 0.5599365234375, 0.5922012329101562, 0.6244659423828125, 0.6567306518554688, 0.688995361328125, 0.7212600708007812, 0.7535247802734375, 0.7857894897460938, 0.81805419921875, 0.8503189086914062, 0.8825836181640625, 0.9148483276367188, 0.947113037109375, 0.9793777465820312, 1.0116424560546875, 1.0439071655273438, 1.076171875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 1.0, 5.0, 9.0, 7.0, 10.0, 8.0, 17.0, 16.0, 19.0, 22.0, 33.0, 32.0, 32.0, 31.0, 28.0, 37.0, 33.0, 43.0, 50.0, 235.0, 854.0, 58.0, 32.0, 33.0, 25.0, 38.0, 42.0, 37.0, 33.0, 30.0, 22.0, 26.0, 21.0, 18.0, 19.0, 13.0, 11.0, 7.0, 9.0, 4.0, 3.0, 3.0, 7.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.8046875, -10.4908447265625, -10.177001953125, -9.8631591796875, -9.54931640625, -9.2354736328125, -8.921630859375, -8.6077880859375, -8.2939453125, -7.9801025390625, -7.666259765625, -7.3524169921875, -7.03857421875, -6.7247314453125, -6.410888671875, -6.0970458984375, -5.783203125, -5.4693603515625, -5.155517578125, -4.8416748046875, -4.52783203125, -4.2139892578125, -3.900146484375, -3.5863037109375, -3.2724609375, -2.9586181640625, -2.644775390625, -2.3309326171875, -2.01708984375, -1.7032470703125, -1.389404296875, -1.0755615234375, -0.76171875, -0.4478759765625, -0.134033203125, 0.1798095703125, 0.49365234375, 0.8074951171875, 1.121337890625, 1.4351806640625, 1.7490234375, 2.0628662109375, 2.376708984375, 2.6905517578125, 3.00439453125, 3.3182373046875, 3.632080078125, 3.9459228515625, 4.259765625, 4.5736083984375, 4.887451171875, 5.2012939453125, 5.51513671875, 5.8289794921875, 6.142822265625, 6.4566650390625, 6.7705078125, 7.0843505859375, 7.398193359375, 7.7120361328125, 8.02587890625, 8.3397216796875, 8.653564453125, 8.9674072265625, 9.28125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 11.0, 13.0, 18.0, 30.0, 45.0, 55.0, 77.0, 132.0, 171.0, 234.0, 333.0, 531.0, 756.0, 1176.0, 1654.0, 2509.0, 3712.0, 5889.0, 9277.0, 14619.0, 23564.0, 40509.0, 71329.0, 127116.0, 230793.0, 412105.0, 1726458.0, 2624920.0, 430468.0, 241871.0, 133743.0, 74929.0, 43402.0, 25458.0, 15925.0, 9797.0, 6101.0, 3845.0, 2541.0, 1684.0, 1180.0, 799.0, 539.0, 373.0, 242.0, 135.0, 119.0, 80.0, 62.0, 39.0, 26.0, 20.0, 16.0, 4.0, 6.0, 1.0, 1.0, 3.0], "bins": [-1.58203125, -1.534149169921875, -1.48626708984375, -1.438385009765625, -1.3905029296875, -1.342620849609375, -1.29473876953125, -1.246856689453125, -1.198974609375, -1.151092529296875, -1.10321044921875, -1.055328369140625, -1.0074462890625, -0.959564208984375, -0.91168212890625, -0.863800048828125, -0.81591796875, -0.768035888671875, -0.72015380859375, -0.672271728515625, -0.6243896484375, -0.576507568359375, -0.52862548828125, -0.480743408203125, -0.432861328125, -0.384979248046875, -0.33709716796875, -0.289215087890625, -0.2413330078125, -0.193450927734375, -0.14556884765625, -0.097686767578125, -0.0498046875, -0.001922607421875, 0.04595947265625, 0.093841552734375, 0.1417236328125, 0.189605712890625, 0.23748779296875, 0.285369873046875, 0.333251953125, 0.381134033203125, 0.42901611328125, 0.476898193359375, 0.5247802734375, 0.572662353515625, 0.62054443359375, 0.668426513671875, 0.71630859375, 0.764190673828125, 0.81207275390625, 0.859954833984375, 0.9078369140625, 0.955718994140625, 1.00360107421875, 1.051483154296875, 1.099365234375, 1.147247314453125, 1.19512939453125, 1.243011474609375, 1.2908935546875, 1.338775634765625, 1.38665771484375, 1.434539794921875, 1.482421875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 6.0, 12.0, 15.0, 12.0, 22.0, 18.0, 23.0, 30.0, 27.0, 33.0, 27.0, 43.0, 43.0, 33.0, 64.0, 139.0, 915.0, 94.0, 38.0, 39.0, 43.0, 39.0, 44.0, 40.0, 45.0, 29.0, 35.0, 28.0, 22.0, 17.0, 10.0, 6.0, 4.0, 4.0, 4.0, 6.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5546875, -8.266845703125, -7.97900390625, -7.691162109375, -7.4033203125, -7.115478515625, -6.82763671875, -6.539794921875, -6.251953125, -5.964111328125, -5.67626953125, -5.388427734375, -5.1005859375, -4.812744140625, -4.52490234375, -4.237060546875, -3.94921875, -3.661376953125, -3.37353515625, -3.085693359375, -2.7978515625, -2.510009765625, -2.22216796875, -1.934326171875, -1.646484375, -1.358642578125, -1.07080078125, -0.782958984375, -0.4951171875, -0.207275390625, 0.08056640625, 0.368408203125, 0.65625, 0.944091796875, 1.23193359375, 1.519775390625, 1.8076171875, 2.095458984375, 2.38330078125, 2.671142578125, 2.958984375, 3.246826171875, 3.53466796875, 3.822509765625, 4.1103515625, 4.398193359375, 4.68603515625, 4.973876953125, 5.26171875, 5.549560546875, 5.83740234375, 6.125244140625, 6.4130859375, 6.700927734375, 6.98876953125, 7.276611328125, 7.564453125, 7.852294921875, 8.14013671875, 8.427978515625, 8.7158203125, 9.003662109375, 9.29150390625, 9.579345703125, 9.8671875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 13.0, 18.0, 31.0, 48.0, 56.0, 119.0, 170.0, 297.0, 503.0, 852.0, 1556.0, 3234.0, 7772.0, 27150.0, 209948.0, 5960213.0, 57262.0, 12772.0, 4666.0, 2126.0, 1102.0, 557.0, 366.0, 191.0, 160.0, 92.0, 56.0, 35.0, 24.0, 12.0, 8.0, 7.0, 1.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.390625, -12.961669921875, -12.53271484375, -12.103759765625, -11.6748046875, -11.245849609375, -10.81689453125, -10.387939453125, -9.958984375, -9.530029296875, -9.10107421875, -8.672119140625, -8.2431640625, -7.814208984375, -7.38525390625, -6.956298828125, -6.52734375, -6.098388671875, -5.66943359375, -5.240478515625, -4.8115234375, -4.382568359375, -3.95361328125, -3.524658203125, -3.095703125, -2.666748046875, -2.23779296875, -1.808837890625, -1.3798828125, -0.950927734375, -0.52197265625, -0.093017578125, 0.3359375, 0.764892578125, 1.19384765625, 1.622802734375, 2.0517578125, 2.480712890625, 2.90966796875, 3.338623046875, 3.767578125, 4.196533203125, 4.62548828125, 5.054443359375, 5.4833984375, 5.912353515625, 6.34130859375, 6.770263671875, 7.19921875, 7.628173828125, 8.05712890625, 8.486083984375, 8.9150390625, 9.343994140625, 9.77294921875, 10.201904296875, 10.630859375, 11.059814453125, 11.48876953125, 11.917724609375, 12.3466796875, 12.775634765625, 13.20458984375, 13.633544921875, 14.0625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 9.0, 8.0, 5.0, 9.0, 14.0, 17.0, 16.0, 26.0, 32.0, 34.0, 40.0, 36.0, 41.0, 37.0, 46.0, 62.0, 238.0, 856.0, 74.0, 41.0, 41.0, 52.0, 38.0, 45.0, 31.0, 33.0, 24.0, 19.0, 18.0, 15.0, 10.0, 11.0, 8.0, 7.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.8125, -8.55670166015625, -8.3009033203125, -8.04510498046875, -7.789306640625, -7.53350830078125, -7.2777099609375, -7.02191162109375, -6.76611328125, -6.51031494140625, -6.2545166015625, -5.99871826171875, -5.742919921875, -5.48712158203125, -5.2313232421875, -4.97552490234375, -4.7197265625, -4.46392822265625, -4.2081298828125, -3.95233154296875, -3.696533203125, -3.44073486328125, -3.1849365234375, -2.92913818359375, -2.67333984375, -2.41754150390625, -2.1617431640625, -1.90594482421875, -1.650146484375, -1.39434814453125, -1.1385498046875, -0.88275146484375, -0.626953125, -0.37115478515625, -0.1153564453125, 0.14044189453125, 0.396240234375, 0.65203857421875, 0.9078369140625, 1.16363525390625, 1.41943359375, 1.67523193359375, 1.9310302734375, 2.18682861328125, 2.442626953125, 2.69842529296875, 2.9542236328125, 3.21002197265625, 3.4658203125, 3.72161865234375, 3.9774169921875, 4.23321533203125, 4.489013671875, 4.74481201171875, 5.0006103515625, 5.25640869140625, 5.51220703125, 5.76800537109375, 6.0238037109375, 6.27960205078125, 6.535400390625, 6.79119873046875, 7.0469970703125, 7.30279541015625, 7.55859375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 15.0, 27.0, 105.0, 505.0, 295.0, 45.0, 10.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.380470275878906, -35.396690368652344, -33.41291046142578, -31.429128646850586, -29.44534683227539, -27.461566925048828, -25.477787017822266, -23.494007110595703, -21.510225296020508, -19.526445388793945, -17.54266357421875, -15.558883666992188, -13.575102806091309, -11.59132194519043, -9.607542037963867, -7.623761177062988, -5.639980316162109, -3.6561996936798096, -1.6724190711975098, 0.31136131286621094, 2.29514217376709, 4.278923034667969, 6.262702941894531, 8.24648380279541, 10.230264663696289, 12.214045524597168, 14.197826385498047, 16.18160629272461, 18.165386199951172, 20.149168014526367, 22.13294792175293, 24.116729736328125, 26.100509643554688, 28.08428955078125, 30.068071365356445, 32.051849365234375, 34.0356330871582, 36.019412994384766, 38.00319290161133, 39.98697280883789, 41.97075653076172, 43.95453643798828, 45.938316345214844, 47.922096252441406, 49.905879974365234, 51.8896598815918, 53.87343978881836, 55.85721969604492, 57.840999603271484, 59.82477951049805, 61.80855941772461, 63.79234313964844, 65.776123046875, 67.75990295410156, 69.74368286132812, 71.72746276855469, 73.71124267578125, 75.69502258300781, 77.67880249023438, 79.66258239746094, 81.6463623046875, 83.63014221191406, 85.61392211914062, 87.59770965576172, 89.58148956298828]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 5.0, 7.0, 10.0, 12.0, 17.0, 14.0, 39.0, 37.0, 54.0, 76.0, 76.0, 109.0, 89.0, 86.0, 68.0, 86.0, 54.0, 44.0, 21.0, 29.0, 15.0, 12.0, 14.0, 5.0, 6.0, 2.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.823284149169922, -26.987491607666016, -26.151697158813477, -25.31590461730957, -24.48011016845703, -23.644317626953125, -22.80852508544922, -21.972732543945312, -21.136938095092773, -20.301145553588867, -19.465351104736328, -18.629558563232422, -17.793766021728516, -16.957971572875977, -16.12217903137207, -15.286385536193848, -14.450592041015625, -13.614798545837402, -12.77900505065918, -11.943212509155273, -11.10741901397705, -10.271625518798828, -9.435832977294922, -8.6000394821167, -7.764245986938477, -6.928452491760254, -6.0926594734191895, -5.256866455078125, -4.421072959899902, -3.5852794647216797, -2.7494864463806152, -1.9136934280395508, -1.0778999328613281, -0.24210667610168457, 0.593686580657959, 1.4294798374176025, 2.265273094177246, 3.1010665893554688, 3.936859607696533, 4.772652626037598, 5.60844612121582, 6.444239616394043, 7.280032634735107, 8.115825653076172, 8.951619148254395, 9.787412643432617, 10.623205184936523, 11.458998680114746, 12.294792175292969, 13.130585670471191, 13.966379165649414, 14.80217170715332, 15.637965202331543, 16.473758697509766, 17.309551239013672, 18.145343780517578, 18.981138229370117, 19.816930770874023, 20.652725219726562, 21.48851776123047, 22.324310302734375, 23.160104751586914, 23.99589729309082, 24.83169174194336, 25.667484283447266]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 8.0, 21.0, 15.0, 30.0, 36.0, 48.0, 85.0, 107.0, 160.0, 226.0, 334.0, 488.0, 843.0, 1529.0, 2899.0, 6189.0, 19250.0, 267553.0, 3848261.0, 28294.0, 8487.0, 3791.0, 1978.0, 1137.0, 755.0, 526.0, 341.0, 227.0, 165.0, 132.0, 86.0, 74.0, 46.0, 47.0, 25.0, 18.0, 14.0, 10.0, 11.0, 4.0, 6.0, 9.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.36572265625, -0.3527069091796875, -0.339691162109375, -0.3266754150390625, -0.31365966796875, -0.3006439208984375, -0.287628173828125, -0.2746124267578125, -0.2615966796875, -0.2485809326171875, -0.235565185546875, -0.2225494384765625, -0.20953369140625, -0.1965179443359375, -0.183502197265625, -0.1704864501953125, -0.157470703125, -0.1444549560546875, -0.131439208984375, -0.1184234619140625, -0.10540771484375, -0.0923919677734375, -0.079376220703125, -0.0663604736328125, -0.0533447265625, -0.0403289794921875, -0.027313232421875, -0.0142974853515625, -0.00128173828125, 0.0117340087890625, 0.024749755859375, 0.0377655029296875, 0.05078125, 0.0637969970703125, 0.076812744140625, 0.0898284912109375, 0.10284423828125, 0.1158599853515625, 0.128875732421875, 0.1418914794921875, 0.1549072265625, 0.1679229736328125, 0.180938720703125, 0.1939544677734375, 0.20697021484375, 0.2199859619140625, 0.233001708984375, 0.2460174560546875, 0.259033203125, 0.2720489501953125, 0.285064697265625, 0.2980804443359375, 0.31109619140625, 0.3241119384765625, 0.337127685546875, 0.3501434326171875, 0.3631591796875, 0.3761749267578125, 0.389190673828125, 0.4022064208984375, 0.41522216796875, 0.4282379150390625, 0.441253662109375, 0.4542694091796875, 0.46728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 9.0, 10.0, 7.0, 10.0, 19.0, 19.0, 215.0, 586.0, 15.0, 15.0, 10.0, 12.0, 12.0, 7.0, 2.0, 5.0, 4.0, 4.0, 2.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08587646484375, -0.08260536193847656, -0.07933425903320312, -0.07606315612792969, -0.07279205322265625, -0.06952095031738281, -0.06624984741210938, -0.06297874450683594, -0.0597076416015625, -0.05643653869628906, -0.053165435791015625, -0.04989433288574219, -0.04662322998046875, -0.04335212707519531, -0.040081024169921875, -0.03680992126464844, -0.033538818359375, -0.030267715454101562, -0.026996612548828125, -0.023725509643554688, -0.02045440673828125, -0.017183303833007812, -0.013912200927734375, -0.010641098022460938, -0.0073699951171875, -0.0040988922119140625, -0.000827789306640625, 0.0024433135986328125, 0.00571441650390625, 0.008985519409179688, 0.012256622314453125, 0.015527725219726562, 0.018798828125, 0.022069931030273438, 0.025341033935546875, 0.028612136840820312, 0.03188323974609375, 0.03515434265136719, 0.038425445556640625, 0.04169654846191406, 0.0449676513671875, 0.04823875427246094, 0.051509857177734375, 0.05478096008300781, 0.05805206298828125, 0.06132316589355469, 0.06459426879882812, 0.06786537170410156, 0.071136474609375, 0.07440757751464844, 0.07767868041992188, 0.08094978332519531, 0.08422088623046875, 0.08749198913574219, 0.09076309204101562, 0.09403419494628906, 0.0973052978515625, 0.10057640075683594, 0.10384750366210938, 0.10711860656738281, 0.11038970947265625, 0.11366081237792969, 0.11693191528320312, 0.12020301818847656, 0.12347412109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 7.0, 9.0, 16.0, 23.0, 22.0, 39.0, 54.0, 85.0, 118.0, 218.0, 338.0, 621.0, 1319.0, 2945.0, 7330.0, 22733.0, 113413.0, 3676197.0, 315887.0, 34448.0, 10277.0, 4192.0, 1839.0, 882.0, 539.0, 277.0, 165.0, 97.0, 47.0, 39.0, 33.0, 16.0, 9.0, 7.0, 8.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.32373046875, -0.31317901611328125, -0.3026275634765625, -0.29207611083984375, -0.281524658203125, -0.27097320556640625, -0.2604217529296875, -0.24987030029296875, -0.23931884765625, -0.22876739501953125, -0.2182159423828125, -0.20766448974609375, -0.197113037109375, -0.18656158447265625, -0.1760101318359375, -0.16545867919921875, -0.1549072265625, -0.14435577392578125, -0.1338043212890625, -0.12325286865234375, -0.112701416015625, -0.10214996337890625, -0.0915985107421875, -0.08104705810546875, -0.07049560546875, -0.05994415283203125, -0.0493927001953125, -0.03884124755859375, -0.028289794921875, -0.01773834228515625, -0.0071868896484375, 0.00336456298828125, 0.013916015625, 0.02446746826171875, 0.0350189208984375, 0.04557037353515625, 0.056121826171875, 0.06667327880859375, 0.0772247314453125, 0.08777618408203125, 0.09832763671875, 0.10887908935546875, 0.1194305419921875, 0.12998199462890625, 0.140533447265625, 0.15108489990234375, 0.1616363525390625, 0.17218780517578125, 0.1827392578125, 0.19329071044921875, 0.2038421630859375, 0.21439361572265625, 0.224945068359375, 0.23549652099609375, 0.2460479736328125, 0.25659942626953125, 0.26715087890625, 0.27770233154296875, 0.2882537841796875, 0.29880523681640625, 0.309356689453125, 0.31990814208984375, 0.3304595947265625, 0.34101104736328125, 0.3515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 7.0, 11.0, 16.0, 20.0, 23.0, 23.0, 34.0, 68.0, 145.0, 320.0, 1486.0, 1294.0, 295.0, 136.0, 60.0, 35.0, 22.0, 20.0, 7.0, 4.0, 7.0, 4.0, 6.0, 3.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.161865234375, -0.15723419189453125, -0.1526031494140625, -0.14797210693359375, -0.143341064453125, -0.13871002197265625, -0.1340789794921875, -0.12944793701171875, -0.12481689453125, -0.12018585205078125, -0.1155548095703125, -0.11092376708984375, -0.106292724609375, -0.10166168212890625, -0.0970306396484375, -0.09239959716796875, -0.0877685546875, -0.08313751220703125, -0.0785064697265625, -0.07387542724609375, -0.069244384765625, -0.06461334228515625, -0.0599822998046875, -0.05535125732421875, -0.05072021484375, -0.04608917236328125, -0.0414581298828125, -0.03682708740234375, -0.032196044921875, -0.02756500244140625, -0.0229339599609375, -0.01830291748046875, -0.013671875, -0.00904083251953125, -0.0044097900390625, 0.00022125244140625, 0.004852294921875, 0.00948333740234375, 0.0141143798828125, 0.01874542236328125, 0.02337646484375, 0.02800750732421875, 0.0326385498046875, 0.03726959228515625, 0.041900634765625, 0.04653167724609375, 0.0511627197265625, 0.05579376220703125, 0.0604248046875, 0.06505584716796875, 0.0696868896484375, 0.07431793212890625, 0.078948974609375, 0.08358001708984375, 0.0882110595703125, 0.09284210205078125, 0.09747314453125, 0.10210418701171875, 0.1067352294921875, 0.11136627197265625, 0.115997314453125, 0.12062835693359375, 0.1252593994140625, 0.12989044189453125, 0.134521484375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 13.0, 40.0, 212.0, 568.0, 139.0, 26.0, 7.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4585137367248535, -2.405585527420044, -2.3526575565338135, -2.299729347229004, -2.2468013763427734, -2.193873167037964, -2.1409449577331543, -2.088016986846924, -2.0350887775421143, -1.9821606874465942, -1.9292325973510742, -1.8763043880462646, -1.8233762979507446, -1.7704482078552246, -1.7175201177597046, -1.6645920276641846, -1.6116639375686646, -1.5587358474731445, -1.5058077573776245, -1.4528796672821045, -1.399951457977295, -1.347023367881775, -1.2940952777862549, -1.2411671876907349, -1.1882390975952148, -1.1353110074996948, -1.0823829174041748, -1.0294547080993652, -0.9765266180038452, -0.9235985279083252, -0.8706704378128052, -0.8177423477172852, -0.764814019203186, -0.711885929107666, -0.6589577794075012, -0.6060296893119812, -0.5531015396118164, -0.5001734495162964, -0.44724535942077637, -0.39431723952293396, -0.34138911962509155, -0.28846099972724915, -0.23553289473056793, -0.18260478973388672, -0.1296766698360443, -0.0767485499382019, -0.023820459842681885, 0.029107660055160522, 0.08203577995300293, 0.13496389985084534, 0.18789200484752655, 0.24082010984420776, 0.29374822974205017, 0.3466763496398926, 0.3996044397354126, 0.452532559633255, 0.5054606795310974, 0.5583887696266174, 0.6113169193267822, 0.6642450094223022, 0.7171730995178223, 0.7701012492179871, 0.8230293393135071, 0.8759574890136719, 0.9288855791091919]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 2.0, 4.0, 7.0, 6.0, 7.0, 9.0, 8.0, 22.0, 15.0, 28.0, 28.0, 48.0, 33.0, 43.0, 63.0, 66.0, 67.0, 62.0, 60.0, 72.0, 61.0, 61.0, 56.0, 33.0, 25.0, 21.0, 21.0, 16.0, 14.0, 6.0, 9.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4421434998512268, -0.42885932326316833, -0.41557517647743225, -0.4022909998893738, -0.3890068233013153, -0.37572264671325684, -0.36243849992752075, -0.3491543233394623, -0.3358701467514038, -0.32258597016334534, -0.30930182337760925, -0.2960176467895508, -0.2827334702014923, -0.26944929361343384, -0.25616514682769775, -0.24288097023963928, -0.2295968234539032, -0.21631266176700592, -0.20302848517894745, -0.18974432349205017, -0.1764601469039917, -0.16317598521709442, -0.14989182353019714, -0.13660764694213867, -0.1233234852552414, -0.11003931611776352, -0.09675514698028564, -0.08347098529338837, -0.07018681615591049, -0.05690264701843262, -0.04361848533153534, -0.030334316194057465, -0.01705014705657959, -0.0037659797817468643, 0.009518187493085861, 0.022802352905273438, 0.03608652204275131, 0.04937069118022919, 0.06265485286712646, 0.07593902200460434, 0.08922319114208221, 0.10250736027956009, 0.11579152941703796, 0.12907569110393524, 0.14235985279083252, 0.155644029378891, 0.16892819106578827, 0.18221235275268555, 0.19549652934074402, 0.2087806910276413, 0.22206486761569977, 0.23534902930259705, 0.24863320589065552, 0.2619173526763916, 0.2752015292644501, 0.28848570585250854, 0.30176985263824463, 0.3150540292263031, 0.3283381760120392, 0.34162235260009766, 0.35490652918815613, 0.3681907057762146, 0.3814748525619507, 0.39475902915000916, 0.4080432057380676]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 12.0, 22.0, 39.0, 49.0, 79.0, 113.0, 171.0, 259.0, 457.0, 786.0, 1318.0, 2156.0, 3820.0, 7611.0, 15885.0, 41856.0, 888592.0, 49255.0, 17633.0, 8203.0, 4316.0, 2347.0, 1320.0, 809.0, 510.0, 330.0, 220.0, 126.0, 77.0, 42.0, 37.0, 21.0, 25.0, 14.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61962890625, -0.6016998291015625, -0.583770751953125, -0.5658416748046875, -0.54791259765625, -0.5299835205078125, -0.512054443359375, -0.4941253662109375, -0.4761962890625, -0.4582672119140625, -0.440338134765625, -0.4224090576171875, -0.40447998046875, -0.3865509033203125, -0.368621826171875, -0.3506927490234375, -0.332763671875, -0.3148345947265625, -0.296905517578125, -0.2789764404296875, -0.26104736328125, -0.2431182861328125, -0.225189208984375, -0.2072601318359375, -0.1893310546875, -0.1714019775390625, -0.153472900390625, -0.1355438232421875, -0.11761474609375, -0.0996856689453125, -0.081756591796875, -0.0638275146484375, -0.0458984375, -0.0279693603515625, -0.010040283203125, 0.0078887939453125, 0.02581787109375, 0.0437469482421875, 0.061676025390625, 0.0796051025390625, 0.0975341796875, 0.1154632568359375, 0.133392333984375, 0.1513214111328125, 0.16925048828125, 0.1871795654296875, 0.205108642578125, 0.2230377197265625, 0.240966796875, 0.2588958740234375, 0.276824951171875, 0.2947540283203125, 0.31268310546875, 0.3306121826171875, 0.348541259765625, 0.3664703369140625, 0.3843994140625, 0.4023284912109375, 0.420257568359375, 0.4381866455078125, 0.45611572265625, 0.4740447998046875, 0.491973876953125, 0.5099029541015625, 0.52783203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 6.0, 5.0, 9.0, 11.0, 14.0, 14.0, 15.0, 106.0, 572.0, 140.0, 16.0, 18.0, 7.0, 6.0, 11.0, 6.0, 5.0, 9.0, 2.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.07566452026367188, -0.07247161865234375, -0.06927871704101562, -0.0660858154296875, -0.06289291381835938, -0.05970001220703125, -0.056507110595703125, -0.053314208984375, -0.050121307373046875, -0.04692840576171875, -0.043735504150390625, -0.0405426025390625, -0.037349700927734375, -0.03415679931640625, -0.030963897705078125, -0.02777099609375, -0.024578094482421875, -0.02138519287109375, -0.018192291259765625, -0.0149993896484375, -0.011806488037109375, -0.00861358642578125, -0.005420684814453125, -0.002227783203125, 0.000965118408203125, 0.00415802001953125, 0.007350921630859375, 0.0105438232421875, 0.013736724853515625, 0.01692962646484375, 0.020122528076171875, 0.0233154296875, 0.026508331298828125, 0.02970123291015625, 0.032894134521484375, 0.0360870361328125, 0.039279937744140625, 0.04247283935546875, 0.045665740966796875, 0.048858642578125, 0.052051544189453125, 0.05524444580078125, 0.058437347412109375, 0.0616302490234375, 0.06482315063476562, 0.06801605224609375, 0.07120895385742188, 0.07440185546875, 0.07759475708007812, 0.08078765869140625, 0.08398056030273438, 0.0871734619140625, 0.09036636352539062, 0.09355926513671875, 0.09675216674804688, 0.099945068359375, 0.10313796997070312, 0.10633087158203125, 0.10952377319335938, 0.1127166748046875, 0.11590957641601562, 0.11910247802734375, 0.12229537963867188, 0.12548828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 12.0, 22.0, 21.0, 50.0, 62.0, 124.0, 173.0, 348.0, 554.0, 1234.0, 3098.0, 9634.0, 43561.0, 313602.0, 570693.0, 82133.0, 15344.0, 4404.0, 1670.0, 772.0, 386.0, 217.0, 160.0, 93.0, 46.0, 37.0, 24.0, 17.0, 11.0, 13.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43603515625, -0.42108917236328125, -0.4061431884765625, -0.39119720458984375, -0.376251220703125, -0.36130523681640625, -0.3463592529296875, -0.33141326904296875, -0.31646728515625, -0.30152130126953125, -0.2865753173828125, -0.27162933349609375, -0.256683349609375, -0.24173736572265625, -0.2267913818359375, -0.21184539794921875, -0.1968994140625, -0.18195343017578125, -0.1670074462890625, -0.15206146240234375, -0.137115478515625, -0.12216949462890625, -0.1072235107421875, -0.09227752685546875, -0.07733154296875, -0.06238555908203125, -0.0474395751953125, -0.03249359130859375, -0.017547607421875, -0.00260162353515625, 0.0123443603515625, 0.02729034423828125, 0.042236328125, 0.05718231201171875, 0.0721282958984375, 0.08707427978515625, 0.102020263671875, 0.11696624755859375, 0.1319122314453125, 0.14685821533203125, 0.16180419921875, 0.17675018310546875, 0.1916961669921875, 0.20664215087890625, 0.221588134765625, 0.23653411865234375, 0.2514801025390625, 0.26642608642578125, 0.2813720703125, 0.29631805419921875, 0.3112640380859375, 0.32621002197265625, 0.341156005859375, 0.35610198974609375, 0.3710479736328125, 0.38599395751953125, 0.40093994140625, 0.41588592529296875, 0.4308319091796875, 0.44577789306640625, 0.460723876953125, 0.47566986083984375, 0.4906158447265625, 0.5055618286132812, 0.5205078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 8.0, 3.0, 6.0, 6.0, 9.0, 11.0, 11.0, 19.0, 18.0, 27.0, 16.0, 28.0, 30.0, 28.0, 36.0, 25.0, 35.0, 29.0, 38.0, 36.0, 46.0, 35.0, 64.0, 36.0, 54.0, 34.0, 32.0, 38.0, 26.0, 45.0, 31.0, 20.0, 14.0, 21.0, 17.0, 11.0, 6.0, 14.0, 16.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298583984375, -0.28871917724609375, -0.2788543701171875, -0.26898956298828125, -0.259124755859375, -0.24925994873046875, -0.2393951416015625, -0.22953033447265625, -0.21966552734375, -0.20980072021484375, -0.1999359130859375, -0.19007110595703125, -0.180206298828125, -0.17034149169921875, -0.1604766845703125, -0.15061187744140625, -0.1407470703125, -0.13088226318359375, -0.1210174560546875, -0.11115264892578125, -0.101287841796875, -0.09142303466796875, -0.0815582275390625, -0.07169342041015625, -0.06182861328125, -0.05196380615234375, -0.0420989990234375, -0.03223419189453125, -0.022369384765625, -0.01250457763671875, -0.0026397705078125, 0.00722503662109375, 0.01708984375, 0.02695465087890625, 0.0368194580078125, 0.04668426513671875, 0.056549072265625, 0.06641387939453125, 0.0762786865234375, 0.08614349365234375, 0.09600830078125, 0.10587310791015625, 0.1157379150390625, 0.12560272216796875, 0.135467529296875, 0.14533233642578125, 0.1551971435546875, 0.16506195068359375, 0.1749267578125, 0.18479156494140625, 0.1946563720703125, 0.20452117919921875, 0.214385986328125, 0.22425079345703125, 0.2341156005859375, 0.24398040771484375, 0.25384521484375, 0.26371002197265625, 0.2735748291015625, 0.28343963623046875, 0.293304443359375, 0.30316925048828125, 0.3130340576171875, 0.32289886474609375, 0.332763671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 10.0, 13.0, 25.0, 28.0, 50.0, 95.0, 141.0, 270.0, 535.0, 1328.0, 4437.0, 30374.0, 951660.0, 50990.0, 5679.0, 1549.0, 604.0, 318.0, 168.0, 92.0, 50.0, 35.0, 29.0, 11.0, 13.0, 5.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64111328125, -0.618682861328125, -0.59625244140625, -0.573822021484375, -0.5513916015625, -0.528961181640625, -0.50653076171875, -0.484100341796875, -0.461669921875, -0.439239501953125, -0.41680908203125, -0.394378662109375, -0.3719482421875, -0.349517822265625, -0.32708740234375, -0.304656982421875, -0.2822265625, -0.259796142578125, -0.23736572265625, -0.214935302734375, -0.1925048828125, -0.170074462890625, -0.14764404296875, -0.125213623046875, -0.102783203125, -0.080352783203125, -0.05792236328125, -0.035491943359375, -0.0130615234375, 0.009368896484375, 0.03179931640625, 0.054229736328125, 0.07666015625, 0.099090576171875, 0.12152099609375, 0.143951416015625, 0.1663818359375, 0.188812255859375, 0.21124267578125, 0.233673095703125, 0.256103515625, 0.278533935546875, 0.30096435546875, 0.323394775390625, 0.3458251953125, 0.368255615234375, 0.39068603515625, 0.413116455078125, 0.435546875, 0.457977294921875, 0.48040771484375, 0.502838134765625, 0.5252685546875, 0.547698974609375, 0.57012939453125, 0.592559814453125, 0.614990234375, 0.637420654296875, 0.65985107421875, 0.682281494140625, 0.7047119140625, 0.727142333984375, 0.74957275390625, 0.772003173828125, 0.79443359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 15.0, 26.0, 43.0, 135.0, 469.0, 161.0, 62.0, 33.0, 15.0, 10.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001132965087890625, -0.0011035650968551636, -0.0010741651058197021, -0.0010447651147842407, -0.0010153651237487793, -0.0009859651327133179, -0.0009565651416778564, -0.000927165150642395, -0.0008977651596069336, -0.0008683651685714722, -0.0008389651775360107, -0.0008095651865005493, -0.0007801651954650879, -0.0007507652044296265, -0.000721365213394165, -0.0006919652223587036, -0.0006625652313232422, -0.0006331652402877808, -0.0006037652492523193, -0.0005743652582168579, -0.0005449652671813965, -0.0005155652761459351, -0.00048616528511047363, -0.0004567652940750122, -0.0004273653030395508, -0.00039796531200408936, -0.00036856532096862793, -0.0003391653299331665, -0.0003097653388977051, -0.00028036534786224365, -0.0002509653568267822, -0.0002215653657913208, -0.00019216537475585938, -0.00016276538372039795, -0.00013336539268493652, -0.0001039654016494751, -7.456541061401367e-05, -4.5165419578552246e-05, -1.576542854309082e-05, 1.3634562492370605e-05, 4.303455352783203e-05, 7.243454456329346e-05, 0.00010183453559875488, 0.0001312345266342163, 0.00016063451766967773, 0.00019003450870513916, 0.00021943449974060059, 0.000248834490776062, 0.00027823448181152344, 0.00030763447284698486, 0.0003370344638824463, 0.0003664344549179077, 0.00039583444595336914, 0.00042523443698883057, 0.000454634428024292, 0.0004840344190597534, 0.0005134344100952148, 0.0005428344011306763, 0.0005722343921661377, 0.0006016343832015991, 0.0006310343742370605, 0.000660434365272522, 0.0006898343563079834, 0.0007192343473434448, 0.0007486343383789062]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 4.0, 9.0, 14.0, 18.0, 22.0, 29.0, 66.0, 75.0, 146.0, 264.0, 457.0, 942.0, 2222.0, 6227.0, 26643.0, 298306.0, 651915.0, 46450.0, 9327.0, 2943.0, 1123.0, 588.0, 310.0, 139.0, 111.0, 65.0, 45.0, 34.0, 20.0, 7.0, 13.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.425048828125, -0.4126014709472656, -0.40015411376953125, -0.3877067565917969, -0.3752593994140625, -0.3628120422363281, -0.35036468505859375, -0.3379173278808594, -0.325469970703125, -0.3130226135253906, -0.30057525634765625, -0.2881278991699219, -0.2756805419921875, -0.2632331848144531, -0.25078582763671875, -0.23833847045898438, -0.22589111328125, -0.21344375610351562, -0.20099639892578125, -0.18854904174804688, -0.1761016845703125, -0.16365432739257812, -0.15120697021484375, -0.13875961303710938, -0.126312255859375, -0.11386489868164062, -0.10141754150390625, -0.08897018432617188, -0.0765228271484375, -0.06407546997070312, -0.05162811279296875, -0.039180755615234375, -0.0267333984375, -0.014286041259765625, -0.00183868408203125, 0.010608673095703125, 0.0230560302734375, 0.035503387451171875, 0.04795074462890625, 0.060398101806640625, 0.072845458984375, 0.08529281616210938, 0.09774017333984375, 0.11018753051757812, 0.1226348876953125, 0.13508224487304688, 0.14752960205078125, 0.15997695922851562, 0.17242431640625, 0.18487167358398438, 0.19731903076171875, 0.20976638793945312, 0.2222137451171875, 0.23466110229492188, 0.24710845947265625, 0.2595558166503906, 0.272003173828125, 0.2844505310058594, 0.29689788818359375, 0.3093452453613281, 0.3217926025390625, 0.3342399597167969, 0.34668731689453125, 0.3591346740722656, 0.37158203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 6.0, 7.0, 14.0, 16.0, 29.0, 36.0, 43.0, 82.0, 112.0, 118.0, 96.0, 86.0, 87.0, 77.0, 46.0, 33.0, 32.0, 19.0, 22.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.44921875, -0.43688201904296875, -0.4245452880859375, -0.41220855712890625, -0.399871826171875, -0.38753509521484375, -0.3751983642578125, -0.36286163330078125, -0.35052490234375, -0.33818817138671875, -0.3258514404296875, -0.31351470947265625, -0.301177978515625, -0.28884124755859375, -0.2765045166015625, -0.26416778564453125, -0.2518310546875, -0.23949432373046875, -0.2271575927734375, -0.21482086181640625, -0.202484130859375, -0.19014739990234375, -0.1778106689453125, -0.16547393798828125, -0.15313720703125, -0.14080047607421875, -0.1284637451171875, -0.11612701416015625, -0.103790283203125, -0.09145355224609375, -0.0791168212890625, -0.06678009033203125, -0.054443359375, -0.04210662841796875, -0.0297698974609375, -0.01743316650390625, -0.005096435546875, 0.00724029541015625, 0.0195770263671875, 0.03191375732421875, 0.04425048828125, 0.05658721923828125, 0.0689239501953125, 0.08126068115234375, 0.093597412109375, 0.10593414306640625, 0.1182708740234375, 0.13060760498046875, 0.1429443359375, 0.15528106689453125, 0.1676177978515625, 0.17995452880859375, 0.192291259765625, 0.20462799072265625, 0.2169647216796875, 0.22930145263671875, 0.24163818359375, 0.25397491455078125, 0.2663116455078125, 0.27864837646484375, 0.290985107421875, 0.30332183837890625, 0.3156585693359375, 0.32799530029296875, 0.34033203125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 9.0, 11.0, 17.0, 37.0, 69.0, 215.0, 369.0, 175.0, 48.0, 24.0, 10.0, 3.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.021965980529785, -5.831284999847412, -5.640604496002197, -5.449923515319824, -5.259242534637451, -5.068561553955078, -4.877881050109863, -4.68720006942749, -4.496519088745117, -4.305838108062744, -4.115157604217529, -3.9244766235351562, -3.733795642852783, -3.5431149005889893, -3.3524341583251953, -3.1617531776428223, -2.9710726737976074, -2.7803919315338135, -2.5897109508514404, -2.3990302085876465, -2.2083492279052734, -2.0176684856414795, -1.8269877433776855, -1.636306881904602, -1.4456260204315186, -1.254945158958435, -1.0642642974853516, -0.8735835552215576, -0.6829026937484741, -0.4922218322753906, -0.3015410900115967, -0.11086022853851318, 0.07982110977172852, 0.2705019414424896, 0.46118277311325073, 0.6518635749816895, 0.842544436454773, 1.0332252979278564, 1.2239060401916504, 1.4145869016647339, 1.6052677631378174, 1.7959486246109009, 1.9866294860839844, 2.1773102283477783, 2.3679909706115723, 2.5586719512939453, 2.7493526935577393, 2.940033435821533, 3.1307144165039062, 3.3213951587677, 3.5120761394500732, 3.702756881713867, 3.8934378623962402, 4.084118843078613, 4.274799346923828, 4.465480327606201, 4.656161308288574, 4.846842288970947, 5.037522792816162, 5.228203773498535, 5.418884754180908, 5.609565734863281, 5.800246238708496, 5.990927219390869, 6.181607723236084]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 11.0, 1.0, 1.0, 1.0, 7.0, 4.0, 15.0, 10.0, 20.0, 36.0, 55.0, 91.0, 120.0, 126.0, 124.0, 135.0, 82.0, 51.0, 32.0, 11.0, 21.0, 7.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 0.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.942081451416016, -6.730679512023926, -6.519277095794678, -6.307875156402588, -6.09647274017334, -5.88507080078125, -5.673668384552002, -5.462266445159912, -5.250864028930664, -5.039462089538574, -4.828059673309326, -4.616657733917236, -4.405255317687988, -4.193853378295898, -3.9824509620666504, -3.7710490226745605, -3.5596468448638916, -3.3482446670532227, -3.1368424892425537, -2.9254403114318848, -2.714038133621216, -2.502635955810547, -2.291234016418457, -2.079831600189209, -1.8684295415878296, -1.6570273637771606, -1.4456251859664917, -1.2342231273651123, -1.0228209495544434, -0.8114187717437744, -0.6000165939331055, -0.3886144161224365, -0.17721223831176758, 0.03418992459774017, 0.24559208750724792, 0.4569942355155945, 0.6683964133262634, 0.8797985315322876, 1.0912007093429565, 1.3026028871536255, 1.5140050649642944, 1.7254072427749634, 1.9368094205856323, 2.1482114791870117, 2.3596136569976807, 2.5710158348083496, 2.7824180126190186, 2.9938201904296875, 3.2052223682403564, 3.4166245460510254, 3.6280267238616943, 3.8394289016723633, 4.050830841064453, 4.262233257293701, 4.473635196685791, 4.685037612915039, 4.896439552307129, 5.107841491699219, 5.319243907928467, 5.530645847320557, 5.742048263549805, 5.9534502029418945, 6.164852619171143, 6.376254558563232, 6.5876569747924805]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 22.0, 47.0, 95.0, 328.0, 1278.0, 7537.0, 318178.0, 3851336.0, 12527.0, 2172.0, 467.0, 152.0, 42.0, 27.0, 18.0, 11.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0703125, -1.976531982421875, -1.88275146484375, -1.788970947265625, -1.6951904296875, -1.601409912109375, -1.50762939453125, -1.413848876953125, -1.320068359375, -1.226287841796875, -1.13250732421875, -1.038726806640625, -0.9449462890625, -0.851165771484375, -0.75738525390625, -0.663604736328125, -0.56982421875, -0.476043701171875, -0.38226318359375, -0.288482666015625, -0.1947021484375, -0.100921630859375, -0.00714111328125, 0.086639404296875, 0.180419921875, 0.274200439453125, 0.36798095703125, 0.461761474609375, 0.5555419921875, 0.649322509765625, 0.74310302734375, 0.836883544921875, 0.9306640625, 1.024444580078125, 1.11822509765625, 1.212005615234375, 1.3057861328125, 1.399566650390625, 1.49334716796875, 1.587127685546875, 1.680908203125, 1.774688720703125, 1.86846923828125, 1.962249755859375, 2.0560302734375, 2.149810791015625, 2.24359130859375, 2.337371826171875, 2.43115234375, 2.524932861328125, 2.61871337890625, 2.712493896484375, 2.8062744140625, 2.900054931640625, 2.99383544921875, 3.087615966796875, 3.181396484375, 3.275177001953125, 3.36895751953125, 3.462738037109375, 3.5565185546875, 3.650299072265625, 3.74407958984375, 3.837860107421875, 3.931640625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 3.0, 8.0, 11.0, 6.0, 5.0, 8.0, 4.0, 11.0, 16.0, 37.0, 74.0, 190.0, 257.0, 179.0, 80.0, 23.0, 16.0, 7.0, 6.0, 8.0, 7.0, 4.0, 7.0, 3.0, 6.0, 9.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0732421875, -0.07091999053955078, -0.06859779357910156, -0.06627559661865234, -0.06395339965820312, -0.061631202697753906, -0.05930900573730469, -0.05698680877685547, -0.05466461181640625, -0.05234241485595703, -0.05002021789550781, -0.047698020935058594, -0.045375823974609375, -0.043053627014160156, -0.04073143005371094, -0.03840923309326172, -0.0360870361328125, -0.03376483917236328, -0.03144264221191406, -0.029120445251464844, -0.026798248291015625, -0.024476051330566406, -0.022153854370117188, -0.01983165740966797, -0.01750946044921875, -0.015187263488769531, -0.012865066528320312, -0.010542869567871094, -0.008220672607421875, -0.005898475646972656, -0.0035762786865234375, -0.0012540817260742188, 0.001068115234375, 0.0033903121948242188, 0.0057125091552734375, 0.008034706115722656, 0.010356903076171875, 0.012679100036621094, 0.015001296997070312, 0.01732349395751953, 0.01964569091796875, 0.02196788787841797, 0.024290084838867188, 0.026612281799316406, 0.028934478759765625, 0.031256675720214844, 0.03357887268066406, 0.03590106964111328, 0.0382232666015625, 0.04054546356201172, 0.04286766052246094, 0.045189857482910156, 0.047512054443359375, 0.049834251403808594, 0.05215644836425781, 0.05447864532470703, 0.05680084228515625, 0.05912303924560547, 0.06144523620605469, 0.0637674331665039, 0.06608963012695312, 0.06841182708740234, 0.07073402404785156, 0.07305622100830078, 0.07537841796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 8.0, 15.0, 17.0, 18.0, 42.0, 73.0, 82.0, 191.0, 315.0, 543.0, 1137.0, 2507.0, 5992.0, 17145.0, 65612.0, 2041670.0, 1966500.0, 65371.0, 16707.0, 5747.0, 2317.0, 1069.0, 518.0, 275.0, 138.0, 87.0, 79.0, 31.0, 23.0, 22.0, 15.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6688766479492188, -0.6497650146484375, -0.6306533813476562, -0.611541748046875, -0.5924301147460938, -0.5733184814453125, -0.5542068481445312, -0.53509521484375, -0.5159835815429688, -0.4968719482421875, -0.47776031494140625, -0.458648681640625, -0.43953704833984375, -0.4204254150390625, -0.40131378173828125, -0.3822021484375, -0.36309051513671875, -0.3439788818359375, -0.32486724853515625, -0.305755615234375, -0.28664398193359375, -0.2675323486328125, -0.24842071533203125, -0.22930908203125, -0.21019744873046875, -0.1910858154296875, -0.17197418212890625, -0.152862548828125, -0.13375091552734375, -0.1146392822265625, -0.09552764892578125, -0.076416015625, -0.05730438232421875, -0.0381927490234375, -0.01908111572265625, 3.0517578125e-05, 0.01914215087890625, 0.0382537841796875, 0.05736541748046875, 0.07647705078125, 0.09558868408203125, 0.1147003173828125, 0.13381195068359375, 0.152923583984375, 0.17203521728515625, 0.1911468505859375, 0.21025848388671875, 0.2293701171875, 0.24848175048828125, 0.2675933837890625, 0.28670501708984375, 0.305816650390625, 0.32492828369140625, 0.3440399169921875, 0.36315155029296875, 0.38226318359375, 0.40137481689453125, 0.4204864501953125, 0.43959808349609375, 0.458709716796875, 0.47782135009765625, 0.4969329833984375, 0.5160446166992188, 0.53515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 2.0, 4.0, 4.0, 7.0, 8.0, 10.0, 7.0, 12.0, 10.0, 18.0, 18.0, 24.0, 23.0, 22.0, 51.0, 68.0, 87.0, 184.0, 469.0, 1526.0, 721.0, 276.0, 150.0, 93.0, 56.0, 33.0, 39.0, 23.0, 17.0, 22.0, 10.0, 19.0, 4.0, 7.0, 7.0, 3.0, 2.0, 3.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0762939453125, -0.07402801513671875, -0.0717620849609375, -0.06949615478515625, -0.067230224609375, -0.06496429443359375, -0.0626983642578125, -0.06043243408203125, -0.05816650390625, -0.05590057373046875, -0.0536346435546875, -0.05136871337890625, -0.049102783203125, -0.04683685302734375, -0.0445709228515625, -0.04230499267578125, -0.0400390625, -0.03777313232421875, -0.0355072021484375, -0.03324127197265625, -0.030975341796875, -0.02870941162109375, -0.0264434814453125, -0.02417755126953125, -0.02191162109375, -0.01964569091796875, -0.0173797607421875, -0.01511383056640625, -0.012847900390625, -0.01058197021484375, -0.0083160400390625, -0.00605010986328125, -0.0037841796875, -0.00151824951171875, 0.0007476806640625, 0.00301361083984375, 0.005279541015625, 0.00754547119140625, 0.0098114013671875, 0.01207733154296875, 0.01434326171875, 0.01660919189453125, 0.0188751220703125, 0.02114105224609375, 0.023406982421875, 0.02567291259765625, 0.0279388427734375, 0.03020477294921875, 0.032470703125, 0.03473663330078125, 0.0370025634765625, 0.03926849365234375, 0.041534423828125, 0.04380035400390625, 0.0460662841796875, 0.04833221435546875, 0.05059814453125, 0.05286407470703125, 0.0551300048828125, 0.05739593505859375, 0.059661865234375, 0.06192779541015625, 0.0641937255859375, 0.06645965576171875, 0.0687255859375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 16.0, 102.0, 750.0, 105.0, 19.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8531599044799805, -3.7578370571136475, -3.6625144481658936, -3.5671916007995605, -3.4718689918518066, -3.3765461444854736, -3.2812232971191406, -3.1859006881713867, -3.0905778408050537, -2.9952549934387207, -2.899932384490967, -2.804609537124634, -2.70928692817688, -2.613964080810547, -2.518641471862793, -2.42331862449646, -2.327995777130127, -2.232672929763794, -2.13735032081604, -2.042027473449707, -1.9467047452926636, -1.8513820171356201, -1.7560592889785767, -1.6607365608215332, -1.5654139518737793, -1.4700912237167358, -1.3747684955596924, -1.2794456481933594, -1.184122920036316, -1.0888001918792725, -0.993477463722229, -0.8981546759605408, -0.8028318881988525, -0.7075091600418091, -0.6121863722801208, -0.5168636441230774, -0.42154088616371155, -0.3262181282043457, -0.23089540004730225, -0.135572612285614, -0.04024988412857056, 0.05507286638021469, 0.15039561688899994, 0.2457183599472046, 0.34104111790657043, 0.4363638758659363, 0.5316866040229797, 0.627009391784668, 0.7223321199417114, 0.8176548480987549, 0.9129776358604431, 1.0083003044128418, 1.1036231517791748, 1.1989458799362183, 1.2942686080932617, 1.3895914554595947, 1.4849140644073486, 1.580236792564392, 1.6755595207214355, 1.7708823680877686, 1.866205096244812, 1.9615278244018555, 2.0568504333496094, 2.1521732807159424, 2.2474961280822754]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 2.0, 10.0, 8.0, 12.0, 17.0, 13.0, 16.0, 41.0, 47.0, 50.0, 69.0, 76.0, 92.0, 64.0, 72.0, 83.0, 71.0, 51.0, 42.0, 37.0, 27.0, 18.0, 7.0, 12.0, 9.0, 8.0, 9.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5329259634017944, -0.5160823464393616, -0.4992387890815735, -0.4823951721191406, -0.46555158495903015, -0.4487079977989197, -0.4318644106388092, -0.41502082347869873, -0.39817720651626587, -0.3813336193561554, -0.3644900321960449, -0.34764641523361206, -0.3308028280735016, -0.3139592409133911, -0.29711565375328064, -0.28027206659317017, -0.2634284794330597, -0.24658489227294922, -0.22974129021167755, -0.21289770305156708, -0.1960541009902954, -0.17921051383018494, -0.16236692667007446, -0.145523339509964, -0.12867973744869232, -0.11183614283800125, -0.09499254822731018, -0.07814896106719971, -0.061305366456508636, -0.044461771845817566, -0.027618184685707092, -0.010774590075016022, 0.006069004535675049, 0.02291259728372097, 0.03975619003176689, 0.056599780917167664, 0.07344337552785873, 0.0902869701385498, 0.10713055729866028, 0.12397415190935135, 0.14081774652004242, 0.1576613336801529, 0.17450493574142456, 0.19134852290153503, 0.2081921100616455, 0.22503571212291718, 0.24187929928302765, 0.2587229013442993, 0.2755664885044098, 0.29241007566452026, 0.30925366282463074, 0.3260972499847412, 0.3429408669471741, 0.35978445410728455, 0.376628041267395, 0.3934716284275055, 0.41031521558761597, 0.42715880274772644, 0.4440023899078369, 0.4608460068702698, 0.47768959403038025, 0.4945331811904907, 0.5113767385482788, 0.5282203555107117, 0.5450639724731445]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 22.0, 27.0, 20.0, 38.0, 62.0, 83.0, 104.0, 182.0, 253.0, 429.0, 703.0, 1139.0, 1981.0, 3648.0, 7079.0, 15528.0, 49139.0, 546014.0, 356170.0, 38317.0, 13246.0, 6421.0, 3240.0, 1817.0, 1041.0, 677.0, 402.0, 257.0, 153.0, 111.0, 71.0, 52.0, 34.0, 18.0, 19.0, 17.0, 9.0, 8.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5126953125, -0.4971199035644531, -0.48154449462890625, -0.4659690856933594, -0.4503936767578125, -0.4348182678222656, -0.41924285888671875, -0.4036674499511719, -0.388092041015625, -0.3725166320800781, -0.35694122314453125, -0.3413658142089844, -0.3257904052734375, -0.3102149963378906, -0.29463958740234375, -0.2790641784667969, -0.26348876953125, -0.24791336059570312, -0.23233795166015625, -0.21676254272460938, -0.2011871337890625, -0.18561172485351562, -0.17003631591796875, -0.15446090698242188, -0.138885498046875, -0.12331008911132812, -0.10773468017578125, -0.09215927124023438, -0.0765838623046875, -0.061008453369140625, -0.04543304443359375, -0.029857635498046875, -0.0142822265625, 0.001293182373046875, 0.01686859130859375, 0.032444000244140625, 0.0480194091796875, 0.06359481811523438, 0.07917022705078125, 0.09474563598632812, 0.110321044921875, 0.12589645385742188, 0.14147186279296875, 0.15704727172851562, 0.1726226806640625, 0.18819808959960938, 0.20377349853515625, 0.21934890747070312, 0.23492431640625, 0.2504997253417969, 0.26607513427734375, 0.2816505432128906, 0.2972259521484375, 0.3128013610839844, 0.32837677001953125, 0.3439521789550781, 0.359527587890625, 0.3751029968261719, 0.39067840576171875, 0.4062538146972656, 0.4218292236328125, 0.4374046325683594, 0.45298004150390625, 0.4685554504394531, 0.484130859375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 8.0, 5.0, 8.0, 13.0, 14.0, 41.0, 74.0, 113.0, 163.0, 167.0, 139.0, 88.0, 50.0, 23.0, 16.0, 7.0, 11.0, 7.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.066650390625, -0.06465578079223633, -0.06266117095947266, -0.060666561126708984, -0.05867195129394531, -0.05667734146118164, -0.05468273162841797, -0.0526881217956543, -0.050693511962890625, -0.04869890213012695, -0.04670429229736328, -0.04470968246459961, -0.04271507263183594, -0.040720462799072266, -0.038725852966308594, -0.03673124313354492, -0.03473663330078125, -0.03274202346801758, -0.030747413635253906, -0.028752803802490234, -0.026758193969726562, -0.02476358413696289, -0.02276897430419922, -0.020774364471435547, -0.018779754638671875, -0.016785144805908203, -0.014790534973144531, -0.01279592514038086, -0.010801315307617188, -0.008806705474853516, -0.006812095642089844, -0.004817485809326172, -0.0028228759765625, -0.0008282661437988281, 0.0011663436889648438, 0.0031609535217285156, 0.0051555633544921875, 0.007150173187255859, 0.009144783020019531, 0.011139392852783203, 0.013134002685546875, 0.015128612518310547, 0.01712322235107422, 0.01911783218383789, 0.021112442016601562, 0.023107051849365234, 0.025101661682128906, 0.027096271514892578, 0.02909088134765625, 0.031085491180419922, 0.033080101013183594, 0.035074710845947266, 0.03706932067871094, 0.03906393051147461, 0.04105854034423828, 0.04305315017700195, 0.045047760009765625, 0.0470423698425293, 0.04903697967529297, 0.05103158950805664, 0.05302619934082031, 0.055020809173583984, 0.057015419006347656, 0.05901002883911133, 0.061004638671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 4.0, 3.0, 5.0, 14.0, 26.0, 108.0, 386.0, 4096.0, 747898.0, 293398.0, 2182.0, 283.0, 76.0, 22.0, 9.0, 8.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.52734375, -1.4762725830078125, -1.425201416015625, -1.3741302490234375, -1.32305908203125, -1.2719879150390625, -1.220916748046875, -1.1698455810546875, -1.1187744140625, -1.0677032470703125, -1.016632080078125, -0.9655609130859375, -0.91448974609375, -0.8634185791015625, -0.812347412109375, -0.7612762451171875, -0.710205078125, -0.6591339111328125, -0.608062744140625, -0.5569915771484375, -0.50592041015625, -0.4548492431640625, -0.403778076171875, -0.3527069091796875, -0.3016357421875, -0.2505645751953125, -0.199493408203125, -0.1484222412109375, -0.09735107421875, -0.0462799072265625, 0.004791259765625, 0.0558624267578125, 0.10693359375, 0.1580047607421875, 0.209075927734375, 0.2601470947265625, 0.31121826171875, 0.3622894287109375, 0.413360595703125, 0.4644317626953125, 0.5155029296875, 0.5665740966796875, 0.617645263671875, 0.6687164306640625, 0.71978759765625, 0.7708587646484375, 0.821929931640625, 0.8730010986328125, 0.924072265625, 0.9751434326171875, 1.026214599609375, 1.0772857666015625, 1.12835693359375, 1.1794281005859375, 1.230499267578125, 1.2815704345703125, 1.3326416015625, 1.3837127685546875, 1.434783935546875, 1.4858551025390625, 1.53692626953125, 1.5879974365234375, 1.639068603515625, 1.6901397705078125, 1.7412109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 5.0, 5.0, 7.0, 4.0, 11.0, 17.0, 22.0, 12.0, 23.0, 25.0, 26.0, 31.0, 34.0, 47.0, 58.0, 50.0, 41.0, 49.0, 45.0, 40.0, 49.0, 45.0, 35.0, 28.0, 46.0, 36.0, 21.0, 26.0, 29.0, 20.0, 24.0, 13.0, 15.0, 7.0, 9.0, 9.0, 10.0, 4.0, 9.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2237548828125, -0.21648025512695312, -0.20920562744140625, -0.20193099975585938, -0.1946563720703125, -0.18738174438476562, -0.18010711669921875, -0.17283248901367188, -0.165557861328125, -0.15828323364257812, -0.15100860595703125, -0.14373397827148438, -0.1364593505859375, -0.12918472290039062, -0.12191009521484375, -0.11463546752929688, -0.10736083984375, -0.10008621215820312, -0.09281158447265625, -0.08553695678710938, -0.0782623291015625, -0.07098770141601562, -0.06371307373046875, -0.056438446044921875, -0.049163818359375, -0.041889190673828125, -0.03461456298828125, -0.027339935302734375, -0.0200653076171875, -0.012790679931640625, -0.00551605224609375, 0.001758575439453125, 0.009033203125, 0.016307830810546875, 0.02358245849609375, 0.030857086181640625, 0.0381317138671875, 0.045406341552734375, 0.05268096923828125, 0.059955596923828125, 0.067230224609375, 0.07450485229492188, 0.08177947998046875, 0.08905410766601562, 0.0963287353515625, 0.10360336303710938, 0.11087799072265625, 0.11815261840820312, 0.12542724609375, 0.13270187377929688, 0.13997650146484375, 0.14725112915039062, 0.1545257568359375, 0.16180038452148438, 0.16907501220703125, 0.17634963989257812, 0.183624267578125, 0.19089889526367188, 0.19817352294921875, 0.20544815063476562, 0.2127227783203125, 0.21999740600585938, 0.22727203369140625, 0.23454666137695312, 0.2418212890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 5.0, 10.0, 21.0, 48.0, 133.0, 1137.0, 1024972.0, 21632.0, 426.0, 97.0, 31.0, 17.0, 12.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.421875, -4.29840087890625, -4.1749267578125, -4.05145263671875, -3.927978515625, -3.80450439453125, -3.6810302734375, -3.55755615234375, -3.43408203125, -3.31060791015625, -3.1871337890625, -3.06365966796875, -2.940185546875, -2.81671142578125, -2.6932373046875, -2.56976318359375, -2.4462890625, -2.32281494140625, -2.1993408203125, -2.07586669921875, -1.952392578125, -1.82891845703125, -1.7054443359375, -1.58197021484375, -1.45849609375, -1.33502197265625, -1.2115478515625, -1.08807373046875, -0.964599609375, -0.84112548828125, -0.7176513671875, -0.59417724609375, -0.470703125, -0.34722900390625, -0.2237548828125, -0.10028076171875, 0.023193359375, 0.14666748046875, 0.2701416015625, 0.39361572265625, 0.51708984375, 0.64056396484375, 0.7640380859375, 0.88751220703125, 1.010986328125, 1.13446044921875, 1.2579345703125, 1.38140869140625, 1.5048828125, 1.62835693359375, 1.7518310546875, 1.87530517578125, 1.998779296875, 2.12225341796875, 2.2457275390625, 2.36920166015625, 2.49267578125, 2.61614990234375, 2.7396240234375, 2.86309814453125, 2.986572265625, 3.11004638671875, 3.2335205078125, 3.35699462890625, 3.48046875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 3.0, 5.0, 9.0, 5.0, 9.0, 23.0, 31.0, 40.0, 78.0, 108.0, 265.0, 177.0, 72.0, 54.0, 30.0, 23.0, 15.0, 14.0, 6.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007991790771484375, -0.0007747560739517212, -0.0007503330707550049, -0.0007259100675582886, -0.0007014870643615723, -0.000677064061164856, -0.0006526410579681396, -0.0006282180547714233, -0.000603795051574707, -0.0005793720483779907, -0.0005549490451812744, -0.0005305260419845581, -0.0005061030387878418, -0.0004816800355911255, -0.0004572570323944092, -0.00043283402919769287, -0.00040841102600097656, -0.00038398802280426025, -0.00035956501960754395, -0.00033514201641082764, -0.00031071901321411133, -0.000286296010017395, -0.0002618730068206787, -0.0002374500036239624, -0.0002130270004272461, -0.00018860399723052979, -0.00016418099403381348, -0.00013975799083709717, -0.00011533498764038086, -9.091198444366455e-05, -6.648898124694824e-05, -4.2065978050231934e-05, -1.7642974853515625e-05, 6.780028343200684e-06, 3.120303153991699e-05, 5.56260347366333e-05, 8.004903793334961e-05, 0.00010447204113006592, 0.00012889504432678223, 0.00015331804752349854, 0.00017774105072021484, 0.00020216405391693115, 0.00022658705711364746, 0.00025101006031036377, 0.0002754330635070801, 0.0002998560667037964, 0.0003242790699005127, 0.000348702073097229, 0.0003731250762939453, 0.0003975480794906616, 0.00042197108268737793, 0.00044639408588409424, 0.00047081708908081055, 0.0004952400922775269, 0.0005196630954742432, 0.0005440860986709595, 0.0005685091018676758, 0.0005929321050643921, 0.0006173551082611084, 0.0006417781114578247, 0.000666201114654541, 0.0006906241178512573, 0.0007150471210479736, 0.0007394701242446899, 0.0007638931274414062]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 6.0, 8.0, 11.0, 23.0, 37.0, 87.0, 190.0, 469.0, 1317.0, 4749.0, 38002.0, 821872.0, 166783.0, 11270.0, 2365.0, 757.0, 301.0, 133.0, 69.0, 33.0, 23.0, 15.0, 8.0, 6.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.5026168823242188, -0.4822845458984375, -0.46195220947265625, -0.441619873046875, -0.42128753662109375, -0.4009552001953125, -0.38062286376953125, -0.36029052734375, -0.33995819091796875, -0.3196258544921875, -0.29929351806640625, -0.278961181640625, -0.25862884521484375, -0.2382965087890625, -0.21796417236328125, -0.1976318359375, -0.17729949951171875, -0.1569671630859375, -0.13663482666015625, -0.116302490234375, -0.09597015380859375, -0.0756378173828125, -0.05530548095703125, -0.03497314453125, -0.01464080810546875, 0.0056915283203125, 0.02602386474609375, 0.046356201171875, 0.06668853759765625, 0.0870208740234375, 0.10735321044921875, 0.127685546875, 0.14801788330078125, 0.1683502197265625, 0.18868255615234375, 0.209014892578125, 0.22934722900390625, 0.2496795654296875, 0.27001190185546875, 0.29034423828125, 0.31067657470703125, 0.3310089111328125, 0.35134124755859375, 0.371673583984375, 0.39200592041015625, 0.4123382568359375, 0.43267059326171875, 0.4530029296875, 0.47333526611328125, 0.4936676025390625, 0.5139999389648438, 0.534332275390625, 0.5546646118164062, 0.5749969482421875, 0.5953292846679688, 0.61566162109375, 0.6359939575195312, 0.6563262939453125, 0.6766586303710938, 0.696990966796875, 0.7173233032226562, 0.7376556396484375, 0.7579879760742188, 0.7783203125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 8.0, 10.0, 15.0, 21.0, 35.0, 47.0, 86.0, 127.0, 152.0, 144.0, 96.0, 86.0, 54.0, 33.0, 25.0, 13.0, 11.0, 8.0, 10.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32568359375, -0.3136024475097656, -0.30152130126953125, -0.2894401550292969, -0.2773590087890625, -0.2652778625488281, -0.25319671630859375, -0.24111557006835938, -0.229034423828125, -0.21695327758789062, -0.20487213134765625, -0.19279098510742188, -0.1807098388671875, -0.16862869262695312, -0.15654754638671875, -0.14446640014648438, -0.13238525390625, -0.12030410766601562, -0.10822296142578125, -0.09614181518554688, -0.0840606689453125, -0.07197952270507812, -0.05989837646484375, -0.047817230224609375, -0.035736083984375, -0.023654937744140625, -0.01157379150390625, 0.000507354736328125, 0.0125885009765625, 0.024669647216796875, 0.03675079345703125, 0.048831939697265625, 0.0609130859375, 0.07299423217773438, 0.08507537841796875, 0.09715652465820312, 0.1092376708984375, 0.12131881713867188, 0.13339996337890625, 0.14548110961914062, 0.157562255859375, 0.16964340209960938, 0.18172454833984375, 0.19380569458007812, 0.2058868408203125, 0.21796798706054688, 0.23004913330078125, 0.24213027954101562, 0.25421142578125, 0.2662925720214844, 0.27837371826171875, 0.2904548645019531, 0.3025360107421875, 0.3146171569824219, 0.32669830322265625, 0.3387794494628906, 0.350860595703125, 0.3629417419433594, 0.37502288818359375, 0.3871040344238281, 0.3991851806640625, 0.4112663269042969, 0.42334747314453125, 0.4354286193847656, 0.447509765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 8.0, 10.0, 22.0, 90.0, 266.0, 371.0, 147.0, 59.0, 16.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.099022388458252, -4.949929237365723, -4.800836563110352, -4.651743412017822, -4.502650260925293, -4.353557586669922, -4.204464435577393, -4.055371284484863, -3.906278610229492, -3.757185697555542, -3.608092784881592, -3.4589996337890625, -3.3099067211151123, -3.160813808441162, -3.011720657348633, -2.8626277446746826, -2.7135348320007324, -2.5644419193267822, -2.415349006652832, -2.2662558555603027, -2.1171629428863525, -1.9680700302124023, -1.8189769983291626, -1.6698839664459229, -1.5207910537719727, -1.3716981410980225, -1.2226051092147827, -1.073512077331543, -0.9244191646575928, -0.7753261923789978, -0.6262332201004028, -0.4771401882171631, -0.3280477523803711, -0.17895478010177612, -0.029861807823181152, 0.11923116445541382, 0.2683241367340088, 0.41741710901260376, 0.5665100812911987, 0.7156031131744385, 0.8646960258483887, 1.0137889385223389, 1.1628819704055786, 1.3119750022888184, 1.4610679149627686, 1.6101608276367188, 1.7592538595199585, 1.9083468914031982, 2.0574398040771484, 2.2065327167510986, 2.355625629425049, 2.504718780517578, 2.6538116931915283, 2.8029046058654785, 2.951997756958008, 3.101090669631958, 3.250183582305908, 3.3992764949798584, 3.5483694076538086, 3.697462558746338, 3.846555471420288, 3.9956483840942383, 4.144741535186768, 4.293834686279297, 4.442927360534668]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 6.0, 9.0, 9.0, 15.0, 31.0, 45.0, 67.0, 96.0, 119.0, 134.0, 115.0, 111.0, 73.0, 60.0, 37.0, 22.0, 11.0, 8.0, 3.0, 1.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.652742624282837, -3.521327018737793, -3.38991117477417, -3.258495569229126, -3.127079963684082, -2.995664358139038, -2.864248752593994, -2.732832908630371, -2.601417303085327, -2.470001697540283, -2.33858585357666, -2.207170248031616, -2.0757546424865723, -1.9443390369415283, -1.8129233121871948, -1.6815075874328613, -1.5500919818878174, -1.4186763763427734, -1.28726065158844, -1.1558449268341064, -1.0244293212890625, -0.8930136561393738, -0.7615979909896851, -0.6301823258399963, -0.4987666606903076, -0.3673509955406189, -0.23593533039093018, -0.10451966524124146, 0.026895999908447266, 0.158311665058136, 0.2897273302078247, 0.4211429953575134, 0.5525588989257812, 0.68397456407547, 0.8153902292251587, 0.9468058943748474, 1.0782215595245361, 1.20963716506958, 1.3410528898239136, 1.472468614578247, 1.603884220123291, 1.735299825668335, 1.8667155504226685, 1.998131275177002, 2.129546880722046, 2.26096248626709, 2.392378330230713, 2.523793935775757, 2.655209541320801, 2.7866251468658447, 2.9180407524108887, 3.0494565963745117, 3.1808722019195557, 3.3122878074645996, 3.4437036514282227, 3.5751192569732666, 3.7065348625183105, 3.8379504680633545, 3.9693660736083984, 4.1007819175720215, 4.2321977615356445, 4.363613128662109, 4.495028972625732, 4.626444339752197, 4.75786018371582]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 11.0, 8.0, 8.0, 10.0, 16.0, 23.0, 18.0, 40.0, 40.0, 54.0, 100.0, 124.0, 210.0, 298.0, 483.0, 792.0, 1421.0, 3765.0, 13737.0, 187080.0, 3943100.0, 31578.0, 6501.0, 2298.0, 1042.0, 559.0, 336.0, 190.0, 123.0, 86.0, 63.0, 45.0, 23.0, 32.0, 19.0, 12.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.5275726318359375, -1.477020263671875, -1.4264678955078125, -1.37591552734375, -1.3253631591796875, -1.274810791015625, -1.2242584228515625, -1.1737060546875, -1.1231536865234375, -1.072601318359375, -1.0220489501953125, -0.97149658203125, -0.9209442138671875, -0.870391845703125, -0.8198394775390625, -0.769287109375, -0.7187347412109375, -0.668182373046875, -0.6176300048828125, -0.56707763671875, -0.5165252685546875, -0.465972900390625, -0.4154205322265625, -0.3648681640625, -0.3143157958984375, -0.263763427734375, -0.2132110595703125, -0.16265869140625, -0.1121063232421875, -0.061553955078125, -0.0110015869140625, 0.03955078125, 0.0901031494140625, 0.140655517578125, 0.1912078857421875, 0.24176025390625, 0.2923126220703125, 0.342864990234375, 0.3934173583984375, 0.4439697265625, 0.4945220947265625, 0.545074462890625, 0.5956268310546875, 0.64617919921875, 0.6967315673828125, 0.747283935546875, 0.7978363037109375, 0.848388671875, 0.8989410400390625, 0.949493408203125, 1.0000457763671875, 1.05059814453125, 1.1011505126953125, 1.151702880859375, 1.2022552490234375, 1.2528076171875, 1.3033599853515625, 1.353912353515625, 1.4044647216796875, 1.45501708984375, 1.5055694580078125, 1.556121826171875, 1.6066741943359375, 1.6572265625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 5.0, 8.0, 7.0, 11.0, 29.0, 47.0, 111.0, 143.0, 177.0, 170.0, 111.0, 75.0, 28.0, 26.0, 11.0, 10.0, 12.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09283447265625, -0.09023857116699219, -0.08764266967773438, -0.08504676818847656, -0.08245086669921875, -0.07985496520996094, -0.07725906372070312, -0.07466316223144531, -0.0720672607421875, -0.06947135925292969, -0.06687545776367188, -0.06427955627441406, -0.06168365478515625, -0.05908775329589844, -0.056491851806640625, -0.05389595031738281, -0.051300048828125, -0.04870414733886719, -0.046108245849609375, -0.04351234436035156, -0.04091644287109375, -0.03832054138183594, -0.035724639892578125, -0.03312873840332031, -0.0305328369140625, -0.027936935424804688, -0.025341033935546875, -0.022745132446289062, -0.02014923095703125, -0.017553329467773438, -0.014957427978515625, -0.012361526489257812, -0.009765625, -0.0071697235107421875, -0.004573822021484375, -0.0019779205322265625, 0.00061798095703125, 0.0032138824462890625, 0.005809783935546875, 0.008405685424804688, 0.0110015869140625, 0.013597488403320312, 0.016193389892578125, 0.018789291381835938, 0.02138519287109375, 0.023981094360351562, 0.026576995849609375, 0.029172897338867188, 0.031768798828125, 0.03436470031738281, 0.036960601806640625, 0.03955650329589844, 0.04215240478515625, 0.04474830627441406, 0.047344207763671875, 0.04994010925292969, 0.0525360107421875, 0.05513191223144531, 0.057727813720703125, 0.06032371520996094, 0.06291961669921875, 0.06551551818847656, 0.06811141967773438, 0.07070732116699219, 0.07330322265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 9.0, 13.0, 9.0, 9.0, 28.0, 27.0, 51.0, 62.0, 135.0, 381.0, 2274.0, 27232.0, 4049153.0, 109291.0, 4463.0, 653.0, 190.0, 94.0, 56.0, 35.0, 24.0, 20.0, 11.0, 8.0, 4.0, 4.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.650390625, -1.596588134765625, -1.54278564453125, -1.488983154296875, -1.4351806640625, -1.381378173828125, -1.32757568359375, -1.273773193359375, -1.219970703125, -1.166168212890625, -1.11236572265625, -1.058563232421875, -1.0047607421875, -0.950958251953125, -0.89715576171875, -0.843353271484375, -0.78955078125, -0.735748291015625, -0.68194580078125, -0.628143310546875, -0.5743408203125, -0.520538330078125, -0.46673583984375, -0.412933349609375, -0.359130859375, -0.305328369140625, -0.25152587890625, -0.197723388671875, -0.1439208984375, -0.090118408203125, -0.03631591796875, 0.017486572265625, 0.0712890625, 0.125091552734375, 0.17889404296875, 0.232696533203125, 0.2864990234375, 0.340301513671875, 0.39410400390625, 0.447906494140625, 0.501708984375, 0.555511474609375, 0.60931396484375, 0.663116455078125, 0.7169189453125, 0.770721435546875, 0.82452392578125, 0.878326416015625, 0.93212890625, 0.985931396484375, 1.03973388671875, 1.093536376953125, 1.1473388671875, 1.201141357421875, 1.25494384765625, 1.308746337890625, 1.362548828125, 1.416351318359375, 1.47015380859375, 1.523956298828125, 1.5777587890625, 1.631561279296875, 1.68536376953125, 1.739166259765625, 1.79296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 10.0, 6.0, 6.0, 7.0, 9.0, 24.0, 17.0, 18.0, 37.0, 52.0, 68.0, 90.0, 187.0, 358.0, 746.0, 1261.0, 515.0, 217.0, 134.0, 87.0, 46.0, 46.0, 34.0, 12.0, 13.0, 14.0, 14.0, 7.0, 6.0, 8.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0870361328125, -0.08434200286865234, -0.08164787292480469, -0.07895374298095703, -0.07625961303710938, -0.07356548309326172, -0.07087135314941406, -0.0681772232055664, -0.06548309326171875, -0.0627889633178711, -0.06009483337402344, -0.05740070343017578, -0.054706573486328125, -0.05201244354248047, -0.04931831359863281, -0.046624183654785156, -0.0439300537109375, -0.041235923767089844, -0.03854179382324219, -0.03584766387939453, -0.033153533935546875, -0.03045940399169922, -0.027765274047851562, -0.025071144104003906, -0.02237701416015625, -0.019682884216308594, -0.016988754272460938, -0.014294624328613281, -0.011600494384765625, -0.008906364440917969, -0.0062122344970703125, -0.0035181045532226562, -0.000823974609375, 0.0018701553344726562, 0.0045642852783203125, 0.007258415222167969, 0.009952545166015625, 0.012646675109863281, 0.015340805053710938, 0.018034934997558594, 0.02072906494140625, 0.023423194885253906, 0.026117324829101562, 0.02881145477294922, 0.031505584716796875, 0.03419971466064453, 0.03689384460449219, 0.039587974548339844, 0.0422821044921875, 0.044976234436035156, 0.04767036437988281, 0.05036449432373047, 0.053058624267578125, 0.05575275421142578, 0.05844688415527344, 0.061141014099121094, 0.06383514404296875, 0.0665292739868164, 0.06922340393066406, 0.07191753387451172, 0.07461166381835938, 0.07730579376220703, 0.07999992370605469, 0.08269405364990234, 0.08538818359375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 35.0, 552.0, 381.0, 26.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9804832935333252, -1.8810842037200928, -1.7816851139068604, -1.682286024093628, -1.5828869342803955, -1.483487844467163, -1.3840886354446411, -1.2846895456314087, -1.1852904558181763, -1.0858913660049438, -0.9864922761917114, -0.8870931267738342, -0.7876940369606018, -0.6882949471473694, -0.5888957977294922, -0.48949670791625977, -0.39009761810302734, -0.2906985282897949, -0.1912994086742401, -0.0919002890586853, 0.007498800754547119, 0.10689789056777954, 0.20629703998565674, 0.30569612979888916, 0.4050952196121216, 0.504494309425354, 0.6038933992385864, 0.7032925486564636, 0.802691638469696, 0.9020907282829285, 1.0014898777008057, 1.100888967514038, 1.2002878189086914, 1.2996869087219238, 1.3990859985351562, 1.4984850883483887, 1.597884178161621, 1.6972832679748535, 1.7966824769973755, 1.896081566810608, 1.9954806566238403, 2.0948798656463623, 2.1942789554595947, 2.293678045272827, 2.3930771350860596, 2.492476224899292, 2.5918753147125244, 2.691274404525757, 2.7906734943389893, 2.8900725841522217, 2.989471673965454, 3.0888707637786865, 3.188269853591919, 3.2876689434051514, 3.387068271636963, 3.4864673614501953, 3.5858664512634277, 3.68526554107666, 3.7846646308898926, 3.884063720703125, 3.9834628105163574, 4.08286190032959, 4.182260990142822, 4.281660079956055, 4.381059169769287]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 10.0, 10.0, 14.0, 18.0, 18.0, 31.0, 42.0, 47.0, 57.0, 68.0, 75.0, 61.0, 94.0, 69.0, 60.0, 70.0, 43.0, 48.0, 33.0, 27.0, 23.0, 12.0, 14.0, 12.0, 8.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4672037363052368, -0.45223161578178406, -0.4372595250606537, -0.4222874045372009, -0.40731531381607056, -0.3923431932926178, -0.37737107276916504, -0.36239898204803467, -0.3474268615245819, -0.33245474100112915, -0.3174826502799988, -0.302510529756546, -0.28753840923309326, -0.2725663185119629, -0.25759419798851013, -0.24262209236621857, -0.227649986743927, -0.21267788112163544, -0.19770577549934387, -0.1827336549758911, -0.16776154935359955, -0.15278944373130798, -0.13781732320785522, -0.12284521758556366, -0.1078731119632721, -0.09290100634098053, -0.07792889326810837, -0.0629567801952362, -0.04798467457294464, -0.033012568950653076, -0.018040455877780914, -0.0030683428049087524, 0.011903762817382812, 0.026875872164964676, 0.04184798151254654, 0.0568200908601284, 0.07179220020771027, 0.08676430583000183, 0.10173641890287399, 0.11670853197574615, 0.13168063759803772, 0.14665274322032928, 0.16162484884262085, 0.1765969693660736, 0.19156907498836517, 0.20654118061065674, 0.2215133011341095, 0.23648540675640106, 0.2514575123786926, 0.2664296329021454, 0.28140172362327576, 0.2963738441467285, 0.3113459348678589, 0.32631805539131165, 0.3412901759147644, 0.3562622666358948, 0.37123438715934753, 0.3862065076828003, 0.40117859840393066, 0.4161507189273834, 0.4311228394508362, 0.44609493017196655, 0.4610670506954193, 0.47603917121887207, 0.49101126194000244]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 1.0, 4.0, 8.0, 5.0, 6.0, 14.0, 23.0, 22.0, 25.0, 48.0, 60.0, 73.0, 129.0, 207.0, 336.0, 701.0, 1604.0, 5694.0, 46333.0, 824743.0, 153594.0, 10429.0, 2396.0, 906.0, 477.0, 240.0, 132.0, 103.0, 63.0, 44.0, 35.0, 20.0, 14.0, 13.0, 18.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74365234375, -0.7167892456054688, -0.6899261474609375, -0.6630630493164062, -0.636199951171875, -0.6093368530273438, -0.5824737548828125, -0.5556106567382812, -0.52874755859375, -0.5018844604492188, -0.4750213623046875, -0.44815826416015625, -0.421295166015625, -0.39443206787109375, -0.3675689697265625, -0.34070587158203125, -0.3138427734375, -0.28697967529296875, -0.2601165771484375, -0.23325347900390625, -0.206390380859375, -0.17952728271484375, -0.1526641845703125, -0.12580108642578125, -0.09893798828125, -0.07207489013671875, -0.0452117919921875, -0.01834869384765625, 0.008514404296875, 0.03537750244140625, 0.0622406005859375, 0.08910369873046875, 0.115966796875, 0.14282989501953125, 0.1696929931640625, 0.19655609130859375, 0.223419189453125, 0.25028228759765625, 0.2771453857421875, 0.30400848388671875, 0.33087158203125, 0.35773468017578125, 0.3845977783203125, 0.41146087646484375, 0.438323974609375, 0.46518707275390625, 0.4920501708984375, 0.5189132690429688, 0.5457763671875, 0.5726394653320312, 0.5995025634765625, 0.6263656616210938, 0.653228759765625, 0.6800918579101562, 0.7069549560546875, 0.7338180541992188, 0.76068115234375, 0.7875442504882812, 0.8144073486328125, 0.8412704467773438, 0.868133544921875, 0.8949966430664062, 0.9218597412109375, 0.9487228393554688, 0.9755859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 0.0, 4.0, 10.0, 18.0, 33.0, 47.0, 90.0, 130.0, 153.0, 156.0, 114.0, 94.0, 54.0, 38.0, 28.0, 11.0, 3.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.07951641082763672, -0.07718467712402344, -0.07485294342041016, -0.07252120971679688, -0.0701894760131836, -0.06785774230957031, -0.06552600860595703, -0.06319427490234375, -0.06086254119873047, -0.05853080749511719, -0.056199073791503906, -0.053867340087890625, -0.051535606384277344, -0.04920387268066406, -0.04687213897705078, -0.0445404052734375, -0.04220867156982422, -0.03987693786621094, -0.037545204162597656, -0.035213470458984375, -0.032881736755371094, -0.030550003051757812, -0.02821826934814453, -0.02588653564453125, -0.02355480194091797, -0.021223068237304688, -0.018891334533691406, -0.016559600830078125, -0.014227867126464844, -0.011896133422851562, -0.009564399719238281, -0.007232666015625, -0.004900932312011719, -0.0025691986083984375, -0.00023746490478515625, 0.002094268798828125, 0.004426002502441406, 0.0067577362060546875, 0.009089469909667969, 0.01142120361328125, 0.013752937316894531, 0.016084671020507812, 0.018416404724121094, 0.020748138427734375, 0.023079872131347656, 0.025411605834960938, 0.02774333953857422, 0.0300750732421875, 0.03240680694580078, 0.03473854064941406, 0.037070274353027344, 0.039402008056640625, 0.041733741760253906, 0.04406547546386719, 0.04639720916748047, 0.04872894287109375, 0.05106067657470703, 0.05339241027832031, 0.055724143981933594, 0.058055877685546875, 0.060387611389160156, 0.06271934509277344, 0.06505107879638672, 0.0673828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 14.0, 18.0, 21.0, 28.0, 37.0, 54.0, 86.0, 146.0, 238.0, 510.0, 1176.0, 3659.0, 15731.0, 95059.0, 565886.0, 310837.0, 42876.0, 8059.0, 2309.0, 868.0, 383.0, 197.0, 110.0, 63.0, 54.0, 33.0, 22.0, 26.0, 16.0, 11.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62646484375, -0.60845947265625, -0.5904541015625, -0.57244873046875, -0.554443359375, -0.53643798828125, -0.5184326171875, -0.50042724609375, -0.482421875, -0.46441650390625, -0.4464111328125, -0.42840576171875, -0.410400390625, -0.39239501953125, -0.3743896484375, -0.35638427734375, -0.33837890625, -0.32037353515625, -0.3023681640625, -0.28436279296875, -0.266357421875, -0.24835205078125, -0.2303466796875, -0.21234130859375, -0.1943359375, -0.17633056640625, -0.1583251953125, -0.14031982421875, -0.122314453125, -0.10430908203125, -0.0863037109375, -0.06829833984375, -0.05029296875, -0.03228759765625, -0.0142822265625, 0.00372314453125, 0.021728515625, 0.03973388671875, 0.0577392578125, 0.07574462890625, 0.09375, 0.11175537109375, 0.1297607421875, 0.14776611328125, 0.165771484375, 0.18377685546875, 0.2017822265625, 0.21978759765625, 0.23779296875, 0.25579833984375, 0.2738037109375, 0.29180908203125, 0.309814453125, 0.32781982421875, 0.3458251953125, 0.36383056640625, 0.3818359375, 0.39984130859375, 0.4178466796875, 0.43585205078125, 0.453857421875, 0.47186279296875, 0.4898681640625, 0.50787353515625, 0.52587890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 3.0, 9.0, 14.0, 8.0, 11.0, 13.0, 9.0, 11.0, 19.0, 19.0, 24.0, 35.0, 30.0, 36.0, 39.0, 39.0, 46.0, 38.0, 55.0, 44.0, 37.0, 49.0, 44.0, 53.0, 27.0, 28.0, 33.0, 28.0, 33.0, 24.0, 23.0, 17.0, 23.0, 12.0, 13.0, 8.0, 7.0, 8.0, 9.0, 5.0, 0.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2354736328125, -0.2281360626220703, -0.22079849243164062, -0.21346092224121094, -0.20612335205078125, -0.19878578186035156, -0.19144821166992188, -0.1841106414794922, -0.1767730712890625, -0.1694355010986328, -0.16209793090820312, -0.15476036071777344, -0.14742279052734375, -0.14008522033691406, -0.13274765014648438, -0.1254100799560547, -0.118072509765625, -0.11073493957519531, -0.10339736938476562, -0.09605979919433594, -0.08872222900390625, -0.08138465881347656, -0.07404708862304688, -0.06670951843261719, -0.0593719482421875, -0.05203437805175781, -0.044696807861328125, -0.03735923767089844, -0.03002166748046875, -0.022684097290039062, -0.015346527099609375, -0.008008956909179688, -0.00067138671875, 0.0066661834716796875, 0.014003753662109375, 0.021341323852539062, 0.02867889404296875, 0.03601646423339844, 0.043354034423828125, 0.05069160461425781, 0.0580291748046875, 0.06536674499511719, 0.07270431518554688, 0.08004188537597656, 0.08737945556640625, 0.09471702575683594, 0.10205459594726562, 0.10939216613769531, 0.116729736328125, 0.12406730651855469, 0.13140487670898438, 0.13874244689941406, 0.14608001708984375, 0.15341758728027344, 0.16075515747070312, 0.1680927276611328, 0.1754302978515625, 0.1827678680419922, 0.19010543823242188, 0.19744300842285156, 0.20478057861328125, 0.21211814880371094, 0.21945571899414062, 0.2267932891845703, 0.234130859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 11.0, 24.0, 26.0, 69.0, 193.0, 613.0, 2899.0, 487333.0, 553173.0, 3214.0, 629.0, 206.0, 63.0, 37.0, 20.0, 15.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.642852783203125, -1.59722900390625, -1.551605224609375, -1.5059814453125, -1.460357666015625, -1.41473388671875, -1.369110107421875, -1.323486328125, -1.277862548828125, -1.23223876953125, -1.186614990234375, -1.1409912109375, -1.095367431640625, -1.04974365234375, -1.004119873046875, -0.95849609375, -0.912872314453125, -0.86724853515625, -0.821624755859375, -0.7760009765625, -0.730377197265625, -0.68475341796875, -0.639129638671875, -0.593505859375, -0.547882080078125, -0.50225830078125, -0.456634521484375, -0.4110107421875, -0.365386962890625, -0.31976318359375, -0.274139404296875, -0.228515625, -0.182891845703125, -0.13726806640625, -0.091644287109375, -0.0460205078125, -0.000396728515625, 0.04522705078125, 0.090850830078125, 0.136474609375, 0.182098388671875, 0.22772216796875, 0.273345947265625, 0.3189697265625, 0.364593505859375, 0.41021728515625, 0.455841064453125, 0.50146484375, 0.547088623046875, 0.59271240234375, 0.638336181640625, 0.6839599609375, 0.729583740234375, 0.77520751953125, 0.820831298828125, 0.866455078125, 0.912078857421875, 0.95770263671875, 1.003326416015625, 1.0489501953125, 1.094573974609375, 1.14019775390625, 1.185821533203125, 1.2314453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 10.0, 13.0, 10.0, 27.0, 23.0, 23.0, 34.0, 61.0, 62.0, 72.0, 99.0, 112.0, 109.0, 56.0, 56.0, 40.0, 46.0, 21.0, 19.0, 19.0, 16.0, 11.0, 13.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012993812561035156, -0.00012536346912384033, -0.0001207888126373291, -0.00011621415615081787, -0.00011163949966430664, -0.00010706484317779541, -0.00010249018669128418, -9.791553020477295e-05, -9.334087371826172e-05, -8.876621723175049e-05, -8.419156074523926e-05, -7.961690425872803e-05, -7.50422477722168e-05, -7.046759128570557e-05, -6.589293479919434e-05, -6.13182783126831e-05, -5.6743621826171875e-05, -5.2168965339660645e-05, -4.7594308853149414e-05, -4.3019652366638184e-05, -3.844499588012695e-05, -3.387033939361572e-05, -2.9295682907104492e-05, -2.4721026420593262e-05, -2.014636993408203e-05, -1.55717134475708e-05, -1.099705696105957e-05, -6.42240047454834e-06, -1.8477439880371094e-06, 2.726912498474121e-06, 7.3015689849853516e-06, 1.1876225471496582e-05, 1.6450881958007812e-05, 2.1025538444519043e-05, 2.5600194931030273e-05, 3.0174851417541504e-05, 3.4749507904052734e-05, 3.9324164390563965e-05, 4.3898820877075195e-05, 4.8473477363586426e-05, 5.3048133850097656e-05, 5.762279033660889e-05, 6.219744682312012e-05, 6.677210330963135e-05, 7.134675979614258e-05, 7.592141628265381e-05, 8.049607276916504e-05, 8.507072925567627e-05, 8.96453857421875e-05, 9.422004222869873e-05, 9.879469871520996e-05, 0.00010336935520172119, 0.00010794401168823242, 0.00011251866817474365, 0.00011709332466125488, 0.00012166798114776611, 0.00012624263763427734, 0.00013081729412078857, 0.0001353919506072998, 0.00013996660709381104, 0.00014454126358032227, 0.0001491159200668335, 0.00015369057655334473, 0.00015826523303985596, 0.0001628398895263672]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 12.0, 14.0, 27.0, 40.0, 87.0, 179.0, 445.0, 1241.0, 6435.0, 559971.0, 471827.0, 6111.0, 1263.0, 416.0, 198.0, 99.0, 78.0, 35.0, 29.0, 13.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92724609375, -0.8915634155273438, -0.8558807373046875, -0.8201980590820312, -0.784515380859375, -0.7488327026367188, -0.7131500244140625, -0.6774673461914062, -0.64178466796875, -0.6061019897460938, -0.5704193115234375, -0.5347366333007812, -0.499053955078125, -0.46337127685546875, -0.4276885986328125, -0.39200592041015625, -0.3563232421875, -0.32064056396484375, -0.2849578857421875, -0.24927520751953125, -0.213592529296875, -0.17790985107421875, -0.1422271728515625, -0.10654449462890625, -0.07086181640625, -0.03517913818359375, 0.0005035400390625, 0.03618621826171875, 0.071868896484375, 0.10755157470703125, 0.1432342529296875, 0.17891693115234375, 0.214599609375, 0.25028228759765625, 0.2859649658203125, 0.32164764404296875, 0.357330322265625, 0.39301300048828125, 0.4286956787109375, 0.46437835693359375, 0.50006103515625, 0.5357437133789062, 0.5714263916015625, 0.6071090698242188, 0.642791748046875, 0.6784744262695312, 0.7141571044921875, 0.7498397827148438, 0.7855224609375, 0.8212051391601562, 0.8568878173828125, 0.8925704956054688, 0.928253173828125, 0.9639358520507812, 0.9996185302734375, 1.0353012084960938, 1.07098388671875, 1.1066665649414062, 1.1423492431640625, 1.1780319213867188, 1.213714599609375, 1.2493972778320312, 1.2850799560546875, 1.3207626342773438, 1.3564453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 12.0, 6.0, 22.0, 47.0, 112.0, 305.0, 287.0, 123.0, 49.0, 18.0, 7.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4099082946777344, -0.39037322998046875, -0.3708381652832031, -0.3513031005859375, -0.3317680358886719, -0.31223297119140625, -0.2926979064941406, -0.273162841796875, -0.2536277770996094, -0.23409271240234375, -0.21455764770507812, -0.1950225830078125, -0.17548751831054688, -0.15595245361328125, -0.13641738891601562, -0.11688232421875, -0.09734725952148438, -0.07781219482421875, -0.058277130126953125, -0.0387420654296875, -0.019207000732421875, 0.00032806396484375, 0.019863128662109375, 0.039398193359375, 0.058933258056640625, 0.07846832275390625, 0.09800338745117188, 0.1175384521484375, 0.13707351684570312, 0.15660858154296875, 0.17614364624023438, 0.1956787109375, 0.21521377563476562, 0.23474884033203125, 0.2542839050292969, 0.2738189697265625, 0.2933540344238281, 0.31288909912109375, 0.3324241638183594, 0.351959228515625, 0.3714942932128906, 0.39102935791015625, 0.4105644226074219, 0.4300994873046875, 0.4496345520019531, 0.46916961669921875, 0.4887046813964844, 0.50823974609375, 0.5277748107910156, 0.5473098754882812, 0.5668449401855469, 0.5863800048828125, 0.6059150695800781, 0.6254501342773438, 0.6449851989746094, 0.664520263671875, 0.6840553283691406, 0.7035903930664062, 0.7231254577636719, 0.7426605224609375, 0.7621955871582031, 0.7817306518554688, 0.8012657165527344, 0.82080078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 11.0, 53.0, 684.0, 227.0, 29.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.582576274871826, -2.1321871280670166, -1.6817981004714966, -1.2314090728759766, -0.781019926071167, -0.3306307792663574, 0.11975812911987305, 0.5701472759246826, 1.0205364227294922, 1.4709255695343018, 1.9213145971298218, 2.371703624725342, 2.8220927715301514, 3.272481918334961, 3.7228708267211914, 4.173259735107422, 4.6236491203308105, 5.074038028717041, 5.52442741394043, 5.97481632232666, 6.425205230712891, 6.875594615936279, 7.32598352432251, 7.776372909545898, 8.226761817932129, 8.67715072631836, 9.12753963470459, 9.57792854309082, 10.028318405151367, 10.478707313537598, 10.929096221923828, 11.379485130310059, 11.829874038696289, 12.28026294708252, 12.73065185546875, 13.181041717529297, 13.631430625915527, 14.081819534301758, 14.532208442687988, 14.982597351074219, 15.432987213134766, 15.883376121520996, 16.333765029907227, 16.784154891967773, 17.234542846679688, 17.684932708740234, 18.13532257080078, 18.585710525512695, 19.03609848022461, 19.486488342285156, 19.93687629699707, 20.387266159057617, 20.83765411376953, 21.288043975830078, 21.738433837890625, 22.18882179260254, 22.639211654663086, 23.089601516723633, 23.539989471435547, 23.990379333496094, 24.440767288208008, 24.891157150268555, 25.34154510498047, 25.791934967041016, 26.242324829101562]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 5.0, 12.0, 17.0, 18.0, 21.0, 24.0, 41.0, 46.0, 46.0, 46.0, 53.0, 61.0, 71.0, 59.0, 66.0, 77.0, 53.0, 45.0, 52.0, 42.0, 25.0, 32.0, 23.0, 11.0, 13.0, 14.0, 3.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.796495199203491, -2.7146565914154053, -2.6328182220458984, -2.5509796142578125, -2.4691410064697266, -2.3873026371002197, -2.305464029312134, -2.223625659942627, -2.141787052154541, -2.059948444366455, -1.9781100749969482, -1.8962714672088623, -1.814432978630066, -1.7325944900512695, -1.6507558822631836, -1.5689173936843872, -1.4870789051055908, -1.4052404165267944, -1.323401927947998, -1.241563320159912, -1.1597248315811157, -1.0778863430023193, -0.9960477948188782, -0.914209246635437, -0.8323707580566406, -0.7505322694778442, -0.6686937212944031, -0.5868551731109619, -0.5050166845321655, -0.42317816615104675, -0.341339647769928, -0.2595010995864868, -0.17766261100769043, -0.09582409262657166, -0.01398557424545288, 0.0678529441356659, 0.14969146251678467, 0.23152998089790344, 0.3133684992790222, 0.3952070474624634, 0.47704553604125977, 0.5588840246200562, 0.6407225728034973, 0.7225611209869385, 0.8043996095657349, 0.8862380981445312, 0.9680766463279724, 1.0499151945114136, 1.13175368309021, 1.2135921716690063, 1.2954306602478027, 1.3772692680358887, 1.459107756614685, 1.5409462451934814, 1.6227848529815674, 1.7046233415603638, 1.7864618301391602, 1.8683003187179565, 1.950138807296753, 2.031977415084839, 2.1138157844543457, 2.1956543922424316, 2.2774930000305176, 2.3593316078186035, 2.4411699771881104]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 7.0, 5.0, 19.0, 34.0, 81.0, 171.0, 392.0, 1083.0, 10233.0, 4158523.0, 22225.0, 1044.0, 262.0, 96.0, 41.0, 25.0, 17.0, 11.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4140625, -5.25750732421875, -5.1009521484375, -4.94439697265625, -4.787841796875, -4.63128662109375, -4.4747314453125, -4.31817626953125, -4.16162109375, -4.00506591796875, -3.8485107421875, -3.69195556640625, -3.535400390625, -3.37884521484375, -3.2222900390625, -3.06573486328125, -2.9091796875, -2.75262451171875, -2.5960693359375, -2.43951416015625, -2.282958984375, -2.12640380859375, -1.9698486328125, -1.81329345703125, -1.65673828125, -1.50018310546875, -1.3436279296875, -1.18707275390625, -1.030517578125, -0.87396240234375, -0.7174072265625, -0.56085205078125, -0.404296875, -0.24774169921875, -0.0911865234375, 0.06536865234375, 0.221923828125, 0.37847900390625, 0.5350341796875, 0.69158935546875, 0.84814453125, 1.00469970703125, 1.1612548828125, 1.31781005859375, 1.474365234375, 1.63092041015625, 1.7874755859375, 1.94403076171875, 2.1005859375, 2.25714111328125, 2.4136962890625, 2.57025146484375, 2.726806640625, 2.88336181640625, 3.0399169921875, 3.19647216796875, 3.35302734375, 3.50958251953125, 3.6661376953125, 3.82269287109375, 3.979248046875, 4.13580322265625, 4.2923583984375, 4.44891357421875, 4.60546875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 14.0, 10.0, 27.0, 58.0, 83.0, 114.0, 137.0, 134.0, 133.0, 98.0, 72.0, 44.0, 23.0, 15.0, 13.0, 9.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125732421875, -0.1221761703491211, -0.11861991882324219, -0.11506366729736328, -0.11150741577148438, -0.10795116424560547, -0.10439491271972656, -0.10083866119384766, -0.09728240966796875, -0.09372615814208984, -0.09016990661621094, -0.08661365509033203, -0.08305740356445312, -0.07950115203857422, -0.07594490051269531, -0.0723886489868164, -0.0688323974609375, -0.0652761459350586, -0.06171989440917969, -0.05816364288330078, -0.054607391357421875, -0.05105113983154297, -0.04749488830566406, -0.043938636779785156, -0.04038238525390625, -0.036826133728027344, -0.03326988220214844, -0.02971363067626953, -0.026157379150390625, -0.02260112762451172, -0.019044876098632812, -0.015488624572753906, -0.011932373046875, -0.008376121520996094, -0.0048198699951171875, -0.0012636184692382812, 0.002292633056640625, 0.005848884582519531, 0.009405136108398438, 0.012961387634277344, 0.01651763916015625, 0.020073890686035156, 0.023630142211914062, 0.02718639373779297, 0.030742645263671875, 0.03429889678955078, 0.03785514831542969, 0.041411399841308594, 0.0449676513671875, 0.048523902893066406, 0.05208015441894531, 0.05563640594482422, 0.059192657470703125, 0.06274890899658203, 0.06630516052246094, 0.06986141204833984, 0.07341766357421875, 0.07697391510009766, 0.08053016662597656, 0.08408641815185547, 0.08764266967773438, 0.09119892120361328, 0.09475517272949219, 0.0983114242553711, 0.10186767578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 13.0, 10.0, 16.0, 12.0, 27.0, 32.0, 28.0, 45.0, 51.0, 66.0, 91.0, 128.0, 158.0, 251.0, 619.0, 5357.0, 2198501.0, 1979961.0, 7089.0, 862.0, 283.0, 165.0, 129.0, 96.0, 75.0, 49.0, 36.0, 27.0, 19.0, 17.0, 17.0, 12.0, 9.0, 9.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.357421875, -2.2813720703125, -2.205322265625, -2.1292724609375, -2.05322265625, -1.9771728515625, -1.901123046875, -1.8250732421875, -1.7490234375, -1.6729736328125, -1.596923828125, -1.5208740234375, -1.44482421875, -1.3687744140625, -1.292724609375, -1.2166748046875, -1.140625, -1.0645751953125, -0.988525390625, -0.9124755859375, -0.83642578125, -0.7603759765625, -0.684326171875, -0.6082763671875, -0.5322265625, -0.4561767578125, -0.380126953125, -0.3040771484375, -0.22802734375, -0.1519775390625, -0.075927734375, 0.0001220703125, 0.076171875, 0.1522216796875, 0.228271484375, 0.3043212890625, 0.38037109375, 0.4564208984375, 0.532470703125, 0.6085205078125, 0.6845703125, 0.7606201171875, 0.836669921875, 0.9127197265625, 0.98876953125, 1.0648193359375, 1.140869140625, 1.2169189453125, 1.29296875, 1.3690185546875, 1.445068359375, 1.5211181640625, 1.59716796875, 1.6732177734375, 1.749267578125, 1.8253173828125, 1.9013671875, 1.9774169921875, 2.053466796875, 2.1295166015625, 2.20556640625, 2.2816162109375, 2.357666015625, 2.4337158203125, 2.509765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 13.0, 11.0, 24.0, 53.0, 84.0, 219.0, 654.0, 2022.0, 524.0, 180.0, 83.0, 52.0, 50.0, 20.0, 22.0, 9.0, 6.0, 9.0, 12.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.243408203125, -0.23723602294921875, -0.2310638427734375, -0.22489166259765625, -0.218719482421875, -0.21254730224609375, -0.2063751220703125, -0.20020294189453125, -0.19403076171875, -0.18785858154296875, -0.1816864013671875, -0.17551422119140625, -0.169342041015625, -0.16316986083984375, -0.1569976806640625, -0.15082550048828125, -0.1446533203125, -0.13848114013671875, -0.1323089599609375, -0.12613677978515625, -0.119964599609375, -0.11379241943359375, -0.1076202392578125, -0.10144805908203125, -0.09527587890625, -0.08910369873046875, -0.0829315185546875, -0.07675933837890625, -0.070587158203125, -0.06441497802734375, -0.0582427978515625, -0.05207061767578125, -0.0458984375, -0.03972625732421875, -0.0335540771484375, -0.02738189697265625, -0.021209716796875, -0.01503753662109375, -0.0088653564453125, -0.00269317626953125, 0.00347900390625, 0.00965118408203125, 0.0158233642578125, 0.02199554443359375, 0.028167724609375, 0.03433990478515625, 0.0405120849609375, 0.04668426513671875, 0.0528564453125, 0.05902862548828125, 0.0652008056640625, 0.07137298583984375, 0.077545166015625, 0.08371734619140625, 0.0898895263671875, 0.09606170654296875, 0.10223388671875, 0.10840606689453125, 0.1145782470703125, 0.12075042724609375, 0.126922607421875, 0.13309478759765625, 0.1392669677734375, 0.14543914794921875, 0.151611328125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 13.0, 39.0, 116.0, 304.0, 311.0, 125.0, 39.0, 21.0, 15.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.244680643081665, -2.154935598373413, -2.065190553665161, -1.9754453897476196, -1.8857003450393677, -1.7959553003311157, -1.7062101364135742, -1.6164650917053223, -1.5267200469970703, -1.4369750022888184, -1.3472299575805664, -1.257484793663025, -1.167739748954773, -1.077994704246521, -0.9882495999336243, -0.8985044956207275, -0.8087594509124756, -0.7190144062042236, -0.6292693018913269, -0.5395241975784302, -0.4497791528701782, -0.3600340783596039, -0.27028900384902954, -0.1805438995361328, -0.09079885482788086, -0.0010537803173065186, 0.08869129419326782, 0.17843636870384216, 0.2681814432144165, 0.35792651772499084, 0.4476715922355652, 0.5374166965484619, 0.627161979675293, 0.7169070243835449, 0.8066521286964417, 0.8963972330093384, 0.9861422777175903, 1.0758873224258423, 1.1656324863433838, 1.2553775310516357, 1.3451225757598877, 1.4348676204681396, 1.5246126651763916, 1.614357829093933, 1.704102873802185, 1.793847918510437, 1.8835930824279785, 1.9733381271362305, 2.0630831718444824, 2.1528282165527344, 2.2425732612609863, 2.3323183059692383, 2.4220633506774902, 2.5118086338043213, 2.6015536785125732, 2.691298723220825, 2.781043767929077, 2.870788812637329, 2.960533857345581, 3.050278902053833, 3.140024185180664, 3.229769229888916, 3.319514274597168, 3.40925931930542, 3.499004364013672]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 8.0, 6.0, 12.0, 9.0, 22.0, 22.0, 42.0, 39.0, 52.0, 58.0, 56.0, 75.0, 68.0, 81.0, 87.0, 68.0, 61.0, 51.0, 44.0, 29.0, 27.0, 31.0, 14.0, 9.0, 8.0, 6.0, 9.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9387330412864685, -0.9107680320739746, -0.8828029632568359, -0.8548378944396973, -0.8268728852272034, -0.7989078760147095, -0.7709428071975708, -0.7429777383804321, -0.7150127291679382, -0.6870477199554443, -0.6590826511383057, -0.631117582321167, -0.6031525731086731, -0.5751875638961792, -0.5472224950790405, -0.5192574262619019, -0.49129241704940796, -0.4633273780345917, -0.4353623390197754, -0.4073973000049591, -0.3794322609901428, -0.35146722197532654, -0.32350218296051025, -0.29553714394569397, -0.2675721049308777, -0.2396070659160614, -0.21164202690124512, -0.18367698788642883, -0.15571194887161255, -0.12774690985679626, -0.09978187084197998, -0.0718168318271637, -0.04385173320770264, -0.015886694192886353, 0.012078344821929932, 0.040043383836746216, 0.0680084228515625, 0.09597346186637878, 0.12393850088119507, 0.15190353989601135, 0.17986857891082764, 0.20783361792564392, 0.2357986569404602, 0.2637636959552765, 0.2917287349700928, 0.31969377398490906, 0.34765881299972534, 0.3756238520145416, 0.4035888910293579, 0.4315539300441742, 0.4595189690589905, 0.48748400807380676, 0.515449047088623, 0.5434141159057617, 0.5713791251182556, 0.5993441343307495, 0.6273092031478882, 0.6552742719650269, 0.6832392811775208, 0.7112042903900146, 0.7391693592071533, 0.767134428024292, 0.7950994372367859, 0.8230644464492798, 0.8510295152664185]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 9.0, 9.0, 9.0, 2.0, 11.0, 14.0, 13.0, 15.0, 17.0, 42.0, 43.0, 80.0, 99.0, 141.0, 257.0, 423.0, 731.0, 1485.0, 3401.0, 9681.0, 45303.0, 338752.0, 541677.0, 82781.0, 14817.0, 4536.0, 1814.0, 919.0, 530.0, 312.0, 178.0, 114.0, 86.0, 62.0, 37.0, 27.0, 19.0, 20.0, 17.0, 10.0, 7.0, 10.0, 7.0, 8.0, 7.0, 6.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.75537109375, -0.7325897216796875, -0.709808349609375, -0.6870269775390625, -0.66424560546875, -0.6414642333984375, -0.618682861328125, -0.5959014892578125, -0.5731201171875, -0.5503387451171875, -0.527557373046875, -0.5047760009765625, -0.48199462890625, -0.4592132568359375, -0.436431884765625, -0.4136505126953125, -0.390869140625, -0.3680877685546875, -0.345306396484375, -0.3225250244140625, -0.29974365234375, -0.2769622802734375, -0.254180908203125, -0.2313995361328125, -0.2086181640625, -0.1858367919921875, -0.163055419921875, -0.1402740478515625, -0.11749267578125, -0.0947113037109375, -0.071929931640625, -0.0491485595703125, -0.0263671875, -0.0035858154296875, 0.019195556640625, 0.0419769287109375, 0.06475830078125, 0.0875396728515625, 0.110321044921875, 0.1331024169921875, 0.1558837890625, 0.1786651611328125, 0.201446533203125, 0.2242279052734375, 0.24700927734375, 0.2697906494140625, 0.292572021484375, 0.3153533935546875, 0.338134765625, 0.3609161376953125, 0.383697509765625, 0.4064788818359375, 0.42926025390625, 0.4520416259765625, 0.474822998046875, 0.4976043701171875, 0.5203857421875, 0.5431671142578125, 0.565948486328125, 0.5887298583984375, 0.61151123046875, 0.6342926025390625, 0.657073974609375, 0.6798553466796875, 0.70263671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 10.0, 20.0, 50.0, 54.0, 84.0, 112.0, 119.0, 128.0, 122.0, 82.0, 65.0, 50.0, 28.0, 28.0, 15.0, 10.0, 5.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10821533203125, -0.10505867004394531, -0.10190200805664062, -0.09874534606933594, -0.09558868408203125, -0.09243202209472656, -0.08927536010742188, -0.08611869812011719, -0.0829620361328125, -0.07980537414550781, -0.07664871215820312, -0.07349205017089844, -0.07033538818359375, -0.06717872619628906, -0.06402206420898438, -0.06086540222167969, -0.057708740234375, -0.05455207824707031, -0.051395416259765625, -0.04823875427246094, -0.04508209228515625, -0.04192543029785156, -0.038768768310546875, -0.03561210632324219, -0.0324554443359375, -0.029298782348632812, -0.026142120361328125, -0.022985458374023438, -0.01982879638671875, -0.016672134399414062, -0.013515472412109375, -0.010358810424804688, -0.0072021484375, -0.0040454864501953125, -0.000888824462890625, 0.0022678375244140625, 0.00542449951171875, 0.008581161499023438, 0.011737823486328125, 0.014894485473632812, 0.0180511474609375, 0.021207809448242188, 0.024364471435546875, 0.027521133422851562, 0.03067779541015625, 0.03383445739746094, 0.036991119384765625, 0.04014778137207031, 0.043304443359375, 0.04646110534667969, 0.049617767333984375, 0.05277442932128906, 0.05593109130859375, 0.05908775329589844, 0.062244415283203125, 0.06540107727050781, 0.0685577392578125, 0.07171440124511719, 0.07487106323242188, 0.07802772521972656, 0.08118438720703125, 0.08434104919433594, 0.08749771118164062, 0.09065437316894531, 0.09381103515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 11.0, 18.0, 20.0, 30.0, 33.0, 45.0, 73.0, 157.0, 229.0, 509.0, 1066.0, 3143.0, 12878.0, 80590.0, 534803.0, 355994.0, 46104.0, 8616.0, 2345.0, 884.0, 390.0, 224.0, 106.0, 86.0, 53.0, 29.0, 35.0, 19.0, 15.0, 10.0, 4.0, 7.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.603515625, -0.5845718383789062, -0.5656280517578125, -0.5466842651367188, -0.527740478515625, -0.5087966918945312, -0.4898529052734375, -0.47090911865234375, -0.45196533203125, -0.43302154541015625, -0.4140777587890625, -0.39513397216796875, -0.376190185546875, -0.35724639892578125, -0.3383026123046875, -0.31935882568359375, -0.3004150390625, -0.28147125244140625, -0.2625274658203125, -0.24358367919921875, -0.224639892578125, -0.20569610595703125, -0.1867523193359375, -0.16780853271484375, -0.14886474609375, -0.12992095947265625, -0.1109771728515625, -0.09203338623046875, -0.073089599609375, -0.05414581298828125, -0.0352020263671875, -0.01625823974609375, 0.002685546875, 0.02162933349609375, 0.0405731201171875, 0.05951690673828125, 0.078460693359375, 0.09740447998046875, 0.1163482666015625, 0.13529205322265625, 0.15423583984375, 0.17317962646484375, 0.1921234130859375, 0.21106719970703125, 0.230010986328125, 0.24895477294921875, 0.2678985595703125, 0.28684234619140625, 0.3057861328125, 0.32472991943359375, 0.3436737060546875, 0.36261749267578125, 0.381561279296875, 0.40050506591796875, 0.4194488525390625, 0.43839263916015625, 0.45733642578125, 0.47628021240234375, 0.4952239990234375, 0.5141677856445312, 0.533111572265625, 0.5520553588867188, 0.5709991455078125, 0.5899429321289062, 0.60888671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 8.0, 11.0, 19.0, 12.0, 14.0, 28.0, 25.0, 29.0, 20.0, 25.0, 32.0, 39.0, 28.0, 51.0, 51.0, 49.0, 48.0, 52.0, 38.0, 48.0, 44.0, 42.0, 38.0, 34.0, 25.0, 28.0, 20.0, 20.0, 20.0, 13.0, 18.0, 8.0, 9.0, 7.0, 4.0, 7.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2459716796875, -0.23764991760253906, -0.22932815551757812, -0.2210063934326172, -0.21268463134765625, -0.2043628692626953, -0.19604110717773438, -0.18771934509277344, -0.1793975830078125, -0.17107582092285156, -0.16275405883789062, -0.1544322967529297, -0.14611053466796875, -0.1377887725830078, -0.12946701049804688, -0.12114524841308594, -0.112823486328125, -0.10450172424316406, -0.09617996215820312, -0.08785820007324219, -0.07953643798828125, -0.07121467590332031, -0.06289291381835938, -0.05457115173339844, -0.0462493896484375, -0.03792762756347656, -0.029605865478515625, -0.021284103393554688, -0.01296234130859375, -0.0046405792236328125, 0.003681182861328125, 0.012002944946289062, 0.02032470703125, 0.028646469116210938, 0.036968231201171875, 0.04528999328613281, 0.05361175537109375, 0.06193351745605469, 0.07025527954101562, 0.07857704162597656, 0.0868988037109375, 0.09522056579589844, 0.10354232788085938, 0.11186408996582031, 0.12018585205078125, 0.1285076141357422, 0.13682937622070312, 0.14515113830566406, 0.153472900390625, 0.16179466247558594, 0.17011642456054688, 0.1784381866455078, 0.18675994873046875, 0.1950817108154297, 0.20340347290039062, 0.21172523498535156, 0.2200469970703125, 0.22836875915527344, 0.23669052124023438, 0.2450122833251953, 0.25333404541015625, 0.2616558074951172, 0.2699775695800781, 0.27829933166503906, 0.28662109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 6.0, 9.0, 16.0, 19.0, 66.0, 148.0, 343.0, 2027.0, 49772.0, 985876.0, 9026.0, 866.0, 218.0, 87.0, 43.0, 23.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.951171875, -1.902740478515625, -1.85430908203125, -1.805877685546875, -1.7574462890625, -1.709014892578125, -1.66058349609375, -1.612152099609375, -1.563720703125, -1.515289306640625, -1.46685791015625, -1.418426513671875, -1.3699951171875, -1.321563720703125, -1.27313232421875, -1.224700927734375, -1.17626953125, -1.127838134765625, -1.07940673828125, -1.030975341796875, -0.9825439453125, -0.934112548828125, -0.88568115234375, -0.837249755859375, -0.788818359375, -0.740386962890625, -0.69195556640625, -0.643524169921875, -0.5950927734375, -0.546661376953125, -0.49822998046875, -0.449798583984375, -0.4013671875, -0.352935791015625, -0.30450439453125, -0.256072998046875, -0.2076416015625, -0.159210205078125, -0.11077880859375, -0.062347412109375, -0.013916015625, 0.034515380859375, 0.08294677734375, 0.131378173828125, 0.1798095703125, 0.228240966796875, 0.27667236328125, 0.325103759765625, 0.37353515625, 0.421966552734375, 0.47039794921875, 0.518829345703125, 0.5672607421875, 0.615692138671875, 0.66412353515625, 0.712554931640625, 0.760986328125, 0.809417724609375, 0.85784912109375, 0.906280517578125, 0.9547119140625, 1.003143310546875, 1.05157470703125, 1.100006103515625, 1.1484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 16.0, 12.0, 28.0, 22.0, 39.0, 65.0, 61.0, 127.0, 132.0, 112.0, 99.0, 69.0, 55.0, 32.0, 30.0, 23.0, 10.0, 14.0, 9.0, 8.0, 2.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013816356658935547, -0.0001340806484222412, -0.00012999773025512695, -0.0001259148120880127, -0.00012183189392089844, -0.00011774897575378418, -0.00011366605758666992, -0.00010958313941955566, -0.0001055002212524414, -0.00010141730308532715, -9.733438491821289e-05, -9.325146675109863e-05, -8.916854858398438e-05, -8.508563041687012e-05, -8.100271224975586e-05, -7.69197940826416e-05, -7.283687591552734e-05, -6.875395774841309e-05, -6.467103958129883e-05, -6.058812141418457e-05, -5.650520324707031e-05, -5.2422285079956055e-05, -4.83393669128418e-05, -4.425644874572754e-05, -4.017353057861328e-05, -3.6090612411499023e-05, -3.2007694244384766e-05, -2.7924776077270508e-05, -2.384185791015625e-05, -1.9758939743041992e-05, -1.5676021575927734e-05, -1.1593103408813477e-05, -7.510185241699219e-06, -3.427267074584961e-06, 6.556510925292969e-07, 4.738569259643555e-06, 8.821487426757812e-06, 1.290440559387207e-05, 1.6987323760986328e-05, 2.1070241928100586e-05, 2.5153160095214844e-05, 2.92360782623291e-05, 3.331899642944336e-05, 3.740191459655762e-05, 4.1484832763671875e-05, 4.556775093078613e-05, 4.965066909790039e-05, 5.373358726501465e-05, 5.7816505432128906e-05, 6.189942359924316e-05, 6.598234176635742e-05, 7.006525993347168e-05, 7.414817810058594e-05, 7.82310962677002e-05, 8.231401443481445e-05, 8.639693260192871e-05, 9.047985076904297e-05, 9.456276893615723e-05, 9.864568710327148e-05, 0.00010272860527038574, 0.0001068115234375, 0.00011089444160461426, 0.00011497735977172852, 0.00011906027793884277, 0.00012314319610595703]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 16.0, 25.0, 29.0, 57.0, 75.0, 151.0, 284.0, 694.0, 1878.0, 6137.0, 29552.0, 652911.0, 330191.0, 19332.0, 4668.0, 1442.0, 549.0, 266.0, 103.0, 63.0, 45.0, 20.0, 14.0, 9.0, 3.0, 5.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.4602508544921875, -0.442474365234375, -0.4246978759765625, -0.40692138671875, -0.3891448974609375, -0.371368408203125, -0.3535919189453125, -0.3358154296875, -0.3180389404296875, -0.300262451171875, -0.2824859619140625, -0.26470947265625, -0.2469329833984375, -0.229156494140625, -0.2113800048828125, -0.193603515625, -0.1758270263671875, -0.158050537109375, -0.1402740478515625, -0.12249755859375, -0.1047210693359375, -0.086944580078125, -0.0691680908203125, -0.0513916015625, -0.0336151123046875, -0.015838623046875, 0.0019378662109375, 0.01971435546875, 0.0374908447265625, 0.055267333984375, 0.0730438232421875, 0.0908203125, 0.1085968017578125, 0.126373291015625, 0.1441497802734375, 0.16192626953125, 0.1797027587890625, 0.197479248046875, 0.2152557373046875, 0.2330322265625, 0.2508087158203125, 0.268585205078125, 0.2863616943359375, 0.30413818359375, 0.3219146728515625, 0.339691162109375, 0.3574676513671875, 0.375244140625, 0.3930206298828125, 0.410797119140625, 0.4285736083984375, 0.44635009765625, 0.4641265869140625, 0.481903076171875, 0.4996795654296875, 0.5174560546875, 0.5352325439453125, 0.553009033203125, 0.5707855224609375, 0.58856201171875, 0.6063385009765625, 0.624114990234375, 0.6418914794921875, 0.65966796875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 10.0, 15.0, 19.0, 45.0, 71.0, 84.0, 158.0, 156.0, 141.0, 112.0, 69.0, 35.0, 24.0, 12.0, 4.0, 5.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.330322265625, -0.32177162170410156, -0.3132209777832031, -0.3046703338623047, -0.29611968994140625, -0.2875690460205078, -0.2790184020996094, -0.27046775817871094, -0.2619171142578125, -0.25336647033691406, -0.24481582641601562, -0.2362651824951172, -0.22771453857421875, -0.2191638946533203, -0.21061325073242188, -0.20206260681152344, -0.193511962890625, -0.18496131896972656, -0.17641067504882812, -0.1678600311279297, -0.15930938720703125, -0.1507587432861328, -0.14220809936523438, -0.13365745544433594, -0.1251068115234375, -0.11655616760253906, -0.10800552368164062, -0.09945487976074219, -0.09090423583984375, -0.08235359191894531, -0.07380294799804688, -0.06525230407714844, -0.05670166015625, -0.04815101623535156, -0.039600372314453125, -0.031049728393554688, -0.02249908447265625, -0.013948440551757812, -0.005397796630859375, 0.0031528472900390625, 0.0117034912109375, 0.020254135131835938, 0.028804779052734375, 0.03735542297363281, 0.04590606689453125, 0.05445671081542969, 0.06300735473632812, 0.07155799865722656, 0.080108642578125, 0.08865928649902344, 0.09720993041992188, 0.10576057434082031, 0.11431121826171875, 0.12286186218261719, 0.13141250610351562, 0.13996315002441406, 0.1485137939453125, 0.15706443786621094, 0.16561508178710938, 0.1741657257080078, 0.18271636962890625, 0.1912670135498047, 0.19981765747070312, 0.20836830139160156, 0.2169189453125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 20.0, 74.0, 323.0, 441.0, 108.0, 26.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.791337013244629, -13.51680850982666, -13.242279052734375, -12.967750549316406, -12.693221092224121, -12.418692588806152, -12.144163131713867, -11.869634628295898, -11.59510612487793, -11.320577621459961, -11.046048164367676, -10.771519660949707, -10.496990203857422, -10.222461700439453, -9.947932243347168, -9.6734037399292, -9.398874282836914, -9.124345779418945, -8.84981632232666, -8.575287818908691, -8.300758361816406, -8.026229858398438, -7.7517008781433105, -7.477171897888184, -7.202642917633057, -6.92811393737793, -6.653584957122803, -6.379055976867676, -6.104527473449707, -5.829998016357422, -5.555469512939453, -5.280940532684326, -5.006411552429199, -4.731882572174072, -4.457353591918945, -4.182824611663818, -3.9082958698272705, -3.6337668895721436, -3.3592381477355957, -3.0847091674804688, -2.810180425643921, -2.535651445388794, -2.261122703552246, -1.9865937232971191, -1.7120647430419922, -1.4375357627868652, -1.1630069017410278, -0.8884780406951904, -0.6139490604400635, -0.3394201397895813, -0.06489121913909912, 0.20963770151138306, 0.48416662216186523, 0.7586956024169922, 1.0332244634628296, 1.307753324508667, 1.582282304763794, 1.856811285018921, 2.1313400268554688, 2.4058690071105957, 2.6803979873657227, 2.9549269676208496, 3.2294559478759766, 3.5039846897125244, 3.7785136699676514]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 8.0, 15.0, 16.0, 23.0, 25.0, 33.0, 55.0, 42.0, 49.0, 58.0, 56.0, 80.0, 77.0, 65.0, 64.0, 55.0, 45.0, 44.0, 27.0, 36.0, 31.0, 26.0, 18.0, 15.0, 11.0, 5.0, 7.0, 6.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5152783393859863, -2.426679849624634, -2.3380813598632812, -2.2494828701019287, -2.160884380340576, -2.0722861289978027, -1.9836876392364502, -1.8950891494750977, -1.8064906597137451, -1.7178921699523926, -1.62929368019104, -1.540695309638977, -1.4520968198776245, -1.363498330116272, -1.274899959564209, -1.1863014698028564, -1.097702980041504, -1.0091044902801514, -0.9205060601234436, -0.8319076299667358, -0.7433091402053833, -0.6547106504440308, -0.566112220287323, -0.47751379013061523, -0.3889153003692627, -0.30031684041023254, -0.2117183804512024, -0.12311992049217224, -0.03452146053314209, 0.05407699942588806, 0.1426754593849182, 0.23127388954162598, 0.3198723793029785, 0.40847083926200867, 0.4970692992210388, 0.5856677293777466, 0.6742662191390991, 0.7628647089004517, 0.8514631390571594, 0.9400615692138672, 1.0286600589752197, 1.1172585487365723, 1.2058570384979248, 1.2944554090499878, 1.3830538988113403, 1.4716523885726929, 1.5602507591247559, 1.6488492488861084, 1.737447738647461, 1.8260462284088135, 1.914644718170166, 2.0032432079315186, 2.091841697692871, 2.1804399490356445, 2.269038438796997, 2.3576369285583496, 2.446235418319702, 2.5348339080810547, 2.6234323978424072, 2.7120308876037598, 2.800629138946533, 2.8892276287078857, 2.9778261184692383, 3.066424608230591, 3.1550230979919434]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 5.0, 7.0, 7.0, 9.0, 12.0, 12.0, 18.0, 22.0, 34.0, 42.0, 60.0, 82.0, 120.0, 171.0, 271.0, 475.0, 992.0, 2167.0, 6326.0, 28143.0, 375996.0, 3689679.0, 71808.0, 11951.0, 3389.0, 1309.0, 544.0, 238.0, 142.0, 88.0, 60.0, 36.0, 22.0, 14.0, 8.0, 4.0, 5.0, 5.0, 0.0, 2.0, 2.0], "bins": [-1.7431640625, -1.7037429809570312, -1.6643218994140625, -1.6249008178710938, -1.585479736328125, -1.5460586547851562, -1.5066375732421875, -1.4672164916992188, -1.42779541015625, -1.3883743286132812, -1.3489532470703125, -1.3095321655273438, -1.270111083984375, -1.2306900024414062, -1.1912689208984375, -1.1518478393554688, -1.1124267578125, -1.0730056762695312, -1.0335845947265625, -0.9941635131835938, -0.954742431640625, -0.9153213500976562, -0.8759002685546875, -0.8364791870117188, -0.79705810546875, -0.7576370239257812, -0.7182159423828125, -0.6787948608398438, -0.639373779296875, -0.5999526977539062, -0.5605316162109375, -0.5211105346679688, -0.481689453125, -0.44226837158203125, -0.4028472900390625, -0.36342620849609375, -0.324005126953125, -0.28458404541015625, -0.2451629638671875, -0.20574188232421875, -0.16632080078125, -0.12689971923828125, -0.0874786376953125, -0.04805755615234375, -0.008636474609375, 0.03078460693359375, 0.0702056884765625, 0.10962677001953125, 0.1490478515625, 0.18846893310546875, 0.2278900146484375, 0.26731109619140625, 0.306732177734375, 0.34615325927734375, 0.3855743408203125, 0.42499542236328125, 0.46441650390625, 0.5038375854492188, 0.5432586669921875, 0.5826797485351562, 0.622100830078125, 0.6615219116210938, 0.7009429931640625, 0.7403640747070312, 0.77978515625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 2.0, 6.0, 11.0, 18.0, 23.0, 34.0, 44.0, 56.0, 75.0, 83.0, 100.0, 68.0, 106.0, 85.0, 64.0, 58.0, 48.0, 35.0, 17.0, 19.0, 12.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10906982421875, -0.10572052001953125, -0.1023712158203125, -0.09902191162109375, -0.095672607421875, -0.09232330322265625, -0.0889739990234375, -0.08562469482421875, -0.082275390625, -0.07892608642578125, -0.0755767822265625, -0.07222747802734375, -0.068878173828125, -0.06552886962890625, -0.0621795654296875, -0.05883026123046875, -0.05548095703125, -0.05213165283203125, -0.0487823486328125, -0.04543304443359375, -0.042083740234375, -0.03873443603515625, -0.0353851318359375, -0.03203582763671875, -0.0286865234375, -0.02533721923828125, -0.0219879150390625, -0.01863861083984375, -0.015289306640625, -0.01194000244140625, -0.0085906982421875, -0.00524139404296875, -0.00189208984375, 0.00145721435546875, 0.0048065185546875, 0.00815582275390625, 0.011505126953125, 0.01485443115234375, 0.0182037353515625, 0.02155303955078125, 0.02490234375, 0.02825164794921875, 0.0316009521484375, 0.03495025634765625, 0.038299560546875, 0.04164886474609375, 0.0449981689453125, 0.04834747314453125, 0.05169677734375, 0.05504608154296875, 0.0583953857421875, 0.06174468994140625, 0.065093994140625, 0.06844329833984375, 0.0717926025390625, 0.07514190673828125, 0.0784912109375, 0.08184051513671875, 0.0851898193359375, 0.08853912353515625, 0.091888427734375, 0.09523773193359375, 0.0985870361328125, 0.10193634033203125, 0.10528564453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 6.0, 5.0, 10.0, 16.0, 15.0, 22.0, 31.0, 34.0, 50.0, 68.0, 90.0, 135.0, 226.0, 505.0, 1265.0, 5009.0, 196005.0, 3973048.0, 14676.0, 1706.0, 586.0, 296.0, 160.0, 89.0, 67.0, 35.0, 24.0, 19.0, 18.0, 11.0, 11.0, 6.0, 10.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9853515625, -1.9173736572265625, -1.849395751953125, -1.7814178466796875, -1.71343994140625, -1.6454620361328125, -1.577484130859375, -1.5095062255859375, -1.4415283203125, -1.3735504150390625, -1.305572509765625, -1.2375946044921875, -1.16961669921875, -1.1016387939453125, -1.033660888671875, -0.9656829833984375, -0.897705078125, -0.8297271728515625, -0.761749267578125, -0.6937713623046875, -0.62579345703125, -0.5578155517578125, -0.489837646484375, -0.4218597412109375, -0.3538818359375, -0.2859039306640625, -0.217926025390625, -0.1499481201171875, -0.08197021484375, -0.0139923095703125, 0.053985595703125, 0.1219635009765625, 0.18994140625, 0.2579193115234375, 0.325897216796875, 0.3938751220703125, 0.46185302734375, 0.5298309326171875, 0.597808837890625, 0.6657867431640625, 0.7337646484375, 0.8017425537109375, 0.869720458984375, 0.9376983642578125, 1.00567626953125, 1.0736541748046875, 1.141632080078125, 1.2096099853515625, 1.277587890625, 1.3455657958984375, 1.413543701171875, 1.4815216064453125, 1.54949951171875, 1.6174774169921875, 1.685455322265625, 1.7534332275390625, 1.8214111328125, 1.8893890380859375, 1.957366943359375, 2.0253448486328125, 2.09332275390625, 2.1613006591796875, 2.229278564453125, 2.2972564697265625, 2.365234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 7.0, 4.0, 18.0, 21.0, 41.0, 67.0, 153.0, 408.0, 2172.0, 723.0, 231.0, 104.0, 69.0, 24.0, 15.0, 12.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43017578125, -0.4207496643066406, -0.41132354736328125, -0.4018974304199219, -0.3924713134765625, -0.3830451965332031, -0.37361907958984375, -0.3641929626464844, -0.354766845703125, -0.3453407287597656, -0.33591461181640625, -0.3264884948730469, -0.3170623779296875, -0.3076362609863281, -0.29821014404296875, -0.2887840270996094, -0.27935791015625, -0.2699317932128906, -0.26050567626953125, -0.2510795593261719, -0.2416534423828125, -0.23222732543945312, -0.22280120849609375, -0.21337509155273438, -0.203948974609375, -0.19452285766601562, -0.18509674072265625, -0.17567062377929688, -0.1662445068359375, -0.15681838989257812, -0.14739227294921875, -0.13796615600585938, -0.1285400390625, -0.11911392211914062, -0.10968780517578125, -0.10026168823242188, -0.0908355712890625, -0.08140945434570312, -0.07198333740234375, -0.06255722045898438, -0.053131103515625, -0.043704986572265625, -0.03427886962890625, -0.024852752685546875, -0.0154266357421875, -0.006000518798828125, 0.00342559814453125, 0.012851715087890625, 0.02227783203125, 0.031703948974609375, 0.04113006591796875, 0.050556182861328125, 0.0599822998046875, 0.06940841674804688, 0.07883453369140625, 0.08826065063476562, 0.097686767578125, 0.10711288452148438, 0.11653900146484375, 0.12596511840820312, 0.1353912353515625, 0.14481735229492188, 0.15424346923828125, 0.16366958618164062, 0.173095703125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 19.0, 50.0, 113.0, 234.0, 249.0, 168.0, 70.0, 31.0, 15.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6778669357299805, -1.6155760288238525, -1.553285002708435, -1.4909940958023071, -1.4287031888961792, -1.3664121627807617, -1.3041212558746338, -1.2418303489685059, -1.179539442062378, -1.11724853515625, -1.0549575090408325, -0.9926666021347046, -0.9303756952285767, -0.868084728717804, -0.8057937622070312, -0.7435028553009033, -0.6812118887901306, -0.6189209222793579, -0.55663001537323, -0.4943390488624573, -0.43204814195632935, -0.36975717544555664, -0.3074662387371063, -0.245175302028656, -0.1828843653202057, -0.12059342861175537, -0.05830248445272446, 0.0039884597063064575, 0.06627939641475677, 0.1285703480243683, 0.1908612847328186, 0.2531522214412689, 0.31544315814971924, 0.37773409485816956, 0.4400250315666199, 0.5023159980773926, 0.5646069049835205, 0.6268978714942932, 0.6891888380050659, 0.7514797449111938, 0.8137706518173218, 0.8760616183280945, 0.9383525252342224, 1.0006434917449951, 1.062934398651123, 1.125225305557251, 1.1875163316726685, 1.2498072385787964, 1.3120982646942139, 1.3743891716003418, 1.4366801977157593, 1.4989711046218872, 1.5612620115280151, 1.6235530376434326, 1.6858439445495605, 1.7481348514556885, 1.8104257583618164, 1.8727166652679443, 1.9350076913833618, 1.9972985982894897, 2.0595896244049072, 2.121880531311035, 2.184171438217163, 2.246462345123291, 2.308753252029419]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 2.0, 10.0, 11.0, 10.0, 9.0, 9.0, 21.0, 26.0, 24.0, 28.0, 23.0, 22.0, 34.0, 31.0, 55.0, 42.0, 61.0, 40.0, 56.0, 52.0, 41.0, 48.0, 36.0, 37.0, 36.0, 43.0, 33.0, 23.0, 22.0, 21.0, 15.0, 15.0, 10.0, 12.0, 14.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5707749128341675, -0.5530621409416199, -0.5353493094444275, -0.5176365375518799, -0.4999237060546875, -0.4822109341621399, -0.4644981324672699, -0.4467853307723999, -0.4290725290775299, -0.4113597273826599, -0.3936469256877899, -0.3759341239929199, -0.3582213521003723, -0.34050852060317993, -0.3227957487106323, -0.30508294701576233, -0.28737014532089233, -0.26965734362602234, -0.25194454193115234, -0.23423175513744354, -0.21651895344257355, -0.19880615174770355, -0.18109336495399475, -0.16338056325912476, -0.14566776156425476, -0.12795495986938477, -0.11024216562509537, -0.09252937138080597, -0.07481656968593597, -0.05710376799106598, -0.03939097374677658, -0.021678179502487183, -0.0039653778076171875, 0.01374742016196251, 0.031460218131542206, 0.0491730161011219, 0.0668858140707016, 0.0845986157655716, 0.10231141000986099, 0.12002420425415039, 0.13773700594902039, 0.15544980764389038, 0.17316260933876038, 0.19087539613246918, 0.20858819782733917, 0.22630099952220917, 0.24401378631591797, 0.26172658801078796, 0.27943938970565796, 0.29715219140052795, 0.31486499309539795, 0.33257779479026794, 0.35029059648513794, 0.36800336837768555, 0.38571617007255554, 0.40342897176742554, 0.42114177346229553, 0.4388545751571655, 0.4565673768520355, 0.4742801785469055, 0.4919929504394531, 0.5097057819366455, 0.5274185538291931, 0.5451313257217407, 0.5628441572189331]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 4.0, 3.0, 5.0, 14.0, 11.0, 18.0, 20.0, 34.0, 46.0, 65.0, 95.0, 151.0, 221.0, 417.0, 762.0, 1573.0, 4090.0, 13976.0, 82537.0, 571111.0, 319499.0, 39943.0, 8521.0, 2759.0, 1206.0, 557.0, 331.0, 192.0, 126.0, 81.0, 58.0, 36.0, 28.0, 13.0, 14.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.97998046875, -0.9533615112304688, -0.9267425537109375, -0.9001235961914062, -0.873504638671875, -0.8468856811523438, -0.8202667236328125, -0.7936477661132812, -0.76702880859375, -0.7404098510742188, -0.7137908935546875, -0.6871719360351562, -0.660552978515625, -0.6339340209960938, -0.6073150634765625, -0.5806961059570312, -0.5540771484375, -0.5274581909179688, -0.5008392333984375, -0.47422027587890625, -0.447601318359375, -0.42098236083984375, -0.3943634033203125, -0.36774444580078125, -0.34112548828125, -0.31450653076171875, -0.2878875732421875, -0.26126861572265625, -0.234649658203125, -0.20803070068359375, -0.1814117431640625, -0.15479278564453125, -0.128173828125, -0.10155487060546875, -0.0749359130859375, -0.04831695556640625, -0.021697998046875, 0.00492095947265625, 0.0315399169921875, 0.05815887451171875, 0.08477783203125, 0.11139678955078125, 0.1380157470703125, 0.16463470458984375, 0.191253662109375, 0.21787261962890625, 0.2444915771484375, 0.27111053466796875, 0.2977294921875, 0.32434844970703125, 0.3509674072265625, 0.37758636474609375, 0.404205322265625, 0.43082427978515625, 0.4574432373046875, 0.48406219482421875, 0.51068115234375, 0.5373001098632812, 0.5639190673828125, 0.5905380249023438, 0.617156982421875, 0.6437759399414062, 0.6703948974609375, 0.6970138549804688, 0.7236328125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 12.0, 8.0, 20.0, 28.0, 36.0, 51.0, 60.0, 81.0, 74.0, 76.0, 94.0, 95.0, 80.0, 59.0, 56.0, 33.0, 35.0, 31.0, 21.0, 10.0, 8.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10687255859375, -0.10346698760986328, -0.10006141662597656, -0.09665584564208984, -0.09325027465820312, -0.0898447036743164, -0.08643913269042969, -0.08303356170654297, -0.07962799072265625, -0.07622241973876953, -0.07281684875488281, -0.0694112777709961, -0.06600570678710938, -0.06260013580322266, -0.05919456481933594, -0.05578899383544922, -0.0523834228515625, -0.04897785186767578, -0.04557228088378906, -0.042166709899902344, -0.038761138916015625, -0.035355567932128906, -0.03194999694824219, -0.02854442596435547, -0.02513885498046875, -0.02173328399658203, -0.018327713012695312, -0.014922142028808594, -0.011516571044921875, -0.008111000061035156, -0.0047054290771484375, -0.0012998580932617188, 0.002105712890625, 0.005511283874511719, 0.008916854858398438, 0.012322425842285156, 0.015727996826171875, 0.019133567810058594, 0.022539138793945312, 0.02594470977783203, 0.02935028076171875, 0.03275585174560547, 0.03616142272949219, 0.039566993713378906, 0.042972564697265625, 0.046378135681152344, 0.04978370666503906, 0.05318927764892578, 0.0565948486328125, 0.06000041961669922, 0.06340599060058594, 0.06681156158447266, 0.07021713256835938, 0.0736227035522461, 0.07702827453613281, 0.08043384552001953, 0.08383941650390625, 0.08724498748779297, 0.09065055847167969, 0.0940561294555664, 0.09746170043945312, 0.10086727142333984, 0.10427284240722656, 0.10767841339111328, 0.111083984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 10.0, 13.0, 20.0, 18.0, 52.0, 64.0, 109.0, 154.0, 294.0, 514.0, 1135.0, 2956.0, 9347.0, 38819.0, 219569.0, 568778.0, 164318.0, 30161.0, 7441.0, 2499.0, 1042.0, 495.0, 292.0, 143.0, 99.0, 67.0, 33.0, 39.0, 22.0, 21.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5688095092773438, -0.5507049560546875, -0.5326004028320312, -0.514495849609375, -0.49639129638671875, -0.4782867431640625, -0.46018218994140625, -0.44207763671875, -0.42397308349609375, -0.4058685302734375, -0.38776397705078125, -0.369659423828125, -0.35155487060546875, -0.3334503173828125, -0.31534576416015625, -0.2972412109375, -0.27913665771484375, -0.2610321044921875, -0.24292755126953125, -0.224822998046875, -0.20671844482421875, -0.1886138916015625, -0.17050933837890625, -0.15240478515625, -0.13430023193359375, -0.1161956787109375, -0.09809112548828125, -0.079986572265625, -0.06188201904296875, -0.0437774658203125, -0.02567291259765625, -0.007568359375, 0.01053619384765625, 0.0286407470703125, 0.04674530029296875, 0.064849853515625, 0.08295440673828125, 0.1010589599609375, 0.11916351318359375, 0.13726806640625, 0.15537261962890625, 0.1734771728515625, 0.19158172607421875, 0.209686279296875, 0.22779083251953125, 0.2458953857421875, 0.26399993896484375, 0.2821044921875, 0.30020904541015625, 0.3183135986328125, 0.33641815185546875, 0.354522705078125, 0.37262725830078125, 0.3907318115234375, 0.40883636474609375, 0.42694091796875, 0.44504547119140625, 0.4631500244140625, 0.48125457763671875, 0.499359130859375, 0.5174636840820312, 0.5355682373046875, 0.5536727905273438, 0.57177734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 7.0, 10.0, 11.0, 16.0, 17.0, 16.0, 24.0, 26.0, 29.0, 32.0, 40.0, 32.0, 49.0, 57.0, 42.0, 68.0, 67.0, 56.0, 49.0, 59.0, 45.0, 31.0, 39.0, 25.0, 29.0, 20.0, 17.0, 19.0, 14.0, 8.0, 3.0, 8.0, 10.0, 3.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4521484375, -0.4392852783203125, -0.426422119140625, -0.4135589599609375, -0.40069580078125, -0.3878326416015625, -0.374969482421875, -0.3621063232421875, -0.3492431640625, -0.3363800048828125, -0.323516845703125, -0.3106536865234375, -0.29779052734375, -0.2849273681640625, -0.272064208984375, -0.2592010498046875, -0.246337890625, -0.2334747314453125, -0.220611572265625, -0.2077484130859375, -0.19488525390625, -0.1820220947265625, -0.169158935546875, -0.1562957763671875, -0.1434326171875, -0.1305694580078125, -0.117706298828125, -0.1048431396484375, -0.09197998046875, -0.0791168212890625, -0.066253662109375, -0.0533905029296875, -0.04052734375, -0.0276641845703125, -0.014801025390625, -0.0019378662109375, 0.01092529296875, 0.0237884521484375, 0.036651611328125, 0.0495147705078125, 0.0623779296875, 0.0752410888671875, 0.088104248046875, 0.1009674072265625, 0.11383056640625, 0.1266937255859375, 0.139556884765625, 0.1524200439453125, 0.165283203125, 0.1781463623046875, 0.191009521484375, 0.2038726806640625, 0.21673583984375, 0.2295989990234375, 0.242462158203125, 0.2553253173828125, 0.2681884765625, 0.2810516357421875, 0.293914794921875, 0.3067779541015625, 0.31964111328125, 0.3325042724609375, 0.345367431640625, 0.3582305908203125, 0.37109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 7.0, 18.0, 22.0, 44.0, 90.0, 190.0, 424.0, 1028.0, 2953.0, 10804.0, 67947.0, 804678.0, 138006.0, 15832.0, 4122.0, 1345.0, 528.0, 237.0, 108.0, 56.0, 35.0, 20.0, 13.0, 12.0, 3.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447509765625, -0.4333610534667969, -0.41921234130859375, -0.4050636291503906, -0.3909149169921875, -0.3767662048339844, -0.36261749267578125, -0.3484687805175781, -0.334320068359375, -0.3201713562011719, -0.30602264404296875, -0.2918739318847656, -0.2777252197265625, -0.2635765075683594, -0.24942779541015625, -0.23527908325195312, -0.22113037109375, -0.20698165893554688, -0.19283294677734375, -0.17868423461914062, -0.1645355224609375, -0.15038681030273438, -0.13623809814453125, -0.12208938598632812, -0.107940673828125, -0.09379196166992188, -0.07964324951171875, -0.06549453735351562, -0.0513458251953125, -0.037197113037109375, -0.02304840087890625, -0.008899688720703125, 0.0052490234375, 0.019397735595703125, 0.03354644775390625, 0.047695159912109375, 0.0618438720703125, 0.07599258422851562, 0.09014129638671875, 0.10429000854492188, 0.118438720703125, 0.13258743286132812, 0.14673614501953125, 0.16088485717773438, 0.1750335693359375, 0.18918228149414062, 0.20333099365234375, 0.21747970581054688, 0.23162841796875, 0.24577713012695312, 0.25992584228515625, 0.2740745544433594, 0.2882232666015625, 0.3023719787597656, 0.31652069091796875, 0.3306694030761719, 0.344818115234375, 0.3589668273925781, 0.37311553955078125, 0.3872642517089844, 0.4014129638671875, 0.4155616760253906, 0.42971038818359375, 0.4438591003417969, 0.4580078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 8.0, 9.0, 17.0, 17.0, 23.0, 51.0, 63.0, 72.0, 79.0, 89.0, 92.0, 103.0, 72.0, 57.0, 55.0, 57.0, 29.0, 17.0, 14.0, 14.0, 8.0, 12.0, 8.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010842084884643555, -0.00010530184954404831, -0.00010218285024166107, -9.906385093927383e-05, -9.59448516368866e-05, -9.282585233449936e-05, -8.970685303211212e-05, -8.658785372972488e-05, -8.346885442733765e-05, -8.034985512495041e-05, -7.723085582256317e-05, -7.411185652017593e-05, -7.09928572177887e-05, -6.787385791540146e-05, -6.475485861301422e-05, -6.163585931062698e-05, -5.8516860008239746e-05, -5.539786070585251e-05, -5.227886140346527e-05, -4.9159862101078033e-05, -4.6040862798690796e-05, -4.292186349630356e-05, -3.980286419391632e-05, -3.668386489152908e-05, -3.3564865589141846e-05, -3.0445866286754608e-05, -2.732686698436737e-05, -2.4207867681980133e-05, -2.1088868379592896e-05, -1.7969869077205658e-05, -1.485086977481842e-05, -1.1731870472431183e-05, -8.612871170043945e-06, -5.493871867656708e-06, -2.3748725652694702e-06, 7.441267371177673e-07, 3.863126039505005e-06, 6.9821253418922424e-06, 1.010112464427948e-05, 1.3220123946666718e-05, 1.6339123249053955e-05, 1.9458122551441193e-05, 2.257712185382843e-05, 2.5696121156215668e-05, 2.8815120458602905e-05, 3.193411976099014e-05, 3.505311906337738e-05, 3.817211836576462e-05, 4.1291117668151855e-05, 4.441011697053909e-05, 4.752911627292633e-05, 5.064811557531357e-05, 5.3767114877700806e-05, 5.688611418008804e-05, 6.000511348247528e-05, 6.312411278486252e-05, 6.624311208724976e-05, 6.9362111389637e-05, 7.248111069202423e-05, 7.560010999441147e-05, 7.87191092967987e-05, 8.183810859918594e-05, 8.495710790157318e-05, 8.807610720396042e-05, 9.119510650634766e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 5.0, 9.0, 15.0, 24.0, 27.0, 40.0, 62.0, 98.0, 145.0, 264.0, 472.0, 811.0, 1650.0, 3658.0, 9454.0, 29638.0, 169664.0, 687245.0, 108022.0, 23145.0, 7827.0, 3164.0, 1412.0, 681.0, 385.0, 240.0, 134.0, 82.0, 59.0, 36.0, 20.0, 13.0, 15.0, 12.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.282958984375, -0.2733345031738281, -0.26371002197265625, -0.2540855407714844, -0.2444610595703125, -0.23483657836914062, -0.22521209716796875, -0.21558761596679688, -0.205963134765625, -0.19633865356445312, -0.18671417236328125, -0.17708969116210938, -0.1674652099609375, -0.15784072875976562, -0.14821624755859375, -0.13859176635742188, -0.12896728515625, -0.11934280395507812, -0.10971832275390625, -0.10009384155273438, -0.0904693603515625, -0.08084487915039062, -0.07122039794921875, -0.061595916748046875, -0.051971435546875, -0.042346954345703125, -0.03272247314453125, -0.023097991943359375, -0.0134735107421875, -0.003849029541015625, 0.00577545166015625, 0.015399932861328125, 0.0250244140625, 0.034648895263671875, 0.04427337646484375, 0.053897857666015625, 0.0635223388671875, 0.07314682006835938, 0.08277130126953125, 0.09239578247070312, 0.102020263671875, 0.11164474487304688, 0.12126922607421875, 0.13089370727539062, 0.1405181884765625, 0.15014266967773438, 0.15976715087890625, 0.16939163208007812, 0.17901611328125, 0.18864059448242188, 0.19826507568359375, 0.20788955688476562, 0.2175140380859375, 0.22713851928710938, 0.23676300048828125, 0.24638748168945312, 0.256011962890625, 0.2656364440917969, 0.27526092529296875, 0.2848854064941406, 0.2945098876953125, 0.3041343688964844, 0.31375885009765625, 0.3233833312988281, 0.3330078125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 1.0, 5.0, 4.0, 2.0, 9.0, 7.0, 15.0, 31.0, 28.0, 45.0, 59.0, 92.0, 99.0, 142.0, 118.0, 92.0, 73.0, 53.0, 41.0, 25.0, 13.0, 6.0, 6.0, 6.0, 8.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2076416015625, -0.20068740844726562, -0.19373321533203125, -0.18677902221679688, -0.1798248291015625, -0.17287063598632812, -0.16591644287109375, -0.15896224975585938, -0.152008056640625, -0.14505386352539062, -0.13809967041015625, -0.13114547729492188, -0.1241912841796875, -0.11723709106445312, -0.11028289794921875, -0.10332870483398438, -0.09637451171875, -0.08942031860351562, -0.08246612548828125, -0.07551193237304688, -0.0685577392578125, -0.061603546142578125, -0.05464935302734375, -0.047695159912109375, -0.040740966796875, -0.033786773681640625, -0.02683258056640625, -0.019878387451171875, -0.0129241943359375, -0.005970001220703125, 0.00098419189453125, 0.007938385009765625, 0.014892578125, 0.021846771240234375, 0.02880096435546875, 0.035755157470703125, 0.0427093505859375, 0.049663543701171875, 0.05661773681640625, 0.06357192993164062, 0.070526123046875, 0.07748031616210938, 0.08443450927734375, 0.09138870239257812, 0.0983428955078125, 0.10529708862304688, 0.11225128173828125, 0.11920547485351562, 0.12615966796875, 0.13311386108398438, 0.14006805419921875, 0.14702224731445312, 0.1539764404296875, 0.16093063354492188, 0.16788482666015625, 0.17483901977539062, 0.181793212890625, 0.18874740600585938, 0.19570159912109375, 0.20265579223632812, 0.2096099853515625, 0.21656417846679688, 0.22351837158203125, 0.23047256469726562, 0.2374267578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 9.0, 68.0, 311.0, 423.0, 158.0, 28.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.710105895996094, -13.41294002532959, -13.115774154663086, -12.818608283996582, -12.521442413330078, -12.224276542663574, -11.92711067199707, -11.62994384765625, -11.332778930664062, -11.035613059997559, -10.738447189331055, -10.44128131866455, -10.144115447998047, -9.846949577331543, -9.549783706665039, -9.252616882324219, -8.955451011657715, -8.658285140991211, -8.361119270324707, -8.063953399658203, -7.766787528991699, -7.469621658325195, -7.172455310821533, -6.875289440155029, -6.578123569488525, -6.2809576988220215, -5.983791828155518, -5.686625957489014, -5.389459609985352, -5.092293739318848, -4.795127868652344, -4.49796199798584, -4.2007951736450195, -3.9036293029785156, -3.6064634323120117, -3.3092973232269287, -3.012131452560425, -2.714965581893921, -2.417799472808838, -2.120633602142334, -1.82346773147583, -1.5263018608093262, -1.2291358709335327, -0.931969940662384, -0.6348040103912354, -0.33763813972473145, -0.04047214984893799, 0.25669384002685547, 0.5538597106933594, 0.8510256409645081, 1.1481915712356567, 1.4453575611114502, 1.742523431777954, 2.039689302444458, 2.336855411529541, 2.634021282196045, 2.931187152862549, 3.2283530235290527, 3.5255188941955566, 3.8226850032806396, 4.119851112365723, 4.417016983032227, 4.7141828536987305, 5.011348724365234, 5.308514595031738]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 8.0, 10.0, 14.0, 24.0, 17.0, 22.0, 13.0, 30.0, 37.0, 36.0, 39.0, 54.0, 44.0, 48.0, 55.0, 57.0, 50.0, 46.0, 51.0, 47.0, 47.0, 33.0, 40.0, 29.0, 24.0, 23.0, 14.0, 15.0, 16.0, 12.0, 7.0, 4.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.1682190895080566, -2.0930838584899902, -2.017948865890503, -1.9428136348724365, -1.8676784038543701, -1.7925432920455933, -1.7174081802368164, -1.64227294921875, -1.5671378374099731, -1.4920027256011963, -1.4168674945831299, -1.341732382774353, -1.2665972709655762, -1.1914620399475098, -1.116326928138733, -1.041191816329956, -0.9660565853118896, -0.890921413898468, -0.8157862424850464, -0.7406511306762695, -0.6655159592628479, -0.5903807878494263, -0.5152456760406494, -0.4401105046272278, -0.36497533321380615, -0.2898401618003845, -0.21470502018928528, -0.13956986367702484, -0.0644347071647644, 0.010700464248657227, 0.08583560585975647, 0.1609707474708557, 0.23610591888427734, 0.311241090297699, 0.3863762319087982, 0.46151137351989746, 0.5366465449333191, 0.6117817163467407, 0.6869168281555176, 0.7620519995689392, 0.8371871709823608, 0.9123223423957825, 0.9874575138092041, 1.062592625617981, 1.1377277374267578, 1.2128629684448242, 1.287998080253601, 1.363133192062378, 1.4382684230804443, 1.5134035348892212, 1.5885387659072876, 1.6636738777160645, 1.7388091087341309, 1.8139442205429077, 1.8890793323516846, 1.964214563369751, 2.0393495559692383, 2.1144847869873047, 2.189619779586792, 2.2647550106048584, 2.339890241622925, 2.415025234222412, 2.4901604652404785, 2.565295696258545, 2.6404309272766113]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 6.0, 10.0, 15.0, 8.0, 14.0, 14.0, 13.0, 19.0, 35.0, 44.0, 57.0, 67.0, 83.0, 155.0, 212.0, 339.0, 656.0, 1297.0, 3190.0, 10635.0, 55863.0, 3707325.0, 374808.0, 28233.0, 6775.0, 2288.0, 923.0, 498.0, 269.0, 148.0, 86.0, 51.0, 37.0, 32.0, 25.0, 5.0, 12.0, 8.0, 10.0, 5.0, 3.0, 4.0, 2.0], "bins": [-1.4052734375, -1.3724441528320312, -1.3396148681640625, -1.3067855834960938, -1.273956298828125, -1.2411270141601562, -1.2082977294921875, -1.1754684448242188, -1.14263916015625, -1.1098098754882812, -1.0769805908203125, -1.0441513061523438, -1.011322021484375, -0.9784927368164062, -0.9456634521484375, -0.9128341674804688, -0.8800048828125, -0.8471755981445312, -0.8143463134765625, -0.7815170288085938, -0.748687744140625, -0.7158584594726562, -0.6830291748046875, -0.6501998901367188, -0.61737060546875, -0.5845413208007812, -0.5517120361328125, -0.5188827514648438, -0.486053466796875, -0.45322418212890625, -0.4203948974609375, -0.38756561279296875, -0.354736328125, -0.32190704345703125, -0.2890777587890625, -0.25624847412109375, -0.223419189453125, -0.19058990478515625, -0.1577606201171875, -0.12493133544921875, -0.09210205078125, -0.05927276611328125, -0.0264434814453125, 0.00638580322265625, 0.039215087890625, 0.07204437255859375, 0.1048736572265625, 0.13770294189453125, 0.1705322265625, 0.20336151123046875, 0.2361907958984375, 0.26902008056640625, 0.301849365234375, 0.33467864990234375, 0.3675079345703125, 0.40033721923828125, 0.43316650390625, 0.46599578857421875, 0.4988250732421875, 0.5316543579101562, 0.564483642578125, 0.5973129272460938, 0.6301422119140625, 0.6629714965820312, 0.69580078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 12.0, 13.0, 27.0, 33.0, 50.0, 56.0, 79.0, 85.0, 78.0, 84.0, 85.0, 88.0, 81.0, 78.0, 30.0, 36.0, 20.0, 21.0, 12.0, 10.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11016845703125, -0.10618114471435547, -0.10219383239746094, -0.0982065200805664, -0.09421920776367188, -0.09023189544677734, -0.08624458312988281, -0.08225727081298828, -0.07826995849609375, -0.07428264617919922, -0.07029533386230469, -0.06630802154541016, -0.062320709228515625, -0.058333396911621094, -0.05434608459472656, -0.05035877227783203, -0.0463714599609375, -0.04238414764404297, -0.03839683532714844, -0.034409523010253906, -0.030422210693359375, -0.026434898376464844, -0.022447586059570312, -0.01846027374267578, -0.01447296142578125, -0.010485649108886719, -0.0064983367919921875, -0.0025110244750976562, 0.001476287841796875, 0.005463600158691406, 0.009450912475585938, 0.013438224792480469, 0.017425537109375, 0.02141284942626953, 0.025400161743164062, 0.029387474060058594, 0.033374786376953125, 0.037362098693847656, 0.04134941101074219, 0.04533672332763672, 0.04932403564453125, 0.05331134796142578, 0.05729866027832031, 0.061285972595214844, 0.06527328491210938, 0.0692605972290039, 0.07324790954589844, 0.07723522186279297, 0.0812225341796875, 0.08520984649658203, 0.08919715881347656, 0.0931844711303711, 0.09717178344726562, 0.10115909576416016, 0.10514640808105469, 0.10913372039794922, 0.11312103271484375, 0.11710834503173828, 0.12109565734863281, 0.12508296966552734, 0.12907028198242188, 0.1330575942993164, 0.13704490661621094, 0.14103221893310547, 0.14501953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 11.0, 24.0, 66.0, 119.0, 224.0, 638.0, 2163.0, 13994.0, 1709350.0, 2450420.0, 13989.0, 2232.0, 611.0, 227.0, 111.0, 33.0, 27.0, 16.0, 7.0, 7.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.938262939453125, -1.88726806640625, -1.836273193359375, -1.7852783203125, -1.734283447265625, -1.68328857421875, -1.632293701171875, -1.581298828125, -1.530303955078125, -1.47930908203125, -1.428314208984375, -1.3773193359375, -1.326324462890625, -1.27532958984375, -1.224334716796875, -1.17333984375, -1.122344970703125, -1.07135009765625, -1.020355224609375, -0.9693603515625, -0.918365478515625, -0.86737060546875, -0.816375732421875, -0.765380859375, -0.714385986328125, -0.66339111328125, -0.612396240234375, -0.5614013671875, -0.510406494140625, -0.45941162109375, -0.408416748046875, -0.357421875, -0.306427001953125, -0.25543212890625, -0.204437255859375, -0.1534423828125, -0.102447509765625, -0.05145263671875, -0.000457763671875, 0.050537109375, 0.101531982421875, 0.15252685546875, 0.203521728515625, 0.2545166015625, 0.305511474609375, 0.35650634765625, 0.407501220703125, 0.45849609375, 0.509490966796875, 0.56048583984375, 0.611480712890625, 0.6624755859375, 0.713470458984375, 0.76446533203125, 0.815460205078125, 0.866455078125, 0.917449951171875, 0.96844482421875, 1.019439697265625, 1.0704345703125, 1.121429443359375, 1.17242431640625, 1.223419189453125, 1.2744140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 3.0, 9.0, 14.0, 25.0, 30.0, 64.0, 128.0, 343.0, 1747.0, 1188.0, 288.0, 108.0, 50.0, 33.0, 10.0, 11.0, 7.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.360107421875, -0.35190582275390625, -0.3437042236328125, -0.33550262451171875, -0.327301025390625, -0.31909942626953125, -0.3108978271484375, -0.30269622802734375, -0.29449462890625, -0.28629302978515625, -0.2780914306640625, -0.26988983154296875, -0.261688232421875, -0.25348663330078125, -0.2452850341796875, -0.23708343505859375, -0.2288818359375, -0.22068023681640625, -0.2124786376953125, -0.20427703857421875, -0.196075439453125, -0.18787384033203125, -0.1796722412109375, -0.17147064208984375, -0.16326904296875, -0.15506744384765625, -0.1468658447265625, -0.13866424560546875, -0.130462646484375, -0.12226104736328125, -0.1140594482421875, -0.10585784912109375, -0.09765625, -0.08945465087890625, -0.0812530517578125, -0.07305145263671875, -0.064849853515625, -0.05664825439453125, -0.0484466552734375, -0.04024505615234375, -0.03204345703125, -0.02384185791015625, -0.0156402587890625, -0.00743865966796875, 0.000762939453125, 0.00896453857421875, 0.0171661376953125, 0.02536773681640625, 0.0335693359375, 0.04177093505859375, 0.0499725341796875, 0.05817413330078125, 0.066375732421875, 0.07457733154296875, 0.0827789306640625, 0.09098052978515625, 0.09918212890625, 0.10738372802734375, 0.1155853271484375, 0.12378692626953125, 0.131988525390625, 0.14019012451171875, 0.1483917236328125, 0.15659332275390625, 0.164794921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 14.0, 33.0, 141.0, 388.0, 313.0, 88.0, 16.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.229099988937378, -1.1403254270553589, -1.0515507459640503, -0.9627761840820312, -0.8740015625953674, -0.7852269411087036, -0.6964523792266846, -0.6076777577400208, -0.5189031362533569, -0.4301285147666931, -0.3413539230823517, -0.25257933139801025, -0.16380470991134644, -0.07503008842468262, 0.013744473457336426, 0.10251909494400024, 0.19129371643066406, 0.2800683379173279, 0.3688429296016693, 0.45761752128601074, 0.5463921427726746, 0.6351667642593384, 0.7239413261413574, 0.8127159476280212, 0.9014905691146851, 0.9902651906013489, 1.0790398120880127, 1.1678143739700317, 1.2565889358520508, 1.3453636169433594, 1.4341381788253784, 1.5229127407073975, 1.611687183380127, 1.700461745262146, 1.7892364263534546, 1.8780109882354736, 1.9667856693267822, 2.0555601119995117, 2.1443347930908203, 2.233109474182129, 2.3218841552734375, 2.410658836364746, 2.4994332790374756, 2.588207960128784, 2.6769826412200928, 2.7657570838928223, 2.854531764984131, 2.9433064460754395, 3.032080888748169, 3.1208555698394775, 3.209630012512207, 3.2984046936035156, 3.387179374694824, 3.475954055786133, 3.5647284984588623, 3.653503179550171, 3.7422776222229004, 3.831052303314209, 3.9198267459869385, 4.008601188659668, 4.097375869750977, 4.186150550842285, 4.274925231933594, 4.363699913024902, 4.452474594116211]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 12.0, 8.0, 9.0, 14.0, 18.0, 29.0, 29.0, 41.0, 43.0, 55.0, 57.0, 55.0, 57.0, 61.0, 59.0, 51.0, 61.0, 41.0, 52.0, 54.0, 34.0, 24.0, 38.0, 23.0, 17.0, 14.0, 9.0, 9.0, 5.0, 6.0, 2.0, 0.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6174001693725586, -0.597888708114624, -0.5783773064613342, -0.5588658452033997, -0.5393544435501099, -0.5198429822921753, -0.5003315210342407, -0.48082008957862854, -0.46130865812301636, -0.4417972266674042, -0.422285795211792, -0.4027743339538574, -0.38326290249824524, -0.36375147104263306, -0.3442400097846985, -0.3247285783290863, -0.3052171468734741, -0.28570571541786194, -0.26619428396224976, -0.24668282270431519, -0.227171391248703, -0.20765995979309082, -0.18814851343631744, -0.16863706707954407, -0.14912563562393188, -0.1296142041683197, -0.11010275781154633, -0.09059131890535355, -0.07107987999916077, -0.05156844109296799, -0.03205700218677521, -0.012545555830001831, 0.006965935230255127, 0.026477374136447906, 0.045988813042640686, 0.06550025194883347, 0.08501169085502625, 0.10452312976121902, 0.1240345686674118, 0.14354601502418518, 0.16305744647979736, 0.18256887793540955, 0.20208032429218292, 0.2215917706489563, 0.24110320210456848, 0.26061463356018066, 0.28012609481811523, 0.2996375262737274, 0.3191489577293396, 0.3386603891849518, 0.35817182064056396, 0.37768328189849854, 0.3971947133541107, 0.4167061448097229, 0.43621760606765747, 0.45572903752326965, 0.47524046897888184, 0.494751900434494, 0.5142633318901062, 0.5337747931480408, 0.5532861948013306, 0.5727976560592651, 0.5923091173171997, 0.6118205785751343, 0.6313319802284241]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 9.0, 26.0, 36.0, 57.0, 92.0, 146.0, 264.0, 577.0, 1372.0, 3687.0, 14599.0, 128606.0, 726245.0, 150026.0, 16105.0, 3982.0, 1423.0, 592.0, 286.0, 147.0, 109.0, 51.0, 37.0, 19.0, 14.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.103515625, -1.0724563598632812, -1.0413970947265625, -1.0103378295898438, -0.979278564453125, -0.9482192993164062, -0.9171600341796875, -0.8861007690429688, -0.85504150390625, -0.8239822387695312, -0.7929229736328125, -0.7618637084960938, -0.730804443359375, -0.6997451782226562, -0.6686859130859375, -0.6376266479492188, -0.6065673828125, -0.5755081176757812, -0.5444488525390625, -0.5133895874023438, -0.482330322265625, -0.45127105712890625, -0.4202117919921875, -0.38915252685546875, -0.35809326171875, -0.32703399658203125, -0.2959747314453125, -0.26491546630859375, -0.233856201171875, -0.20279693603515625, -0.1717376708984375, -0.14067840576171875, -0.109619140625, -0.07855987548828125, -0.0475006103515625, -0.01644134521484375, 0.014617919921875, 0.04567718505859375, 0.0767364501953125, 0.10779571533203125, 0.13885498046875, 0.16991424560546875, 0.2009735107421875, 0.23203277587890625, 0.263092041015625, 0.29415130615234375, 0.3252105712890625, 0.35626983642578125, 0.3873291015625, 0.41838836669921875, 0.4494476318359375, 0.48050689697265625, 0.511566162109375, 0.5426254272460938, 0.5736846923828125, 0.6047439575195312, 0.63580322265625, 0.6668624877929688, 0.6979217529296875, 0.7289810180664062, 0.760040283203125, 0.7910995483398438, 0.8221588134765625, 0.8532180786132812, 0.88427734375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 5.0, 11.0, 20.0, 30.0, 39.0, 40.0, 64.0, 63.0, 74.0, 88.0, 94.0, 77.0, 91.0, 86.0, 61.0, 43.0, 25.0, 23.0, 17.0, 12.0, 11.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11566162109375, -0.11161327362060547, -0.10756492614746094, -0.1035165786743164, -0.09946823120117188, -0.09541988372802734, -0.09137153625488281, -0.08732318878173828, -0.08327484130859375, -0.07922649383544922, -0.07517814636230469, -0.07112979888916016, -0.06708145141601562, -0.0630331039428711, -0.05898475646972656, -0.05493640899658203, -0.0508880615234375, -0.04683971405029297, -0.04279136657714844, -0.038743019104003906, -0.034694671630859375, -0.030646324157714844, -0.026597976684570312, -0.02254962921142578, -0.01850128173828125, -0.014452934265136719, -0.010404586791992188, -0.006356239318847656, -0.002307891845703125, 0.0017404556274414062, 0.0057888031005859375, 0.009837150573730469, 0.013885498046875, 0.01793384552001953, 0.021982192993164062, 0.026030540466308594, 0.030078887939453125, 0.034127235412597656, 0.03817558288574219, 0.04222393035888672, 0.04627227783203125, 0.05032062530517578, 0.05436897277832031, 0.058417320251464844, 0.062465667724609375, 0.0665140151977539, 0.07056236267089844, 0.07461071014404297, 0.0786590576171875, 0.08270740509033203, 0.08675575256347656, 0.0908041000366211, 0.09485244750976562, 0.09890079498291016, 0.10294914245605469, 0.10699748992919922, 0.11104583740234375, 0.11509418487548828, 0.11914253234863281, 0.12319087982177734, 0.12723922729492188, 0.1312875747680664, 0.13533592224121094, 0.13938426971435547, 0.1434326171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 7.0, 12.0, 12.0, 13.0, 29.0, 50.0, 75.0, 102.0, 235.0, 417.0, 819.0, 1923.0, 6106.0, 25630.0, 162382.0, 605198.0, 203736.0, 30748.0, 6923.0, 2202.0, 916.0, 448.0, 215.0, 119.0, 74.0, 59.0, 36.0, 15.0, 15.0, 8.0, 11.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6056671142578125, -0.585845947265625, -0.5660247802734375, -0.54620361328125, -0.5263824462890625, -0.506561279296875, -0.4867401123046875, -0.4669189453125, -0.4470977783203125, -0.427276611328125, -0.4074554443359375, -0.38763427734375, -0.3678131103515625, -0.347991943359375, -0.3281707763671875, -0.308349609375, -0.2885284423828125, -0.268707275390625, -0.2488861083984375, -0.22906494140625, -0.2092437744140625, -0.189422607421875, -0.1696014404296875, -0.1497802734375, -0.1299591064453125, -0.110137939453125, -0.0903167724609375, -0.07049560546875, -0.0506744384765625, -0.030853271484375, -0.0110321044921875, 0.0087890625, 0.0286102294921875, 0.048431396484375, 0.0682525634765625, 0.08807373046875, 0.1078948974609375, 0.127716064453125, 0.1475372314453125, 0.1673583984375, 0.1871795654296875, 0.207000732421875, 0.2268218994140625, 0.24664306640625, 0.2664642333984375, 0.286285400390625, 0.3061065673828125, 0.325927734375, 0.3457489013671875, 0.365570068359375, 0.3853912353515625, 0.40521240234375, 0.4250335693359375, 0.444854736328125, 0.4646759033203125, 0.4844970703125, 0.5043182373046875, 0.524139404296875, 0.5439605712890625, 0.56378173828125, 0.5836029052734375, 0.603424072265625, 0.6232452392578125, 0.64306640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 8.0, 6.0, 7.0, 8.0, 11.0, 8.0, 17.0, 31.0, 31.0, 31.0, 38.0, 65.0, 46.0, 60.0, 61.0, 73.0, 50.0, 70.0, 57.0, 48.0, 54.0, 31.0, 39.0, 26.0, 23.0, 18.0, 15.0, 23.0, 9.0, 7.0, 4.0, 4.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5009765625, -0.48709869384765625, -0.4732208251953125, -0.45934295654296875, -0.445465087890625, -0.43158721923828125, -0.4177093505859375, -0.40383148193359375, -0.38995361328125, -0.37607574462890625, -0.3621978759765625, -0.34832000732421875, -0.334442138671875, -0.32056427001953125, -0.3066864013671875, -0.29280853271484375, -0.2789306640625, -0.26505279541015625, -0.2511749267578125, -0.23729705810546875, -0.223419189453125, -0.20954132080078125, -0.1956634521484375, -0.18178558349609375, -0.16790771484375, -0.15402984619140625, -0.1401519775390625, -0.12627410888671875, -0.112396240234375, -0.09851837158203125, -0.0846405029296875, -0.07076263427734375, -0.056884765625, -0.04300689697265625, -0.0291290283203125, -0.01525115966796875, -0.001373291015625, 0.01250457763671875, 0.0263824462890625, 0.04026031494140625, 0.05413818359375, 0.06801605224609375, 0.0818939208984375, 0.09577178955078125, 0.109649658203125, 0.12352752685546875, 0.1374053955078125, 0.15128326416015625, 0.1651611328125, 0.17903900146484375, 0.1929168701171875, 0.20679473876953125, 0.220672607421875, 0.23455047607421875, 0.2484283447265625, 0.26230621337890625, 0.27618408203125, 0.29006195068359375, 0.3039398193359375, 0.31781768798828125, 0.331695556640625, 0.34557342529296875, 0.3594512939453125, 0.37332916259765625, 0.38720703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 8.0, 8.0, 15.0, 15.0, 32.0, 38.0, 91.0, 159.0, 254.0, 565.0, 1228.0, 3321.0, 10159.0, 46736.0, 426119.0, 489555.0, 52681.0, 11414.0, 3568.0, 1320.0, 590.0, 270.0, 152.0, 94.0, 45.0, 50.0, 17.0, 15.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318115234375, -0.3078651428222656, -0.29761505126953125, -0.2873649597167969, -0.2771148681640625, -0.2668647766113281, -0.25661468505859375, -0.24636459350585938, -0.236114501953125, -0.22586441040039062, -0.21561431884765625, -0.20536422729492188, -0.1951141357421875, -0.18486404418945312, -0.17461395263671875, -0.16436386108398438, -0.15411376953125, -0.14386367797851562, -0.13361358642578125, -0.12336349487304688, -0.1131134033203125, -0.10286331176757812, -0.09261322021484375, -0.08236312866210938, -0.072113037109375, -0.061862945556640625, -0.05161285400390625, -0.041362762451171875, -0.0311126708984375, -0.020862579345703125, -0.01061248779296875, -0.000362396240234375, 0.0098876953125, 0.020137786865234375, 0.03038787841796875, 0.040637969970703125, 0.0508880615234375, 0.061138153076171875, 0.07138824462890625, 0.08163833618164062, 0.091888427734375, 0.10213851928710938, 0.11238861083984375, 0.12263870239257812, 0.1328887939453125, 0.14313888549804688, 0.15338897705078125, 0.16363906860351562, 0.17388916015625, 0.18413925170898438, 0.19438934326171875, 0.20463943481445312, 0.2148895263671875, 0.22513961791992188, 0.23538970947265625, 0.24563980102539062, 0.255889892578125, 0.2661399841308594, 0.27639007568359375, 0.2866401672363281, 0.2968902587890625, 0.3071403503417969, 0.31739044189453125, 0.3276405334472656, 0.337890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 13.0, 14.0, 14.0, 19.0, 24.0, 38.0, 38.0, 69.0, 84.0, 100.0, 117.0, 107.0, 94.0, 68.0, 42.0, 34.0, 31.0, 18.0, 12.0, 10.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00012183189392089844, -0.00011867564171552658, -0.00011551938951015472, -0.00011236313730478287, -0.00010920688509941101, -0.00010605063289403915, -0.0001028943806886673, -9.973812848329544e-05, -9.658187627792358e-05, -9.342562407255173e-05, -9.026937186717987e-05, -8.711311966180801e-05, -8.395686745643616e-05, -8.08006152510643e-05, -7.764436304569244e-05, -7.448811084032059e-05, -7.133185863494873e-05, -6.817560642957687e-05, -6.501935422420502e-05, -6.186310201883316e-05, -5.8706849813461304e-05, -5.555059760808945e-05, -5.239434540271759e-05, -4.9238093197345734e-05, -4.608184099197388e-05, -4.292558878660202e-05, -3.9769336581230164e-05, -3.661308437585831e-05, -3.345683217048645e-05, -3.0300579965114594e-05, -2.7144327759742737e-05, -2.398807555437088e-05, -2.0831823348999023e-05, -1.7675571143627167e-05, -1.451931893825531e-05, -1.1363066732883453e-05, -8.206814527511597e-06, -5.05056232213974e-06, -1.8943101167678833e-06, 1.2619420886039734e-06, 4.41819429397583e-06, 7.574446499347687e-06, 1.0730698704719543e-05, 1.38869509100914e-05, 1.7043203115463257e-05, 2.0199455320835114e-05, 2.335570752620697e-05, 2.6511959731578827e-05, 2.9668211936950684e-05, 3.282446414232254e-05, 3.59807163476944e-05, 3.9136968553066254e-05, 4.229322075843811e-05, 4.544947296380997e-05, 4.8605725169181824e-05, 5.176197737455368e-05, 5.491822957992554e-05, 5.8074481785297394e-05, 6.123073399066925e-05, 6.438698619604111e-05, 6.754323840141296e-05, 7.069949060678482e-05, 7.385574281215668e-05, 7.701199501752853e-05, 8.016824722290039e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 8.0, 9.0, 7.0, 23.0, 25.0, 42.0, 70.0, 88.0, 160.0, 271.0, 521.0, 1053.0, 2436.0, 6909.0, 26744.0, 251382.0, 676568.0, 63349.0, 11930.0, 3756.0, 1508.0, 714.0, 391.0, 215.0, 127.0, 82.0, 58.0, 27.0, 21.0, 16.0, 4.0, 12.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.2579383850097656, -0.24683380126953125, -0.23572921752929688, -0.2246246337890625, -0.21352005004882812, -0.20241546630859375, -0.19131088256835938, -0.180206298828125, -0.16910171508789062, -0.15799713134765625, -0.14689254760742188, -0.1357879638671875, -0.12468338012695312, -0.11357879638671875, -0.10247421264648438, -0.09136962890625, -0.08026504516601562, -0.06916046142578125, -0.058055877685546875, -0.0469512939453125, -0.035846710205078125, -0.02474212646484375, -0.013637542724609375, -0.002532958984375, 0.008571624755859375, 0.01967620849609375, 0.030780792236328125, 0.0418853759765625, 0.052989959716796875, 0.06409454345703125, 0.07519912719726562, 0.0863037109375, 0.09740829467773438, 0.10851287841796875, 0.11961746215820312, 0.1307220458984375, 0.14182662963867188, 0.15293121337890625, 0.16403579711914062, 0.175140380859375, 0.18624496459960938, 0.19734954833984375, 0.20845413208007812, 0.2195587158203125, 0.23066329956054688, 0.24176788330078125, 0.2528724670410156, 0.26397705078125, 0.2750816345214844, 0.28618621826171875, 0.2972908020019531, 0.3083953857421875, 0.3194999694824219, 0.33060455322265625, 0.3417091369628906, 0.352813720703125, 0.3639183044433594, 0.37502288818359375, 0.3861274719238281, 0.3972320556640625, 0.4083366394042969, 0.41944122314453125, 0.4305458068847656, 0.441650390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 9.0, 8.0, 9.0, 11.0, 7.0, 19.0, 27.0, 40.0, 43.0, 59.0, 48.0, 82.0, 81.0, 92.0, 90.0, 85.0, 64.0, 49.0, 33.0, 24.0, 27.0, 22.0, 12.0, 17.0, 8.0, 6.0, 3.0, 5.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1312255859375, -0.1267852783203125, -0.122344970703125, -0.1179046630859375, -0.11346435546875, -0.1090240478515625, -0.104583740234375, -0.1001434326171875, -0.095703125, -0.0912628173828125, -0.086822509765625, -0.0823822021484375, -0.07794189453125, -0.0735015869140625, -0.069061279296875, -0.0646209716796875, -0.0601806640625, -0.0557403564453125, -0.051300048828125, -0.0468597412109375, -0.04241943359375, -0.0379791259765625, -0.033538818359375, -0.0290985107421875, -0.024658203125, -0.0202178955078125, -0.015777587890625, -0.0113372802734375, -0.00689697265625, -0.0024566650390625, 0.001983642578125, 0.0064239501953125, 0.0108642578125, 0.0153045654296875, 0.019744873046875, 0.0241851806640625, 0.02862548828125, 0.0330657958984375, 0.037506103515625, 0.0419464111328125, 0.04638671875, 0.0508270263671875, 0.055267333984375, 0.0597076416015625, 0.06414794921875, 0.0685882568359375, 0.073028564453125, 0.0774688720703125, 0.0819091796875, 0.0863494873046875, 0.090789794921875, 0.0952301025390625, 0.09967041015625, 0.1041107177734375, 0.108551025390625, 0.1129913330078125, 0.117431640625, 0.1218719482421875, 0.126312255859375, 0.1307525634765625, 0.13519287109375, 0.1396331787109375, 0.144073486328125, 0.1485137939453125, 0.1529541015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 6.0, 18.0, 18.0, 42.0, 90.0, 149.0, 150.0, 162.0, 126.0, 91.0, 54.0, 32.0, 17.0, 15.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.038255214691162, -2.9267897605895996, -2.815324306488037, -2.7038588523864746, -2.592393398284912, -2.4809279441833496, -2.369462490081787, -2.2579967975616455, -2.146531343460083, -2.0350658893585205, -1.923600435256958, -1.8121349811553955, -1.7006694078445435, -1.589203953742981, -1.4777384996414185, -1.3662729263305664, -1.2548075914382935, -1.143342137336731, -1.0318766832351685, -0.9204111695289612, -0.8089456558227539, -0.6974802017211914, -0.5860147476196289, -0.47454923391342163, -0.36308377981185913, -0.25161829590797424, -0.14015282690525055, -0.028687357902526855, 0.08277812600135803, 0.19424360990524292, 0.3057090640068054, 0.4171745777130127, 0.5286400318145752, 0.6401054859161377, 0.751570999622345, 0.8630364537239075, 0.9745019674301147, 1.0859674215316772, 1.1974328756332397, 1.3088984489440918, 1.4203639030456543, 1.5318293571472168, 1.6432948112487793, 1.7547602653503418, 1.8662258386611938, 1.9776912927627563, 2.0891566276550293, 2.200622320175171, 2.3120875358581543, 2.423552989959717, 2.5350184440612793, 2.646483898162842, 2.7579493522644043, 2.869414806365967, 2.9808802604675293, 3.092345952987671, 3.2038114070892334, 3.315276861190796, 3.4267423152923584, 3.538207769393921, 3.6496732234954834, 3.761138916015625, 3.8726043701171875, 3.98406982421875, 4.0955352783203125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 4.0, 13.0, 13.0, 11.0, 16.0, 20.0, 25.0, 24.0, 29.0, 41.0, 43.0, 51.0, 48.0, 66.0, 67.0, 75.0, 45.0, 50.0, 52.0, 44.0, 34.0, 44.0, 36.0, 27.0, 24.0, 19.0, 24.0, 11.0, 12.0, 5.0, 5.0, 2.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.997396945953369, -2.919171094894409, -2.840945243835449, -2.76271915435791, -2.68449330329895, -2.6062674522399902, -2.5280416011810303, -2.4498157501220703, -2.3715898990631104, -2.2933640480041504, -2.2151381969451904, -2.1369123458862305, -2.0586862564086914, -1.9804604053497314, -1.9022345542907715, -1.8240087032318115, -1.745782732963562, -1.667556881904602, -1.5893309116363525, -1.5111050605773926, -1.4328792095184326, -1.3546533584594727, -1.2764273881912231, -1.1982015371322632, -1.1199755668640137, -1.0417497158050537, -0.963523805141449, -0.8852978944778442, -0.8070720434188843, -0.7288461327552795, -0.6506202220916748, -0.5723943710327148, -0.4941685199737549, -0.41594263911247253, -0.3377167582511902, -0.25949084758758545, -0.1812649667263031, -0.10303908586502075, -0.024813175201416016, 0.053412675857543945, 0.13163858652114868, 0.20986446738243103, 0.2880903482437134, 0.3663162589073181, 0.44454213976860046, 0.5227680206298828, 0.6009939312934875, 0.6792197823524475, 0.7574456930160522, 0.835671603679657, 0.9138974547386169, 0.9921233654022217, 1.0703492164611816, 1.1485750675201416, 1.2268010377883911, 1.305026888847351, 1.3832528591156006, 1.4614787101745605, 1.53970468044281, 1.61793053150177, 1.69615638256073, 1.7743823528289795, 1.8526082038879395, 1.9308340549468994, 2.0090599060058594]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 10.0, 3.0, 4.0, 11.0, 21.0, 20.0, 25.0, 37.0, 42.0, 57.0, 100.0, 128.0, 184.0, 242.0, 394.0, 776.0, 1562.0, 3587.0, 10641.0, 46307.0, 701743.0, 3325839.0, 77429.0, 15901.0, 5036.0, 1975.0, 932.0, 487.0, 307.0, 156.0, 116.0, 66.0, 49.0, 28.0, 24.0, 13.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.3681640625, -1.33489990234375, -1.3016357421875, -1.26837158203125, -1.235107421875, -1.20184326171875, -1.1685791015625, -1.13531494140625, -1.10205078125, -1.06878662109375, -1.0355224609375, -1.00225830078125, -0.968994140625, -0.93572998046875, -0.9024658203125, -0.86920166015625, -0.8359375, -0.80267333984375, -0.7694091796875, -0.73614501953125, -0.702880859375, -0.66961669921875, -0.6363525390625, -0.60308837890625, -0.56982421875, -0.53656005859375, -0.5032958984375, -0.47003173828125, -0.436767578125, -0.40350341796875, -0.3702392578125, -0.33697509765625, -0.3037109375, -0.27044677734375, -0.2371826171875, -0.20391845703125, -0.170654296875, -0.13739013671875, -0.1041259765625, -0.07086181640625, -0.03759765625, -0.00433349609375, 0.0289306640625, 0.06219482421875, 0.095458984375, 0.12872314453125, 0.1619873046875, 0.19525146484375, 0.228515625, 0.26177978515625, 0.2950439453125, 0.32830810546875, 0.361572265625, 0.39483642578125, 0.4281005859375, 0.46136474609375, 0.49462890625, 0.52789306640625, 0.5611572265625, 0.59442138671875, 0.627685546875, 0.66094970703125, 0.6942138671875, 0.72747802734375, 0.7607421875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 14.0, 24.0, 26.0, 32.0, 47.0, 54.0, 68.0, 80.0, 87.0, 100.0, 83.0, 88.0, 63.0, 53.0, 54.0, 42.0, 24.0, 14.0, 11.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.148193359375, -0.14391517639160156, -0.13963699340820312, -0.1353588104248047, -0.13108062744140625, -0.1268024444580078, -0.12252426147460938, -0.11824607849121094, -0.1139678955078125, -0.10968971252441406, -0.10541152954101562, -0.10113334655761719, -0.09685516357421875, -0.09257698059082031, -0.08829879760742188, -0.08402061462402344, -0.079742431640625, -0.07546424865722656, -0.07118606567382812, -0.06690788269042969, -0.06262969970703125, -0.05835151672363281, -0.054073333740234375, -0.04979515075683594, -0.0455169677734375, -0.04123878479003906, -0.036960601806640625, -0.03268241882324219, -0.02840423583984375, -0.024126052856445312, -0.019847869873046875, -0.015569686889648438, -0.01129150390625, -0.0070133209228515625, -0.002735137939453125, 0.0015430450439453125, 0.00582122802734375, 0.010099411010742188, 0.014377593994140625, 0.018655776977539062, 0.0229339599609375, 0.027212142944335938, 0.031490325927734375, 0.03576850891113281, 0.04004669189453125, 0.04432487487792969, 0.048603057861328125, 0.05288124084472656, 0.057159423828125, 0.06143760681152344, 0.06571578979492188, 0.06999397277832031, 0.07427215576171875, 0.07855033874511719, 0.08282852172851562, 0.08710670471191406, 0.0913848876953125, 0.09566307067871094, 0.09994125366210938, 0.10421943664550781, 0.10849761962890625, 0.11277580261230469, 0.11705398559570312, 0.12133216857910156, 0.1256103515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 7.0, 16.0, 13.0, 26.0, 41.0, 38.0, 69.0, 82.0, 101.0, 199.0, 337.0, 866.0, 2881.0, 22010.0, 4099753.0, 61964.0, 3762.0, 906.0, 408.0, 215.0, 141.0, 109.0, 69.0, 57.0, 49.0, 31.0, 30.0, 12.0, 16.0, 11.0, 10.0, 9.0, 8.0, 3.0, 3.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.796875, -2.711181640625, -2.62548828125, -2.539794921875, -2.4541015625, -2.368408203125, -2.28271484375, -2.197021484375, -2.111328125, -2.025634765625, -1.93994140625, -1.854248046875, -1.7685546875, -1.682861328125, -1.59716796875, -1.511474609375, -1.42578125, -1.340087890625, -1.25439453125, -1.168701171875, -1.0830078125, -0.997314453125, -0.91162109375, -0.825927734375, -0.740234375, -0.654541015625, -0.56884765625, -0.483154296875, -0.3974609375, -0.311767578125, -0.22607421875, -0.140380859375, -0.0546875, 0.031005859375, 0.11669921875, 0.202392578125, 0.2880859375, 0.373779296875, 0.45947265625, 0.545166015625, 0.630859375, 0.716552734375, 0.80224609375, 0.887939453125, 0.9736328125, 1.059326171875, 1.14501953125, 1.230712890625, 1.31640625, 1.402099609375, 1.48779296875, 1.573486328125, 1.6591796875, 1.744873046875, 1.83056640625, 1.916259765625, 2.001953125, 2.087646484375, 2.17333984375, 2.259033203125, 2.3447265625, 2.430419921875, 2.51611328125, 2.601806640625, 2.6875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 8.0, 14.0, 35.0, 104.0, 679.0, 2824.0, 318.0, 63.0, 20.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64697265625, -0.6165847778320312, -0.5861968994140625, -0.5558090209960938, -0.525421142578125, -0.49503326416015625, -0.4646453857421875, -0.43425750732421875, -0.40386962890625, -0.37348175048828125, -0.3430938720703125, -0.31270599365234375, -0.282318115234375, -0.25193023681640625, -0.2215423583984375, -0.19115447998046875, -0.1607666015625, -0.13037872314453125, -0.0999908447265625, -0.06960296630859375, -0.039215087890625, -0.00882720947265625, 0.0215606689453125, 0.05194854736328125, 0.08233642578125, 0.11272430419921875, 0.1431121826171875, 0.17350006103515625, 0.203887939453125, 0.23427581787109375, 0.2646636962890625, 0.29505157470703125, 0.325439453125, 0.35582733154296875, 0.3862152099609375, 0.41660308837890625, 0.446990966796875, 0.47737884521484375, 0.5077667236328125, 0.5381546020507812, 0.56854248046875, 0.5989303588867188, 0.6293182373046875, 0.6597061157226562, 0.690093994140625, 0.7204818725585938, 0.7508697509765625, 0.7812576293945312, 0.8116455078125, 0.8420333862304688, 0.8724212646484375, 0.9028091430664062, 0.933197021484375, 0.9635848999023438, 0.9939727783203125, 1.0243606567382812, 1.05474853515625, 1.0851364135742188, 1.1155242919921875, 1.1459121704101562, 1.176300048828125, 1.2066879272460938, 1.2370758056640625, 1.2674636840820312, 1.2978515625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 10.0, 16.0, 66.0, 165.0, 294.0, 263.0, 99.0, 45.0, 13.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.0675811767578125, -5.928643226623535, -5.7897047996521, -5.650766849517822, -5.511828422546387, -5.372890472412109, -5.233952045440674, -5.0950140953063965, -4.956075668334961, -4.817137718200684, -4.678199291229248, -4.539261341094971, -4.400322914123535, -4.261384963989258, -4.122446537017822, -3.983508586883545, -3.8445706367492676, -3.705632448196411, -3.5666942596435547, -3.4277560710906982, -3.288817882537842, -3.1498799324035645, -3.010941743850708, -2.8720035552978516, -2.733065366744995, -2.5941271781921387, -2.4551889896392822, -2.316250801086426, -2.1773128509521484, -2.038374423980713, -1.8994364738464355, -1.760498285293579, -1.6215603351593018, -1.4826221466064453, -1.3436839580535889, -1.204745888710022, -1.0658077001571655, -0.9268695116043091, -0.7879313826560974, -0.6489932537078857, -0.5100550651550293, -0.37111690640449524, -0.23217874765396118, -0.09324058890342712, 0.045697569847106934, 0.18463575839996338, 0.32357388734817505, 0.4625120162963867, 0.6014502048492432, 0.7403883934020996, 0.8793265223503113, 1.018264651298523, 1.1572028398513794, 1.2961410284042358, 1.4350790977478027, 1.5740172863006592, 1.7129554748535156, 1.851893663406372, 1.9908318519592285, 2.129770040512085, 2.2687082290649414, 2.4076461791992188, 2.546584367752075, 2.6855225563049316, 2.824460744857788]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 4.0, 6.0, 5.0, 9.0, 13.0, 25.0, 28.0, 22.0, 39.0, 37.0, 42.0, 52.0, 67.0, 56.0, 78.0, 76.0, 67.0, 68.0, 54.0, 50.0, 39.0, 33.0, 31.0, 15.0, 14.0, 14.0, 14.0, 13.0, 11.0, 7.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5844693183898926, -1.5345063209533691, -1.4845434427261353, -1.4345804452896118, -1.3846174478530884, -1.3346545696258545, -1.284691572189331, -1.2347285747528076, -1.1847655773162842, -1.1348025798797607, -1.0848397016525269, -1.0348767042160034, -0.98491370677948, -0.9349507689476013, -0.8849878311157227, -0.8350248336791992, -0.7850619554519653, -0.7350990176200867, -0.6851360201835632, -0.6351730823516846, -0.5852100849151611, -0.5352471470832825, -0.4852842092514038, -0.43532124161720276, -0.3853582739830017, -0.33539530634880066, -0.2854323387145996, -0.23546940088272095, -0.1855064332485199, -0.13554346561431885, -0.08558052778244019, -0.035617560148239136, 0.014345407485961914, 0.06430836766958237, 0.11427132785320282, 0.16423428058624268, 0.21419724822044373, 0.2641602158546448, 0.31412315368652344, 0.3640861213207245, 0.41404908895492554, 0.4640120565891266, 0.5139750242233276, 0.5639379620552063, 0.613900899887085, 0.6638638973236084, 0.7138268351554871, 0.7637897729873657, 0.8137527704238892, 0.8637157082557678, 0.9136787056922913, 0.9636416435241699, 1.0136046409606934, 1.0635676383972168, 1.1135305166244507, 1.1634935140609741, 1.213456392288208, 1.2634193897247314, 1.3133822679519653, 1.3633452653884888, 1.4133082628250122, 1.463271141052246, 1.5132341384887695, 1.563197135925293, 1.6131601333618164]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 4.0, 5.0, 15.0, 6.0, 17.0, 23.0, 46.0, 48.0, 64.0, 65.0, 102.0, 146.0, 234.0, 297.0, 457.0, 683.0, 975.0, 1597.0, 2796.0, 5607.0, 13141.0, 41889.0, 170146.0, 479220.0, 240897.0, 57614.0, 17085.0, 6778.0, 3233.0, 1884.0, 1024.0, 765.0, 476.0, 350.0, 222.0, 177.0, 121.0, 90.0, 58.0, 52.0, 37.0, 32.0, 15.0, 18.0, 8.0, 5.0, 4.0, 11.0, 5.0, 2.0, 1.0, 4.0, 1.0], "bins": [-0.654296875, -0.6353988647460938, -0.6165008544921875, -0.5976028442382812, -0.578704833984375, -0.5598068237304688, -0.5409088134765625, -0.5220108032226562, -0.50311279296875, -0.48421478271484375, -0.4653167724609375, -0.44641876220703125, -0.427520751953125, -0.40862274169921875, -0.3897247314453125, -0.37082672119140625, -0.3519287109375, -0.33303070068359375, -0.3141326904296875, -0.29523468017578125, -0.276336669921875, -0.25743865966796875, -0.2385406494140625, -0.21964263916015625, -0.20074462890625, -0.18184661865234375, -0.1629486083984375, -0.14405059814453125, -0.125152587890625, -0.10625457763671875, -0.0873565673828125, -0.06845855712890625, -0.049560546875, -0.03066253662109375, -0.0117645263671875, 0.00713348388671875, 0.026031494140625, 0.04492950439453125, 0.0638275146484375, 0.08272552490234375, 0.10162353515625, 0.12052154541015625, 0.1394195556640625, 0.15831756591796875, 0.177215576171875, 0.19611358642578125, 0.2150115966796875, 0.23390960693359375, 0.2528076171875, 0.27170562744140625, 0.2906036376953125, 0.30950164794921875, 0.328399658203125, 0.34729766845703125, 0.3661956787109375, 0.38509368896484375, 0.40399169921875, 0.42288970947265625, 0.4417877197265625, 0.46068572998046875, 0.479583740234375, 0.49848175048828125, 0.5173797607421875, 0.5362777709960938, 0.55517578125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 13.0, 31.0, 31.0, 43.0, 73.0, 83.0, 95.0, 126.0, 117.0, 113.0, 82.0, 55.0, 46.0, 28.0, 12.0, 8.0, 10.0, 3.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.223388671875, -0.217315673828125, -0.21124267578125, -0.205169677734375, -0.1990966796875, -0.193023681640625, -0.18695068359375, -0.180877685546875, -0.1748046875, -0.168731689453125, -0.16265869140625, -0.156585693359375, -0.1505126953125, -0.144439697265625, -0.13836669921875, -0.132293701171875, -0.126220703125, -0.120147705078125, -0.11407470703125, -0.108001708984375, -0.1019287109375, -0.095855712890625, -0.08978271484375, -0.083709716796875, -0.07763671875, -0.071563720703125, -0.06549072265625, -0.059417724609375, -0.0533447265625, -0.047271728515625, -0.04119873046875, -0.035125732421875, -0.029052734375, -0.022979736328125, -0.01690673828125, -0.010833740234375, -0.0047607421875, 0.001312255859375, 0.00738525390625, 0.013458251953125, 0.01953125, 0.025604248046875, 0.03167724609375, 0.037750244140625, 0.0438232421875, 0.049896240234375, 0.05596923828125, 0.062042236328125, 0.068115234375, 0.074188232421875, 0.08026123046875, 0.086334228515625, 0.0924072265625, 0.098480224609375, 0.10455322265625, 0.110626220703125, 0.11669921875, 0.122772216796875, 0.12884521484375, 0.134918212890625, 0.1409912109375, 0.147064208984375, 0.15313720703125, 0.159210205078125, 0.165283203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 8.0, 12.0, 18.0, 17.0, 30.0, 36.0, 51.0, 97.0, 126.0, 232.0, 379.0, 783.0, 1748.0, 4679.0, 15188.0, 55436.0, 224157.0, 478543.0, 197401.0, 48876.0, 13146.0, 4232.0, 1679.0, 733.0, 357.0, 226.0, 106.0, 64.0, 48.0, 42.0, 24.0, 20.0, 16.0, 9.0, 9.0, 8.0, 5.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.399993896484375, -0.38641357421875, -0.372833251953125, -0.3592529296875, -0.345672607421875, -0.33209228515625, -0.318511962890625, -0.304931640625, -0.291351318359375, -0.27777099609375, -0.264190673828125, -0.2506103515625, -0.237030029296875, -0.22344970703125, -0.209869384765625, -0.1962890625, -0.182708740234375, -0.16912841796875, -0.155548095703125, -0.1419677734375, -0.128387451171875, -0.11480712890625, -0.101226806640625, -0.087646484375, -0.074066162109375, -0.06048583984375, -0.046905517578125, -0.0333251953125, -0.019744873046875, -0.00616455078125, 0.007415771484375, 0.02099609375, 0.034576416015625, 0.04815673828125, 0.061737060546875, 0.0753173828125, 0.088897705078125, 0.10247802734375, 0.116058349609375, 0.129638671875, 0.143218994140625, 0.15679931640625, 0.170379638671875, 0.1839599609375, 0.197540283203125, 0.21112060546875, 0.224700927734375, 0.23828125, 0.251861572265625, 0.26544189453125, 0.279022216796875, 0.2926025390625, 0.306182861328125, 0.31976318359375, 0.333343505859375, 0.346923828125, 0.360504150390625, 0.37408447265625, 0.387664794921875, 0.4012451171875, 0.414825439453125, 0.42840576171875, 0.441986083984375, 0.45556640625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 6.0, 3.0, 8.0, 13.0, 9.0, 14.0, 13.0, 17.0, 12.0, 24.0, 21.0, 20.0, 22.0, 34.0, 38.0, 36.0, 40.0, 46.0, 39.0, 40.0, 57.0, 45.0, 43.0, 37.0, 35.0, 39.0, 37.0, 48.0, 31.0, 33.0, 26.0, 10.0, 18.0, 11.0, 10.0, 14.0, 10.0, 7.0, 7.0, 4.0, 8.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28759765625, -0.2774620056152344, -0.26732635498046875, -0.2571907043457031, -0.2470550537109375, -0.23691940307617188, -0.22678375244140625, -0.21664810180664062, -0.206512451171875, -0.19637680053710938, -0.18624114990234375, -0.17610549926757812, -0.1659698486328125, -0.15583419799804688, -0.14569854736328125, -0.13556289672851562, -0.12542724609375, -0.11529159545898438, -0.10515594482421875, -0.09502029418945312, -0.0848846435546875, -0.07474899291992188, -0.06461334228515625, -0.054477691650390625, -0.044342041015625, -0.034206390380859375, -0.02407073974609375, -0.013935089111328125, -0.0037994384765625, 0.006336212158203125, 0.01647186279296875, 0.026607513427734375, 0.0367431640625, 0.046878814697265625, 0.05701446533203125, 0.06715011596679688, 0.0772857666015625, 0.08742141723632812, 0.09755706787109375, 0.10769271850585938, 0.117828369140625, 0.12796401977539062, 0.13809967041015625, 0.14823532104492188, 0.1583709716796875, 0.16850662231445312, 0.17864227294921875, 0.18877792358398438, 0.19891357421875, 0.20904922485351562, 0.21918487548828125, 0.22932052612304688, 0.2394561767578125, 0.24959182739257812, 0.25972747802734375, 0.2698631286621094, 0.279998779296875, 0.2901344299316406, 0.30027008056640625, 0.3104057312011719, 0.3205413818359375, 0.3306770324707031, 0.34081268310546875, 0.3509483337402344, 0.361083984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 5.0, 5.0, 4.0, 14.0, 16.0, 22.0, 41.0, 53.0, 95.0, 197.0, 365.0, 811.0, 1965.0, 5590.0, 19272.0, 100785.0, 642828.0, 228688.0, 34061.0, 8673.0, 2898.0, 1088.0, 490.0, 249.0, 145.0, 68.0, 46.0, 30.0, 14.0, 13.0, 5.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3447265625, -0.3347892761230469, -0.32485198974609375, -0.3149147033691406, -0.3049774169921875, -0.2950401306152344, -0.28510284423828125, -0.2751655578613281, -0.265228271484375, -0.2552909851074219, -0.24535369873046875, -0.23541641235351562, -0.2254791259765625, -0.21554183959960938, -0.20560455322265625, -0.19566726684570312, -0.18572998046875, -0.17579269409179688, -0.16585540771484375, -0.15591812133789062, -0.1459808349609375, -0.13604354858398438, -0.12610626220703125, -0.11616897583007812, -0.106231689453125, -0.09629440307617188, -0.08635711669921875, -0.07641983032226562, -0.0664825439453125, -0.056545257568359375, -0.04660797119140625, -0.036670684814453125, -0.0267333984375, -0.016796112060546875, -0.00685882568359375, 0.003078460693359375, 0.0130157470703125, 0.022953033447265625, 0.03289031982421875, 0.042827606201171875, 0.052764892578125, 0.06270217895507812, 0.07263946533203125, 0.08257675170898438, 0.0925140380859375, 0.10245132446289062, 0.11238861083984375, 0.12232589721679688, 0.13226318359375, 0.14220046997070312, 0.15213775634765625, 0.16207504272460938, 0.1720123291015625, 0.18194961547851562, 0.19188690185546875, 0.20182418823242188, 0.211761474609375, 0.22169876098632812, 0.23163604736328125, 0.24157333374023438, 0.2515106201171875, 0.2614479064941406, 0.27138519287109375, 0.2813224792480469, 0.291259765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 10.0, 11.0, 16.0, 23.0, 39.0, 32.0, 66.0, 67.0, 95.0, 126.0, 120.0, 104.0, 72.0, 56.0, 42.0, 31.0, 22.0, 16.0, 12.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171796798706055e-05, -7.890630513429642e-05, -7.609464228153229e-05, -7.328297942876816e-05, -7.047131657600403e-05, -6.76596537232399e-05, -6.484799087047577e-05, -6.203632801771164e-05, -5.922466516494751e-05, -5.641300231218338e-05, -5.360133945941925e-05, -5.078967660665512e-05, -4.797801375389099e-05, -4.516635090112686e-05, -4.235468804836273e-05, -3.95430251955986e-05, -3.673136234283447e-05, -3.391969949007034e-05, -3.110803663730621e-05, -2.8296373784542084e-05, -2.5484710931777954e-05, -2.2673048079013824e-05, -1.9861385226249695e-05, -1.7049722373485565e-05, -1.4238059520721436e-05, -1.1426396667957306e-05, -8.614733815193176e-06, -5.803070962429047e-06, -2.991408109664917e-06, -1.7974525690078735e-07, 2.6319175958633423e-06, 5.443580448627472e-06, 8.255243301391602e-06, 1.1066906154155731e-05, 1.387856900691986e-05, 1.669023185968399e-05, 1.950189471244812e-05, 2.231355756521225e-05, 2.512522041797638e-05, 2.793688327074051e-05, 3.074854612350464e-05, 3.356020897626877e-05, 3.63718718290329e-05, 3.918353468179703e-05, 4.199519753456116e-05, 4.480686038732529e-05, 4.7618523240089417e-05, 5.0430186092853546e-05, 5.3241848945617676e-05, 5.6053511798381805e-05, 5.8865174651145935e-05, 6.167683750391006e-05, 6.44885003566742e-05, 6.730016320943832e-05, 7.011182606220245e-05, 7.292348891496658e-05, 7.573515176773071e-05, 7.854681462049484e-05, 8.135847747325897e-05, 8.41701403260231e-05, 8.698180317878723e-05, 8.979346603155136e-05, 9.260512888431549e-05, 9.541679173707962e-05, 9.822845458984375e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 16.0, 16.0, 32.0, 60.0, 86.0, 133.0, 286.0, 684.0, 1489.0, 4428.0, 14838.0, 71256.0, 595927.0, 305539.0, 39146.0, 9489.0, 2951.0, 1178.0, 495.0, 233.0, 105.0, 53.0, 41.0, 25.0, 11.0, 11.0, 10.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41259765625, -0.4016914367675781, -0.39078521728515625, -0.3798789978027344, -0.3689727783203125, -0.3580665588378906, -0.34716033935546875, -0.3362541198730469, -0.325347900390625, -0.3144416809082031, -0.30353546142578125, -0.2926292419433594, -0.2817230224609375, -0.2708168029785156, -0.25991058349609375, -0.24900436401367188, -0.23809814453125, -0.22719192504882812, -0.21628570556640625, -0.20537948608398438, -0.1944732666015625, -0.18356704711914062, -0.17266082763671875, -0.16175460815429688, -0.150848388671875, -0.13994216918945312, -0.12903594970703125, -0.11812973022460938, -0.1072235107421875, -0.09631729125976562, -0.08541107177734375, -0.07450485229492188, -0.0635986328125, -0.052692413330078125, -0.04178619384765625, -0.030879974365234375, -0.0199737548828125, -0.009067535400390625, 0.00183868408203125, 0.012744903564453125, 0.023651123046875, 0.034557342529296875, 0.04546356201171875, 0.056369781494140625, 0.0672760009765625, 0.07818222045898438, 0.08908843994140625, 0.09999465942382812, 0.11090087890625, 0.12180709838867188, 0.13271331787109375, 0.14361953735351562, 0.1545257568359375, 0.16543197631835938, 0.17633819580078125, 0.18724441528320312, 0.198150634765625, 0.20905685424804688, 0.21996307373046875, 0.23086929321289062, 0.2417755126953125, 0.2526817321777344, 0.26358795166015625, 0.2744941711425781, 0.285400390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 7.0, 4.0, 7.0, 8.0, 4.0, 7.0, 7.0, 10.0, 18.0, 19.0, 18.0, 23.0, 41.0, 46.0, 51.0, 70.0, 77.0, 84.0, 79.0, 68.0, 68.0, 47.0, 42.0, 38.0, 23.0, 32.0, 25.0, 14.0, 9.0, 12.0, 7.0, 10.0, 4.0, 4.0, 7.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1729736328125, -0.1678619384765625, -0.162750244140625, -0.1576385498046875, -0.15252685546875, -0.1474151611328125, -0.142303466796875, -0.1371917724609375, -0.132080078125, -0.1269683837890625, -0.121856689453125, -0.1167449951171875, -0.11163330078125, -0.1065216064453125, -0.101409912109375, -0.0962982177734375, -0.0911865234375, -0.0860748291015625, -0.080963134765625, -0.0758514404296875, -0.07073974609375, -0.0656280517578125, -0.060516357421875, -0.0554046630859375, -0.05029296875, -0.0451812744140625, -0.040069580078125, -0.0349578857421875, -0.02984619140625, -0.0247344970703125, -0.019622802734375, -0.0145111083984375, -0.0093994140625, -0.0042877197265625, 0.000823974609375, 0.0059356689453125, 0.01104736328125, 0.0161590576171875, 0.021270751953125, 0.0263824462890625, 0.031494140625, 0.0366058349609375, 0.041717529296875, 0.0468292236328125, 0.05194091796875, 0.0570526123046875, 0.062164306640625, 0.0672760009765625, 0.0723876953125, 0.0774993896484375, 0.082611083984375, 0.0877227783203125, 0.09283447265625, 0.0979461669921875, 0.103057861328125, 0.1081695556640625, 0.11328125, 0.1183929443359375, 0.123504638671875, 0.1286163330078125, 0.13372802734375, 0.1388397216796875, 0.143951416015625, 0.1490631103515625, 0.1541748046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 22.0, 52.0, 86.0, 180.0, 219.0, 186.0, 132.0, 63.0, 24.0, 22.0, 9.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.021912097930908, -5.873057842254639, -5.724203586578369, -5.575348854064941, -5.426494598388672, -5.277640342712402, -5.128786087036133, -4.979931831359863, -4.831077575683594, -4.682223320007324, -4.533369064331055, -4.384514331817627, -4.235660076141357, -4.086805820465088, -3.9379515647888184, -3.789097309112549, -3.640242576599121, -3.4913883209228516, -3.342533826828003, -3.1936795711517334, -3.0448250770568848, -2.8959708213806152, -2.7471165657043457, -2.598262310028076, -2.4494078159332275, -2.300553560256958, -2.1516990661621094, -2.00284481048584, -1.8539904356002808, -1.7051360607147217, -1.5562818050384521, -1.407427430152893, -1.2585735321044922, -1.109719157218933, -0.9608648419380188, -0.8120105266571045, -0.6631561517715454, -0.5143017768859863, -0.365447461605072, -0.21659314632415771, -0.06773877143859863, 0.08111557364463806, 0.22996991872787476, 0.37882426381111145, 0.5276786088943481, 0.6765329837799072, 0.8253872990608215, 0.9742416143417358, 1.123095989227295, 1.271950364112854, 1.420804738998413, 1.5696589946746826, 1.7185133695602417, 1.8673677444458008, 2.0162220001220703, 2.16507625579834, 2.3139307498931885, 2.462785005569458, 2.6116394996643066, 2.760493755340576, 2.9093480110168457, 3.0582025051116943, 3.207056760787964, 3.3559112548828125, 3.504765510559082]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 5.0, 9.0, 5.0, 8.0, 10.0, 17.0, 15.0, 15.0, 21.0, 20.0, 33.0, 37.0, 29.0, 30.0, 39.0, 43.0, 48.0, 48.0, 33.0, 53.0, 37.0, 44.0, 50.0, 40.0, 39.0, 29.0, 25.0, 24.0, 25.0, 19.0, 19.0, 17.0, 20.0, 16.0, 9.0, 13.0, 16.0, 9.0, 8.0, 7.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-2.0773415565490723, -2.0180912017822266, -1.9588409662246704, -1.8995906114578247, -1.840340256690979, -1.7810900211334229, -1.7218396663665771, -1.6625893115997314, -1.6033389568328857, -1.54408860206604, -1.4848383665084839, -1.4255880117416382, -1.3663376569747925, -1.3070874214172363, -1.2478370666503906, -1.188586711883545, -1.1293364763259888, -1.070086121559143, -1.010835886001587, -0.9515855312347412, -0.8923351764678955, -0.8330848813056946, -0.7738345861434937, -0.714584231376648, -0.655333936214447, -0.5960836410522461, -0.5368332862854004, -0.47758299112319946, -0.41833266615867615, -0.35908234119415283, -0.2998320460319519, -0.2405817210674286, -0.18133139610290527, -0.12208107858896255, -0.06283076107501984, -0.003580451011657715, 0.0556698739528656, 0.11492019891738892, 0.17417049407958984, 0.23342081904411316, 0.2926711440086365, 0.3519214689731598, 0.4111717939376831, 0.47042208909988403, 0.529672384262085, 0.5889227390289307, 0.6481730341911316, 0.7074233293533325, 0.7666736841201782, 0.8259239792823792, 0.8851743340492249, 0.9444246292114258, 1.0036749839782715, 1.0629253387451172, 1.1221755743026733, 1.181425929069519, 1.2406761646270752, 1.299926519393921, 1.359176754951477, 1.4184271097183228, 1.4776774644851685, 1.5369277000427246, 1.5961780548095703, 1.655428409576416, 1.7146787643432617]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 17.0, 13.0, 15.0, 16.0, 26.0, 34.0, 52.0, 62.0, 103.0, 128.0, 199.0, 307.0, 500.0, 937.0, 1714.0, 4156.0, 12997.0, 79860.0, 3873505.0, 187265.0, 21336.0, 6079.0, 2345.0, 1127.0, 601.0, 314.0, 157.0, 107.0, 83.0, 55.0, 31.0, 29.0, 25.0, 15.0, 12.0, 13.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.041015625, -1.0109710693359375, -0.980926513671875, -0.9508819580078125, -0.92083740234375, -0.8907928466796875, -0.860748291015625, -0.8307037353515625, -0.8006591796875, -0.7706146240234375, -0.740570068359375, -0.7105255126953125, -0.68048095703125, -0.6504364013671875, -0.620391845703125, -0.5903472900390625, -0.560302734375, -0.5302581787109375, -0.500213623046875, -0.4701690673828125, -0.44012451171875, -0.4100799560546875, -0.380035400390625, -0.3499908447265625, -0.3199462890625, -0.2899017333984375, -0.259857177734375, -0.2298126220703125, -0.19976806640625, -0.1697235107421875, -0.139678955078125, -0.1096343994140625, -0.07958984375, -0.0495452880859375, -0.019500732421875, 0.0105438232421875, 0.04058837890625, 0.0706329345703125, 0.100677490234375, 0.1307220458984375, 0.1607666015625, 0.1908111572265625, 0.220855712890625, 0.2509002685546875, 0.28094482421875, 0.3109893798828125, 0.341033935546875, 0.3710784912109375, 0.401123046875, 0.4311676025390625, 0.461212158203125, 0.4912567138671875, 0.52130126953125, 0.5513458251953125, 0.581390380859375, 0.6114349365234375, 0.6414794921875, 0.6715240478515625, 0.701568603515625, 0.7316131591796875, 0.76165771484375, 0.7917022705078125, 0.821746826171875, 0.8517913818359375, 0.8818359375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 4.0, 7.0, 3.0, 16.0, 12.0, 28.0, 44.0, 46.0, 72.0, 110.0, 99.0, 98.0, 104.0, 86.0, 77.0, 71.0, 46.0, 26.0, 14.0, 8.0, 6.0, 7.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.215087890625, -0.2092113494873047, -0.20333480834960938, -0.19745826721191406, -0.19158172607421875, -0.18570518493652344, -0.17982864379882812, -0.1739521026611328, -0.1680755615234375, -0.1621990203857422, -0.15632247924804688, -0.15044593811035156, -0.14456939697265625, -0.13869285583496094, -0.13281631469726562, -0.1269397735595703, -0.121063232421875, -0.11518669128417969, -0.10931015014648438, -0.10343360900878906, -0.09755706787109375, -0.09168052673339844, -0.08580398559570312, -0.07992744445800781, -0.0740509033203125, -0.06817436218261719, -0.062297821044921875, -0.05642127990722656, -0.05054473876953125, -0.04466819763183594, -0.038791656494140625, -0.03291511535644531, -0.02703857421875, -0.021162033081054688, -0.015285491943359375, -0.009408950805664062, -0.00353240966796875, 0.0023441314697265625, 0.008220672607421875, 0.014097213745117188, 0.0199737548828125, 0.025850296020507812, 0.031726837158203125, 0.03760337829589844, 0.04347991943359375, 0.04935646057128906, 0.055233001708984375, 0.06110954284667969, 0.066986083984375, 0.07286262512207031, 0.07873916625976562, 0.08461570739746094, 0.09049224853515625, 0.09636878967285156, 0.10224533081054688, 0.10812187194824219, 0.1139984130859375, 0.11987495422363281, 0.12575149536132812, 0.13162803649902344, 0.13750457763671875, 0.14338111877441406, 0.14925765991210938, 0.1551342010498047, 0.1610107421875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 9.0, 7.0, 12.0, 14.0, 23.0, 25.0, 19.0, 28.0, 42.0, 68.0, 123.0, 289.0, 853.0, 3681.0, 23061.0, 628259.0, 3492849.0, 37733.0, 5142.0, 1163.0, 407.0, 112.0, 72.0, 48.0, 49.0, 34.0, 24.0, 25.0, 18.0, 16.0, 15.0, 15.0, 5.0, 4.0, 9.0, 10.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.16015625, -1.1271133422851562, -1.0940704345703125, -1.0610275268554688, -1.027984619140625, -0.9949417114257812, -0.9618988037109375, -0.9288558959960938, -0.89581298828125, -0.8627700805664062, -0.8297271728515625, -0.7966842651367188, -0.763641357421875, -0.7305984497070312, -0.6975555419921875, -0.6645126342773438, -0.6314697265625, -0.5984268188476562, -0.5653839111328125, -0.5323410034179688, -0.499298095703125, -0.46625518798828125, -0.4332122802734375, -0.40016937255859375, -0.36712646484375, -0.33408355712890625, -0.3010406494140625, -0.26799774169921875, -0.234954833984375, -0.20191192626953125, -0.1688690185546875, -0.13582611083984375, -0.102783203125, -0.06974029541015625, -0.0366973876953125, -0.00365447998046875, 0.029388427734375, 0.06243133544921875, 0.0954742431640625, 0.12851715087890625, 0.16156005859375, 0.19460296630859375, 0.2276458740234375, 0.26068878173828125, 0.293731689453125, 0.32677459716796875, 0.3598175048828125, 0.39286041259765625, 0.4259033203125, 0.45894622802734375, 0.4919891357421875, 0.5250320434570312, 0.558074951171875, 0.5911178588867188, 0.6241607666015625, 0.6572036743164062, 0.69024658203125, 0.7232894897460938, 0.7563323974609375, 0.7893753051757812, 0.822418212890625, 0.8554611206054688, 0.8885040283203125, 0.9215469360351562, 0.95458984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 21.0, 20.0, 46.0, 102.0, 249.0, 1317.0, 1844.0, 253.0, 106.0, 52.0, 32.0, 8.0, 10.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.175537109375, -0.16304397583007812, -0.15055084228515625, -0.13805770874023438, -0.1255645751953125, -0.11307144165039062, -0.10057830810546875, -0.08808517456054688, -0.075592041015625, -0.06309890747070312, -0.05060577392578125, -0.038112640380859375, -0.0256195068359375, -0.013126373291015625, -0.00063323974609375, 0.011859893798828125, 0.02435302734375, 0.036846160888671875, 0.04933929443359375, 0.061832427978515625, 0.0743255615234375, 0.08681869506835938, 0.09931182861328125, 0.11180496215820312, 0.124298095703125, 0.13679122924804688, 0.14928436279296875, 0.16177749633789062, 0.1742706298828125, 0.18676376342773438, 0.19925689697265625, 0.21175003051757812, 0.2242431640625, 0.23673629760742188, 0.24922943115234375, 0.2617225646972656, 0.2742156982421875, 0.2867088317871094, 0.29920196533203125, 0.3116950988769531, 0.324188232421875, 0.3366813659667969, 0.34917449951171875, 0.3616676330566406, 0.3741607666015625, 0.3866539001464844, 0.39914703369140625, 0.4116401672363281, 0.42413330078125, 0.4366264343261719, 0.44911956787109375, 0.4616127014160156, 0.4741058349609375, 0.4865989685058594, 0.49909210205078125, 0.5115852355957031, 0.524078369140625, 0.5365715026855469, 0.5490646362304688, 0.5615577697753906, 0.5740509033203125, 0.5865440368652344, 0.5990371704101562, 0.6115303039550781, 0.6240234375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 3.0, 4.0, 20.0, 34.0, 85.0, 179.0, 236.0, 182.0, 131.0, 60.0, 27.0, 8.0, 10.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3731882572174072, -2.3117642402648926, -2.250340223312378, -2.1889162063598633, -2.1274919509887695, -2.066067934036255, -2.0046439170837402, -1.9432199001312256, -1.881795883178711, -1.8203718662261963, -1.7589478492736816, -1.6975237131118774, -1.6360996961593628, -1.5746756792068481, -1.513251543045044, -1.4518275260925293, -1.3904035091400146, -1.3289794921875, -1.2675554752349854, -1.2061313390731812, -1.1447073221206665, -1.0832833051681519, -1.0218591690063477, -0.960435152053833, -0.8990111351013184, -0.8375871181488037, -0.7761630415916443, -0.7147389650344849, -0.6533149480819702, -0.5918909311294556, -0.5304668545722961, -0.4690428078174591, -0.4076188802719116, -0.3461948335170746, -0.28477078676223755, -0.2233467400074005, -0.16192269325256348, -0.10049864649772644, -0.039074599742889404, 0.022349447011947632, 0.08377349376678467, 0.1451975405216217, 0.20662158727645874, 0.2680456340312958, 0.3294696807861328, 0.39089372754096985, 0.4523177742958069, 0.5137418508529663, 0.575165867805481, 0.6365898847579956, 0.698013961315155, 0.7594380378723145, 0.8208620548248291, 0.8822860717773438, 0.9437101483345032, 1.0051342248916626, 1.0665582418441772, 1.127982258796692, 1.189406394958496, 1.2508304119110107, 1.3122544288635254, 1.37367844581604, 1.4351024627685547, 1.4965265989303589, 1.5579506158828735]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 6.0, 20.0, 19.0, 31.0, 38.0, 49.0, 72.0, 70.0, 74.0, 80.0, 72.0, 93.0, 89.0, 58.0, 59.0, 46.0, 31.0, 32.0, 19.0, 11.0, 8.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3341453075408936, -1.2963017225265503, -1.258458137512207, -1.2206144332885742, -1.182770848274231, -1.1449272632598877, -1.1070836782455444, -1.0692400932312012, -1.0313963890075684, -0.9935528039932251, -0.9557091593742371, -0.9178655743598938, -0.8800219297409058, -0.8421783447265625, -0.8043347597122192, -0.7664911150932312, -0.7286475300788879, -0.6908039450645447, -0.6529603004455566, -0.6151167154312134, -0.5772730708122253, -0.5394294857978821, -0.501585841178894, -0.4637422561645508, -0.42589864134788513, -0.3880550265312195, -0.35021141171455383, -0.3123677968978882, -0.2745242118835449, -0.23668058216571808, -0.19883698225021362, -0.16099336743354797, -0.12314975261688232, -0.08530613780021667, -0.04746253043413162, -0.00961892306804657, 0.02822469174861908, 0.06606830656528473, 0.10391190648078918, 0.14175552129745483, 0.17959913611412048, 0.21744275093078613, 0.2552863657474518, 0.29312998056411743, 0.3309735655784607, 0.36881721019744873, 0.406660795211792, 0.44450441002845764, 0.4823480248451233, 0.5201916098594666, 0.5580352544784546, 0.5958788394927979, 0.6337224841117859, 0.6715660691261292, 0.7094097137451172, 0.7472532987594604, 0.7850968837738037, 0.822940468788147, 0.860784113407135, 0.8986276984214783, 0.9364713430404663, 0.9743149280548096, 1.0121585130691528, 1.050002098083496, 1.087845802307129]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 2.0, 6.0, 11.0, 6.0, 12.0, 21.0, 35.0, 46.0, 71.0, 106.0, 170.0, 265.0, 408.0, 674.0, 1124.0, 2062.0, 4698.0, 12620.0, 45812.0, 234993.0, 544810.0, 151321.0, 31689.0, 9486.0, 3751.0, 1806.0, 966.0, 625.0, 336.0, 218.0, 143.0, 87.0, 65.0, 38.0, 20.0, 15.0, 12.0, 5.0, 7.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.71435546875, -0.6908340454101562, -0.6673126220703125, -0.6437911987304688, -0.620269775390625, -0.5967483520507812, -0.5732269287109375, -0.5497055053710938, -0.52618408203125, -0.5026626586914062, -0.4791412353515625, -0.45561981201171875, -0.432098388671875, -0.40857696533203125, -0.3850555419921875, -0.36153411865234375, -0.3380126953125, -0.31449127197265625, -0.2909698486328125, -0.26744842529296875, -0.243927001953125, -0.22040557861328125, -0.1968841552734375, -0.17336273193359375, -0.14984130859375, -0.12631988525390625, -0.1027984619140625, -0.07927703857421875, -0.055755615234375, -0.03223419189453125, -0.0087127685546875, 0.01480865478515625, 0.038330078125, 0.06185150146484375, 0.0853729248046875, 0.10889434814453125, 0.132415771484375, 0.15593719482421875, 0.1794586181640625, 0.20298004150390625, 0.22650146484375, 0.25002288818359375, 0.2735443115234375, 0.29706573486328125, 0.320587158203125, 0.34410858154296875, 0.3676300048828125, 0.39115142822265625, 0.4146728515625, 0.43819427490234375, 0.4617156982421875, 0.48523712158203125, 0.508758544921875, 0.5322799682617188, 0.5558013916015625, 0.5793228149414062, 0.60284423828125, 0.6263656616210938, 0.6498870849609375, 0.6734085083007812, 0.696929931640625, 0.7204513549804688, 0.7439727783203125, 0.7674942016601562, 0.791015625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 7.0, 18.0, 18.0, 26.0, 44.0, 58.0, 78.0, 104.0, 111.0, 102.0, 90.0, 89.0, 75.0, 55.0, 42.0, 21.0, 16.0, 9.0, 8.0, 3.0, 5.0, 1.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.22607421875, -0.21984481811523438, -0.21361541748046875, -0.20738601684570312, -0.2011566162109375, -0.19492721557617188, -0.18869781494140625, -0.18246841430664062, -0.176239013671875, -0.17000961303710938, -0.16378021240234375, -0.15755081176757812, -0.1513214111328125, -0.14509201049804688, -0.13886260986328125, -0.13263320922851562, -0.12640380859375, -0.12017440795898438, -0.11394500732421875, -0.10771560668945312, -0.1014862060546875, -0.09525680541992188, -0.08902740478515625, -0.08279800415039062, -0.076568603515625, -0.07033920288085938, -0.06410980224609375, -0.057880401611328125, -0.0516510009765625, -0.045421600341796875, -0.03919219970703125, -0.032962799072265625, -0.0267333984375, -0.020503997802734375, -0.01427459716796875, -0.008045196533203125, -0.0018157958984375, 0.004413604736328125, 0.01064300537109375, 0.016872406005859375, 0.023101806640625, 0.029331207275390625, 0.03556060791015625, 0.041790008544921875, 0.0480194091796875, 0.054248809814453125, 0.06047821044921875, 0.06670761108398438, 0.07293701171875, 0.07916641235351562, 0.08539581298828125, 0.09162521362304688, 0.0978546142578125, 0.10408401489257812, 0.11031341552734375, 0.11654281616210938, 0.122772216796875, 0.12900161743164062, 0.13523101806640625, 0.14146041870117188, 0.1476898193359375, 0.15391921997070312, 0.16014862060546875, 0.16637802124023438, 0.172607421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 12.0, 6.0, 14.0, 14.0, 20.0, 39.0, 49.0, 87.0, 85.0, 186.0, 298.0, 553.0, 1197.0, 3265.0, 10887.0, 51064.0, 278714.0, 524447.0, 140922.0, 26280.0, 6397.0, 2074.0, 841.0, 447.0, 230.0, 127.0, 88.0, 51.0, 29.0, 30.0, 26.0, 22.0, 16.0, 10.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54638671875, -0.528350830078125, -0.51031494140625, -0.492279052734375, -0.4742431640625, -0.456207275390625, -0.43817138671875, -0.420135498046875, -0.402099609375, -0.384063720703125, -0.36602783203125, -0.347991943359375, -0.3299560546875, -0.311920166015625, -0.29388427734375, -0.275848388671875, -0.2578125, -0.239776611328125, -0.22174072265625, -0.203704833984375, -0.1856689453125, -0.167633056640625, -0.14959716796875, -0.131561279296875, -0.113525390625, -0.095489501953125, -0.07745361328125, -0.059417724609375, -0.0413818359375, -0.023345947265625, -0.00531005859375, 0.012725830078125, 0.03076171875, 0.048797607421875, 0.06683349609375, 0.084869384765625, 0.1029052734375, 0.120941162109375, 0.13897705078125, 0.157012939453125, 0.175048828125, 0.193084716796875, 0.21112060546875, 0.229156494140625, 0.2471923828125, 0.265228271484375, 0.28326416015625, 0.301300048828125, 0.3193359375, 0.337371826171875, 0.35540771484375, 0.373443603515625, 0.3914794921875, 0.409515380859375, 0.42755126953125, 0.445587158203125, 0.463623046875, 0.481658935546875, 0.49969482421875, 0.517730712890625, 0.5357666015625, 0.553802490234375, 0.57183837890625, 0.589874267578125, 0.60791015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 8.0, 4.0, 10.0, 7.0, 6.0, 19.0, 19.0, 12.0, 33.0, 24.0, 36.0, 34.0, 40.0, 45.0, 41.0, 39.0, 44.0, 43.0, 47.0, 43.0, 52.0, 52.0, 46.0, 45.0, 33.0, 41.0, 28.0, 32.0, 33.0, 17.0, 14.0, 16.0, 10.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42822265625, -0.41469573974609375, -0.4011688232421875, -0.38764190673828125, -0.374114990234375, -0.36058807373046875, -0.3470611572265625, -0.33353424072265625, -0.32000732421875, -0.30648040771484375, -0.2929534912109375, -0.27942657470703125, -0.265899658203125, -0.25237274169921875, -0.2388458251953125, -0.22531890869140625, -0.2117919921875, -0.19826507568359375, -0.1847381591796875, -0.17121124267578125, -0.157684326171875, -0.14415740966796875, -0.1306304931640625, -0.11710357666015625, -0.10357666015625, -0.09004974365234375, -0.0765228271484375, -0.06299591064453125, -0.049468994140625, -0.03594207763671875, -0.0224151611328125, -0.00888824462890625, 0.004638671875, 0.01816558837890625, 0.0316925048828125, 0.04521942138671875, 0.058746337890625, 0.07227325439453125, 0.0858001708984375, 0.09932708740234375, 0.11285400390625, 0.12638092041015625, 0.1399078369140625, 0.15343475341796875, 0.166961669921875, 0.18048858642578125, 0.1940155029296875, 0.20754241943359375, 0.2210693359375, 0.23459625244140625, 0.2481231689453125, 0.26165008544921875, 0.275177001953125, 0.28870391845703125, 0.3022308349609375, 0.31575775146484375, 0.32928466796875, 0.34281158447265625, 0.3563385009765625, 0.36986541748046875, 0.383392333984375, 0.39691925048828125, 0.4104461669921875, 0.42397308349609375, 0.4375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 1.0, 4.0, 8.0, 6.0, 9.0, 21.0, 18.0, 24.0, 48.0, 50.0, 90.0, 140.0, 228.0, 432.0, 885.0, 2199.0, 6141.0, 22992.0, 151949.0, 669502.0, 159574.0, 23658.0, 6353.0, 2196.0, 923.0, 425.0, 228.0, 147.0, 99.0, 59.0, 48.0, 26.0, 23.0, 20.0, 6.0, 8.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.2949104309082031, -0.28610992431640625, -0.2773094177246094, -0.2685089111328125, -0.2597084045410156, -0.25090789794921875, -0.24210739135742188, -0.233306884765625, -0.22450637817382812, -0.21570587158203125, -0.20690536499023438, -0.1981048583984375, -0.18930435180664062, -0.18050384521484375, -0.17170333862304688, -0.16290283203125, -0.15410232543945312, -0.14530181884765625, -0.13650131225585938, -0.1277008056640625, -0.11890029907226562, -0.11009979248046875, -0.10129928588867188, -0.092498779296875, -0.08369827270507812, -0.07489776611328125, -0.06609725952148438, -0.0572967529296875, -0.048496246337890625, -0.03969573974609375, -0.030895233154296875, -0.0220947265625, -0.013294219970703125, -0.00449371337890625, 0.004306793212890625, 0.0131072998046875, 0.021907806396484375, 0.03070831298828125, 0.039508819580078125, 0.048309326171875, 0.057109832763671875, 0.06591033935546875, 0.07471084594726562, 0.0835113525390625, 0.09231185913085938, 0.10111236572265625, 0.10991287231445312, 0.11871337890625, 0.12751388549804688, 0.13631439208984375, 0.14511489868164062, 0.1539154052734375, 0.16271591186523438, 0.17151641845703125, 0.18031692504882812, 0.189117431640625, 0.19791793823242188, 0.20671844482421875, 0.21551895141601562, 0.2243194580078125, 0.23311996459960938, 0.24192047119140625, 0.2507209777832031, 0.259521484375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 8.0, 8.0, 10.0, 8.0, 14.0, 25.0, 24.0, 32.0, 26.0, 48.0, 41.0, 75.0, 72.0, 82.0, 79.0, 73.0, 51.0, 52.0, 40.0, 28.0, 34.0, 17.0, 21.0, 17.0, 7.0, 13.0, 17.0, 6.0, 11.0, 6.0, 3.0, 4.0, 3.0, 2.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.799531936645508e-05, -5.5985525250434875e-05, -5.397573113441467e-05, -5.196593701839447e-05, -4.995614290237427e-05, -4.7946348786354065e-05, -4.593655467033386e-05, -4.392676055431366e-05, -4.191696643829346e-05, -3.9907172322273254e-05, -3.789737820625305e-05, -3.588758409023285e-05, -3.3877789974212646e-05, -3.1867995858192444e-05, -2.985820174217224e-05, -2.784840762615204e-05, -2.5838613510131836e-05, -2.3828819394111633e-05, -2.181902527809143e-05, -1.9809231162071228e-05, -1.7799437046051025e-05, -1.5789642930030823e-05, -1.377984881401062e-05, -1.1770054697990417e-05, -9.760260581970215e-06, -7.750466465950012e-06, -5.7406723499298096e-06, -3.730878233909607e-06, -1.7210841178894043e-06, 2.8870999813079834e-07, 2.298504114151001e-06, 4.308298230171204e-06, 6.318092346191406e-06, 8.327886462211609e-06, 1.0337680578231812e-05, 1.2347474694252014e-05, 1.4357268810272217e-05, 1.636706292629242e-05, 1.8376857042312622e-05, 2.0386651158332825e-05, 2.2396445274353027e-05, 2.440623939037323e-05, 2.6416033506393433e-05, 2.8425827622413635e-05, 3.0435621738433838e-05, 3.244541585445404e-05, 3.445520997047424e-05, 3.6465004086494446e-05, 3.847479820251465e-05, 4.048459231853485e-05, 4.2494386434555054e-05, 4.4504180550575256e-05, 4.651397466659546e-05, 4.852376878261566e-05, 5.0533562898635864e-05, 5.254335701465607e-05, 5.455315113067627e-05, 5.656294524669647e-05, 5.8572739362716675e-05, 6.058253347873688e-05, 6.259232759475708e-05, 6.460212171077728e-05, 6.661191582679749e-05, 6.862170994281769e-05, 7.063150405883789e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 12.0, 15.0, 25.0, 41.0, 56.0, 111.0, 201.0, 403.0, 974.0, 2866.0, 14976.0, 218912.0, 750399.0, 50452.0, 6220.0, 1549.0, 640.0, 305.0, 154.0, 100.0, 57.0, 18.0, 23.0, 10.0, 5.0, 6.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35595703125, -0.34336090087890625, -0.3307647705078125, -0.31816864013671875, -0.305572509765625, -0.29297637939453125, -0.2803802490234375, -0.26778411865234375, -0.25518798828125, -0.24259185791015625, -0.2299957275390625, -0.21739959716796875, -0.204803466796875, -0.19220733642578125, -0.1796112060546875, -0.16701507568359375, -0.1544189453125, -0.14182281494140625, -0.1292266845703125, -0.11663055419921875, -0.104034423828125, -0.09143829345703125, -0.0788421630859375, -0.06624603271484375, -0.05364990234375, -0.04105377197265625, -0.0284576416015625, -0.01586151123046875, -0.003265380859375, 0.00933074951171875, 0.0219268798828125, 0.03452301025390625, 0.047119140625, 0.05971527099609375, 0.0723114013671875, 0.08490753173828125, 0.097503662109375, 0.11009979248046875, 0.1226959228515625, 0.13529205322265625, 0.14788818359375, 0.16048431396484375, 0.1730804443359375, 0.18567657470703125, 0.198272705078125, 0.21086883544921875, 0.2234649658203125, 0.23606109619140625, 0.2486572265625, 0.26125335693359375, 0.2738494873046875, 0.28644561767578125, 0.299041748046875, 0.31163787841796875, 0.3242340087890625, 0.33683013916015625, 0.34942626953125, 0.36202239990234375, 0.3746185302734375, 0.38721466064453125, 0.399810791015625, 0.41240692138671875, 0.4250030517578125, 0.43759918212890625, 0.4501953125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 12.0, 20.0, 21.0, 37.0, 41.0, 60.0, 69.0, 106.0, 95.0, 107.0, 105.0, 72.0, 74.0, 58.0, 28.0, 34.0, 13.0, 20.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12646484375, -0.11955642700195312, -0.11264801025390625, -0.10573959350585938, -0.0988311767578125, -0.09192276000976562, -0.08501434326171875, -0.07810592651367188, -0.071197509765625, -0.06428909301757812, -0.05738067626953125, -0.050472259521484375, -0.0435638427734375, -0.036655426025390625, -0.02974700927734375, -0.022838592529296875, -0.01593017578125, -0.009021759033203125, -0.00211334228515625, 0.004795074462890625, 0.0117034912109375, 0.018611907958984375, 0.02552032470703125, 0.032428741455078125, 0.039337158203125, 0.046245574951171875, 0.05315399169921875, 0.060062408447265625, 0.0669708251953125, 0.07387924194335938, 0.08078765869140625, 0.08769607543945312, 0.0946044921875, 0.10151290893554688, 0.10842132568359375, 0.11532974243164062, 0.1222381591796875, 0.12914657592773438, 0.13605499267578125, 0.14296340942382812, 0.149871826171875, 0.15678024291992188, 0.16368865966796875, 0.17059707641601562, 0.1775054931640625, 0.18441390991210938, 0.19132232666015625, 0.19823074340820312, 0.20513916015625, 0.21204757690429688, 0.21895599365234375, 0.22586441040039062, 0.2327728271484375, 0.23968124389648438, 0.24658966064453125, 0.2534980773925781, 0.260406494140625, 0.2673149108886719, 0.27422332763671875, 0.2811317443847656, 0.2880401611328125, 0.2949485778808594, 0.30185699462890625, 0.3087654113769531, 0.315673828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 17.0, 19.0, 56.0, 111.0, 155.0, 233.0, 165.0, 111.0, 63.0, 32.0, 14.0, 11.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.191426753997803, -4.038639545440674, -3.885852575302124, -3.733065366744995, -3.5802783966064453, -3.4274911880493164, -3.2747039794921875, -3.1219170093536377, -2.969130039215088, -2.816342830657959, -2.663555860519409, -2.5107686519622803, -2.3579816818237305, -2.2051944732666016, -2.0524072647094727, -1.8996202945709229, -1.746833086013794, -1.5940459966659546, -1.4412589073181152, -1.2884716987609863, -1.1356847286224365, -0.9828975796699524, -0.8301104307174683, -0.6773233413696289, -0.5245362520217896, -0.3717491626739502, -0.21896204352378845, -0.06617492437362671, 0.08661216497421265, 0.239399254322052, 0.39218640327453613, 0.5449734926223755, 0.6977605819702148, 0.8505476713180542, 1.0033347606658936, 1.1561219692230225, 1.3089089393615723, 1.4616961479187012, 1.6144832372665405, 1.7672703266143799, 1.9200574159622192, 2.0728445053100586, 2.2256317138671875, 2.3784186840057373, 2.531205892562866, 2.683992862701416, 2.836780071258545, 2.989567279815674, 3.1423542499542236, 3.2951414585113525, 3.4479284286499023, 3.6007156372070312, 3.753502607345581, 3.90628981590271, 4.05907678604126, 4.211863994598389, 4.364651203155518, 4.5174384117126465, 4.670225620269775, 4.823012351989746, 4.975799560546875, 5.128586769104004, 5.281373977661133, 5.434161186218262, 5.586947917938232]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 8.0, 8.0, 8.0, 14.0, 13.0, 16.0, 21.0, 23.0, 28.0, 38.0, 34.0, 42.0, 47.0, 46.0, 45.0, 28.0, 49.0, 46.0, 49.0, 48.0, 48.0, 47.0, 43.0, 36.0, 22.0, 23.0, 24.0, 24.0, 26.0, 13.0, 15.0, 12.0, 11.0, 11.0, 10.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1554758548736572, -2.0817110538482666, -2.007946014404297, -1.9341812133789062, -1.8604164123535156, -1.7866514921188354, -1.7128865718841553, -1.6391217708587646, -1.5653568506240845, -1.4915919303894043, -1.4178271293640137, -1.3440622091293335, -1.2702972888946533, -1.1965324878692627, -1.1227675676345825, -1.0490026473999023, -0.9752378463745117, -0.9014729857444763, -0.8277081251144409, -0.7539432048797607, -0.6801783442497253, -0.6064134836196899, -0.5326485633850098, -0.45888370275497437, -0.38511884212493896, -0.31135398149490356, -0.23758909106254578, -0.16382421553134918, -0.09005934000015259, -0.016294479370117188, 0.0574704110622406, 0.1312353014945984, 0.2049999237060547, 0.2787647843360901, 0.3525296747684479, 0.42629456520080566, 0.5000594258308411, 0.5738242864608765, 0.6475892066955566, 0.721354067325592, 0.7951189279556274, 0.8688837885856628, 0.9426486492156982, 1.0164135694503784, 1.0901784896850586, 1.1639432907104492, 1.2377082109451294, 1.3114731311798096, 1.3852379322052002, 1.4590028524398804, 1.532767653465271, 1.6065325736999512, 1.6802973747253418, 1.754062294960022, 1.8278272151947021, 1.9015920162200928, 1.975356936454773, 2.049121856689453, 2.1228866577148438, 2.1966514587402344, 2.270416498184204, 2.3441812992095947, 2.4179461002349854, 2.491711139678955, 2.5654759407043457]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 9.0, 9.0, 15.0, 34.0, 42.0, 62.0, 84.0, 142.0, 212.0, 337.0, 496.0, 1025.0, 2290.0, 6557.0, 28797.0, 477184.0, 3613937.0, 47457.0, 9776.0, 3171.0, 1263.0, 585.0, 296.0, 172.0, 122.0, 77.0, 44.0, 32.0, 20.0, 7.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.0642852783203125, -1.028961181640625, -0.9936370849609375, -0.95831298828125, -0.9229888916015625, -0.887664794921875, -0.8523406982421875, -0.8170166015625, -0.7816925048828125, -0.746368408203125, -0.7110443115234375, -0.67572021484375, -0.6403961181640625, -0.605072021484375, -0.5697479248046875, -0.534423828125, -0.4990997314453125, -0.463775634765625, -0.4284515380859375, -0.39312744140625, -0.3578033447265625, -0.322479248046875, -0.2871551513671875, -0.2518310546875, -0.2165069580078125, -0.181182861328125, -0.1458587646484375, -0.11053466796875, -0.0752105712890625, -0.039886474609375, -0.0045623779296875, 0.03076171875, 0.0660858154296875, 0.101409912109375, 0.1367340087890625, 0.17205810546875, 0.2073822021484375, 0.242706298828125, 0.2780303955078125, 0.3133544921875, 0.3486785888671875, 0.384002685546875, 0.4193267822265625, 0.45465087890625, 0.4899749755859375, 0.525299072265625, 0.5606231689453125, 0.595947265625, 0.6312713623046875, 0.666595458984375, 0.7019195556640625, 0.73724365234375, 0.7725677490234375, 0.807891845703125, 0.8432159423828125, 0.8785400390625, 0.9138641357421875, 0.949188232421875, 0.9845123291015625, 1.01983642578125, 1.0551605224609375, 1.090484619140625, 1.1258087158203125, 1.1611328125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 9.0, 22.0, 18.0, 33.0, 44.0, 69.0, 82.0, 92.0, 100.0, 101.0, 84.0, 95.0, 74.0, 62.0, 33.0, 25.0, 17.0, 13.0, 7.0, 1.0, 2.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.24013900756835938, -0.23332977294921875, -0.22652053833007812, -0.2197113037109375, -0.21290206909179688, -0.20609283447265625, -0.19928359985351562, -0.192474365234375, -0.18566513061523438, -0.17885589599609375, -0.17204666137695312, -0.1652374267578125, -0.15842819213867188, -0.15161895751953125, -0.14480972290039062, -0.13800048828125, -0.13119125366210938, -0.12438201904296875, -0.11757278442382812, -0.1107635498046875, -0.10395431518554688, -0.09714508056640625, -0.09033584594726562, -0.083526611328125, -0.07671737670898438, -0.06990814208984375, -0.06309890747070312, -0.0562896728515625, -0.049480438232421875, -0.04267120361328125, -0.035861968994140625, -0.029052734375, -0.022243499755859375, -0.01543426513671875, -0.008625030517578125, -0.0018157958984375, 0.004993438720703125, 0.01180267333984375, 0.018611907958984375, 0.025421142578125, 0.032230377197265625, 0.03903961181640625, 0.045848846435546875, 0.0526580810546875, 0.059467315673828125, 0.06627655029296875, 0.07308578491210938, 0.07989501953125, 0.08670425415039062, 0.09351348876953125, 0.10032272338867188, 0.1071319580078125, 0.11394119262695312, 0.12075042724609375, 0.12755966186523438, 0.134368896484375, 0.14117813110351562, 0.14798736572265625, 0.15479660034179688, 0.1616058349609375, 0.16841506958007812, 0.17522430419921875, 0.18203353881835938, 0.1888427734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 2.0, 10.0, 7.0, 12.0, 10.0, 23.0, 25.0, 38.0, 40.0, 74.0, 117.0, 175.0, 336.0, 643.0, 1345.0, 3054.0, 8001.0, 24568.0, 109648.0, 3042572.0, 898884.0, 74372.0, 18743.0, 6517.0, 2560.0, 1134.0, 605.0, 299.0, 163.0, 94.0, 60.0, 38.0, 25.0, 21.0, 14.0, 14.0, 5.0, 10.0, 5.0, 4.0, 3.0, 0.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.52349853515625, -0.5059814453125, -0.48846435546875, -0.470947265625, -0.45343017578125, -0.4359130859375, -0.41839599609375, -0.40087890625, -0.38336181640625, -0.3658447265625, -0.34832763671875, -0.330810546875, -0.31329345703125, -0.2957763671875, -0.27825927734375, -0.2607421875, -0.24322509765625, -0.2257080078125, -0.20819091796875, -0.190673828125, -0.17315673828125, -0.1556396484375, -0.13812255859375, -0.12060546875, -0.10308837890625, -0.0855712890625, -0.06805419921875, -0.050537109375, -0.03302001953125, -0.0155029296875, 0.00201416015625, 0.01953125, 0.03704833984375, 0.0545654296875, 0.07208251953125, 0.089599609375, 0.10711669921875, 0.1246337890625, 0.14215087890625, 0.15966796875, 0.17718505859375, 0.1947021484375, 0.21221923828125, 0.229736328125, 0.24725341796875, 0.2647705078125, 0.28228759765625, 0.2998046875, 0.31732177734375, 0.3348388671875, 0.35235595703125, 0.369873046875, 0.38739013671875, 0.4049072265625, 0.42242431640625, 0.43994140625, 0.45745849609375, 0.4749755859375, 0.49249267578125, 0.510009765625, 0.52752685546875, 0.5450439453125, 0.56256103515625, 0.580078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 7.0, 4.0, 7.0, 9.0, 10.0, 20.0, 30.0, 38.0, 65.0, 89.0, 167.0, 357.0, 1143.0, 1384.0, 303.0, 156.0, 85.0, 45.0, 38.0, 24.0, 30.0, 21.0, 10.0, 14.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2939453125, -0.28578758239746094, -0.2776298522949219, -0.2694721221923828, -0.26131439208984375, -0.2531566619873047, -0.24499893188476562, -0.23684120178222656, -0.2286834716796875, -0.22052574157714844, -0.21236801147460938, -0.2042102813720703, -0.19605255126953125, -0.1878948211669922, -0.17973709106445312, -0.17157936096191406, -0.163421630859375, -0.15526390075683594, -0.14710617065429688, -0.1389484405517578, -0.13079071044921875, -0.12263298034667969, -0.11447525024414062, -0.10631752014160156, -0.0981597900390625, -0.09000205993652344, -0.08184432983398438, -0.07368659973144531, -0.06552886962890625, -0.05737113952636719, -0.049213409423828125, -0.04105567932128906, -0.03289794921875, -0.024740219116210938, -0.016582489013671875, -0.008424758911132812, -0.00026702880859375, 0.007890701293945312, 0.016048431396484375, 0.024206161499023438, 0.0323638916015625, 0.04052162170410156, 0.048679351806640625, 0.05683708190917969, 0.06499481201171875, 0.07315254211425781, 0.08131027221679688, 0.08946800231933594, 0.097625732421875, 0.10578346252441406, 0.11394119262695312, 0.12209892272949219, 0.13025665283203125, 0.1384143829345703, 0.14657211303710938, 0.15472984313964844, 0.1628875732421875, 0.17104530334472656, 0.17920303344726562, 0.1873607635498047, 0.19551849365234375, 0.2036762237548828, 0.21183395385742188, 0.21999168395996094, 0.2281494140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 10.0, 5.0, 30.0, 93.0, 167.0, 276.0, 221.0, 115.0, 38.0, 23.0, 11.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.66354501247406, -1.5745261907577515, -1.4855072498321533, -1.3964884281158447, -1.3074696063995361, -1.2184507846832275, -1.1294318437576294, -1.0404130220413208, -0.9513941407203674, -0.8623752593994141, -0.7733564376831055, -0.6843375563621521, -0.5953186750411987, -0.5062998533248901, -0.41728097200393677, -0.3282621502876282, -0.2392432689666748, -0.15022441744804382, -0.06120555102825165, 0.027813315391540527, 0.11683216691017151, 0.2058510184288025, 0.29486989974975586, 0.38388872146606445, 0.4729076027870178, 0.5619264841079712, 0.6509453058242798, 0.7399641871452332, 0.8289830684661865, 0.9180018901824951, 1.0070207118988037, 1.0960395336151123, 1.185058355331421, 1.2740771770477295, 1.3630961179733276, 1.4521149396896362, 1.5411337614059448, 1.630152702331543, 1.7191715240478516, 1.8081903457641602, 1.8972091674804688, 1.9862279891967773, 2.075246810913086, 2.1642656326293945, 2.2532846927642822, 2.342303514480591, 2.4313223361968994, 2.520341157913208, 2.6093602180480957, 2.6983790397644043, 2.787397861480713, 2.8764166831970215, 2.965435743331909, 3.0544545650482178, 3.1434733867645264, 3.232492208480835, 3.3215110301971436, 3.410529851913452, 3.4995486736297607, 3.5885677337646484, 3.677586555480957, 3.7666053771972656, 3.855624198913574, 3.944643020629883, 4.033661842346191]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 1.0, 5.0, 11.0, 10.0, 6.0, 13.0, 12.0, 24.0, 27.0, 27.0, 50.0, 45.0, 48.0, 41.0, 59.0, 59.0, 55.0, 52.0, 57.0, 59.0, 42.0, 48.0, 44.0, 31.0, 37.0, 25.0, 25.0, 18.0, 12.0, 16.0, 14.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8086709380149841, -0.7789427042007446, -0.7492144703865051, -0.7194862365722656, -0.6897580027580261, -0.6600297689437866, -0.6303015947341919, -0.6005733013153076, -0.5708451271057129, -0.5411168932914734, -0.5113886594772339, -0.4816604256629944, -0.4519321918487549, -0.4222039580345154, -0.39247575402259827, -0.36274752020835876, -0.3330192565917969, -0.3032910227775574, -0.27356278896331787, -0.24383457005023956, -0.21410633623600006, -0.18437810242176056, -0.15464988350868225, -0.12492164969444275, -0.09519341588020325, -0.06546518206596375, -0.03573695570230484, -0.006008729338645935, 0.023719504475593567, 0.05344773828983307, 0.08317595720291138, 0.11290419101715088, 0.1426323652267456, 0.1723605990409851, 0.2020888328552246, 0.23181705176830292, 0.2615453004837036, 0.2912735342979431, 0.32100173830986023, 0.35072997212409973, 0.38045820593833923, 0.41018643975257874, 0.43991467356681824, 0.46964287757873535, 0.49937111139297485, 0.5290993452072144, 0.5588275790214539, 0.5885558128356934, 0.6182840466499329, 0.6480122804641724, 0.6777405142784119, 0.7074687480926514, 0.7371969819068909, 0.7669252157211304, 0.7966533899307251, 0.8263816833496094, 0.8561098575592041, 0.8858380913734436, 0.9155663251876831, 0.9452945590019226, 0.9750227928161621, 1.0047509670257568, 1.0344792604446411, 1.0642074346542358, 1.0939357280731201]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 8.0, 14.0, 9.0, 13.0, 26.0, 33.0, 50.0, 68.0, 114.0, 165.0, 229.0, 417.0, 748.0, 1463.0, 3252.0, 8688.0, 32391.0, 188988.0, 638882.0, 134575.0, 25350.0, 7324.0, 2773.0, 1306.0, 629.0, 386.0, 221.0, 162.0, 91.0, 54.0, 36.0, 24.0, 19.0, 15.0, 14.0, 11.0, 5.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.82470703125, -0.7984542846679688, -0.7722015380859375, -0.7459487915039062, -0.719696044921875, -0.6934432983398438, -0.6671905517578125, -0.6409378051757812, -0.61468505859375, -0.5884323120117188, -0.5621795654296875, -0.5359268188476562, -0.509674072265625, -0.48342132568359375, -0.4571685791015625, -0.43091583251953125, -0.4046630859375, -0.37841033935546875, -0.3521575927734375, -0.32590484619140625, -0.299652099609375, -0.27339935302734375, -0.2471466064453125, -0.22089385986328125, -0.19464111328125, -0.16838836669921875, -0.1421356201171875, -0.11588287353515625, -0.089630126953125, -0.06337738037109375, -0.0371246337890625, -0.01087188720703125, 0.015380859375, 0.04163360595703125, 0.0678863525390625, 0.09413909912109375, 0.120391845703125, 0.14664459228515625, 0.1728973388671875, 0.19915008544921875, 0.22540283203125, 0.25165557861328125, 0.2779083251953125, 0.30416107177734375, 0.330413818359375, 0.35666656494140625, 0.3829193115234375, 0.40917205810546875, 0.4354248046875, 0.46167755126953125, 0.4879302978515625, 0.5141830444335938, 0.540435791015625, 0.5666885375976562, 0.5929412841796875, 0.6191940307617188, 0.64544677734375, 0.6716995239257812, 0.6979522705078125, 0.7242050170898438, 0.750457763671875, 0.7767105102539062, 0.8029632568359375, 0.8292160034179688, 0.85546875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 14.0, 19.0, 31.0, 32.0, 59.0, 94.0, 90.0, 127.0, 121.0, 97.0, 95.0, 68.0, 47.0, 38.0, 27.0, 10.0, 5.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271240234375, -0.2635459899902344, -0.25585174560546875, -0.24815750122070312, -0.2404632568359375, -0.23276901245117188, -0.22507476806640625, -0.21738052368164062, -0.209686279296875, -0.20199203491210938, -0.19429779052734375, -0.18660354614257812, -0.1789093017578125, -0.17121505737304688, -0.16352081298828125, -0.15582656860351562, -0.14813232421875, -0.14043807983398438, -0.13274383544921875, -0.12504959106445312, -0.1173553466796875, -0.10966110229492188, -0.10196685791015625, -0.09427261352539062, -0.086578369140625, -0.07888412475585938, -0.07118988037109375, -0.06349563598632812, -0.0558013916015625, -0.048107147216796875, -0.04041290283203125, -0.032718658447265625, -0.0250244140625, -0.017330169677734375, -0.00963592529296875, -0.001941680908203125, 0.0057525634765625, 0.013446807861328125, 0.02114105224609375, 0.028835296630859375, 0.036529541015625, 0.044223785400390625, 0.05191802978515625, 0.059612274169921875, 0.0673065185546875, 0.07500076293945312, 0.08269500732421875, 0.09038925170898438, 0.09808349609375, 0.10577774047851562, 0.11347198486328125, 0.12116622924804688, 0.1288604736328125, 0.13655471801757812, 0.14424896240234375, 0.15194320678710938, 0.159637451171875, 0.16733169555664062, 0.17502593994140625, 0.18272018432617188, 0.1904144287109375, 0.19810867309570312, 0.20580291748046875, 0.21349716186523438, 0.22119140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 10.0, 19.0, 11.0, 20.0, 29.0, 24.0, 44.0, 51.0, 88.0, 156.0, 211.0, 372.0, 695.0, 1586.0, 4449.0, 15950.0, 82879.0, 484444.0, 377301.0, 60997.0, 12683.0, 3562.0, 1379.0, 616.0, 321.0, 203.0, 118.0, 100.0, 55.0, 40.0, 42.0, 22.0, 13.0, 9.0, 15.0, 7.0, 6.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.61572265625, -0.5964279174804688, -0.5771331787109375, -0.5578384399414062, -0.538543701171875, -0.5192489624023438, -0.4999542236328125, -0.48065948486328125, -0.46136474609375, -0.44207000732421875, -0.4227752685546875, -0.40348052978515625, -0.384185791015625, -0.36489105224609375, -0.3455963134765625, -0.32630157470703125, -0.3070068359375, -0.28771209716796875, -0.2684173583984375, -0.24912261962890625, -0.229827880859375, -0.21053314208984375, -0.1912384033203125, -0.17194366455078125, -0.15264892578125, -0.13335418701171875, -0.1140594482421875, -0.09476470947265625, -0.075469970703125, -0.05617523193359375, -0.0368804931640625, -0.01758575439453125, 0.001708984375, 0.02100372314453125, 0.0402984619140625, 0.05959320068359375, 0.078887939453125, 0.09818267822265625, 0.1174774169921875, 0.13677215576171875, 0.15606689453125, 0.17536163330078125, 0.1946563720703125, 0.21395111083984375, 0.233245849609375, 0.25254058837890625, 0.2718353271484375, 0.29113006591796875, 0.3104248046875, 0.32971954345703125, 0.3490142822265625, 0.36830902099609375, 0.387603759765625, 0.40689849853515625, 0.4261932373046875, 0.44548797607421875, 0.46478271484375, 0.48407745361328125, 0.5033721923828125, 0.5226669311523438, 0.541961669921875, 0.5612564086914062, 0.5805511474609375, 0.5998458862304688, 0.619140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 9.0, 8.0, 17.0, 9.0, 19.0, 17.0, 16.0, 29.0, 19.0, 15.0, 27.0, 37.0, 34.0, 43.0, 41.0, 35.0, 50.0, 38.0, 54.0, 45.0, 46.0, 54.0, 40.0, 32.0, 37.0, 33.0, 33.0, 29.0, 24.0, 22.0, 18.0, 20.0, 10.0, 12.0, 5.0, 10.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37890625, -0.3653297424316406, -0.35175323486328125, -0.3381767272949219, -0.3246002197265625, -0.3110237121582031, -0.29744720458984375, -0.2838706970214844, -0.270294189453125, -0.2567176818847656, -0.24314117431640625, -0.22956466674804688, -0.2159881591796875, -0.20241165161132812, -0.18883514404296875, -0.17525863647460938, -0.16168212890625, -0.14810562133789062, -0.13452911376953125, -0.12095260620117188, -0.1073760986328125, -0.09379959106445312, -0.08022308349609375, -0.06664657592773438, -0.053070068359375, -0.039493560791015625, -0.02591705322265625, -0.012340545654296875, 0.0012359619140625, 0.014812469482421875, 0.02838897705078125, 0.041965484619140625, 0.0555419921875, 0.06911849975585938, 0.08269500732421875, 0.09627151489257812, 0.1098480224609375, 0.12342453002929688, 0.13700103759765625, 0.15057754516601562, 0.164154052734375, 0.17773056030273438, 0.19130706787109375, 0.20488357543945312, 0.2184600830078125, 0.23203659057617188, 0.24561309814453125, 0.2591896057128906, 0.27276611328125, 0.2863426208496094, 0.29991912841796875, 0.3134956359863281, 0.3270721435546875, 0.3406486511230469, 0.35422515869140625, 0.3678016662597656, 0.381378173828125, 0.3949546813964844, 0.40853118896484375, 0.4221076965332031, 0.4356842041015625, 0.4492607116699219, 0.46283721923828125, 0.4764137268066406, 0.489990234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 4.0, 6.0, 11.0, 20.0, 32.0, 97.0, 159.0, 651.0, 5306.0, 1008243.0, 32193.0, 1308.0, 323.0, 97.0, 47.0, 26.0, 11.0, 7.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.078125, -1.0345001220703125, -0.990875244140625, -0.9472503662109375, -0.90362548828125, -0.8600006103515625, -0.816375732421875, -0.7727508544921875, -0.7291259765625, -0.6855010986328125, -0.641876220703125, -0.5982513427734375, -0.55462646484375, -0.5110015869140625, -0.467376708984375, -0.4237518310546875, -0.380126953125, -0.3365020751953125, -0.292877197265625, -0.2492523193359375, -0.20562744140625, -0.1620025634765625, -0.118377685546875, -0.0747528076171875, -0.0311279296875, 0.0124969482421875, 0.056121826171875, 0.0997467041015625, 0.14337158203125, 0.1869964599609375, 0.230621337890625, 0.2742462158203125, 0.31787109375, 0.3614959716796875, 0.405120849609375, 0.4487457275390625, 0.49237060546875, 0.5359954833984375, 0.579620361328125, 0.6232452392578125, 0.6668701171875, 0.7104949951171875, 0.754119873046875, 0.7977447509765625, 0.84136962890625, 0.8849945068359375, 0.928619384765625, 0.9722442626953125, 1.015869140625, 1.0594940185546875, 1.103118896484375, 1.1467437744140625, 1.19036865234375, 1.2339935302734375, 1.277618408203125, 1.3212432861328125, 1.3648681640625, 1.4084930419921875, 1.452117919921875, 1.4957427978515625, 1.53936767578125, 1.5829925537109375, 1.626617431640625, 1.6702423095703125, 1.7138671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 9.0, 17.0, 30.0, 62.0, 88.0, 213.0, 265.0, 163.0, 74.0, 27.0, 14.0, 18.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019884109497070312, -0.0001941230148077011, -0.0001894049346446991, -0.00018468685448169708, -0.00017996877431869507, -0.00017525069415569305, -0.00017053261399269104, -0.00016581453382968903, -0.000161096453666687, -0.000156378373503685, -0.00015166029334068298, -0.00014694221317768097, -0.00014222413301467896, -0.00013750605285167694, -0.00013278797268867493, -0.0001280698925256729, -0.0001233518123626709, -0.00011863373219966888, -0.00011391565203666687, -0.00010919757187366486, -0.00010447949171066284, -9.976141154766083e-05, -9.504333138465881e-05, -9.03252512216568e-05, -8.560717105865479e-05, -8.088909089565277e-05, -7.617101073265076e-05, -7.145293056964874e-05, -6.673485040664673e-05, -6.201677024364471e-05, -5.72986900806427e-05, -5.2580609917640686e-05, -4.786252975463867e-05, -4.314444959163666e-05, -3.8426369428634644e-05, -3.370828926563263e-05, -2.8990209102630615e-05, -2.42721289396286e-05, -1.9554048776626587e-05, -1.4835968613624573e-05, -1.0117888450622559e-05, -5.3998082876205444e-06, -6.817281246185303e-07, 4.036352038383484e-06, 8.754432201385498e-06, 1.3472512364387512e-05, 1.8190592527389526e-05, 2.290867269039154e-05, 2.7626752853393555e-05, 3.234483301639557e-05, 3.706291317939758e-05, 4.17809933423996e-05, 4.649907350540161e-05, 5.1217153668403625e-05, 5.593523383140564e-05, 6.0653313994407654e-05, 6.537139415740967e-05, 7.008947432041168e-05, 7.48075544834137e-05, 7.952563464641571e-05, 8.424371480941772e-05, 8.896179497241974e-05, 9.367987513542175e-05, 9.839795529842377e-05, 0.00010311603546142578]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 13.0, 24.0, 27.0, 80.0, 173.0, 411.0, 2444.0, 841682.0, 201377.0, 1663.0, 329.0, 162.0, 79.0, 36.0, 15.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7578125, -1.7102203369140625, -1.662628173828125, -1.6150360107421875, -1.56744384765625, -1.5198516845703125, -1.472259521484375, -1.4246673583984375, -1.3770751953125, -1.3294830322265625, -1.281890869140625, -1.2342987060546875, -1.18670654296875, -1.1391143798828125, -1.091522216796875, -1.0439300537109375, -0.996337890625, -0.9487457275390625, -0.901153564453125, -0.8535614013671875, -0.80596923828125, -0.7583770751953125, -0.710784912109375, -0.6631927490234375, -0.6156005859375, -0.5680084228515625, -0.520416259765625, -0.4728240966796875, -0.42523193359375, -0.3776397705078125, -0.330047607421875, -0.2824554443359375, -0.23486328125, -0.1872711181640625, -0.139678955078125, -0.0920867919921875, -0.04449462890625, 0.0030975341796875, 0.050689697265625, 0.0982818603515625, 0.1458740234375, 0.1934661865234375, 0.241058349609375, 0.2886505126953125, 0.33624267578125, 0.3838348388671875, 0.431427001953125, 0.4790191650390625, 0.526611328125, 0.5742034912109375, 0.621795654296875, 0.6693878173828125, 0.71697998046875, 0.7645721435546875, 0.812164306640625, 0.8597564697265625, 0.9073486328125, 0.9549407958984375, 1.002532958984375, 1.0501251220703125, 1.09771728515625, 1.1453094482421875, 1.192901611328125, 1.2404937744140625, 1.2880859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 13.0, 17.0, 63.0, 171.0, 440.0, 202.0, 66.0, 18.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8994140625, -0.874786376953125, -0.85015869140625, -0.825531005859375, -0.8009033203125, -0.776275634765625, -0.75164794921875, -0.727020263671875, -0.702392578125, -0.677764892578125, -0.65313720703125, -0.628509521484375, -0.6038818359375, -0.579254150390625, -0.55462646484375, -0.529998779296875, -0.50537109375, -0.480743408203125, -0.45611572265625, -0.431488037109375, -0.4068603515625, -0.382232666015625, -0.35760498046875, -0.332977294921875, -0.308349609375, -0.283721923828125, -0.25909423828125, -0.234466552734375, -0.2098388671875, -0.185211181640625, -0.16058349609375, -0.135955810546875, -0.111328125, -0.086700439453125, -0.06207275390625, -0.037445068359375, -0.0128173828125, 0.011810302734375, 0.03643798828125, 0.061065673828125, 0.085693359375, 0.110321044921875, 0.13494873046875, 0.159576416015625, 0.1842041015625, 0.208831787109375, 0.23345947265625, 0.258087158203125, 0.28271484375, 0.307342529296875, 0.33197021484375, 0.356597900390625, 0.3812255859375, 0.405853271484375, 0.43048095703125, 0.455108642578125, 0.479736328125, 0.504364013671875, 0.52899169921875, 0.553619384765625, 0.5782470703125, 0.602874755859375, 0.62750244140625, 0.652130126953125, 0.6767578125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 11.0, 22.0, 102.0, 303.0, 319.0, 182.0, 46.0, 13.0, 4.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.225072860717773, -9.93333625793457, -9.641600608825684, -9.34986400604248, -9.058128356933594, -8.76639175415039, -8.474655151367188, -8.1829195022583, -7.891182899475098, -7.599446773529053, -7.307710647583008, -7.015974044799805, -6.72423791885376, -6.432501792907715, -6.14076566696167, -5.849029541015625, -5.55729341506958, -5.265557289123535, -4.97382116317749, -4.682085037231445, -4.390348434448242, -4.098612308502197, -3.8068761825561523, -3.5151398181915283, -3.2234036922454834, -2.9316675662994385, -2.6399312019348145, -2.3481950759887695, -2.0564589500427246, -1.7647225856781006, -1.4729864597320557, -1.1812500953674316, -0.8895139694213867, -0.5977777242660522, -0.30604153871536255, -0.014305353164672852, 0.2774308919906616, 0.5691671371459961, 0.860903263092041, 1.152639627456665, 1.44437575340271, 1.7361119985580444, 2.027848243713379, 2.319584369659424, 2.6113204956054688, 2.9030568599700928, 3.1947929859161377, 3.4865293502807617, 3.7782654762268066, 4.070001602172852, 4.3617377281188965, 4.653473854064941, 4.9452104568481445, 5.2369465827941895, 5.528682708740234, 5.8204193115234375, 6.112154960632324, 6.403891086578369, 6.695627212524414, 6.987363815307617, 7.279099941253662, 7.570836067199707, 7.862572193145752, 8.154308319091797, 8.446044921875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 3.0, 6.0, 8.0, 16.0, 16.0, 12.0, 12.0, 25.0, 19.0, 16.0, 18.0, 27.0, 32.0, 37.0, 45.0, 35.0, 49.0, 34.0, 40.0, 49.0, 42.0, 41.0, 33.0, 46.0, 44.0, 37.0, 29.0, 30.0, 35.0, 28.0, 22.0, 22.0, 14.0, 16.0, 11.0, 11.0, 6.0, 10.0, 7.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.5423927307128906, -2.471569538116455, -2.4007463455200195, -2.329922914505005, -2.2590997219085693, -2.188276529312134, -2.1174533367156982, -2.0466301441192627, -1.9758068323135376, -1.904983639717102, -1.834160327911377, -1.7633371353149414, -1.6925139427185059, -1.6216906309127808, -1.5508674383163452, -1.4800441265106201, -1.4092209339141846, -1.338397741317749, -1.267574429512024, -1.1967512369155884, -1.1259279251098633, -1.0551047325134277, -0.9842815399169922, -0.9134582877159119, -0.8426350355148315, -0.7718117833137512, -0.7009885311126709, -0.6301653385162354, -0.559342086315155, -0.4885188341140747, -0.4176956117153168, -0.34687238931655884, -0.2760488986968994, -0.20522566139698029, -0.13440242409706116, -0.06357918679714203, 0.0072440505027771, 0.07806730270385742, 0.14889052510261536, 0.2197137475013733, 0.2905369997024536, 0.36136025190353394, 0.43218347430229187, 0.5030066967010498, 0.5738299489021301, 0.6446532011032104, 0.715476393699646, 0.7862996459007263, 0.8571228981018066, 0.927946150302887, 0.9987694025039673, 1.0695925951004028, 1.140415906906128, 1.2112390995025635, 1.282062292098999, 1.3528854846954346, 1.4237087965011597, 1.4945319890975952, 1.5653553009033203, 1.6361784934997559, 1.7070016860961914, 1.7778249979019165, 1.848648190498352, 1.9194715023040771, 1.9902946949005127]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 8.0, 9.0, 16.0, 18.0, 28.0, 47.0, 60.0, 70.0, 99.0, 167.0, 238.0, 374.0, 594.0, 1148.0, 2502.0, 7198.0, 28234.0, 510631.0, 3585873.0, 40956.0, 9626.0, 3231.0, 1310.0, 742.0, 375.0, 269.0, 130.0, 117.0, 60.0, 39.0, 23.0, 26.0, 18.0, 14.0, 3.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8349609375, -0.8041534423828125, -0.773345947265625, -0.7425384521484375, -0.71173095703125, -0.6809234619140625, -0.650115966796875, -0.6193084716796875, -0.5885009765625, -0.5576934814453125, -0.526885986328125, -0.4960784912109375, -0.46527099609375, -0.4344635009765625, -0.403656005859375, -0.3728485107421875, -0.342041015625, -0.3112335205078125, -0.280426025390625, -0.2496185302734375, -0.21881103515625, -0.1880035400390625, -0.157196044921875, -0.1263885498046875, -0.0955810546875, -0.0647735595703125, -0.033966064453125, -0.0031585693359375, 0.02764892578125, 0.0584564208984375, 0.089263916015625, 0.1200714111328125, 0.15087890625, 0.1816864013671875, 0.212493896484375, 0.2433013916015625, 0.27410888671875, 0.3049163818359375, 0.335723876953125, 0.3665313720703125, 0.3973388671875, 0.4281463623046875, 0.458953857421875, 0.4897613525390625, 0.52056884765625, 0.5513763427734375, 0.582183837890625, 0.6129913330078125, 0.643798828125, 0.6746063232421875, 0.705413818359375, 0.7362213134765625, 0.76702880859375, 0.7978363037109375, 0.828643798828125, 0.8594512939453125, 0.8902587890625, 0.9210662841796875, 0.951873779296875, 0.9826812744140625, 1.01348876953125, 1.0442962646484375, 1.075103759765625, 1.1059112548828125, 1.13671875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 9.0, 19.0, 34.0, 46.0, 70.0, 78.0, 96.0, 121.0, 116.0, 92.0, 94.0, 66.0, 50.0, 48.0, 15.0, 11.0, 9.0, 6.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.2777442932128906, -0.26935577392578125, -0.2609672546386719, -0.2525787353515625, -0.24419021606445312, -0.23580169677734375, -0.22741317749023438, -0.219024658203125, -0.21063613891601562, -0.20224761962890625, -0.19385910034179688, -0.1854705810546875, -0.17708206176757812, -0.16869354248046875, -0.16030502319335938, -0.15191650390625, -0.14352798461914062, -0.13513946533203125, -0.12675094604492188, -0.1183624267578125, -0.10997390747070312, -0.10158538818359375, -0.09319686889648438, -0.084808349609375, -0.07641983032226562, -0.06803131103515625, -0.059642791748046875, -0.0512542724609375, -0.042865753173828125, -0.03447723388671875, -0.026088714599609375, -0.0177001953125, -0.009311676025390625, -0.00092315673828125, 0.007465362548828125, 0.0158538818359375, 0.024242401123046875, 0.03263092041015625, 0.041019439697265625, 0.049407958984375, 0.057796478271484375, 0.06618499755859375, 0.07457351684570312, 0.0829620361328125, 0.09135055541992188, 0.09973907470703125, 0.10812759399414062, 0.11651611328125, 0.12490463256835938, 0.13329315185546875, 0.14168167114257812, 0.1500701904296875, 0.15845870971679688, 0.16684722900390625, 0.17523574829101562, 0.183624267578125, 0.19201278686523438, 0.20040130615234375, 0.20878982543945312, 0.2171783447265625, 0.22556686401367188, 0.23395538330078125, 0.24234390258789062, 0.250732421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 5.0, 9.0, 19.0, 11.0, 12.0, 39.0, 33.0, 38.0, 64.0, 96.0, 108.0, 151.0, 221.0, 527.0, 2729.0, 57911.0, 4111878.0, 17726.0, 1455.0, 381.0, 225.0, 158.0, 113.0, 79.0, 78.0, 39.0, 32.0, 35.0, 28.0, 26.0, 20.0, 5.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7666015625, -1.6909637451171875, -1.615325927734375, -1.5396881103515625, -1.46405029296875, -1.3884124755859375, -1.312774658203125, -1.2371368408203125, -1.1614990234375, -1.0858612060546875, -1.010223388671875, -0.9345855712890625, -0.85894775390625, -0.7833099365234375, -0.707672119140625, -0.6320343017578125, -0.556396484375, -0.4807586669921875, -0.405120849609375, -0.3294830322265625, -0.25384521484375, -0.1782073974609375, -0.102569580078125, -0.0269317626953125, 0.0487060546875, 0.1243438720703125, 0.199981689453125, 0.2756195068359375, 0.35125732421875, 0.4268951416015625, 0.502532958984375, 0.5781707763671875, 0.65380859375, 0.7294464111328125, 0.805084228515625, 0.8807220458984375, 0.95635986328125, 1.0319976806640625, 1.107635498046875, 1.1832733154296875, 1.2589111328125, 1.3345489501953125, 1.410186767578125, 1.4858245849609375, 1.56146240234375, 1.6371002197265625, 1.712738037109375, 1.7883758544921875, 1.864013671875, 1.9396514892578125, 2.015289306640625, 2.0909271240234375, 2.16656494140625, 2.2422027587890625, 2.317840576171875, 2.3934783935546875, 2.4691162109375, 2.5447540283203125, 2.620391845703125, 2.6960296630859375, 2.77166748046875, 2.8473052978515625, 2.922943115234375, 2.9985809326171875, 3.07421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 20.0, 37.0, 96.0, 416.0, 3233.0, 182.0, 48.0, 19.0, 10.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26611328125, -0.24033355712890625, -0.2145538330078125, -0.18877410888671875, -0.162994384765625, -0.13721466064453125, -0.1114349365234375, -0.08565521240234375, -0.05987548828125, -0.03409576416015625, -0.0083160400390625, 0.01746368408203125, 0.043243408203125, 0.06902313232421875, 0.0948028564453125, 0.12058258056640625, 0.1463623046875, 0.17214202880859375, 0.1979217529296875, 0.22370147705078125, 0.249481201171875, 0.27526092529296875, 0.3010406494140625, 0.32682037353515625, 0.35260009765625, 0.37837982177734375, 0.4041595458984375, 0.42993927001953125, 0.455718994140625, 0.48149871826171875, 0.5072784423828125, 0.5330581665039062, 0.558837890625, 0.5846176147460938, 0.6103973388671875, 0.6361770629882812, 0.661956787109375, 0.6877365112304688, 0.7135162353515625, 0.7392959594726562, 0.76507568359375, 0.7908554077148438, 0.8166351318359375, 0.8424148559570312, 0.868194580078125, 0.8939743041992188, 0.9197540283203125, 0.9455337524414062, 0.9713134765625, 0.9970932006835938, 1.0228729248046875, 1.0486526489257812, 1.074432373046875, 1.1002120971679688, 1.1259918212890625, 1.1517715454101562, 1.17755126953125, 1.2033309936523438, 1.2291107177734375, 1.2548904418945312, 1.280670166015625, 1.3064498901367188, 1.3322296142578125, 1.3580093383789062, 1.3837890625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 35.0, 93.0, 480.0, 314.0, 50.0, 9.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.217049598693848, -9.024659156799316, -8.832267761230469, -8.639877319335938, -8.447486877441406, -8.255096435546875, -8.062705039978027, -7.870314598083496, -7.677923679351807, -7.485532760620117, -7.293142318725586, -7.1007513999938965, -6.908360958099365, -6.715970039367676, -6.5235795974731445, -6.331188678741455, -6.138797760009766, -5.946406841278076, -5.754016399383545, -5.5616254806518555, -5.369235038757324, -5.176844120025635, -4.984453201293945, -4.792062759399414, -4.599672317504883, -4.407281398773193, -4.214890956878662, -4.022500038146973, -3.8301093578338623, -3.637718677520752, -3.4453279972076416, -3.2529373168945312, -3.060546398162842, -2.8681557178497314, -2.675765037536621, -2.4833741188049316, -2.2909834384918213, -2.098592758178711, -1.9062020778656006, -1.7138112783432007, -1.5214205980300903, -1.32902991771698, -1.13663911819458, -0.9442484378814697, -0.7518576979637146, -0.5594669580459595, -0.3670762777328491, -0.17468547821044922, 0.017705202102661133, 0.21009592711925507, 0.402486652135849, 0.5948773622512817, 0.7872681021690369, 0.979658842086792, 1.1720495223999023, 1.3644403219223022, 1.5568310022354126, 1.749221682548523, 1.9416124820709229, 2.134003162384033, 2.3263938426971436, 2.518784523010254, 2.7111754417419434, 2.9035661220550537, 3.095956802368164]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 5.0, 6.0, 12.0, 25.0, 30.0, 45.0, 63.0, 71.0, 102.0, 95.0, 111.0, 103.0, 82.0, 83.0, 52.0, 43.0, 23.0, 12.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.7313365936279297, -2.6597084999084473, -2.588080406188965, -2.5164523124694824, -2.44482421875, -2.3731958866119385, -2.301567792892456, -2.2299396991729736, -2.158311605453491, -2.086683511734009, -2.0150554180145264, -1.9434272050857544, -1.871799111366272, -1.8001710176467896, -1.7285428047180176, -1.6569147109985352, -1.5852866172790527, -1.5136585235595703, -1.442030429840088, -1.370402216911316, -1.2987741231918335, -1.227146029472351, -1.155517816543579, -1.0838897228240967, -1.0122616291046143, -0.9406335353851318, -0.8690053820610046, -0.7973772287368774, -0.725749135017395, -0.6541210412979126, -0.5824928879737854, -0.5108647346496582, -0.43923652172088623, -0.3676083981990814, -0.2959802746772766, -0.2243521511554718, -0.152724027633667, -0.08109590411186218, -0.009467780590057373, 0.062160372734069824, 0.13378846645355225, 0.20541658997535706, 0.27704471349716187, 0.3486728370189667, 0.4203009605407715, 0.4919290840625763, 0.5635572075843811, 0.6351853609085083, 0.7068134546279907, 0.7784415483474731, 0.8500697016716003, 0.9216978549957275, 0.99332594871521, 1.0649540424346924, 1.1365821361541748, 1.2082103490829468, 1.2798384428024292, 1.3514665365219116, 1.4230947494506836, 1.494722843170166, 1.5663509368896484, 1.6379790306091309, 1.7096071243286133, 1.7812353372573853, 1.8528634309768677]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 8.0, 7.0, 10.0, 30.0, 42.0, 80.0, 179.0, 377.0, 926.0, 2734.0, 11834.0, 127020.0, 801689.0, 90394.0, 9367.0, 2351.0, 856.0, 340.0, 152.0, 81.0, 41.0, 18.0, 11.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4521484375, -1.408721923828125, -1.36529541015625, -1.321868896484375, -1.2784423828125, -1.235015869140625, -1.19158935546875, -1.148162841796875, -1.104736328125, -1.061309814453125, -1.01788330078125, -0.974456787109375, -0.9310302734375, -0.887603759765625, -0.84417724609375, -0.800750732421875, -0.75732421875, -0.713897705078125, -0.67047119140625, -0.627044677734375, -0.5836181640625, -0.540191650390625, -0.49676513671875, -0.453338623046875, -0.409912109375, -0.366485595703125, -0.32305908203125, -0.279632568359375, -0.2362060546875, -0.192779541015625, -0.14935302734375, -0.105926513671875, -0.0625, -0.019073486328125, 0.02435302734375, 0.067779541015625, 0.1112060546875, 0.154632568359375, 0.19805908203125, 0.241485595703125, 0.284912109375, 0.328338623046875, 0.37176513671875, 0.415191650390625, 0.4586181640625, 0.502044677734375, 0.54547119140625, 0.588897705078125, 0.63232421875, 0.675750732421875, 0.71917724609375, 0.762603759765625, 0.8060302734375, 0.849456787109375, 0.89288330078125, 0.936309814453125, 0.979736328125, 1.023162841796875, 1.06658935546875, 1.110015869140625, 1.1534423828125, 1.196868896484375, 1.24029541015625, 1.283721923828125, 1.3271484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 1.0, 6.0, 10.0, 33.0, 24.0, 64.0, 81.0, 76.0, 118.0, 122.0, 105.0, 100.0, 84.0, 55.0, 47.0, 22.0, 20.0, 12.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.321044921875, -0.3115119934082031, -0.30197906494140625, -0.2924461364746094, -0.2829132080078125, -0.2733802795410156, -0.26384735107421875, -0.2543144226074219, -0.244781494140625, -0.23524856567382812, -0.22571563720703125, -0.21618270874023438, -0.2066497802734375, -0.19711685180664062, -0.18758392333984375, -0.17805099487304688, -0.16851806640625, -0.15898513793945312, -0.14945220947265625, -0.13991928100585938, -0.1303863525390625, -0.12085342407226562, -0.11132049560546875, -0.10178756713867188, -0.092254638671875, -0.08272171020507812, -0.07318878173828125, -0.06365585327148438, -0.0541229248046875, -0.044589996337890625, -0.03505706787109375, -0.025524139404296875, -0.0159912109375, -0.006458282470703125, 0.00307464599609375, 0.012607574462890625, 0.0221405029296875, 0.031673431396484375, 0.04120635986328125, 0.050739288330078125, 0.060272216796875, 0.06980514526367188, 0.07933807373046875, 0.08887100219726562, 0.0984039306640625, 0.10793685913085938, 0.11746978759765625, 0.12700271606445312, 0.13653564453125, 0.14606857299804688, 0.15560150146484375, 0.16513442993164062, 0.1746673583984375, 0.18420028686523438, 0.19373321533203125, 0.20326614379882812, 0.212799072265625, 0.22233200073242188, 0.23186492919921875, 0.24139785766601562, 0.2509307861328125, 0.2604637145996094, 0.26999664306640625, 0.2795295715332031, 0.2890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 10.0, 7.0, 12.0, 22.0, 36.0, 44.0, 58.0, 96.0, 173.0, 273.0, 532.0, 1318.0, 3694.0, 12156.0, 49471.0, 246758.0, 550338.0, 141330.0, 29811.0, 7858.0, 2537.0, 960.0, 431.0, 224.0, 118.0, 81.0, 68.0, 44.0, 25.0, 22.0, 17.0, 5.0, 7.0, 4.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62939453125, -0.6115798950195312, -0.5937652587890625, -0.5759506225585938, -0.558135986328125, -0.5403213500976562, -0.5225067138671875, -0.5046920776367188, -0.48687744140625, -0.46906280517578125, -0.4512481689453125, -0.43343353271484375, -0.415618896484375, -0.39780426025390625, -0.3799896240234375, -0.36217498779296875, -0.3443603515625, -0.32654571533203125, -0.3087310791015625, -0.29091644287109375, -0.273101806640625, -0.25528717041015625, -0.2374725341796875, -0.21965789794921875, -0.20184326171875, -0.18402862548828125, -0.1662139892578125, -0.14839935302734375, -0.130584716796875, -0.11277008056640625, -0.0949554443359375, -0.07714080810546875, -0.059326171875, -0.04151153564453125, -0.0236968994140625, -0.00588226318359375, 0.011932373046875, 0.02974700927734375, 0.0475616455078125, 0.06537628173828125, 0.08319091796875, 0.10100555419921875, 0.1188201904296875, 0.13663482666015625, 0.154449462890625, 0.17226409912109375, 0.1900787353515625, 0.20789337158203125, 0.2257080078125, 0.24352264404296875, 0.2613372802734375, 0.27915191650390625, 0.296966552734375, 0.31478118896484375, 0.3325958251953125, 0.35041046142578125, 0.36822509765625, 0.38603973388671875, 0.4038543701171875, 0.42166900634765625, 0.439483642578125, 0.45729827880859375, 0.4751129150390625, 0.49292755126953125, 0.5107421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 14.0, 13.0, 9.0, 14.0, 24.0, 31.0, 21.0, 36.0, 41.0, 26.0, 43.0, 43.0, 40.0, 39.0, 51.0, 42.0, 52.0, 43.0, 44.0, 53.0, 36.0, 27.0, 30.0, 34.0, 29.0, 29.0, 25.0, 20.0, 16.0, 15.0, 14.0, 8.0, 7.0, 9.0, 6.0, 3.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499267578125, -0.484222412109375, -0.46917724609375, -0.454132080078125, -0.4390869140625, -0.424041748046875, -0.40899658203125, -0.393951416015625, -0.37890625, -0.363861083984375, -0.34881591796875, -0.333770751953125, -0.3187255859375, -0.303680419921875, -0.28863525390625, -0.273590087890625, -0.258544921875, -0.243499755859375, -0.22845458984375, -0.213409423828125, -0.1983642578125, -0.183319091796875, -0.16827392578125, -0.153228759765625, -0.13818359375, -0.123138427734375, -0.10809326171875, -0.093048095703125, -0.0780029296875, -0.062957763671875, -0.04791259765625, -0.032867431640625, -0.017822265625, -0.002777099609375, 0.01226806640625, 0.027313232421875, 0.0423583984375, 0.057403564453125, 0.07244873046875, 0.087493896484375, 0.1025390625, 0.117584228515625, 0.13262939453125, 0.147674560546875, 0.1627197265625, 0.177764892578125, 0.19281005859375, 0.207855224609375, 0.222900390625, 0.237945556640625, 0.25299072265625, 0.268035888671875, 0.2830810546875, 0.298126220703125, 0.31317138671875, 0.328216552734375, 0.34326171875, 0.358306884765625, 0.37335205078125, 0.388397216796875, 0.4034423828125, 0.418487548828125, 0.43353271484375, 0.448577880859375, 0.463623046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 17.0, 18.0, 30.0, 79.0, 129.0, 268.0, 608.0, 1773.0, 5763.0, 30109.0, 266830.0, 643936.0, 81997.0, 12207.0, 2951.0, 1008.0, 400.0, 184.0, 95.0, 55.0, 25.0, 18.0, 13.0, 8.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.17286109924316406, -0.16542434692382812, -0.1579875946044922, -0.15055084228515625, -0.1431140899658203, -0.13567733764648438, -0.12824058532714844, -0.1208038330078125, -0.11336708068847656, -0.10593032836914062, -0.09849357604980469, -0.09105682373046875, -0.08362007141113281, -0.07618331909179688, -0.06874656677246094, -0.061309814453125, -0.05387306213378906, -0.046436309814453125, -0.03899955749511719, -0.03156280517578125, -0.024126052856445312, -0.016689300537109375, -0.009252548217773438, -0.0018157958984375, 0.0056209564208984375, 0.013057708740234375, 0.020494461059570312, 0.02793121337890625, 0.03536796569824219, 0.042804718017578125, 0.05024147033691406, 0.05767822265625, 0.06511497497558594, 0.07255172729492188, 0.07998847961425781, 0.08742523193359375, 0.09486198425292969, 0.10229873657226562, 0.10973548889160156, 0.1171722412109375, 0.12460899353027344, 0.13204574584960938, 0.1394824981689453, 0.14691925048828125, 0.1543560028076172, 0.16179275512695312, 0.16922950744628906, 0.176666259765625, 0.18410301208496094, 0.19153976440429688, 0.1989765167236328, 0.20641326904296875, 0.2138500213623047, 0.22128677368164062, 0.22872352600097656, 0.2361602783203125, 0.24359703063964844, 0.2510337829589844, 0.2584705352783203, 0.26590728759765625, 0.2733440399169922, 0.2807807922363281, 0.28821754455566406, 0.295654296875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 0.0, 10.0, 13.0, 13.0, 28.0, 33.0, 52.0, 98.0, 177.0, 189.0, 151.0, 83.0, 50.0, 30.0, 17.0, 14.0, 9.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010573863983154297, -0.00010226946324110031, -9.880028665065765e-05, -9.5331110060215e-05, -9.186193346977234e-05, -8.839275687932968e-05, -8.492358028888702e-05, -8.145440369844437e-05, -7.798522710800171e-05, -7.451605051755905e-05, -7.10468739271164e-05, -6.757769733667374e-05, -6.410852074623108e-05, -6.063934415578842e-05, -5.7170167565345764e-05, -5.370099097490311e-05, -5.023181438446045e-05, -4.676263779401779e-05, -4.3293461203575134e-05, -3.982428461313248e-05, -3.635510802268982e-05, -3.288593143224716e-05, -2.9416754841804504e-05, -2.5947578251361847e-05, -2.247840166091919e-05, -1.9009225070476532e-05, -1.5540048480033875e-05, -1.2070871889591217e-05, -8.60169529914856e-06, -5.132518708705902e-06, -1.6633421182632446e-06, 1.8058344721794128e-06, 5.27501106262207e-06, 8.744187653064728e-06, 1.2213364243507385e-05, 1.5682540833950043e-05, 1.91517174243927e-05, 2.2620894014835358e-05, 2.6090070605278015e-05, 2.9559247195720673e-05, 3.302842378616333e-05, 3.649760037660599e-05, 3.9966776967048645e-05, 4.34359535574913e-05, 4.690513014793396e-05, 5.037430673837662e-05, 5.3843483328819275e-05, 5.731265991926193e-05, 6.078183650970459e-05, 6.425101310014725e-05, 6.77201896905899e-05, 7.118936628103256e-05, 7.465854287147522e-05, 7.812771946191788e-05, 8.159689605236053e-05, 8.506607264280319e-05, 8.853524923324585e-05, 9.200442582368851e-05, 9.547360241413116e-05, 9.894277900457382e-05, 0.00010241195559501648, 0.00010588113218545914, 0.0001093503087759018, 0.00011281948536634445, 0.00011628866195678711]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 10.0, 10.0, 12.0, 12.0, 27.0, 40.0, 50.0, 84.0, 148.0, 216.0, 377.0, 657.0, 1121.0, 2381.0, 6229.0, 21410.0, 114416.0, 637456.0, 214248.0, 34253.0, 8807.0, 3239.0, 1462.0, 754.0, 423.0, 257.0, 146.0, 93.0, 66.0, 46.0, 30.0, 14.0, 21.0, 11.0, 11.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2191162109375, -0.21279335021972656, -0.20647048950195312, -0.2001476287841797, -0.19382476806640625, -0.1875019073486328, -0.18117904663085938, -0.17485618591308594, -0.1685333251953125, -0.16221046447753906, -0.15588760375976562, -0.1495647430419922, -0.14324188232421875, -0.1369190216064453, -0.13059616088867188, -0.12427330017089844, -0.117950439453125, -0.11162757873535156, -0.10530471801757812, -0.09898185729980469, -0.09265899658203125, -0.08633613586425781, -0.08001327514648438, -0.07369041442871094, -0.0673675537109375, -0.06104469299316406, -0.054721832275390625, -0.04839897155761719, -0.04207611083984375, -0.03575325012207031, -0.029430389404296875, -0.023107528686523438, -0.01678466796875, -0.010461807250976562, -0.004138946533203125, 0.0021839141845703125, 0.00850677490234375, 0.014829635620117188, 0.021152496337890625, 0.027475357055664062, 0.0337982177734375, 0.04012107849121094, 0.046443939208984375, 0.05276679992675781, 0.05908966064453125, 0.06541252136230469, 0.07173538208007812, 0.07805824279785156, 0.084381103515625, 0.09070396423339844, 0.09702682495117188, 0.10334968566894531, 0.10967254638671875, 0.11599540710449219, 0.12231826782226562, 0.12864112854003906, 0.1349639892578125, 0.14128684997558594, 0.14760971069335938, 0.1539325714111328, 0.16025543212890625, 0.1665782928466797, 0.17290115356445312, 0.17922401428222656, 0.185546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 10.0, 5.0, 16.0, 25.0, 41.0, 63.0, 76.0, 129.0, 161.0, 145.0, 105.0, 77.0, 52.0, 40.0, 18.0, 8.0, 10.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2989997863769531, -0.29111480712890625, -0.2832298278808594, -0.2753448486328125, -0.2674598693847656, -0.25957489013671875, -0.2516899108886719, -0.243804931640625, -0.23591995239257812, -0.22803497314453125, -0.22014999389648438, -0.2122650146484375, -0.20438003540039062, -0.19649505615234375, -0.18861007690429688, -0.18072509765625, -0.17284011840820312, -0.16495513916015625, -0.15707015991210938, -0.1491851806640625, -0.14130020141601562, -0.13341522216796875, -0.12553024291992188, -0.117645263671875, -0.10976028442382812, -0.10187530517578125, -0.09399032592773438, -0.0861053466796875, -0.07822036743164062, -0.07033538818359375, -0.062450408935546875, -0.0545654296875, -0.046680450439453125, -0.03879547119140625, -0.030910491943359375, -0.0230255126953125, -0.015140533447265625, -0.00725555419921875, 0.000629425048828125, 0.008514404296875, 0.016399383544921875, 0.02428436279296875, 0.032169342041015625, 0.0400543212890625, 0.047939300537109375, 0.05582427978515625, 0.06370925903320312, 0.07159423828125, 0.07947921752929688, 0.08736419677734375, 0.09524917602539062, 0.1031341552734375, 0.11101913452148438, 0.11890411376953125, 0.12678909301757812, 0.134674072265625, 0.14255905151367188, 0.15044403076171875, 0.15832901000976562, 0.1662139892578125, 0.17409896850585938, 0.18198394775390625, 0.18986892700195312, 0.19775390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 19.0, 58.0, 280.0, 413.0, 171.0, 54.0, 10.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-17.599308013916016, -17.281082153320312, -16.962854385375977, -16.644628524780273, -16.326400756835938, -16.008174896240234, -15.689948081970215, -15.371721267700195, -15.053495407104492, -14.735268592834473, -14.417041778564453, -14.09881591796875, -13.78058910369873, -13.462362289428711, -13.144135475158691, -12.825908660888672, -12.507682800292969, -12.18945598602295, -11.87122917175293, -11.553003311157227, -11.234776496887207, -10.916549682617188, -10.598322868347168, -10.280096054077148, -9.961869239807129, -9.64364242553711, -9.32541561126709, -9.007189750671387, -8.688962936401367, -8.370736122131348, -8.052509307861328, -7.734282970428467, -7.416055679321289, -7.0978288650512695, -6.779602527618408, -6.461375713348389, -6.143149375915527, -5.824922561645508, -5.506695747375488, -5.188469409942627, -4.870243072509766, -4.552016258239746, -4.233789920806885, -3.9155631065368652, -3.597336769104004, -3.2791099548339844, -2.960883378982544, -2.6426568031311035, -2.324430227279663, -2.0062036514282227, -1.6879770755767822, -1.3697503805160522, -1.0515238046646118, -0.7332972288131714, -0.4150705337524414, -0.09684395790100098, 0.22138261795043945, 0.5396091938018799, 0.8578358292579651, 1.1760624647140503, 1.4942890405654907, 1.8125156164169312, 2.130742311477661, 2.4489688873291016, 2.767195463180542]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 10.0, 7.0, 9.0, 11.0, 13.0, 19.0, 28.0, 19.0, 19.0, 21.0, 30.0, 26.0, 34.0, 31.0, 45.0, 47.0, 46.0, 35.0, 46.0, 35.0, 32.0, 39.0, 43.0, 46.0, 33.0, 36.0, 36.0, 25.0, 23.0, 30.0, 17.0, 17.0, 20.0, 11.0, 11.0, 9.0, 8.0, 5.0, 7.0, 2.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.072415828704834, -2.0087406635284424, -1.9450654983520508, -1.8813903331756592, -1.8177151679992676, -1.754040002822876, -1.6903648376464844, -1.6266896724700928, -1.5630145072937012, -1.4993393421173096, -1.435664176940918, -1.3719890117645264, -1.3083138465881348, -1.2446386814117432, -1.1809635162353516, -1.11728835105896, -1.0536130666732788, -0.9899379014968872, -0.9262627363204956, -0.862587571144104, -0.7989124059677124, -0.7352372407913208, -0.6715620160102844, -0.6078868508338928, -0.5442116856575012, -0.4805365204811096, -0.416861355304718, -0.35318616032600403, -0.2895109951496124, -0.22583582997322083, -0.16216063499450684, -0.09848546981811523, -0.03481030464172363, 0.028864867985248566, 0.09254004061222076, 0.15621522068977356, 0.21989038586616516, 0.28356555104255676, 0.34724074602127075, 0.41091591119766235, 0.47459107637405396, 0.5382662415504456, 0.6019414067268372, 0.6656166315078735, 0.7292917966842651, 0.7929669618606567, 0.8566421270370483, 0.9203172922134399, 0.9839924573898315, 1.0476676225662231, 1.1113427877426147, 1.1750179529190063, 1.238693118095398, 1.3023682832717896, 1.3660435676574707, 1.4297187328338623, 1.493393898010254, 1.5570690631866455, 1.620744228363037, 1.6844193935394287, 1.7480945587158203, 1.811769723892212, 1.8754448890686035, 1.9391200542449951, 2.0027952194213867]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 5.0, 8.0, 15.0, 15.0, 19.0, 37.0, 34.0, 57.0, 105.0, 122.0, 165.0, 271.0, 441.0, 732.0, 1423.0, 3144.0, 8770.0, 38735.0, 3704456.0, 394783.0, 28051.0, 7286.0, 2646.0, 1267.0, 630.0, 388.0, 201.0, 141.0, 102.0, 63.0, 46.0, 24.0, 27.0, 15.0, 13.0, 10.0, 9.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3828125, -1.3349609375, -1.287109375, -1.2392578125, -1.19140625, -1.1435546875, -1.095703125, -1.0478515625, -1.0, -0.9521484375, -0.904296875, -0.8564453125, -0.80859375, -0.7607421875, -0.712890625, -0.6650390625, -0.6171875, -0.5693359375, -0.521484375, -0.4736328125, -0.42578125, -0.3779296875, -0.330078125, -0.2822265625, -0.234375, -0.1865234375, -0.138671875, -0.0908203125, -0.04296875, 0.0048828125, 0.052734375, 0.1005859375, 0.1484375, 0.1962890625, 0.244140625, 0.2919921875, 0.33984375, 0.3876953125, 0.435546875, 0.4833984375, 0.53125, 0.5791015625, 0.626953125, 0.6748046875, 0.72265625, 0.7705078125, 0.818359375, 0.8662109375, 0.9140625, 0.9619140625, 1.009765625, 1.0576171875, 1.10546875, 1.1533203125, 1.201171875, 1.2490234375, 1.296875, 1.3447265625, 1.392578125, 1.4404296875, 1.48828125, 1.5361328125, 1.583984375, 1.6318359375, 1.6796875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 17.0, 21.0, 36.0, 43.0, 72.0, 95.0, 95.0, 108.0, 89.0, 107.0, 88.0, 69.0, 57.0, 31.0, 22.0, 15.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.30707550048828125, -0.2975006103515625, -0.28792572021484375, -0.278350830078125, -0.26877593994140625, -0.2592010498046875, -0.24962615966796875, -0.24005126953125, -0.23047637939453125, -0.2209014892578125, -0.21132659912109375, -0.201751708984375, -0.19217681884765625, -0.1826019287109375, -0.17302703857421875, -0.1634521484375, -0.15387725830078125, -0.1443023681640625, -0.13472747802734375, -0.125152587890625, -0.11557769775390625, -0.1060028076171875, -0.09642791748046875, -0.08685302734375, -0.07727813720703125, -0.0677032470703125, -0.05812835693359375, -0.048553466796875, -0.03897857666015625, -0.0294036865234375, -0.01982879638671875, -0.01025390625, -0.00067901611328125, 0.0088958740234375, 0.01847076416015625, 0.028045654296875, 0.03762054443359375, 0.0471954345703125, 0.05677032470703125, 0.06634521484375, 0.07592010498046875, 0.0854949951171875, 0.09506988525390625, 0.104644775390625, 0.11421966552734375, 0.1237945556640625, 0.13336944580078125, 0.1429443359375, 0.15251922607421875, 0.1620941162109375, 0.17166900634765625, 0.181243896484375, 0.19081878662109375, 0.2003936767578125, 0.20996856689453125, 0.21954345703125, 0.22911834716796875, 0.2386932373046875, 0.24826812744140625, 0.257843017578125, 0.26741790771484375, 0.2769927978515625, 0.28656768798828125, 0.296142578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 4.0, 3.0, 9.0, 16.0, 13.0, 11.0, 32.0, 29.0, 42.0, 49.0, 52.0, 85.0, 108.0, 188.0, 343.0, 624.0, 1337.0, 3063.0, 8976.0, 35117.0, 314446.0, 3737059.0, 69186.0, 14884.0, 4636.0, 1907.0, 859.0, 427.0, 257.0, 144.0, 86.0, 65.0, 52.0, 45.0, 30.0, 18.0, 16.0, 12.0, 18.0, 5.0, 4.0, 6.0, 10.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.9990234375, -0.9659423828125, -0.932861328125, -0.8997802734375, -0.86669921875, -0.8336181640625, -0.800537109375, -0.7674560546875, -0.734375, -0.7012939453125, -0.668212890625, -0.6351318359375, -0.60205078125, -0.5689697265625, -0.535888671875, -0.5028076171875, -0.4697265625, -0.4366455078125, -0.403564453125, -0.3704833984375, -0.33740234375, -0.3043212890625, -0.271240234375, -0.2381591796875, -0.205078125, -0.1719970703125, -0.138916015625, -0.1058349609375, -0.07275390625, -0.0396728515625, -0.006591796875, 0.0264892578125, 0.0595703125, 0.0926513671875, 0.125732421875, 0.1588134765625, 0.19189453125, 0.2249755859375, 0.258056640625, 0.2911376953125, 0.32421875, 0.3572998046875, 0.390380859375, 0.4234619140625, 0.45654296875, 0.4896240234375, 0.522705078125, 0.5557861328125, 0.5888671875, 0.6219482421875, 0.655029296875, 0.6881103515625, 0.72119140625, 0.7542724609375, 0.787353515625, 0.8204345703125, 0.853515625, 0.8865966796875, 0.919677734375, 0.9527587890625, 0.98583984375, 1.0189208984375, 1.052001953125, 1.0850830078125, 1.1181640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 9.0, 10.0, 25.0, 49.0, 83.0, 273.0, 3137.0, 285.0, 83.0, 45.0, 28.0, 12.0, 10.0, 5.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73486328125, -0.7135543823242188, -0.6922454833984375, -0.6709365844726562, -0.649627685546875, -0.6283187866210938, -0.6070098876953125, -0.5857009887695312, -0.56439208984375, -0.5430831909179688, -0.5217742919921875, -0.5004653930664062, -0.479156494140625, -0.45784759521484375, -0.4365386962890625, -0.41522979736328125, -0.3939208984375, -0.37261199951171875, -0.3513031005859375, -0.32999420166015625, -0.308685302734375, -0.28737640380859375, -0.2660675048828125, -0.24475860595703125, -0.22344970703125, -0.20214080810546875, -0.1808319091796875, -0.15952301025390625, -0.138214111328125, -0.11690521240234375, -0.0955963134765625, -0.07428741455078125, -0.052978515625, -0.03166961669921875, -0.0103607177734375, 0.01094818115234375, 0.032257080078125, 0.05356597900390625, 0.0748748779296875, 0.09618377685546875, 0.11749267578125, 0.13880157470703125, 0.1601104736328125, 0.18141937255859375, 0.202728271484375, 0.22403717041015625, 0.2453460693359375, 0.26665496826171875, 0.2879638671875, 0.30927276611328125, 0.3305816650390625, 0.35189056396484375, 0.373199462890625, 0.39450836181640625, 0.4158172607421875, 0.43712615966796875, 0.45843505859375, 0.47974395751953125, 0.5010528564453125, 0.5223617553710938, 0.543670654296875, 0.5649795532226562, 0.5862884521484375, 0.6075973510742188, 0.62890625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 18.0, 36.0, 112.0, 282.0, 310.0, 126.0, 61.0, 22.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.302706718444824, -4.185956001281738, -4.069204807281494, -3.952453851699829, -3.835702896118164, -3.718951940536499, -3.602200984954834, -3.485450029373169, -3.368699073791504, -3.251948118209839, -3.135197162628174, -3.018446207046509, -2.9016952514648438, -2.7849442958831787, -2.6681933403015137, -2.5514423847198486, -2.4346914291381836, -2.3179404735565186, -2.2011895179748535, -2.0844385623931885, -1.9676876068115234, -1.8509366512298584, -1.7341856956481934, -1.6174347400665283, -1.5006837844848633, -1.3839328289031982, -1.2671818733215332, -1.1504309177398682, -1.0336799621582031, -0.9169290065765381, -0.800178050994873, -0.683427095413208, -0.566676139831543, -0.44992518424987793, -0.3331742286682129, -0.21642327308654785, -0.09967231750488281, 0.017078638076782227, 0.13382959365844727, 0.2505805492401123, 0.36733150482177734, 0.4840824604034424, 0.6008334159851074, 0.7175843715667725, 0.8343353271484375, 0.9510862827301025, 1.0678372383117676, 1.1845881938934326, 1.3013391494750977, 1.4180901050567627, 1.5348410606384277, 1.6515920162200928, 1.7683429718017578, 1.8850939273834229, 2.001844882965088, 2.118595838546753, 2.235346794128418, 2.352097749710083, 2.468848705291748, 2.585599660873413, 2.702350616455078, 2.819101572036743, 2.935852527618408, 3.0526034832000732, 3.1693544387817383]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 7.0, 2.0, 9.0, 6.0, 9.0, 22.0, 27.0, 39.0, 30.0, 39.0, 55.0, 77.0, 74.0, 76.0, 65.0, 76.0, 72.0, 64.0, 53.0, 48.0, 33.0, 35.0, 25.0, 20.0, 16.0, 11.0, 5.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9575942754745483, -1.9025774002075195, -1.8475606441497803, -1.7925437688827515, -1.7375268936157227, -1.6825101375579834, -1.6274932622909546, -1.5724763870239258, -1.5174596309661865, -1.4624427556991577, -1.4074259996414185, -1.3524091243743896, -1.2973922491073608, -1.242375373840332, -1.1873586177825928, -1.132341742515564, -1.0773248672485352, -1.0223079919815063, -0.9672911763191223, -0.9122743606567383, -0.8572574853897095, -0.8022406697273254, -0.7472238540649414, -0.6922069787979126, -0.6371901631355286, -0.5821733474731445, -0.5271564722061157, -0.4721396565437317, -0.41712281107902527, -0.36210596561431885, -0.3070891499519348, -0.2520723044872284, -0.19705533981323242, -0.142038494348526, -0.08702166378498077, -0.03200483322143555, 0.023012012243270874, 0.0780288577079773, 0.13304567337036133, 0.18806251883506775, 0.24307936429977417, 0.2980962097644806, 0.353113055229187, 0.40812987089157104, 0.46314671635627747, 0.5181635618209839, 0.5731803774833679, 0.628197193145752, 0.6832140684127808, 0.7382308840751648, 0.7932477593421936, 0.8482645750045776, 0.9032814502716064, 0.9582982659339905, 1.0133150815963745, 1.0683319568634033, 1.1233487129211426, 1.1783655881881714, 1.2333823442459106, 1.2883992195129395, 1.3434160947799683, 1.398432970046997, 1.4534497261047363, 1.5084666013717651, 1.563483476638794]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 13.0, 11.0, 13.0, 23.0, 24.0, 30.0, 64.0, 125.0, 255.0, 416.0, 752.0, 1689.0, 3970.0, 12467.0, 62390.0, 452704.0, 434590.0, 59696.0, 12071.0, 3858.0, 1632.0, 840.0, 360.0, 237.0, 116.0, 75.0, 39.0, 26.0, 18.0, 13.0, 10.0, 12.0, 7.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.10699462890625, -1.0723876953125, -1.03778076171875, -1.003173828125, -0.96856689453125, -0.9339599609375, -0.89935302734375, -0.86474609375, -0.83013916015625, -0.7955322265625, -0.76092529296875, -0.726318359375, -0.69171142578125, -0.6571044921875, -0.62249755859375, -0.587890625, -0.55328369140625, -0.5186767578125, -0.48406982421875, -0.449462890625, -0.41485595703125, -0.3802490234375, -0.34564208984375, -0.31103515625, -0.27642822265625, -0.2418212890625, -0.20721435546875, -0.172607421875, -0.13800048828125, -0.1033935546875, -0.06878662109375, -0.0341796875, 0.00042724609375, 0.0350341796875, 0.06964111328125, 0.104248046875, 0.13885498046875, 0.1734619140625, 0.20806884765625, 0.24267578125, 0.27728271484375, 0.3118896484375, 0.34649658203125, 0.381103515625, 0.41571044921875, 0.4503173828125, 0.48492431640625, 0.51953125, 0.55413818359375, 0.5887451171875, 0.62335205078125, 0.657958984375, 0.69256591796875, 0.7271728515625, 0.76177978515625, 0.79638671875, 0.83099365234375, 0.8656005859375, 0.90020751953125, 0.934814453125, 0.96942138671875, 1.0040283203125, 1.03863525390625, 1.0732421875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 10.0, 21.0, 33.0, 50.0, 68.0, 74.0, 90.0, 119.0, 95.0, 107.0, 77.0, 63.0, 49.0, 40.0, 29.0, 27.0, 14.0, 7.0, 9.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343994140625, -0.3333625793457031, -0.32273101806640625, -0.3120994567871094, -0.3014678955078125, -0.2908363342285156, -0.28020477294921875, -0.2695732116699219, -0.258941650390625, -0.24831008911132812, -0.23767852783203125, -0.22704696655273438, -0.2164154052734375, -0.20578384399414062, -0.19515228271484375, -0.18452072143554688, -0.17388916015625, -0.16325759887695312, -0.15262603759765625, -0.14199447631835938, -0.1313629150390625, -0.12073135375976562, -0.11009979248046875, -0.09946823120117188, -0.088836669921875, -0.07820510864257812, -0.06757354736328125, -0.056941986083984375, -0.0463104248046875, -0.035678863525390625, -0.02504730224609375, -0.014415740966796875, -0.0037841796875, 0.006847381591796875, 0.01747894287109375, 0.028110504150390625, 0.0387420654296875, 0.049373626708984375, 0.06000518798828125, 0.07063674926757812, 0.081268310546875, 0.09189987182617188, 0.10253143310546875, 0.11316299438476562, 0.1237945556640625, 0.13442611694335938, 0.14505767822265625, 0.15568923950195312, 0.16632080078125, 0.17695236206054688, 0.18758392333984375, 0.19821548461914062, 0.2088470458984375, 0.21947860717773438, 0.23011016845703125, 0.24074172973632812, 0.251373291015625, 0.2620048522949219, 0.27263641357421875, 0.2832679748535156, 0.2938995361328125, 0.3045310974121094, 0.31516265869140625, 0.3257942199707031, 0.33642578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 10.0, 10.0, 5.0, 11.0, 14.0, 18.0, 19.0, 26.0, 56.0, 58.0, 90.0, 126.0, 165.0, 287.0, 543.0, 1046.0, 2764.0, 8936.0, 39362.0, 227995.0, 580688.0, 148498.0, 26886.0, 6693.0, 2105.0, 864.0, 453.0, 250.0, 166.0, 114.0, 72.0, 57.0, 40.0, 30.0, 23.0, 16.0, 22.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.69677734375, -0.6722259521484375, -0.647674560546875, -0.6231231689453125, -0.59857177734375, -0.5740203857421875, -0.549468994140625, -0.5249176025390625, -0.5003662109375, -0.4758148193359375, -0.451263427734375, -0.4267120361328125, -0.40216064453125, -0.3776092529296875, -0.353057861328125, -0.3285064697265625, -0.303955078125, -0.2794036865234375, -0.254852294921875, -0.2303009033203125, -0.20574951171875, -0.1811981201171875, -0.156646728515625, -0.1320953369140625, -0.1075439453125, -0.0829925537109375, -0.058441162109375, -0.0338897705078125, -0.00933837890625, 0.0152130126953125, 0.039764404296875, 0.0643157958984375, 0.0888671875, 0.1134185791015625, 0.137969970703125, 0.1625213623046875, 0.18707275390625, 0.2116241455078125, 0.236175537109375, 0.2607269287109375, 0.2852783203125, 0.3098297119140625, 0.334381103515625, 0.3589324951171875, 0.38348388671875, 0.4080352783203125, 0.432586669921875, 0.4571380615234375, 0.481689453125, 0.5062408447265625, 0.530792236328125, 0.5553436279296875, 0.57989501953125, 0.6044464111328125, 0.628997802734375, 0.6535491943359375, 0.6781005859375, 0.7026519775390625, 0.727203369140625, 0.7517547607421875, 0.77630615234375, 0.8008575439453125, 0.825408935546875, 0.8499603271484375, 0.87451171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 5.0, 8.0, 13.0, 28.0, 27.0, 36.0, 34.0, 54.0, 58.0, 49.0, 69.0, 85.0, 69.0, 65.0, 69.0, 64.0, 59.0, 49.0, 37.0, 40.0, 22.0, 16.0, 5.0, 13.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1572265625, -1.1213836669921875, -1.085540771484375, -1.0496978759765625, -1.01385498046875, -0.9780120849609375, -0.942169189453125, -0.9063262939453125, -0.8704833984375, -0.8346405029296875, -0.798797607421875, -0.7629547119140625, -0.72711181640625, -0.6912689208984375, -0.655426025390625, -0.6195831298828125, -0.583740234375, -0.5478973388671875, -0.512054443359375, -0.4762115478515625, -0.44036865234375, -0.4045257568359375, -0.368682861328125, -0.3328399658203125, -0.2969970703125, -0.2611541748046875, -0.225311279296875, -0.1894683837890625, -0.15362548828125, -0.1177825927734375, -0.081939697265625, -0.0460968017578125, -0.01025390625, 0.0255889892578125, 0.061431884765625, 0.0972747802734375, 0.13311767578125, 0.1689605712890625, 0.204803466796875, 0.2406463623046875, 0.2764892578125, 0.3123321533203125, 0.348175048828125, 0.3840179443359375, 0.41986083984375, 0.4557037353515625, 0.491546630859375, 0.5273895263671875, 0.563232421875, 0.5990753173828125, 0.634918212890625, 0.6707611083984375, 0.70660400390625, 0.7424468994140625, 0.778289794921875, 0.8141326904296875, 0.8499755859375, 0.8858184814453125, 0.921661376953125, 0.9575042724609375, 0.99334716796875, 1.0291900634765625, 1.065032958984375, 1.1008758544921875, 1.13671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 17.0, 34.0, 47.0, 71.0, 162.0, 329.0, 730.0, 2036.0, 7248.0, 38267.0, 475714.0, 474842.0, 38407.0, 7248.0, 2009.0, 739.0, 292.0, 151.0, 83.0, 46.0, 17.0, 19.0, 8.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.421142578125, -0.4066200256347656, -0.39209747314453125, -0.3775749206542969, -0.3630523681640625, -0.3485298156738281, -0.33400726318359375, -0.3194847106933594, -0.304962158203125, -0.2904396057128906, -0.27591705322265625, -0.2613945007324219, -0.2468719482421875, -0.23234939575195312, -0.21782684326171875, -0.20330429077148438, -0.18878173828125, -0.17425918579101562, -0.15973663330078125, -0.14521408081054688, -0.1306915283203125, -0.11616897583007812, -0.10164642333984375, -0.08712387084960938, -0.072601318359375, -0.058078765869140625, -0.04355621337890625, -0.029033660888671875, -0.0145111083984375, 1.1444091796875e-05, 0.01453399658203125, 0.029056549072265625, 0.0435791015625, 0.058101654052734375, 0.07262420654296875, 0.08714675903320312, 0.1016693115234375, 0.11619186401367188, 0.13071441650390625, 0.14523696899414062, 0.159759521484375, 0.17428207397460938, 0.18880462646484375, 0.20332717895507812, 0.2178497314453125, 0.23237228393554688, 0.24689483642578125, 0.2614173889160156, 0.27593994140625, 0.2904624938964844, 0.30498504638671875, 0.3195075988769531, 0.3340301513671875, 0.3485527038574219, 0.36307525634765625, 0.3775978088378906, 0.392120361328125, 0.4066429138183594, 0.42116546630859375, 0.4356880187988281, 0.4502105712890625, 0.4647331237792969, 0.47925567626953125, 0.4937782287597656, 0.50830078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 4.0, 9.0, 9.0, 9.0, 11.0, 9.0, 21.0, 24.0, 36.0, 39.0, 54.0, 67.0, 81.0, 80.0, 99.0, 84.0, 72.0, 46.0, 39.0, 34.0, 25.0, 41.0, 17.0, 17.0, 11.0, 10.0, 15.0, 6.0, 5.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-7.50422477722168e-05, -7.307622581720352e-05, -7.111020386219025e-05, -6.914418190717697e-05, -6.71781599521637e-05, -6.521213799715042e-05, -6.324611604213715e-05, -6.128009408712387e-05, -5.9314072132110596e-05, -5.734805017709732e-05, -5.5382028222084045e-05, -5.341600626707077e-05, -5.1449984312057495e-05, -4.948396235704422e-05, -4.7517940402030945e-05, -4.555191844701767e-05, -4.3585896492004395e-05, -4.161987453699112e-05, -3.9653852581977844e-05, -3.768783062696457e-05, -3.5721808671951294e-05, -3.375578671693802e-05, -3.1789764761924744e-05, -2.982374280691147e-05, -2.7857720851898193e-05, -2.5891698896884918e-05, -2.3925676941871643e-05, -2.1959654986858368e-05, -1.9993633031845093e-05, -1.8027611076831818e-05, -1.6061589121818542e-05, -1.4095567166805267e-05, -1.2129545211791992e-05, -1.0163523256778717e-05, -8.197501301765442e-06, -6.231479346752167e-06, -4.265457391738892e-06, -2.2994354367256165e-06, -3.334134817123413e-07, 1.6326084733009338e-06, 3.598630428314209e-06, 5.564652383327484e-06, 7.530674338340759e-06, 9.496696293354034e-06, 1.146271824836731e-05, 1.3428740203380585e-05, 1.539476215839386e-05, 1.7360784113407135e-05, 1.932680606842041e-05, 2.1292828023433685e-05, 2.325884997844696e-05, 2.5224871933460236e-05, 2.719089388847351e-05, 2.9156915843486786e-05, 3.112293779850006e-05, 3.3088959753513336e-05, 3.505498170852661e-05, 3.7021003663539886e-05, 3.898702561855316e-05, 4.095304757356644e-05, 4.291906952857971e-05, 4.488509148359299e-05, 4.685111343860626e-05, 4.881713539361954e-05, 5.078315734863281e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 12.0, 11.0, 20.0, 28.0, 38.0, 58.0, 101.0, 222.0, 424.0, 1064.0, 3316.0, 17384.0, 208123.0, 751823.0, 55464.0, 7359.0, 1722.0, 674.0, 298.0, 162.0, 79.0, 57.0, 45.0, 26.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51708984375, -0.50054931640625, -0.4840087890625, -0.46746826171875, -0.450927734375, -0.43438720703125, -0.4178466796875, -0.40130615234375, -0.384765625, -0.36822509765625, -0.3516845703125, -0.33514404296875, -0.318603515625, -0.30206298828125, -0.2855224609375, -0.26898193359375, -0.25244140625, -0.23590087890625, -0.2193603515625, -0.20281982421875, -0.186279296875, -0.16973876953125, -0.1531982421875, -0.13665771484375, -0.1201171875, -0.10357666015625, -0.0870361328125, -0.07049560546875, -0.053955078125, -0.03741455078125, -0.0208740234375, -0.00433349609375, 0.01220703125, 0.02874755859375, 0.0452880859375, 0.06182861328125, 0.078369140625, 0.09490966796875, 0.1114501953125, 0.12799072265625, 0.14453125, 0.16107177734375, 0.1776123046875, 0.19415283203125, 0.210693359375, 0.22723388671875, 0.2437744140625, 0.26031494140625, 0.27685546875, 0.29339599609375, 0.3099365234375, 0.32647705078125, 0.343017578125, 0.35955810546875, 0.3760986328125, 0.39263916015625, 0.4091796875, 0.42572021484375, 0.4422607421875, 0.45880126953125, 0.475341796875, 0.49188232421875, 0.5084228515625, 0.52496337890625, 0.54150390625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 9.0, 10.0, 8.0, 18.0, 18.0, 36.0, 46.0, 72.0, 111.0, 139.0, 141.0, 111.0, 84.0, 59.0, 46.0, 21.0, 11.0, 13.0, 10.0, 4.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40283203125, -0.3898963928222656, -0.37696075439453125, -0.3640251159667969, -0.3510894775390625, -0.3381538391113281, -0.32521820068359375, -0.3122825622558594, -0.299346923828125, -0.2864112854003906, -0.27347564697265625, -0.2605400085449219, -0.2476043701171875, -0.23466873168945312, -0.22173309326171875, -0.20879745483398438, -0.19586181640625, -0.18292617797851562, -0.16999053955078125, -0.15705490112304688, -0.1441192626953125, -0.13118362426757812, -0.11824798583984375, -0.10531234741210938, -0.092376708984375, -0.07944107055664062, -0.06650543212890625, -0.053569793701171875, -0.0406341552734375, -0.027698516845703125, -0.01476287841796875, -0.001827239990234375, 0.0111083984375, 0.024044036865234375, 0.03697967529296875, 0.049915313720703125, 0.0628509521484375, 0.07578659057617188, 0.08872222900390625, 0.10165786743164062, 0.114593505859375, 0.12752914428710938, 0.14046478271484375, 0.15340042114257812, 0.1663360595703125, 0.17927169799804688, 0.19220733642578125, 0.20514297485351562, 0.21807861328125, 0.23101425170898438, 0.24394989013671875, 0.2568855285644531, 0.2698211669921875, 0.2827568054199219, 0.29569244384765625, 0.3086280822753906, 0.321563720703125, 0.3344993591308594, 0.34743499755859375, 0.3603706359863281, 0.3733062744140625, 0.3862419128417969, 0.39917755126953125, 0.4121131896972656, 0.425048828125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 28.0, 83.0, 220.0, 315.0, 228.0, 77.0, 29.0, 10.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.811117172241211, -12.45047664642334, -12.089836120605469, -11.729194641113281, -11.36855411529541, -11.007913589477539, -10.647273063659668, -10.286632537841797, -9.925992012023926, -9.565351486206055, -9.204710960388184, -8.844070434570312, -8.483428955078125, -8.122788429260254, -7.762147903442383, -7.401507377624512, -7.040866374969482, -6.680225849151611, -6.319584846496582, -5.958944320678711, -5.59830379486084, -5.237663269042969, -4.8770222663879395, -4.516381740570068, -4.155740737915039, -3.795099973678589, -3.4344594478607178, -3.0738186836242676, -2.7131781578063965, -2.3525373935699463, -1.991896629333496, -1.631256103515625, -1.270615577697754, -0.9099749326705933, -0.5493342280387878, -0.18869352340698242, 0.17194712162017822, 0.5325877666473389, 0.8932285308837891, 1.2538690567016602, 1.6145098209381104, 1.975150465965271, 2.3357911109924316, 2.696431875228882, 3.057072639465332, 3.417713165283203, 3.7783539295196533, 4.138994216918945, 4.499635219573975, 4.860275745391846, 5.220916748046875, 5.581557273864746, 5.942197799682617, 6.302838325500488, 6.663479328155518, 7.024119853973389, 7.384760856628418, 7.745401382446289, 8.10604190826416, 8.466682434082031, 8.827323913574219, 9.18796443939209, 9.548604965209961, 9.909245491027832, 10.269886016845703]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 3.0, 10.0, 13.0, 9.0, 8.0, 16.0, 22.0, 20.0, 26.0, 29.0, 28.0, 36.0, 27.0, 44.0, 43.0, 44.0, 32.0, 39.0, 56.0, 47.0, 40.0, 39.0, 48.0, 45.0, 40.0, 34.0, 28.0, 30.0, 24.0, 14.0, 21.0, 20.0, 8.0, 12.0, 9.0, 10.0, 6.0, 1.0, 5.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0], "bins": [-4.976199150085449, -4.836032390594482, -4.695866107940674, -4.555699348449707, -4.415533065795898, -4.275366306304932, -4.135200023651123, -3.9950332641601562, -3.8548667430877686, -3.714700222015381, -3.574533700942993, -3.4343671798706055, -3.2942004203796387, -3.15403413772583, -3.0138673782348633, -2.8737008571624756, -2.733534336090088, -2.5933678150177, -2.4532012939453125, -2.313034772872925, -2.172868251800537, -2.0327014923095703, -1.8925349712371826, -1.752368450164795, -1.6122019290924072, -1.4720354080200195, -1.3318688869476318, -1.1917022466659546, -1.051535725593567, -0.9113692045211792, -0.7712026238441467, -0.6310360431671143, -0.49086976051330566, -0.3507032096385956, -0.2105366587638855, -0.07037010788917542, 0.06979644298553467, 0.20996296405792236, 0.35012954473495483, 0.4902961254119873, 0.630462646484375, 0.7706291675567627, 0.9107957482337952, 1.0509623289108276, 1.1911288499832153, 1.331295371055603, 1.4714620113372803, 1.611628532409668, 1.7517950534820557, 1.8919615745544434, 2.032128095626831, 2.1722946166992188, 2.3124613761901855, 2.452627658843994, 2.592794418334961, 2.7329609394073486, 2.8731274604797363, 3.013293981552124, 3.1534605026245117, 3.2936270236968994, 3.433793544769287, 3.573960304260254, 3.7141268253326416, 3.8542933464050293, 3.994459867477417]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 10.0, 5.0, 13.0, 17.0, 28.0, 47.0, 69.0, 84.0, 146.0, 214.0, 331.0, 688.0, 1304.0, 3074.0, 9290.0, 48389.0, 3886556.0, 214688.0, 19877.0, 5331.0, 2027.0, 861.0, 466.0, 259.0, 153.0, 101.0, 73.0, 52.0, 33.0, 32.0, 18.0, 13.0, 5.0, 7.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2998046875, -1.251220703125, -1.20263671875, -1.154052734375, -1.10546875, -1.056884765625, -1.00830078125, -0.959716796875, -0.9111328125, -0.862548828125, -0.81396484375, -0.765380859375, -0.716796875, -0.668212890625, -0.61962890625, -0.571044921875, -0.5224609375, -0.473876953125, -0.42529296875, -0.376708984375, -0.328125, -0.279541015625, -0.23095703125, -0.182373046875, -0.1337890625, -0.085205078125, -0.03662109375, 0.011962890625, 0.060546875, 0.109130859375, 0.15771484375, 0.206298828125, 0.2548828125, 0.303466796875, 0.35205078125, 0.400634765625, 0.44921875, 0.497802734375, 0.54638671875, 0.594970703125, 0.6435546875, 0.692138671875, 0.74072265625, 0.789306640625, 0.837890625, 0.886474609375, 0.93505859375, 0.983642578125, 1.0322265625, 1.080810546875, 1.12939453125, 1.177978515625, 1.2265625, 1.275146484375, 1.32373046875, 1.372314453125, 1.4208984375, 1.469482421875, 1.51806640625, 1.566650390625, 1.615234375, 1.663818359375, 1.71240234375, 1.760986328125, 1.8095703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 4.0, 10.0, 14.0, 23.0, 30.0, 52.0, 52.0, 54.0, 75.0, 100.0, 96.0, 72.0, 84.0, 82.0, 52.0, 43.0, 34.0, 26.0, 31.0, 16.0, 14.0, 12.0, 7.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3450355529785156, -0.33386993408203125, -0.3227043151855469, -0.3115386962890625, -0.3003730773925781, -0.28920745849609375, -0.2780418395996094, -0.266876220703125, -0.2557106018066406, -0.24454498291015625, -0.23337936401367188, -0.2222137451171875, -0.21104812622070312, -0.19988250732421875, -0.18871688842773438, -0.17755126953125, -0.16638565063476562, -0.15522003173828125, -0.14405441284179688, -0.1328887939453125, -0.12172317504882812, -0.11055755615234375, -0.09939193725585938, -0.088226318359375, -0.07706069946289062, -0.06589508056640625, -0.054729461669921875, -0.0435638427734375, -0.032398223876953125, -0.02123260498046875, -0.010066986083984375, 0.0010986328125, 0.012264251708984375, 0.02342987060546875, 0.034595489501953125, 0.0457611083984375, 0.056926727294921875, 0.06809234619140625, 0.07925796508789062, 0.090423583984375, 0.10158920288085938, 0.11275482177734375, 0.12392044067382812, 0.1350860595703125, 0.14625167846679688, 0.15741729736328125, 0.16858291625976562, 0.17974853515625, 0.19091415405273438, 0.20207977294921875, 0.21324539184570312, 0.2244110107421875, 0.23557662963867188, 0.24674224853515625, 0.2579078674316406, 0.269073486328125, 0.2802391052246094, 0.29140472412109375, 0.3025703430175781, 0.3137359619140625, 0.3249015808105469, 0.33606719970703125, 0.3472328186035156, 0.3583984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 11.0, 29.0, 61.0, 118.0, 236.0, 508.0, 1203.0, 3353.0, 13054.0, 90786.0, 3918735.0, 143077.0, 16596.0, 4032.0, 1395.0, 531.0, 278.0, 116.0, 72.0, 39.0, 14.0, 9.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.546875, -1.5008087158203125, -1.454742431640625, -1.4086761474609375, -1.36260986328125, -1.3165435791015625, -1.270477294921875, -1.2244110107421875, -1.1783447265625, -1.1322784423828125, -1.086212158203125, -1.0401458740234375, -0.99407958984375, -0.9480133056640625, -0.901947021484375, -0.8558807373046875, -0.809814453125, -0.7637481689453125, -0.717681884765625, -0.6716156005859375, -0.62554931640625, -0.5794830322265625, -0.533416748046875, -0.4873504638671875, -0.4412841796875, -0.3952178955078125, -0.349151611328125, -0.3030853271484375, -0.25701904296875, -0.2109527587890625, -0.164886474609375, -0.1188201904296875, -0.07275390625, -0.0266876220703125, 0.019378662109375, 0.0654449462890625, 0.11151123046875, 0.1575775146484375, 0.203643798828125, 0.2497100830078125, 0.2957763671875, 0.3418426513671875, 0.387908935546875, 0.4339752197265625, 0.48004150390625, 0.5261077880859375, 0.572174072265625, 0.6182403564453125, 0.664306640625, 0.7103729248046875, 0.756439208984375, 0.8025054931640625, 0.84857177734375, 0.8946380615234375, 0.940704345703125, 0.9867706298828125, 1.0328369140625, 1.0789031982421875, 1.124969482421875, 1.1710357666015625, 1.21710205078125, 1.2631683349609375, 1.309234619140625, 1.3553009033203125, 1.4013671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 8.0, 4.0, 17.0, 12.0, 20.0, 43.0, 80.0, 180.0, 613.0, 2564.0, 266.0, 93.0, 60.0, 32.0, 18.0, 23.0, 9.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7412109375, -0.7195892333984375, -0.697967529296875, -0.6763458251953125, -0.65472412109375, -0.6331024169921875, -0.611480712890625, -0.5898590087890625, -0.5682373046875, -0.5466156005859375, -0.524993896484375, -0.5033721923828125, -0.48175048828125, -0.4601287841796875, -0.438507080078125, -0.4168853759765625, -0.395263671875, -0.3736419677734375, -0.352020263671875, -0.3303985595703125, -0.30877685546875, -0.2871551513671875, -0.265533447265625, -0.2439117431640625, -0.2222900390625, -0.2006683349609375, -0.179046630859375, -0.1574249267578125, -0.13580322265625, -0.1141815185546875, -0.092559814453125, -0.0709381103515625, -0.04931640625, -0.0276947021484375, -0.006072998046875, 0.0155487060546875, 0.03717041015625, 0.0587921142578125, 0.080413818359375, 0.1020355224609375, 0.1236572265625, 0.1452789306640625, 0.166900634765625, 0.1885223388671875, 0.21014404296875, 0.2317657470703125, 0.253387451171875, 0.2750091552734375, 0.296630859375, 0.3182525634765625, 0.339874267578125, 0.3614959716796875, 0.38311767578125, 0.4047393798828125, 0.426361083984375, 0.4479827880859375, 0.4696044921875, 0.4912261962890625, 0.512847900390625, 0.5344696044921875, 0.55609130859375, 0.5777130126953125, 0.599334716796875, 0.6209564208984375, 0.642578125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 12.0, 28.0, 108.0, 377.0, 322.0, 109.0, 36.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.398108959197998, -3.1711981296539307, -2.9442873001098633, -2.717376708984375, -2.4904658794403076, -2.2635550498962402, -2.036644458770752, -1.8097336292266846, -1.5828227996826172, -1.3559119701385498, -1.129001259803772, -0.9020904898643494, -0.6751797199249268, -0.4482688903808594, -0.22135818004608154, 0.005552530288696289, 0.23246335983276367, 0.4593741297721863, 0.6862848997116089, 0.9131956696510315, 1.140106439590454, 1.3670172691345215, 1.5939279794692993, 1.8208386898040771, 2.0477495193481445, 2.274660348892212, 2.5015711784362793, 2.7284817695617676, 2.955392599105835, 3.1823034286499023, 3.4092140197753906, 3.636124849319458, 3.863035202026367, 4.0899457931518555, 4.316856861114502, 4.54376745223999, 4.770678520202637, 4.997589111328125, 5.224499702453613, 5.451410293579102, 5.678321361541748, 5.905231952667236, 6.132143020629883, 6.359053611755371, 6.585964202880859, 6.812875270843506, 7.039785861968994, 7.266696929931641, 7.493607521057129, 7.720518112182617, 7.947429180145264, 8.17434024810791, 8.401250839233398, 8.628161430358887, 8.855072021484375, 9.081982612609863, 9.308893203735352, 9.53580379486084, 9.762714385986328, 9.989625930786133, 10.216536521911621, 10.44344711303711, 10.670357704162598, 10.897268295288086, 11.12417984008789]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 8.0, 9.0, 7.0, 8.0, 8.0, 15.0, 23.0, 22.0, 15.0, 28.0, 22.0, 30.0, 45.0, 32.0, 39.0, 41.0, 43.0, 49.0, 50.0, 58.0, 55.0, 45.0, 42.0, 40.0, 45.0, 28.0, 24.0, 34.0, 25.0, 17.0, 21.0, 18.0, 11.0, 11.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6619577407836914, -1.6124058961868286, -1.5628540515899658, -1.5133020877838135, -1.4637502431869507, -1.414198398590088, -1.364646553993225, -1.3150947093963623, -1.2655428647994995, -1.2159910202026367, -1.166439175605774, -1.1168873310089111, -1.0673353672027588, -1.017783522605896, -0.9682316780090332, -0.9186798334121704, -0.8691279292106628, -0.8195760846138, -0.7700241804122925, -0.7204723358154297, -0.6709204912185669, -0.6213686466217041, -0.5718167424201965, -0.5222648978233337, -0.47271302342414856, -0.4231611490249634, -0.3736093044281006, -0.3240574300289154, -0.2745055556297302, -0.22495371103286743, -0.17540183663368225, -0.12584999203681946, -0.07629811763763428, -0.026746254414319992, 0.022805608808994293, 0.07235747575759888, 0.12190933525562286, 0.17146119475364685, 0.22101306915283203, 0.2705649137496948, 0.32011678814888, 0.3696686625480652, 0.419220507144928, 0.46877238154411316, 0.5183242559432983, 0.5678761005401611, 0.6174279451370239, 0.6669797897338867, 0.7165316939353943, 0.7660835385322571, 0.8156354427337646, 0.8651872873306274, 0.9147391319274902, 0.964290976524353, 1.0138428211212158, 1.0633947849273682, 1.112946629524231, 1.1624984741210938, 1.2120503187179565, 1.2616021633148193, 1.3111541271209717, 1.3607059717178345, 1.4102578163146973, 1.45980966091156, 1.5093615055084229]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 11.0, 12.0, 13.0, 24.0, 41.0, 48.0, 102.0, 122.0, 224.0, 399.0, 687.0, 1162.0, 2311.0, 5095.0, 12152.0, 34633.0, 109519.0, 325699.0, 361120.0, 129551.0, 40238.0, 14045.0, 5655.0, 2623.0, 1339.0, 703.0, 399.0, 225.0, 157.0, 93.0, 47.0, 33.0, 24.0, 24.0, 11.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.80029296875, -0.776092529296875, -0.75189208984375, -0.727691650390625, -0.7034912109375, -0.679290771484375, -0.65509033203125, -0.630889892578125, -0.606689453125, -0.582489013671875, -0.55828857421875, -0.534088134765625, -0.5098876953125, -0.485687255859375, -0.46148681640625, -0.437286376953125, -0.4130859375, -0.388885498046875, -0.36468505859375, -0.340484619140625, -0.3162841796875, -0.292083740234375, -0.26788330078125, -0.243682861328125, -0.219482421875, -0.195281982421875, -0.17108154296875, -0.146881103515625, -0.1226806640625, -0.098480224609375, -0.07427978515625, -0.050079345703125, -0.02587890625, -0.001678466796875, 0.02252197265625, 0.046722412109375, 0.0709228515625, 0.095123291015625, 0.11932373046875, 0.143524169921875, 0.167724609375, 0.191925048828125, 0.21612548828125, 0.240325927734375, 0.2645263671875, 0.288726806640625, 0.31292724609375, 0.337127685546875, 0.361328125, 0.385528564453125, 0.40972900390625, 0.433929443359375, 0.4581298828125, 0.482330322265625, 0.50653076171875, 0.530731201171875, 0.554931640625, 0.579132080078125, 0.60333251953125, 0.627532958984375, 0.6517333984375, 0.675933837890625, 0.70013427734375, 0.724334716796875, 0.74853515625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 6.0, 6.0, 3.0, 11.0, 13.0, 27.0, 18.0, 34.0, 40.0, 59.0, 63.0, 69.0, 78.0, 84.0, 74.0, 72.0, 79.0, 59.0, 47.0, 35.0, 36.0, 25.0, 19.0, 13.0, 11.0, 9.0, 5.0, 1.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36181640625, -0.3504638671875, -0.339111328125, -0.3277587890625, -0.31640625, -0.3050537109375, -0.293701171875, -0.2823486328125, -0.27099609375, -0.2596435546875, -0.248291015625, -0.2369384765625, -0.2255859375, -0.2142333984375, -0.202880859375, -0.1915283203125, -0.18017578125, -0.1688232421875, -0.157470703125, -0.1461181640625, -0.134765625, -0.1234130859375, -0.112060546875, -0.1007080078125, -0.08935546875, -0.0780029296875, -0.066650390625, -0.0552978515625, -0.0439453125, -0.0325927734375, -0.021240234375, -0.0098876953125, 0.00146484375, 0.0128173828125, 0.024169921875, 0.0355224609375, 0.046875, 0.0582275390625, 0.069580078125, 0.0809326171875, 0.09228515625, 0.1036376953125, 0.114990234375, 0.1263427734375, 0.1376953125, 0.1490478515625, 0.160400390625, 0.1717529296875, 0.18310546875, 0.1944580078125, 0.205810546875, 0.2171630859375, 0.228515625, 0.2398681640625, 0.251220703125, 0.2625732421875, 0.27392578125, 0.2852783203125, 0.296630859375, 0.3079833984375, 0.3193359375, 0.3306884765625, 0.342041015625, 0.3533935546875, 0.36474609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 3.0, 9.0, 16.0, 13.0, 15.0, 28.0, 51.0, 39.0, 76.0, 111.0, 163.0, 289.0, 524.0, 937.0, 2397.0, 7165.0, 28366.0, 152170.0, 574612.0, 225972.0, 40619.0, 9514.0, 2877.0, 1077.0, 543.0, 297.0, 213.0, 130.0, 83.0, 74.0, 54.0, 34.0, 25.0, 12.0, 9.0, 8.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0], "bins": [-1.2734375, -1.2386550903320312, -1.2038726806640625, -1.1690902709960938, -1.134307861328125, -1.0995254516601562, -1.0647430419921875, -1.0299606323242188, -0.99517822265625, -0.9603958129882812, -0.9256134033203125, -0.8908309936523438, -0.856048583984375, -0.8212661743164062, -0.7864837646484375, -0.7517013549804688, -0.7169189453125, -0.6821365356445312, -0.6473541259765625, -0.6125717163085938, -0.577789306640625, -0.5430068969726562, -0.5082244873046875, -0.47344207763671875, -0.43865966796875, -0.40387725830078125, -0.3690948486328125, -0.33431243896484375, -0.299530029296875, -0.26474761962890625, -0.2299652099609375, -0.19518280029296875, -0.160400390625, -0.12561798095703125, -0.0908355712890625, -0.05605316162109375, -0.021270751953125, 0.01351165771484375, 0.0482940673828125, 0.08307647705078125, 0.11785888671875, 0.15264129638671875, 0.1874237060546875, 0.22220611572265625, 0.256988525390625, 0.29177093505859375, 0.3265533447265625, 0.36133575439453125, 0.3961181640625, 0.43090057373046875, 0.4656829833984375, 0.5004653930664062, 0.535247802734375, 0.5700302124023438, 0.6048126220703125, 0.6395950317382812, 0.67437744140625, 0.7091598510742188, 0.7439422607421875, 0.7787246704101562, 0.813507080078125, 0.8482894897460938, 0.8830718994140625, 0.9178543090820312, 0.95263671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 1.0, 10.0, 8.0, 13.0, 15.0, 16.0, 17.0, 18.0, 26.0, 37.0, 32.0, 39.0, 33.0, 46.0, 40.0, 47.0, 42.0, 45.0, 41.0, 52.0, 46.0, 38.0, 29.0, 37.0, 33.0, 29.0, 32.0, 31.0, 19.0, 15.0, 21.0, 15.0, 14.0, 12.0, 10.0, 8.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.3134765625, -1.2726593017578125, -1.231842041015625, -1.1910247802734375, -1.15020751953125, -1.1093902587890625, -1.068572998046875, -1.0277557373046875, -0.9869384765625, -0.9461212158203125, -0.905303955078125, -0.8644866943359375, -0.82366943359375, -0.7828521728515625, -0.742034912109375, -0.7012176513671875, -0.660400390625, -0.6195831298828125, -0.578765869140625, -0.5379486083984375, -0.49713134765625, -0.4563140869140625, -0.415496826171875, -0.3746795654296875, -0.3338623046875, -0.2930450439453125, -0.252227783203125, -0.2114105224609375, -0.17059326171875, -0.1297760009765625, -0.088958740234375, -0.0481414794921875, -0.00732421875, 0.0334930419921875, 0.074310302734375, 0.1151275634765625, 0.15594482421875, 0.1967620849609375, 0.237579345703125, 0.2783966064453125, 0.3192138671875, 0.3600311279296875, 0.400848388671875, 0.4416656494140625, 0.48248291015625, 0.5233001708984375, 0.564117431640625, 0.6049346923828125, 0.645751953125, 0.6865692138671875, 0.727386474609375, 0.7682037353515625, 0.80902099609375, 0.8498382568359375, 0.890655517578125, 0.9314727783203125, 0.9722900390625, 1.0131072998046875, 1.053924560546875, 1.0947418212890625, 1.13555908203125, 1.1763763427734375, 1.217193603515625, 1.2580108642578125, 1.298828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 14.0, 20.0, 27.0, 48.0, 81.0, 160.0, 410.0, 1258.0, 7709.0, 188516.0, 826559.0, 20253.0, 2372.0, 631.0, 242.0, 95.0, 57.0, 34.0, 12.0, 6.0, 9.0, 8.0, 9.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.50921630859375, -1.4637451171875, -1.41827392578125, -1.372802734375, -1.32733154296875, -1.2818603515625, -1.23638916015625, -1.19091796875, -1.14544677734375, -1.0999755859375, -1.05450439453125, -1.009033203125, -0.96356201171875, -0.9180908203125, -0.87261962890625, -0.8271484375, -0.78167724609375, -0.7362060546875, -0.69073486328125, -0.645263671875, -0.59979248046875, -0.5543212890625, -0.50885009765625, -0.46337890625, -0.41790771484375, -0.3724365234375, -0.32696533203125, -0.281494140625, -0.23602294921875, -0.1905517578125, -0.14508056640625, -0.099609375, -0.05413818359375, -0.0086669921875, 0.03680419921875, 0.082275390625, 0.12774658203125, 0.1732177734375, 0.21868896484375, 0.26416015625, 0.30963134765625, 0.3551025390625, 0.40057373046875, 0.446044921875, 0.49151611328125, 0.5369873046875, 0.58245849609375, 0.6279296875, 0.67340087890625, 0.7188720703125, 0.76434326171875, 0.809814453125, 0.85528564453125, 0.9007568359375, 0.94622802734375, 0.99169921875, 1.03717041015625, 1.0826416015625, 1.12811279296875, 1.173583984375, 1.21905517578125, 1.2645263671875, 1.30999755859375, 1.35546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 11.0, 14.0, 21.0, 28.0, 79.0, 117.0, 186.0, 223.0, 156.0, 76.0, 36.0, 18.0, 16.0, 6.0, 9.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026226043701171875, -0.00025477074086666107, -0.0002472810447216034, -0.00023979134857654572, -0.00023230165243148804, -0.00022481195628643036, -0.00021732226014137268, -0.000209832563996315, -0.00020234286785125732, -0.00019485317170619965, -0.00018736347556114197, -0.0001798737794160843, -0.0001723840832710266, -0.00016489438712596893, -0.00015740469098091125, -0.00014991499483585358, -0.0001424252986907959, -0.00013493560254573822, -0.00012744590640068054, -0.00011995621025562286, -0.00011246651411056519, -0.00010497681796550751, -9.748712182044983e-05, -8.999742567539215e-05, -8.250772953033447e-05, -7.50180333852768e-05, -6.752833724021912e-05, -6.003864109516144e-05, -5.254894495010376e-05, -4.505924880504608e-05, -3.75695526599884e-05, -3.0079856514930725e-05, -2.2590160369873047e-05, -1.5100464224815369e-05, -7.6107680797576904e-06, -1.210719347000122e-07, 7.368624210357666e-06, 1.4858320355415344e-05, 2.2348016500473022e-05, 2.98377126455307e-05, 3.732740879058838e-05, 4.481710493564606e-05, 5.2306801080703735e-05, 5.9796497225761414e-05, 6.728619337081909e-05, 7.477588951587677e-05, 8.226558566093445e-05, 8.975528180599213e-05, 9.72449779510498e-05, 0.00010473467409610748, 0.00011222437024116516, 0.00011971406638622284, 0.00012720376253128052, 0.0001346934586763382, 0.00014218315482139587, 0.00014967285096645355, 0.00015716254711151123, 0.0001646522432565689, 0.0001721419394016266, 0.00017963163554668427, 0.00018712133169174194, 0.00019461102783679962, 0.0002021007239818573, 0.00020959042012691498, 0.00021708011627197266]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 6.0, 8.0, 25.0, 40.0, 65.0, 127.0, 280.0, 819.0, 4590.0, 146880.0, 880701.0, 12794.0, 1527.0, 362.0, 154.0, 77.0, 38.0, 25.0, 11.0, 6.0, 7.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9775390625, -1.921356201171875, -1.86517333984375, -1.808990478515625, -1.7528076171875, -1.696624755859375, -1.64044189453125, -1.584259033203125, -1.528076171875, -1.471893310546875, -1.41571044921875, -1.359527587890625, -1.3033447265625, -1.247161865234375, -1.19097900390625, -1.134796142578125, -1.07861328125, -1.022430419921875, -0.96624755859375, -0.910064697265625, -0.8538818359375, -0.797698974609375, -0.74151611328125, -0.685333251953125, -0.629150390625, -0.572967529296875, -0.51678466796875, -0.460601806640625, -0.4044189453125, -0.348236083984375, -0.29205322265625, -0.235870361328125, -0.1796875, -0.123504638671875, -0.06732177734375, -0.011138916015625, 0.0450439453125, 0.101226806640625, 0.15740966796875, 0.213592529296875, 0.269775390625, 0.325958251953125, 0.38214111328125, 0.438323974609375, 0.4945068359375, 0.550689697265625, 0.60687255859375, 0.663055419921875, 0.71923828125, 0.775421142578125, 0.83160400390625, 0.887786865234375, 0.9439697265625, 1.000152587890625, 1.05633544921875, 1.112518310546875, 1.168701171875, 1.224884033203125, 1.28106689453125, 1.337249755859375, 1.3934326171875, 1.449615478515625, 1.50579833984375, 1.561981201171875, 1.6181640625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 14.0, 23.0, 35.0, 61.0, 118.0, 190.0, 218.0, 138.0, 77.0, 36.0, 19.0, 18.0, 11.0, 5.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.603515625, -1.5653915405273438, -1.5272674560546875, -1.4891433715820312, -1.451019287109375, -1.4128952026367188, -1.3747711181640625, -1.3366470336914062, -1.29852294921875, -1.2603988647460938, -1.2222747802734375, -1.1841506958007812, -1.146026611328125, -1.1079025268554688, -1.0697784423828125, -1.0316543579101562, -0.9935302734375, -0.9554061889648438, -0.9172821044921875, -0.8791580200195312, -0.841033935546875, -0.8029098510742188, -0.7647857666015625, -0.7266616821289062, -0.68853759765625, -0.6504135131835938, -0.6122894287109375, -0.5741653442382812, -0.536041259765625, -0.49791717529296875, -0.4597930908203125, -0.42166900634765625, -0.383544921875, -0.34542083740234375, -0.3072967529296875, -0.26917266845703125, -0.231048583984375, -0.19292449951171875, -0.1548004150390625, -0.11667633056640625, -0.07855224609375, -0.04042816162109375, -0.0023040771484375, 0.03582000732421875, 0.073944091796875, 0.11206817626953125, 0.1501922607421875, 0.18831634521484375, 0.2264404296875, 0.26456451416015625, 0.3026885986328125, 0.34081268310546875, 0.378936767578125, 0.41706085205078125, 0.4551849365234375, 0.49330902099609375, 0.53143310546875, 0.5695571899414062, 0.6076812744140625, 0.6458053588867188, 0.683929443359375, 0.7220535278320312, 0.7601776123046875, 0.7983016967773438, 0.83642578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 51.0, 290.0, 529.0, 121.0, 13.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.90468978881836, -49.825355529785156, -48.74602127075195, -47.66668701171875, -46.58735656738281, -45.50802230834961, -44.428688049316406, -43.3493537902832, -42.27001953125, -41.1906852722168, -40.111351013183594, -39.03201675415039, -37.95268249511719, -36.87335205078125, -35.79401779174805, -34.714683532714844, -33.63534927368164, -32.55601501464844, -31.476680755615234, -30.397348403930664, -29.31801414489746, -28.238679885864258, -27.159347534179688, -26.080013275146484, -25.00067901611328, -23.921344757080078, -22.842010498046875, -21.762678146362305, -20.6833438873291, -19.6040096282959, -18.524677276611328, -17.445343017578125, -16.366012573242188, -15.286678314208984, -14.207345008850098, -13.128011703491211, -12.048677444458008, -10.969343185424805, -9.890009880065918, -8.810676574707031, -7.731342315673828, -6.652008533477783, -5.572674751281738, -4.493340969085693, -3.4140071868896484, -2.3346734046936035, -1.2553396224975586, -0.17600584030151367, 0.9033279418945312, 1.9826617240905762, 3.061995506286621, 4.141329288482666, 5.220663070678711, 6.299996852874756, 7.379330635070801, 8.458663940429688, 9.53799819946289, 10.617332458496094, 11.69666576385498, 12.775999069213867, 13.85533332824707, 14.934667587280273, 16.013999938964844, 17.093334197998047, 18.17266845703125]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 4.0, 9.0, 7.0, 7.0, 15.0, 19.0, 20.0, 23.0, 22.0, 21.0, 27.0, 31.0, 38.0, 41.0, 40.0, 47.0, 43.0, 44.0, 55.0, 48.0, 48.0, 32.0, 35.0, 44.0, 36.0, 25.0, 35.0, 29.0, 28.0, 21.0, 17.0, 15.0, 16.0, 20.0, 6.0, 4.0, 9.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.251477241516113, -7.036263942718506, -6.821050643920898, -6.605837345123291, -6.390624046325684, -6.175411224365234, -5.960197448730469, -5.7449846267700195, -5.529771327972412, -5.314558029174805, -5.099344730377197, -4.88413143157959, -4.668918132781982, -4.453704833984375, -4.238492012023926, -4.023278713226318, -3.808065176010132, -3.5928518772125244, -3.377638578414917, -3.1624255180358887, -2.9472122192382812, -2.731998920440674, -2.5167856216430664, -2.301572322845459, -2.0863590240478516, -1.8711457252502441, -1.6559325456619263, -1.4407192468643188, -1.225506067276001, -1.0102927684783936, -0.7950794696807861, -0.5798662900924683, -0.3646531105041504, -0.14943985641002655, 0.06577339768409729, 0.2809866666793823, 0.49619990587234497, 0.7114131450653076, 0.926626443862915, 1.141839623451233, 1.3570529222488403, 1.5722662210464478, 1.7874794006347656, 2.002692699432373, 2.2179059982299805, 2.433119297027588, 2.6483325958251953, 2.8635456562042236, 3.078758955001831, 3.2939722537994385, 3.509185552597046, 3.724398612976074, 3.9396119117736816, 4.154825210571289, 4.3700385093688965, 4.585251808166504, 4.800465106964111, 5.015678405761719, 5.230891704559326, 5.446105003356934, 5.661318302154541, 5.876531600952148, 6.091744422912598, 6.306957721710205, 6.5221710205078125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 9.0, 11.0, 17.0, 21.0, 23.0, 41.0, 50.0, 95.0, 106.0, 164.0, 296.0, 496.0, 951.0, 2008.0, 5371.0, 23045.0, 3914794.0, 223786.0, 15130.0, 4207.0, 1701.0, 814.0, 397.0, 263.0, 135.0, 92.0, 75.0, 52.0, 30.0, 23.0, 18.0, 16.0, 9.0, 6.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.2890625, -1.252105712890625, -1.21514892578125, -1.178192138671875, -1.1412353515625, -1.104278564453125, -1.06732177734375, -1.030364990234375, -0.993408203125, -0.956451416015625, -0.91949462890625, -0.882537841796875, -0.8455810546875, -0.808624267578125, -0.77166748046875, -0.734710693359375, -0.69775390625, -0.660797119140625, -0.62384033203125, -0.586883544921875, -0.5499267578125, -0.512969970703125, -0.47601318359375, -0.439056396484375, -0.402099609375, -0.365142822265625, -0.32818603515625, -0.291229248046875, -0.2542724609375, -0.217315673828125, -0.18035888671875, -0.143402099609375, -0.1064453125, -0.069488525390625, -0.03253173828125, 0.004425048828125, 0.0413818359375, 0.078338623046875, 0.11529541015625, 0.152252197265625, 0.189208984375, 0.226165771484375, 0.26312255859375, 0.300079345703125, 0.3370361328125, 0.373992919921875, 0.41094970703125, 0.447906494140625, 0.48486328125, 0.521820068359375, 0.55877685546875, 0.595733642578125, 0.6326904296875, 0.669647216796875, 0.70660400390625, 0.743560791015625, 0.780517578125, 0.817474365234375, 0.85443115234375, 0.891387939453125, 0.9283447265625, 0.965301513671875, 1.00225830078125, 1.039215087890625, 1.076171875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 4.0, 6.0, 5.0, 6.0, 7.0, 14.0, 18.0, 16.0, 17.0, 36.0, 45.0, 51.0, 47.0, 68.0, 61.0, 68.0, 66.0, 59.0, 70.0, 59.0, 58.0, 25.0, 41.0, 31.0, 22.0, 16.0, 14.0, 24.0, 15.0, 9.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37744140625, -0.36418914794921875, -0.3509368896484375, -0.33768463134765625, -0.324432373046875, -0.31118011474609375, -0.2979278564453125, -0.28467559814453125, -0.27142333984375, -0.25817108154296875, -0.2449188232421875, -0.23166656494140625, -0.218414306640625, -0.20516204833984375, -0.1919097900390625, -0.17865753173828125, -0.1654052734375, -0.15215301513671875, -0.1389007568359375, -0.12564849853515625, -0.112396240234375, -0.09914398193359375, -0.0858917236328125, -0.07263946533203125, -0.05938720703125, -0.04613494873046875, -0.0328826904296875, -0.01963043212890625, -0.006378173828125, 0.00687408447265625, 0.0201263427734375, 0.03337860107421875, 0.046630859375, 0.05988311767578125, 0.0731353759765625, 0.08638763427734375, 0.099639892578125, 0.11289215087890625, 0.1261444091796875, 0.13939666748046875, 0.15264892578125, 0.16590118408203125, 0.1791534423828125, 0.19240570068359375, 0.205657958984375, 0.21891021728515625, 0.2321624755859375, 0.24541473388671875, 0.2586669921875, 0.27191925048828125, 0.2851715087890625, 0.29842376708984375, 0.311676025390625, 0.32492828369140625, 0.3381805419921875, 0.35143280029296875, 0.36468505859375, 0.37793731689453125, 0.3911895751953125, 0.40444183349609375, 0.417694091796875, 0.43094635009765625, 0.4441986083984375, 0.45745086669921875, 0.470703125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 11.0, 16.0, 15.0, 16.0, 22.0, 34.0, 36.0, 56.0, 86.0, 123.0, 195.0, 366.0, 693.0, 1773.0, 6449.0, 51682.0, 4096239.0, 28807.0, 4520.0, 1425.0, 638.0, 347.0, 231.0, 147.0, 98.0, 56.0, 50.0, 26.0, 29.0, 20.0, 15.0, 16.0, 14.0, 6.0, 9.0, 3.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.529296875, -2.461669921875, -2.39404296875, -2.326416015625, -2.2587890625, -2.191162109375, -2.12353515625, -2.055908203125, -1.98828125, -1.920654296875, -1.85302734375, -1.785400390625, -1.7177734375, -1.650146484375, -1.58251953125, -1.514892578125, -1.447265625, -1.379638671875, -1.31201171875, -1.244384765625, -1.1767578125, -1.109130859375, -1.04150390625, -0.973876953125, -0.90625, -0.838623046875, -0.77099609375, -0.703369140625, -0.6357421875, -0.568115234375, -0.50048828125, -0.432861328125, -0.365234375, -0.297607421875, -0.22998046875, -0.162353515625, -0.0947265625, -0.027099609375, 0.04052734375, 0.108154296875, 0.17578125, 0.243408203125, 0.31103515625, 0.378662109375, 0.4462890625, 0.513916015625, 0.58154296875, 0.649169921875, 0.716796875, 0.784423828125, 0.85205078125, 0.919677734375, 0.9873046875, 1.054931640625, 1.12255859375, 1.190185546875, 1.2578125, 1.325439453125, 1.39306640625, 1.460693359375, 1.5283203125, 1.595947265625, 1.66357421875, 1.731201171875, 1.798828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 13.0, 11.0, 24.0, 66.0, 364.0, 3479.0, 66.0, 21.0, 16.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2083740234375, -0.1925525665283203, -0.17673110961914062, -0.16090965270996094, -0.14508819580078125, -0.12926673889160156, -0.11344528198242188, -0.09762382507324219, -0.0818023681640625, -0.06598091125488281, -0.050159454345703125, -0.03433799743652344, -0.01851654052734375, -0.0026950836181640625, 0.013126373291015625, 0.028947830200195312, 0.044769287109375, 0.06059074401855469, 0.07641220092773438, 0.09223365783691406, 0.10805511474609375, 0.12387657165527344, 0.13969802856445312, 0.1555194854736328, 0.1713409423828125, 0.1871623992919922, 0.20298385620117188, 0.21880531311035156, 0.23462677001953125, 0.25044822692871094, 0.2662696838378906, 0.2820911407470703, 0.29791259765625, 0.3137340545654297, 0.3295555114746094, 0.34537696838378906, 0.36119842529296875, 0.37701988220214844, 0.3928413391113281, 0.4086627960205078, 0.4244842529296875, 0.4403057098388672, 0.4561271667480469, 0.47194862365722656, 0.48777008056640625, 0.5035915374755859, 0.5194129943847656, 0.5352344512939453, 0.551055908203125, 0.5668773651123047, 0.5826988220214844, 0.5985202789306641, 0.6143417358398438, 0.6301631927490234, 0.6459846496582031, 0.6618061065673828, 0.6776275634765625, 0.6934490203857422, 0.7092704772949219, 0.7250919342041016, 0.7409133911132812, 0.7567348480224609, 0.7725563049316406, 0.7883777618408203, 0.80419921875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 13.0, 43.0, 159.0, 326.0, 270.0, 134.0, 34.0, 18.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7480933666229248, -1.646098017692566, -1.544102668762207, -1.4421074390411377, -1.3401119709014893, -1.23811674118042, -1.136121392250061, -1.0341260433197021, -0.9321306943893433, -0.8301353454589844, -0.7281399965286255, -0.6261447072029114, -0.5241493582725525, -0.4221540093421936, -0.3201587200164795, -0.2181633710861206, -0.11616802215576172, -0.014172688126564026, 0.08782264590263367, 0.18981796503067017, 0.29181331396102905, 0.39380866289138794, 0.49580395221710205, 0.5977993011474609, 0.6997946500778198, 0.8017899990081787, 0.9037853479385376, 1.0057806968688965, 1.1077759265899658, 1.2097713947296143, 1.3117666244506836, 1.4137619733810425, 1.5157570838928223, 1.6177524328231812, 1.71974778175354, 1.8217430114746094, 1.9237384796142578, 2.025733709335327, 2.1277289390563965, 2.229724407196045, 2.3317198753356934, 2.4337151050567627, 2.535710573196411, 2.6377058029174805, 2.739701271057129, 2.8416965007781982, 2.9436917304992676, 3.045687198638916, 3.1476824283599854, 3.2496776580810547, 3.351673126220703, 3.4536683559417725, 3.555663824081421, 3.6576590538024902, 3.7596545219421387, 3.861649751663208, 3.9636449813842773, 4.065640449523926, 4.167635440826416, 4.2696309089660645, 4.371626377105713, 4.473621845245361, 4.575616836547852, 4.6776123046875, 4.779607772827148]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 10.0, 6.0, 17.0, 18.0, 15.0, 22.0, 22.0, 21.0, 35.0, 38.0, 45.0, 46.0, 48.0, 56.0, 62.0, 44.0, 61.0, 61.0, 42.0, 42.0, 51.0, 44.0, 30.0, 25.0, 31.0, 29.0, 19.0, 19.0, 9.0, 7.0, 9.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.3548306226730347, -1.3214133977890015, -1.2879961729049683, -1.254578948020935, -1.2211617231369019, -1.1877444982528687, -1.1543272733688354, -1.1209100484848022, -1.087492823600769, -1.0540755987167358, -1.0206583738327026, -0.9872411489486694, -0.9538239240646362, -0.920406699180603, -0.8869894742965698, -0.8535722494125366, -0.8201550245285034, -0.7867377996444702, -0.753320574760437, -0.7199033498764038, -0.6864861249923706, -0.6530689001083374, -0.6196516752243042, -0.586234450340271, -0.5528172254562378, -0.5194000005722046, -0.4859827756881714, -0.4525655508041382, -0.419148325920105, -0.3857311010360718, -0.3523138761520386, -0.31889665126800537, -0.28547942638397217, -0.25206220149993896, -0.21864497661590576, -0.18522775173187256, -0.15181052684783936, -0.11839330196380615, -0.08497607707977295, -0.051558852195739746, -0.018141627311706543, 0.01527559757232666, 0.04869282245635986, 0.08211004734039307, 0.11552727222442627, 0.14894449710845947, 0.18236172199249268, 0.21577894687652588, 0.24919617176055908, 0.2826133966445923, 0.3160306215286255, 0.3494478464126587, 0.3828650712966919, 0.4162822961807251, 0.4496995210647583, 0.4831167459487915, 0.5165339708328247, 0.5499511957168579, 0.5833684206008911, 0.6167856454849243, 0.6502028703689575, 0.6836200952529907, 0.7170373201370239, 0.7504545450210571, 0.7838717699050903]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 17.0, 16.0, 23.0, 34.0, 50.0, 73.0, 132.0, 238.0, 582.0, 1372.0, 3962.0, 14039.0, 55747.0, 236986.0, 479460.0, 193560.0, 45185.0, 11593.0, 3305.0, 1154.0, 498.0, 208.0, 107.0, 74.0, 48.0, 34.0, 19.0, 17.0, 11.0, 5.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3330078125, -1.295379638671875, -1.25775146484375, -1.220123291015625, -1.1824951171875, -1.144866943359375, -1.10723876953125, -1.069610595703125, -1.031982421875, -0.994354248046875, -0.95672607421875, -0.919097900390625, -0.8814697265625, -0.843841552734375, -0.80621337890625, -0.768585205078125, -0.73095703125, -0.693328857421875, -0.65570068359375, -0.618072509765625, -0.5804443359375, -0.542816162109375, -0.50518798828125, -0.467559814453125, -0.429931640625, -0.392303466796875, -0.35467529296875, -0.317047119140625, -0.2794189453125, -0.241790771484375, -0.20416259765625, -0.166534423828125, -0.12890625, -0.091278076171875, -0.05364990234375, -0.016021728515625, 0.0216064453125, 0.059234619140625, 0.09686279296875, 0.134490966796875, 0.172119140625, 0.209747314453125, 0.24737548828125, 0.285003662109375, 0.3226318359375, 0.360260009765625, 0.39788818359375, 0.435516357421875, 0.47314453125, 0.510772705078125, 0.54840087890625, 0.586029052734375, 0.6236572265625, 0.661285400390625, 0.69891357421875, 0.736541748046875, 0.774169921875, 0.811798095703125, 0.84942626953125, 0.887054443359375, 0.9246826171875, 0.962310791015625, 0.99993896484375, 1.037567138671875, 1.0751953125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 17.0, 16.0, 16.0, 15.0, 18.0, 41.0, 31.0, 51.0, 60.0, 74.0, 59.0, 75.0, 71.0, 61.0, 49.0, 60.0, 73.0, 44.0, 37.0, 29.0, 24.0, 15.0, 24.0, 12.0, 7.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56884765625, -0.551727294921875, -0.53460693359375, -0.517486572265625, -0.5003662109375, -0.483245849609375, -0.46612548828125, -0.449005126953125, -0.431884765625, -0.414764404296875, -0.39764404296875, -0.380523681640625, -0.3634033203125, -0.346282958984375, -0.32916259765625, -0.312042236328125, -0.294921875, -0.277801513671875, -0.26068115234375, -0.243560791015625, -0.2264404296875, -0.209320068359375, -0.19219970703125, -0.175079345703125, -0.157958984375, -0.140838623046875, -0.12371826171875, -0.106597900390625, -0.0894775390625, -0.072357177734375, -0.05523681640625, -0.038116455078125, -0.02099609375, -0.003875732421875, 0.01324462890625, 0.030364990234375, 0.0474853515625, 0.064605712890625, 0.08172607421875, 0.098846435546875, 0.115966796875, 0.133087158203125, 0.15020751953125, 0.167327880859375, 0.1844482421875, 0.201568603515625, 0.21868896484375, 0.235809326171875, 0.2529296875, 0.270050048828125, 0.28717041015625, 0.304290771484375, 0.3214111328125, 0.338531494140625, 0.35565185546875, 0.372772216796875, 0.389892578125, 0.407012939453125, 0.42413330078125, 0.441253662109375, 0.4583740234375, 0.475494384765625, 0.49261474609375, 0.509735107421875, 0.52685546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 2.0, 5.0, 14.0, 9.0, 19.0, 23.0, 28.0, 41.0, 50.0, 66.0, 104.0, 150.0, 211.0, 302.0, 467.0, 852.0, 1734.0, 4388.0, 12889.0, 53707.0, 310449.0, 532149.0, 98714.0, 20817.0, 6127.0, 2352.0, 1071.0, 582.0, 349.0, 242.0, 151.0, 130.0, 90.0, 55.0, 52.0, 35.0, 33.0, 21.0, 21.0, 5.0, 11.0, 11.0, 10.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5654296875, -1.5135650634765625, -1.461700439453125, -1.4098358154296875, -1.35797119140625, -1.3061065673828125, -1.254241943359375, -1.2023773193359375, -1.1505126953125, -1.0986480712890625, -1.046783447265625, -0.9949188232421875, -0.94305419921875, -0.8911895751953125, -0.839324951171875, -0.7874603271484375, -0.735595703125, -0.6837310791015625, -0.631866455078125, -0.5800018310546875, -0.52813720703125, -0.4762725830078125, -0.424407958984375, -0.3725433349609375, -0.3206787109375, -0.2688140869140625, -0.216949462890625, -0.1650848388671875, -0.11322021484375, -0.0613555908203125, -0.009490966796875, 0.0423736572265625, 0.09423828125, 0.1461029052734375, 0.197967529296875, 0.2498321533203125, 0.30169677734375, 0.3535614013671875, 0.405426025390625, 0.4572906494140625, 0.5091552734375, 0.5610198974609375, 0.612884521484375, 0.6647491455078125, 0.71661376953125, 0.7684783935546875, 0.820343017578125, 0.8722076416015625, 0.924072265625, 0.9759368896484375, 1.027801513671875, 1.0796661376953125, 1.13153076171875, 1.1833953857421875, 1.235260009765625, 1.2871246337890625, 1.3389892578125, 1.3908538818359375, 1.442718505859375, 1.4945831298828125, 1.54644775390625, 1.5983123779296875, 1.650177001953125, 1.7020416259765625, 1.75390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 9.0, 7.0, 14.0, 13.0, 12.0, 13.0, 30.0, 27.0, 23.0, 39.0, 58.0, 42.0, 63.0, 54.0, 58.0, 58.0, 50.0, 68.0, 54.0, 35.0, 39.0, 42.0, 47.0, 30.0, 23.0, 20.0, 15.0, 9.0, 7.0, 5.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.80078125, -2.70947265625, -2.6181640625, -2.52685546875, -2.435546875, -2.34423828125, -2.2529296875, -2.16162109375, -2.0703125, -1.97900390625, -1.8876953125, -1.79638671875, -1.705078125, -1.61376953125, -1.5224609375, -1.43115234375, -1.33984375, -1.24853515625, -1.1572265625, -1.06591796875, -0.974609375, -0.88330078125, -0.7919921875, -0.70068359375, -0.609375, -0.51806640625, -0.4267578125, -0.33544921875, -0.244140625, -0.15283203125, -0.0615234375, 0.02978515625, 0.12109375, 0.21240234375, 0.3037109375, 0.39501953125, 0.486328125, 0.57763671875, 0.6689453125, 0.76025390625, 0.8515625, 0.94287109375, 1.0341796875, 1.12548828125, 1.216796875, 1.30810546875, 1.3994140625, 1.49072265625, 1.58203125, 1.67333984375, 1.7646484375, 1.85595703125, 1.947265625, 2.03857421875, 2.1298828125, 2.22119140625, 2.3125, 2.40380859375, 2.4951171875, 2.58642578125, 2.677734375, 2.76904296875, 2.8603515625, 2.95166015625, 3.04296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 12.0, 49.0, 112.0, 341.0, 1871.0, 389321.0, 653964.0, 2332.0, 341.0, 111.0, 45.0, 16.0, 8.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.14691162109375, -3.0516357421875, -2.95635986328125, -2.861083984375, -2.76580810546875, -2.6705322265625, -2.57525634765625, -2.47998046875, -2.38470458984375, -2.2894287109375, -2.19415283203125, -2.098876953125, -2.00360107421875, -1.9083251953125, -1.81304931640625, -1.7177734375, -1.62249755859375, -1.5272216796875, -1.43194580078125, -1.336669921875, -1.24139404296875, -1.1461181640625, -1.05084228515625, -0.95556640625, -0.86029052734375, -0.7650146484375, -0.66973876953125, -0.574462890625, -0.47918701171875, -0.3839111328125, -0.28863525390625, -0.193359375, -0.09808349609375, -0.0028076171875, 0.09246826171875, 0.187744140625, 0.28302001953125, 0.3782958984375, 0.47357177734375, 0.56884765625, 0.66412353515625, 0.7593994140625, 0.85467529296875, 0.949951171875, 1.04522705078125, 1.1405029296875, 1.23577880859375, 1.3310546875, 1.42633056640625, 1.5216064453125, 1.61688232421875, 1.712158203125, 1.80743408203125, 1.9027099609375, 1.99798583984375, 2.09326171875, 2.18853759765625, 2.2838134765625, 2.37908935546875, 2.474365234375, 2.56964111328125, 2.6649169921875, 2.76019287109375, 2.85546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 6.0, 17.0, 11.0, 16.0, 22.0, 19.0, 33.0, 38.0, 52.0, 57.0, 71.0, 74.0, 90.0, 88.0, 70.0, 66.0, 66.0, 35.0, 40.0, 19.0, 25.0, 19.0, 13.0, 12.0, 10.0, 5.0, 6.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00010478496551513672, -0.00010221172124147415, -9.963847696781158e-05, -9.706523269414902e-05, -9.449198842048645e-05, -9.191874414682388e-05, -8.934549987316132e-05, -8.677225559949875e-05, -8.419901132583618e-05, -8.162576705217361e-05, -7.905252277851105e-05, -7.647927850484848e-05, -7.390603423118591e-05, -7.133278995752335e-05, -6.875954568386078e-05, -6.618630141019821e-05, -6.361305713653564e-05, -6.103981286287308e-05, -5.846656858921051e-05, -5.589332431554794e-05, -5.3320080041885376e-05, -5.074683576822281e-05, -4.817359149456024e-05, -4.5600347220897675e-05, -4.302710294723511e-05, -4.045385867357254e-05, -3.788061439990997e-05, -3.5307370126247406e-05, -3.273412585258484e-05, -3.0160881578922272e-05, -2.7587637305259705e-05, -2.5014393031597137e-05, -2.244114875793457e-05, -1.9867904484272003e-05, -1.7294660210609436e-05, -1.4721415936946869e-05, -1.2148171663284302e-05, -9.574927389621735e-06, -7.0016831159591675e-06, -4.4284388422966e-06, -1.8551945686340332e-06, 7.180497050285339e-07, 3.291293978691101e-06, 5.864538252353668e-06, 8.437782526016235e-06, 1.1011026799678802e-05, 1.358427107334137e-05, 1.6157515347003937e-05, 1.8730759620666504e-05, 2.130400389432907e-05, 2.3877248167991638e-05, 2.6450492441654205e-05, 2.9023736715316772e-05, 3.159698098897934e-05, 3.417022526264191e-05, 3.6743469536304474e-05, 3.931671380996704e-05, 4.188995808362961e-05, 4.4463202357292175e-05, 4.703644663095474e-05, 4.960969090461731e-05, 5.218293517827988e-05, 5.4756179451942444e-05, 5.732942372560501e-05, 5.990266799926758e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 12.0, 11.0, 9.0, 16.0, 44.0, 70.0, 130.0, 348.0, 748.0, 2549.0, 25461.0, 936338.0, 77229.0, 3835.0, 1005.0, 387.0, 155.0, 75.0, 45.0, 25.0, 14.0, 8.0, 10.0, 8.0, 7.0, 4.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.087677001953125, -1.04351806640625, -0.999359130859375, -0.9552001953125, -0.911041259765625, -0.86688232421875, -0.822723388671875, -0.778564453125, -0.734405517578125, -0.69024658203125, -0.646087646484375, -0.6019287109375, -0.557769775390625, -0.51361083984375, -0.469451904296875, -0.42529296875, -0.381134033203125, -0.33697509765625, -0.292816162109375, -0.2486572265625, -0.204498291015625, -0.16033935546875, -0.116180419921875, -0.072021484375, -0.027862548828125, 0.01629638671875, 0.060455322265625, 0.1046142578125, 0.148773193359375, 0.19293212890625, 0.237091064453125, 0.28125, 0.325408935546875, 0.36956787109375, 0.413726806640625, 0.4578857421875, 0.502044677734375, 0.54620361328125, 0.590362548828125, 0.634521484375, 0.678680419921875, 0.72283935546875, 0.766998291015625, 0.8111572265625, 0.855316162109375, 0.89947509765625, 0.943634033203125, 0.98779296875, 1.031951904296875, 1.07611083984375, 1.120269775390625, 1.1644287109375, 1.208587646484375, 1.25274658203125, 1.296905517578125, 1.341064453125, 1.385223388671875, 1.42938232421875, 1.473541259765625, 1.5177001953125, 1.561859130859375, 1.60601806640625, 1.650177001953125, 1.6943359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 9.0, 19.0, 24.0, 71.0, 90.0, 145.0, 176.0, 181.0, 118.0, 70.0, 25.0, 31.0, 11.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.07421875, -1.0306243896484375, -0.987030029296875, -0.9434356689453125, -0.89984130859375, -0.8562469482421875, -0.812652587890625, -0.7690582275390625, -0.7254638671875, -0.6818695068359375, -0.638275146484375, -0.5946807861328125, -0.55108642578125, -0.5074920654296875, -0.463897705078125, -0.4203033447265625, -0.376708984375, -0.3331146240234375, -0.289520263671875, -0.2459259033203125, -0.20233154296875, -0.1587371826171875, -0.115142822265625, -0.0715484619140625, -0.0279541015625, 0.0156402587890625, 0.059234619140625, 0.1028289794921875, 0.14642333984375, 0.1900177001953125, 0.233612060546875, 0.2772064208984375, 0.32080078125, 0.3643951416015625, 0.407989501953125, 0.4515838623046875, 0.49517822265625, 0.5387725830078125, 0.582366943359375, 0.6259613037109375, 0.6695556640625, 0.7131500244140625, 0.756744384765625, 0.8003387451171875, 0.84393310546875, 0.8875274658203125, 0.931121826171875, 0.9747161865234375, 1.018310546875, 1.0619049072265625, 1.105499267578125, 1.1490936279296875, 1.19268798828125, 1.2362823486328125, 1.279876708984375, 1.3234710693359375, 1.3670654296875, 1.4106597900390625, 1.454254150390625, 1.4978485107421875, 1.54144287109375, 1.5850372314453125, 1.628631591796875, 1.6722259521484375, 1.7158203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 25.0, 58.0, 196.0, 285.0, 272.0, 104.0, 40.0, 14.0, 9.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.416728973388672, -15.627541542053223, -14.83835506439209, -14.04916763305664, -13.259981155395508, -12.470793724060059, -11.68160629272461, -10.892419815063477, -10.103232383728027, -9.314044952392578, -8.524858474731445, -7.735671043395996, -6.946484088897705, -6.157297134399414, -5.368109703063965, -4.578922748565674, -3.789735794067383, -3.000548839569092, -2.2113616466522217, -1.4221744537353516, -0.6329874992370605, 0.15619945526123047, 0.9453868865966797, 1.7345738410949707, 2.5237607955932617, 3.3129477500915527, 4.102134704589844, 4.891322135925293, 5.680509090423584, 6.469696044921875, 7.258883476257324, 8.048070907592773, 8.837257385253906, 9.626444816589355, 10.415631294250488, 11.204818725585938, 11.99400520324707, 12.78319263458252, 13.572380065917969, 14.361566543579102, 15.15075397491455, 15.93994140625, 16.729127883911133, 17.518314361572266, 18.30750274658203, 19.096689224243164, 19.885875701904297, 20.675064086914062, 21.464250564575195, 22.253437042236328, 23.042625427246094, 23.831811904907227, 24.62099838256836, 25.410186767578125, 26.199373245239258, 26.98855972290039, 27.777748107910156, 28.56693458557129, 29.356122970581055, 30.145309448242188, 30.93449592590332, 31.723682403564453, 32.51287078857422, 33.302059173583984, 34.091243743896484]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 5.0, 5.0, 7.0, 6.0, 8.0, 9.0, 11.0, 14.0, 14.0, 13.0, 21.0, 23.0, 22.0, 23.0, 39.0, 42.0, 37.0, 44.0, 49.0, 49.0, 36.0, 42.0, 38.0, 42.0, 49.0, 35.0, 37.0, 38.0, 33.0, 21.0, 22.0, 26.0, 20.0, 15.0, 17.0, 9.0, 12.0, 14.0, 6.0, 6.0, 10.0, 9.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-9.822504043579102, -9.513459205627441, -9.204414367675781, -8.895368576049805, -8.586323738098145, -8.277278900146484, -7.968234062194824, -7.659189224243164, -7.350143909454346, -7.0410990715026855, -6.732053756713867, -6.423008918762207, -6.113964080810547, -5.8049187660217285, -5.495873928070068, -5.18682861328125, -4.87778377532959, -4.56873893737793, -4.259693622589111, -3.950648784637451, -3.641603708267212, -3.3325586318969727, -3.0235137939453125, -2.7144687175750732, -2.405423641204834, -2.0963785648345947, -1.787333607673645, -1.4782886505126953, -1.169243574142456, -0.8601984977722168, -0.5511535406112671, -0.24210858345031738, 0.06693649291992188, 0.37598150968551636, 0.6850265264511108, 0.9940715432167053, 1.3031165599822998, 1.612161636352539, 1.9212065935134888, 2.2302515506744385, 2.5392966270446777, 2.848341703414917, 3.1573867797851562, 3.4664316177368164, 3.7754766941070557, 4.084521770477295, 4.393566608428955, 4.702611923217773, 5.011656761169434, 5.320701599121094, 5.629746913909912, 5.938791751861572, 6.247837066650391, 6.556881904602051, 6.865926742553711, 7.174971580505371, 7.4840168952941895, 7.79306173324585, 8.102107048034668, 8.411151885986328, 8.720196723937988, 9.029241561889648, 9.338287353515625, 9.647332191467285, 9.956377029418945]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 2.0, 4.0, 15.0, 16.0, 37.0, 51.0, 82.0, 143.0, 303.0, 682.0, 1938.0, 7495.0, 56502.0, 4066841.0, 49790.0, 7100.0, 1969.0, 641.0, 318.0, 147.0, 74.0, 46.0, 25.0, 23.0, 17.0, 9.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.00390625, -0.9571685791015625, -0.910430908203125, -0.8636932373046875, -0.81695556640625, -0.7702178955078125, -0.723480224609375, -0.6767425537109375, -0.6300048828125, -0.5832672119140625, -0.536529541015625, -0.4897918701171875, -0.44305419921875, -0.3963165283203125, -0.349578857421875, -0.3028411865234375, -0.256103515625, -0.2093658447265625, -0.162628173828125, -0.1158905029296875, -0.06915283203125, -0.0224151611328125, 0.024322509765625, 0.0710601806640625, 0.1177978515625, 0.1645355224609375, 0.211273193359375, 0.2580108642578125, 0.30474853515625, 0.3514862060546875, 0.398223876953125, 0.4449615478515625, 0.49169921875, 0.5384368896484375, 0.585174560546875, 0.6319122314453125, 0.67864990234375, 0.7253875732421875, 0.772125244140625, 0.8188629150390625, 0.8656005859375, 0.9123382568359375, 0.959075927734375, 1.0058135986328125, 1.05255126953125, 1.0992889404296875, 1.146026611328125, 1.1927642822265625, 1.239501953125, 1.2862396240234375, 1.332977294921875, 1.3797149658203125, 1.42645263671875, 1.4731903076171875, 1.519927978515625, 1.5666656494140625, 1.6134033203125, 1.6601409912109375, 1.706878662109375, 1.7536163330078125, 1.80035400390625, 1.8470916748046875, 1.893829345703125, 1.9405670166015625, 1.9873046875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 3.0, 3.0, 6.0, 4.0, 16.0, 15.0, 13.0, 19.0, 26.0, 27.0, 43.0, 52.0, 55.0, 55.0, 75.0, 74.0, 75.0, 74.0, 55.0, 47.0, 49.0, 37.0, 37.0, 28.0, 24.0, 21.0, 18.0, 14.0, 5.0, 5.0, 6.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5517578125, -0.5328216552734375, -0.513885498046875, -0.4949493408203125, -0.47601318359375, -0.4570770263671875, -0.438140869140625, -0.4192047119140625, -0.4002685546875, -0.3813323974609375, -0.362396240234375, -0.3434600830078125, -0.32452392578125, -0.3055877685546875, -0.286651611328125, -0.2677154541015625, -0.248779296875, -0.2298431396484375, -0.210906982421875, -0.1919708251953125, -0.17303466796875, -0.1540985107421875, -0.135162353515625, -0.1162261962890625, -0.0972900390625, -0.0783538818359375, -0.059417724609375, -0.0404815673828125, -0.02154541015625, -0.0026092529296875, 0.016326904296875, 0.0352630615234375, 0.05419921875, 0.0731353759765625, 0.092071533203125, 0.1110076904296875, 0.12994384765625, 0.1488800048828125, 0.167816162109375, 0.1867523193359375, 0.2056884765625, 0.2246246337890625, 0.243560791015625, 0.2624969482421875, 0.28143310546875, 0.3003692626953125, 0.319305419921875, 0.3382415771484375, 0.357177734375, 0.3761138916015625, 0.395050048828125, 0.4139862060546875, 0.43292236328125, 0.4518585205078125, 0.470794677734375, 0.4897308349609375, 0.5086669921875, 0.5276031494140625, 0.546539306640625, 0.5654754638671875, 0.58441162109375, 0.6033477783203125, 0.622283935546875, 0.6412200927734375, 0.66015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 6.0, 10.0, 16.0, 12.0, 13.0, 23.0, 31.0, 37.0, 39.0, 46.0, 49.0, 92.0, 124.0, 274.0, 870.0, 3410.0, 23026.0, 4082474.0, 74914.0, 6374.0, 1405.0, 398.0, 173.0, 114.0, 71.0, 53.0, 50.0, 48.0, 37.0, 21.0, 15.0, 11.0, 4.0, 11.0, 5.0, 11.0, 1.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.087890625, -2.998870849609375, -2.90985107421875, -2.820831298828125, -2.7318115234375, -2.642791748046875, -2.55377197265625, -2.464752197265625, -2.375732421875, -2.286712646484375, -2.19769287109375, -2.108673095703125, -2.0196533203125, -1.930633544921875, -1.84161376953125, -1.752593994140625, -1.66357421875, -1.574554443359375, -1.48553466796875, -1.396514892578125, -1.3074951171875, -1.218475341796875, -1.12945556640625, -1.040435791015625, -0.951416015625, -0.862396240234375, -0.77337646484375, -0.684356689453125, -0.5953369140625, -0.506317138671875, -0.41729736328125, -0.328277587890625, -0.2392578125, -0.150238037109375, -0.06121826171875, 0.027801513671875, 0.1168212890625, 0.205841064453125, 0.29486083984375, 0.383880615234375, 0.472900390625, 0.561920166015625, 0.65093994140625, 0.739959716796875, 0.8289794921875, 0.917999267578125, 1.00701904296875, 1.096038818359375, 1.18505859375, 1.274078369140625, 1.36309814453125, 1.452117919921875, 1.5411376953125, 1.630157470703125, 1.71917724609375, 1.808197021484375, 1.897216796875, 1.986236572265625, 2.07525634765625, 2.164276123046875, 2.2532958984375, 2.342315673828125, 2.43133544921875, 2.520355224609375, 2.609375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 8.0, 11.0, 22.0, 49.0, 159.0, 3502.0, 203.0, 57.0, 28.0, 17.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.239013671875, -0.21838760375976562, -0.19776153564453125, -0.17713546752929688, -0.1565093994140625, -0.13588333129882812, -0.11525726318359375, -0.09463119506835938, -0.074005126953125, -0.053379058837890625, -0.03275299072265625, -0.012126922607421875, 0.0084991455078125, 0.029125213623046875, 0.04975128173828125, 0.07037734985351562, 0.09100341796875, 0.11162948608398438, 0.13225555419921875, 0.15288162231445312, 0.1735076904296875, 0.19413375854492188, 0.21475982666015625, 0.23538589477539062, 0.256011962890625, 0.2766380310058594, 0.29726409912109375, 0.3178901672363281, 0.3385162353515625, 0.3591423034667969, 0.37976837158203125, 0.4003944396972656, 0.4210205078125, 0.4416465759277344, 0.46227264404296875, 0.4828987121582031, 0.5035247802734375, 0.5241508483886719, 0.5447769165039062, 0.5654029846191406, 0.586029052734375, 0.6066551208496094, 0.6272811889648438, 0.6479072570800781, 0.6685333251953125, 0.6891593933105469, 0.7097854614257812, 0.7304115295410156, 0.75103759765625, 0.7716636657714844, 0.7922897338867188, 0.8129158020019531, 0.8335418701171875, 0.8541679382324219, 0.8747940063476562, 0.8954200744628906, 0.916046142578125, 0.9366722106933594, 0.9572982788085938, 0.9779243469238281, 0.9985504150390625, 1.0191764831542969, 1.0398025512695312, 1.0604286193847656, 1.0810546875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 12.0, 19.0, 26.0, 91.0, 123.0, 186.0, 172.0, 151.0, 72.0, 48.0, 46.0, 15.0, 14.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.157376766204834, -2.0742225646972656, -1.9910684823989868, -1.907914400100708, -1.8247601985931396, -1.7416061162948608, -1.658452033996582, -1.5752978324890137, -1.4921437501907349, -1.408989667892456, -1.3258354663848877, -1.2426813840866089, -1.15952730178833, -1.0763731002807617, -0.9932190179824829, -0.9100648760795593, -0.8269107341766357, -0.7437565922737122, -0.6606024503707886, -0.5774483680725098, -0.4942942261695862, -0.4111400842666626, -0.3279859721660614, -0.2448318600654602, -0.16167771816253662, -0.07852359116077423, 0.004630535840988159, 0.08778466284275055, 0.17093878984451294, 0.2540929317474365, 0.3372470438480377, 0.4204011559486389, 0.5035550594329834, 0.586709201335907, 0.6698633432388306, 0.7530174255371094, 0.836171567440033, 0.9193257093429565, 1.0024797916412354, 1.0856339931488037, 1.1687880754470825, 1.2519421577453613, 1.3350963592529297, 1.4182504415512085, 1.5014045238494873, 1.5845587253570557, 1.6677128076553345, 1.7508668899536133, 1.8340210914611816, 1.9171751737594604, 2.0003292560577393, 2.0834834575653076, 2.166637659072876, 2.2497916221618652, 2.3329458236694336, 2.416100025177002, 2.4992542266845703, 2.5824084281921387, 2.665562391281128, 2.7487165927886963, 2.8318707942962646, 2.915024757385254, 2.9981789588928223, 3.0813331604003906, 3.16448712348938]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 9.0, 4.0, 14.0, 11.0, 10.0, 21.0, 23.0, 19.0, 11.0, 12.0, 22.0, 26.0, 24.0, 32.0, 37.0, 40.0, 31.0, 38.0, 42.0, 39.0, 45.0, 44.0, 31.0, 37.0, 36.0, 41.0, 39.0, 45.0, 19.0, 26.0, 31.0, 19.0, 19.0, 22.0, 16.0, 9.0, 10.0, 8.0, 8.0, 6.0, 2.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0084989070892334, -0.9751836657524109, -0.9418684244155884, -0.9085532426834106, -0.8752380013465881, -0.8419227600097656, -0.8086075782775879, -0.7752923369407654, -0.7419770956039429, -0.7086618542671204, -0.6753466129302979, -0.6420314311981201, -0.6087161898612976, -0.5754009485244751, -0.5420857667922974, -0.5087705254554749, -0.47545528411865234, -0.44214004278182983, -0.4088248312473297, -0.3755096197128296, -0.3421943783760071, -0.30887913703918457, -0.27556392550468445, -0.24224869906902313, -0.20893347263336182, -0.1756182461977005, -0.14230301976203918, -0.10898779332637787, -0.07567256689071655, -0.04235734045505524, -0.009042114019393921, 0.024273112416267395, 0.05758833885192871, 0.09090356528759003, 0.12421879172325134, 0.15753401815891266, 0.19084924459457397, 0.2241644710302353, 0.2574796974658966, 0.29079490900039673, 0.32411015033721924, 0.35742539167404175, 0.39074060320854187, 0.424055814743042, 0.4573710560798645, 0.490686297416687, 0.5240014791488647, 0.5573167204856873, 0.5906319618225098, 0.6239472031593323, 0.6572624444961548, 0.6905776262283325, 0.723892867565155, 0.7572081089019775, 0.7905232906341553, 0.8238385319709778, 0.8571537733078003, 0.8904690146446228, 0.9237842559814453, 0.957099437713623, 0.9904146790504456, 1.023729920387268, 1.0570451021194458, 1.090360403060913, 1.1236755847930908]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 4.0, 6.0, 12.0, 16.0, 25.0, 33.0, 46.0, 64.0, 84.0, 144.0, 241.0, 439.0, 783.0, 1604.0, 3273.0, 7951.0, 20609.0, 57729.0, 171547.0, 374991.0, 263556.0, 92403.0, 31746.0, 11881.0, 4837.0, 2084.0, 1076.0, 502.0, 330.0, 166.0, 133.0, 76.0, 58.0, 21.0, 25.0, 15.0, 14.0, 8.0, 8.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97998046875, -0.9490814208984375, -0.918182373046875, -0.8872833251953125, -0.85638427734375, -0.8254852294921875, -0.794586181640625, -0.7636871337890625, -0.7327880859375, -0.7018890380859375, -0.670989990234375, -0.6400909423828125, -0.60919189453125, -0.5782928466796875, -0.547393798828125, -0.5164947509765625, -0.485595703125, -0.4546966552734375, -0.423797607421875, -0.3928985595703125, -0.36199951171875, -0.3311004638671875, -0.300201416015625, -0.2693023681640625, -0.2384033203125, -0.2075042724609375, -0.176605224609375, -0.1457061767578125, -0.11480712890625, -0.0839080810546875, -0.053009033203125, -0.0221099853515625, 0.0087890625, 0.0396881103515625, 0.070587158203125, 0.1014862060546875, 0.13238525390625, 0.1632843017578125, 0.194183349609375, 0.2250823974609375, 0.2559814453125, 0.2868804931640625, 0.317779541015625, 0.3486785888671875, 0.37957763671875, 0.4104766845703125, 0.441375732421875, 0.4722747802734375, 0.503173828125, 0.5340728759765625, 0.564971923828125, 0.5958709716796875, 0.62677001953125, 0.6576690673828125, 0.688568115234375, 0.7194671630859375, 0.7503662109375, 0.7812652587890625, 0.812164306640625, 0.8430633544921875, 0.87396240234375, 0.9048614501953125, 0.935760498046875, 0.9666595458984375, 0.99755859375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 7.0, 1.0, 2.0, 4.0, 7.0, 5.0, 11.0, 17.0, 21.0, 24.0, 29.0, 38.0, 38.0, 57.0, 55.0, 71.0, 63.0, 74.0, 74.0, 56.0, 54.0, 59.0, 47.0, 36.0, 42.0, 22.0, 29.0, 18.0, 14.0, 11.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53515625, -0.51361083984375, -0.4920654296875, -0.47052001953125, -0.448974609375, -0.42742919921875, -0.4058837890625, -0.38433837890625, -0.36279296875, -0.34124755859375, -0.3197021484375, -0.29815673828125, -0.276611328125, -0.25506591796875, -0.2335205078125, -0.21197509765625, -0.1904296875, -0.16888427734375, -0.1473388671875, -0.12579345703125, -0.104248046875, -0.08270263671875, -0.0611572265625, -0.03961181640625, -0.01806640625, 0.00347900390625, 0.0250244140625, 0.04656982421875, 0.068115234375, 0.08966064453125, 0.1112060546875, 0.13275146484375, 0.154296875, 0.17584228515625, 0.1973876953125, 0.21893310546875, 0.240478515625, 0.26202392578125, 0.2835693359375, 0.30511474609375, 0.32666015625, 0.34820556640625, 0.3697509765625, 0.39129638671875, 0.412841796875, 0.43438720703125, 0.4559326171875, 0.47747802734375, 0.4990234375, 0.52056884765625, 0.5421142578125, 0.56365966796875, 0.585205078125, 0.60675048828125, 0.6282958984375, 0.64984130859375, 0.67138671875, 0.69293212890625, 0.7144775390625, 0.73602294921875, 0.757568359375, 0.77911376953125, 0.8006591796875, 0.82220458984375, 0.84375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 14.0, 8.0, 17.0, 23.0, 57.0, 110.0, 200.0, 319.0, 635.0, 1494.0, 6865.0, 137816.0, 861666.0, 33901.0, 3357.0, 1017.0, 461.0, 252.0, 147.0, 64.0, 35.0, 30.0, 22.0, 14.0, 10.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.875, -3.73809814453125, -3.6011962890625, -3.46429443359375, -3.327392578125, -3.19049072265625, -3.0535888671875, -2.91668701171875, -2.77978515625, -2.64288330078125, -2.5059814453125, -2.36907958984375, -2.232177734375, -2.09527587890625, -1.9583740234375, -1.82147216796875, -1.6845703125, -1.54766845703125, -1.4107666015625, -1.27386474609375, -1.136962890625, -1.00006103515625, -0.8631591796875, -0.72625732421875, -0.58935546875, -0.45245361328125, -0.3155517578125, -0.17864990234375, -0.041748046875, 0.09515380859375, 0.2320556640625, 0.36895751953125, 0.505859375, 0.64276123046875, 0.7796630859375, 0.91656494140625, 1.053466796875, 1.19036865234375, 1.3272705078125, 1.46417236328125, 1.60107421875, 1.73797607421875, 1.8748779296875, 2.01177978515625, 2.148681640625, 2.28558349609375, 2.4224853515625, 2.55938720703125, 2.6962890625, 2.83319091796875, 2.9700927734375, 3.10699462890625, 3.243896484375, 3.38079833984375, 3.5177001953125, 3.65460205078125, 3.79150390625, 3.92840576171875, 4.0653076171875, 4.20220947265625, 4.339111328125, 4.47601318359375, 4.6129150390625, 4.74981689453125, 4.88671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 9.0, 13.0, 14.0, 18.0, 22.0, 21.0, 25.0, 41.0, 37.0, 51.0, 54.0, 58.0, 52.0, 44.0, 63.0, 55.0, 69.0, 45.0, 45.0, 47.0, 35.0, 41.0, 26.0, 13.0, 14.0, 12.0, 18.0, 9.0, 6.0, 11.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.64453125, -3.54345703125, -3.4423828125, -3.34130859375, -3.240234375, -3.13916015625, -3.0380859375, -2.93701171875, -2.8359375, -2.73486328125, -2.6337890625, -2.53271484375, -2.431640625, -2.33056640625, -2.2294921875, -2.12841796875, -2.02734375, -1.92626953125, -1.8251953125, -1.72412109375, -1.623046875, -1.52197265625, -1.4208984375, -1.31982421875, -1.21875, -1.11767578125, -1.0166015625, -0.91552734375, -0.814453125, -0.71337890625, -0.6123046875, -0.51123046875, -0.41015625, -0.30908203125, -0.2080078125, -0.10693359375, -0.005859375, 0.09521484375, 0.1962890625, 0.29736328125, 0.3984375, 0.49951171875, 0.6005859375, 0.70166015625, 0.802734375, 0.90380859375, 1.0048828125, 1.10595703125, 1.20703125, 1.30810546875, 1.4091796875, 1.51025390625, 1.611328125, 1.71240234375, 1.8134765625, 1.91455078125, 2.015625, 2.11669921875, 2.2177734375, 2.31884765625, 2.419921875, 2.52099609375, 2.6220703125, 2.72314453125, 2.82421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 10.0, 6.0, 12.0, 20.0, 34.0, 56.0, 116.0, 252.0, 658.0, 2723.0, 45465.0, 965389.0, 30502.0, 2265.0, 599.0, 232.0, 100.0, 47.0, 29.0, 14.0, 10.0, 9.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.7421875, -2.6804962158203125, -2.618804931640625, -2.5571136474609375, -2.49542236328125, -2.4337310791015625, -2.372039794921875, -2.3103485107421875, -2.2486572265625, -2.1869659423828125, -2.125274658203125, -2.0635833740234375, -2.00189208984375, -1.9402008056640625, -1.878509521484375, -1.8168182373046875, -1.755126953125, -1.6934356689453125, -1.631744384765625, -1.5700531005859375, -1.50836181640625, -1.4466705322265625, -1.384979248046875, -1.3232879638671875, -1.2615966796875, -1.1999053955078125, -1.138214111328125, -1.0765228271484375, -1.01483154296875, -0.9531402587890625, -0.891448974609375, -0.8297576904296875, -0.76806640625, -0.7063751220703125, -0.644683837890625, -0.5829925537109375, -0.52130126953125, -0.4596099853515625, -0.397918701171875, -0.3362274169921875, -0.2745361328125, -0.2128448486328125, -0.151153564453125, -0.0894622802734375, -0.02777099609375, 0.0339202880859375, 0.095611572265625, 0.1573028564453125, 0.218994140625, 0.2806854248046875, 0.342376708984375, 0.4040679931640625, 0.46575927734375, 0.5274505615234375, 0.589141845703125, 0.6508331298828125, 0.7125244140625, 0.7742156982421875, 0.835906982421875, 0.8975982666015625, 0.95928955078125, 1.0209808349609375, 1.082672119140625, 1.1443634033203125, 1.2060546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 7.0, 15.0, 23.0, 19.0, 22.0, 34.0, 59.0, 48.0, 71.0, 87.0, 94.0, 90.0, 81.0, 72.0, 61.0, 58.0, 40.0, 30.0, 21.0, 11.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00011938810348510742, -0.0001163482666015625, -0.00011330842971801758, -0.00011026859283447266, -0.00010722875595092773, -0.00010418891906738281, -0.00010114908218383789, -9.810924530029297e-05, -9.506940841674805e-05, -9.202957153320312e-05, -8.89897346496582e-05, -8.594989776611328e-05, -8.291006088256836e-05, -7.987022399902344e-05, -7.683038711547852e-05, -7.37905502319336e-05, -7.075071334838867e-05, -6.771087646484375e-05, -6.467103958129883e-05, -6.16312026977539e-05, -5.8591365814208984e-05, -5.555152893066406e-05, -5.251169204711914e-05, -4.947185516357422e-05, -4.64320182800293e-05, -4.3392181396484375e-05, -4.035234451293945e-05, -3.731250762939453e-05, -3.427267074584961e-05, -3.123283386230469e-05, -2.8192996978759766e-05, -2.5153160095214844e-05, -2.2113323211669922e-05, -1.9073486328125e-05, -1.6033649444580078e-05, -1.2993812561035156e-05, -9.953975677490234e-06, -6.9141387939453125e-06, -3.874301910400391e-06, -8.344650268554688e-07, 2.205371856689453e-06, 5.245208740234375e-06, 8.285045623779297e-06, 1.1324882507324219e-05, 1.436471939086914e-05, 1.7404556274414062e-05, 2.0444393157958984e-05, 2.3484230041503906e-05, 2.6524066925048828e-05, 2.956390380859375e-05, 3.260374069213867e-05, 3.5643577575683594e-05, 3.8683414459228516e-05, 4.172325134277344e-05, 4.476308822631836e-05, 4.780292510986328e-05, 5.08427619934082e-05, 5.3882598876953125e-05, 5.692243576049805e-05, 5.996227264404297e-05, 6.300210952758789e-05, 6.604194641113281e-05, 6.908178329467773e-05, 7.212162017822266e-05, 7.516145706176758e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 9.0, 11.0, 18.0, 32.0, 32.0, 81.0, 198.0, 390.0, 1028.0, 3564.0, 52889.0, 957295.0, 28620.0, 2799.0, 839.0, 347.0, 165.0, 80.0, 53.0, 24.0, 20.0, 15.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4833984375, -1.4272613525390625, -1.371124267578125, -1.3149871826171875, -1.25885009765625, -1.2027130126953125, -1.146575927734375, -1.0904388427734375, -1.0343017578125, -0.9781646728515625, -0.922027587890625, -0.8658905029296875, -0.80975341796875, -0.7536163330078125, -0.697479248046875, -0.6413421630859375, -0.585205078125, -0.5290679931640625, -0.472930908203125, -0.4167938232421875, -0.36065673828125, -0.3045196533203125, -0.248382568359375, -0.1922454833984375, -0.1361083984375, -0.0799713134765625, -0.023834228515625, 0.0323028564453125, 0.08843994140625, 0.1445770263671875, 0.200714111328125, 0.2568511962890625, 0.31298828125, 0.3691253662109375, 0.425262451171875, 0.4813995361328125, 0.53753662109375, 0.5936737060546875, 0.649810791015625, 0.7059478759765625, 0.7620849609375, 0.8182220458984375, 0.874359130859375, 0.9304962158203125, 0.98663330078125, 1.0427703857421875, 1.098907470703125, 1.1550445556640625, 1.211181640625, 1.2673187255859375, 1.323455810546875, 1.3795928955078125, 1.43572998046875, 1.4918670654296875, 1.548004150390625, 1.6041412353515625, 1.6602783203125, 1.7164154052734375, 1.772552490234375, 1.8286895751953125, 1.88482666015625, 1.9409637451171875, 1.997100830078125, 2.0532379150390625, 2.109375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 10.0, 15.0, 41.0, 111.0, 225.0, 287.0, 173.0, 79.0, 37.0, 10.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1630859375, -1.0917816162109375, -1.020477294921875, -0.9491729736328125, -0.87786865234375, -0.8065643310546875, -0.735260009765625, -0.6639556884765625, -0.5926513671875, -0.5213470458984375, -0.450042724609375, -0.3787384033203125, -0.30743408203125, -0.2361297607421875, -0.164825439453125, -0.0935211181640625, -0.022216796875, 0.0490875244140625, 0.120391845703125, 0.1916961669921875, 0.26300048828125, 0.3343048095703125, 0.405609130859375, 0.4769134521484375, 0.5482177734375, 0.6195220947265625, 0.690826416015625, 0.7621307373046875, 0.83343505859375, 0.9047393798828125, 0.976043701171875, 1.0473480224609375, 1.11865234375, 1.1899566650390625, 1.261260986328125, 1.3325653076171875, 1.40386962890625, 1.4751739501953125, 1.546478271484375, 1.6177825927734375, 1.6890869140625, 1.7603912353515625, 1.831695556640625, 1.9029998779296875, 1.97430419921875, 2.0456085205078125, 2.116912841796875, 2.1882171630859375, 2.259521484375, 2.3308258056640625, 2.402130126953125, 2.4734344482421875, 2.54473876953125, 2.6160430908203125, 2.687347412109375, 2.7586517333984375, 2.8299560546875, 2.9012603759765625, 2.972564697265625, 3.0438690185546875, 3.11517333984375, 3.1864776611328125, 3.257781982421875, 3.3290863037109375, 3.400390625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 15.0, 36.0, 116.0, 286.0, 285.0, 167.0, 53.0, 26.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.66199493408203, -47.604583740234375, -46.54716873168945, -45.48975372314453, -44.432342529296875, -43.37493133544922, -42.3175163269043, -41.260101318359375, -40.20269012451172, -39.14527893066406, -38.08786392211914, -37.03044891357422, -35.97303771972656, -34.915626525878906, -33.858211517333984, -32.80079650878906, -31.743385314941406, -30.685972213745117, -29.628559112548828, -28.57114601135254, -27.51373291015625, -26.45631980895996, -25.398906707763672, -24.341493606567383, -23.284080505371094, -22.226667404174805, -21.169254302978516, -20.111841201782227, -19.054428100585938, -17.99701499938965, -16.93960189819336, -15.88218879699707, -14.824775695800781, -13.767362594604492, -12.709949493408203, -11.652536392211914, -10.595123291015625, -9.537710189819336, -8.480297088623047, -7.422883987426758, -6.365470886230469, -5.30805778503418, -4.250644683837891, -3.1932315826416016, -2.1358184814453125, -1.0784053802490234, -0.020992279052734375, 1.0364208221435547, 2.0938339233398438, 3.151247024536133, 4.208660125732422, 5.266073226928711, 6.323486328125, 7.380899429321289, 8.438312530517578, 9.495725631713867, 10.553138732910156, 11.610551834106445, 12.667964935302734, 13.725378036499023, 14.782791137695312, 15.840204238891602, 16.89761734008789, 17.95503044128418, 19.01244354248047]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 8.0, 10.0, 11.0, 17.0, 28.0, 15.0, 27.0, 28.0, 34.0, 29.0, 36.0, 55.0, 48.0, 37.0, 52.0, 59.0, 50.0, 60.0, 53.0, 30.0, 47.0, 27.0, 34.0, 29.0, 26.0, 18.0, 19.0, 25.0, 7.0, 16.0, 14.0, 12.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.751487731933594, -11.368470191955566, -10.985453605651855, -10.602436065673828, -10.219419479370117, -9.83640193939209, -9.453385353088379, -9.070367813110352, -8.68735122680664, -8.304333686828613, -7.921317100524902, -7.538300037384033, -7.155282974243164, -6.772265911102295, -6.389248847961426, -6.006231307983398, -5.623214244842529, -5.24019718170166, -4.857180118560791, -4.474163055419922, -4.091145992279053, -3.7081289291381836, -3.3251116275787354, -2.942094564437866, -2.559077501296997, -2.176060438156128, -1.7930433750152588, -1.4100261926651, -1.027009129524231, -0.6439920663833618, -0.2609748840332031, 0.12204217910766602, 0.5050592422485352, 0.8880763053894043, 1.2710933685302734, 1.6541105508804321, 2.0371274948120117, 2.420144557952881, 2.803161859512329, 3.1861789226531982, 3.5691959857940674, 3.9522130489349365, 4.335230350494385, 4.718247413635254, 5.101264476776123, 5.484281539916992, 5.867298603057861, 6.2503156661987305, 6.6333327293396, 7.016349792480469, 7.399366855621338, 7.782383918762207, 8.165401458740234, 8.548418045043945, 8.931435585021973, 9.314452171325684, 9.697469711303711, 10.080487251281738, 10.46350383758545, 10.846521377563477, 11.229537963867188, 11.612555503845215, 11.995572090148926, 12.378589630126953, 12.761606216430664]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 6.0, 14.0, 15.0, 21.0, 29.0, 50.0, 79.0, 110.0, 205.0, 366.0, 757.0, 1668.0, 5640.0, 41848.0, 4115561.0, 21144.0, 3968.0, 1382.0, 583.0, 320.0, 178.0, 113.0, 63.0, 56.0, 31.0, 24.0, 15.0, 7.0, 9.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3984375, -1.341064453125, -1.28369140625, -1.226318359375, -1.1689453125, -1.111572265625, -1.05419921875, -0.996826171875, -0.939453125, -0.882080078125, -0.82470703125, -0.767333984375, -0.7099609375, -0.652587890625, -0.59521484375, -0.537841796875, -0.48046875, -0.423095703125, -0.36572265625, -0.308349609375, -0.2509765625, -0.193603515625, -0.13623046875, -0.078857421875, -0.021484375, 0.035888671875, 0.09326171875, 0.150634765625, 0.2080078125, 0.265380859375, 0.32275390625, 0.380126953125, 0.4375, 0.494873046875, 0.55224609375, 0.609619140625, 0.6669921875, 0.724365234375, 0.78173828125, 0.839111328125, 0.896484375, 0.953857421875, 1.01123046875, 1.068603515625, 1.1259765625, 1.183349609375, 1.24072265625, 1.298095703125, 1.35546875, 1.412841796875, 1.47021484375, 1.527587890625, 1.5849609375, 1.642333984375, 1.69970703125, 1.757080078125, 1.814453125, 1.871826171875, 1.92919921875, 1.986572265625, 2.0439453125, 2.101318359375, 2.15869140625, 2.216064453125, 2.2734375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 7.0, 9.0, 13.0, 7.0, 24.0, 18.0, 28.0, 32.0, 32.0, 42.0, 52.0, 46.0, 62.0, 69.0, 62.0, 59.0, 69.0, 54.0, 47.0, 33.0, 30.0, 30.0, 37.0, 26.0, 26.0, 16.0, 11.0, 5.0, 12.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0], "bins": [-0.7314453125, -0.7130622863769531, -0.6946792602539062, -0.6762962341308594, -0.6579132080078125, -0.6395301818847656, -0.6211471557617188, -0.6027641296386719, -0.584381103515625, -0.5659980773925781, -0.5476150512695312, -0.5292320251464844, -0.5108489990234375, -0.4924659729003906, -0.47408294677734375, -0.4556999206542969, -0.43731689453125, -0.4189338684082031, -0.40055084228515625, -0.3821678161621094, -0.3637847900390625, -0.3454017639160156, -0.32701873779296875, -0.3086357116699219, -0.290252685546875, -0.2718696594238281, -0.25348663330078125, -0.23510360717773438, -0.2167205810546875, -0.19833755493164062, -0.17995452880859375, -0.16157150268554688, -0.1431884765625, -0.12480545043945312, -0.10642242431640625, -0.08803939819335938, -0.0696563720703125, -0.051273345947265625, -0.03289031982421875, -0.014507293701171875, 0.003875732421875, 0.022258758544921875, 0.04064178466796875, 0.059024810791015625, 0.0774078369140625, 0.09579086303710938, 0.11417388916015625, 0.13255691528320312, 0.15093994140625, 0.16932296752929688, 0.18770599365234375, 0.20608901977539062, 0.2244720458984375, 0.24285507202148438, 0.26123809814453125, 0.2796211242675781, 0.298004150390625, 0.3163871765136719, 0.33477020263671875, 0.3531532287597656, 0.3715362548828125, 0.3899192810058594, 0.40830230712890625, 0.4266853332519531, 0.445068359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 6.0, 7.0, 8.0, 15.0, 12.0, 20.0, 29.0, 34.0, 38.0, 65.0, 84.0, 125.0, 170.0, 261.0, 448.0, 709.0, 1284.0, 2527.0, 5580.0, 15515.0, 101414.0, 4015701.0, 33288.0, 9029.0, 3614.0, 1799.0, 994.0, 491.0, 326.0, 192.0, 149.0, 103.0, 65.0, 52.0, 25.0, 30.0, 21.0, 13.0, 17.0, 9.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.158203125, -1.117218017578125, -1.07623291015625, -1.035247802734375, -0.9942626953125, -0.953277587890625, -0.91229248046875, -0.871307373046875, -0.830322265625, -0.789337158203125, -0.74835205078125, -0.707366943359375, -0.6663818359375, -0.625396728515625, -0.58441162109375, -0.543426513671875, -0.50244140625, -0.461456298828125, -0.42047119140625, -0.379486083984375, -0.3385009765625, -0.297515869140625, -0.25653076171875, -0.215545654296875, -0.174560546875, -0.133575439453125, -0.09259033203125, -0.051605224609375, -0.0106201171875, 0.030364990234375, 0.07135009765625, 0.112335205078125, 0.1533203125, 0.194305419921875, 0.23529052734375, 0.276275634765625, 0.3172607421875, 0.358245849609375, 0.39923095703125, 0.440216064453125, 0.481201171875, 0.522186279296875, 0.56317138671875, 0.604156494140625, 0.6451416015625, 0.686126708984375, 0.72711181640625, 0.768096923828125, 0.80908203125, 0.850067138671875, 0.89105224609375, 0.932037353515625, 0.9730224609375, 1.014007568359375, 1.05499267578125, 1.095977783203125, 1.136962890625, 1.177947998046875, 1.21893310546875, 1.259918212890625, 1.3009033203125, 1.341888427734375, 1.38287353515625, 1.423858642578125, 1.46484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 14.0, 8.0, 17.0, 40.0, 106.0, 3574.0, 165.0, 55.0, 28.0, 16.0, 7.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395751953125, -0.3852348327636719, -0.37471771240234375, -0.3642005920410156, -0.3536834716796875, -0.3431663513183594, -0.33264923095703125, -0.3221321105957031, -0.311614990234375, -0.3010978698730469, -0.29058074951171875, -0.2800636291503906, -0.2695465087890625, -0.2590293884277344, -0.24851226806640625, -0.23799514770507812, -0.22747802734375, -0.21696090698242188, -0.20644378662109375, -0.19592666625976562, -0.1854095458984375, -0.17489242553710938, -0.16437530517578125, -0.15385818481445312, -0.143341064453125, -0.13282394409179688, -0.12230682373046875, -0.11178970336914062, -0.1012725830078125, -0.09075546264648438, -0.08023834228515625, -0.06972122192382812, -0.0592041015625, -0.048686981201171875, -0.03816986083984375, -0.027652740478515625, -0.0171356201171875, -0.006618499755859375, 0.00389862060546875, 0.014415740966796875, 0.024932861328125, 0.035449981689453125, 0.04596710205078125, 0.056484222412109375, 0.0670013427734375, 0.07751846313476562, 0.08803558349609375, 0.09855270385742188, 0.10906982421875, 0.11958694458007812, 0.13010406494140625, 0.14062118530273438, 0.1511383056640625, 0.16165542602539062, 0.17217254638671875, 0.18268966674804688, 0.193206787109375, 0.20372390747070312, 0.21424102783203125, 0.22475814819335938, 0.2352752685546875, 0.24579238891601562, 0.25630950927734375, 0.2668266296386719, 0.27734375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 17.0, 49.0, 83.0, 133.0, 177.0, 182.0, 152.0, 108.0, 50.0, 21.0, 8.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3476784229278564, -1.296535849571228, -1.2453932762145996, -1.1942508220672607, -1.1431082487106323, -1.091965675354004, -1.040823221206665, -0.9896806478500366, -0.9385380744934082, -0.8873955011367798, -0.8362529873847961, -0.7851104736328125, -0.7339679002761841, -0.6828253269195557, -0.631682813167572, -0.5805402994155884, -0.52939772605896, -0.47825518250465393, -0.4271126389503479, -0.37597009539604187, -0.32482755184173584, -0.2736850082874298, -0.22254246473312378, -0.17139992117881775, -0.12025737762451172, -0.06911483407020569, -0.017972290515899658, 0.03317025303840637, 0.0843127965927124, 0.13545534014701843, 0.18659788370132446, 0.2377404272556305, 0.2888830900192261, 0.3400256335735321, 0.39116817712783813, 0.44231072068214417, 0.4934532642364502, 0.5445958375930786, 0.5957383513450623, 0.6468808650970459, 0.6980234384536743, 0.7491660118103027, 0.8003085255622864, 0.85145103931427, 0.9025936126708984, 0.9537361860275269, 1.0048787593841553, 1.0560212135314941, 1.1071637868881226, 1.158306360244751, 1.2094488143920898, 1.2605913877487183, 1.3117339611053467, 1.362876534461975, 1.4140191078186035, 1.4651615619659424, 1.5163041353225708, 1.5674467086791992, 1.618589162826538, 1.6697317361831665, 1.720874309539795, 1.7720168828964233, 1.8231594562530518, 1.8743019104003906, 1.925444483757019]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 12.0, 10.0, 21.0, 26.0, 27.0, 32.0, 22.0, 37.0, 22.0, 48.0, 58.0, 55.0, 52.0, 54.0, 49.0, 65.0, 39.0, 50.0, 39.0, 38.0, 41.0, 41.0, 25.0, 24.0, 24.0, 22.0, 16.0, 11.0, 5.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.8112097382545471, -0.7889202833175659, -0.7666308283805847, -0.7443413734436035, -0.7220519781112671, -0.6997625231742859, -0.6774730682373047, -0.6551836133003235, -0.6328941583633423, -0.6106047034263611, -0.5883152484893799, -0.5660258531570435, -0.5437363982200623, -0.521446943283081, -0.49915748834609985, -0.47686803340911865, -0.4545786380767822, -0.432289183139801, -0.4099997580051422, -0.387710303068161, -0.3654208779335022, -0.343131422996521, -0.3208419680595398, -0.2985525131225586, -0.2762630879878998, -0.2539736330509186, -0.23168420791625977, -0.20939475297927856, -0.18710531294345856, -0.16481587290763855, -0.14252641797065735, -0.12023697793483734, -0.09794747829437256, -0.07565803825855255, -0.05336859077215195, -0.031079143285751343, -0.008789703249931335, 0.013499736785888672, 0.03578919172286987, 0.05807863175868988, 0.08036807179450989, 0.1026575118303299, 0.1249469593167305, 0.1472364068031311, 0.1695258468389511, 0.19181528687477112, 0.21410474181175232, 0.23639418184757233, 0.25868362188339233, 0.28097307682037354, 0.30326250195503235, 0.32555195689201355, 0.34784138202667236, 0.37013083696365356, 0.39242029190063477, 0.41470974683761597, 0.4369991719722748, 0.459288626909256, 0.4815780520439148, 0.503867506980896, 0.5261569619178772, 0.5484464168548584, 0.5707358121871948, 0.593025267124176, 0.6153147220611572]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 9.0, 7.0, 15.0, 16.0, 29.0, 22.0, 40.0, 63.0, 107.0, 138.0, 209.0, 292.0, 558.0, 947.0, 1573.0, 2800.0, 5037.0, 9575.0, 19173.0, 40986.0, 90164.0, 199665.0, 304360.0, 199790.0, 90982.0, 41049.0, 19463.0, 9636.0, 5102.0, 2715.0, 1557.0, 919.0, 555.0, 352.0, 209.0, 149.0, 83.0, 59.0, 54.0, 34.0, 18.0, 11.0, 8.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.677734375, -0.6547622680664062, -0.6317901611328125, -0.6088180541992188, -0.585845947265625, -0.5628738403320312, -0.5399017333984375, -0.5169296264648438, -0.49395751953125, -0.47098541259765625, -0.4480133056640625, -0.42504119873046875, -0.402069091796875, -0.37909698486328125, -0.3561248779296875, -0.33315277099609375, -0.3101806640625, -0.28720855712890625, -0.2642364501953125, -0.24126434326171875, -0.218292236328125, -0.19532012939453125, -0.1723480224609375, -0.14937591552734375, -0.12640380859375, -0.10343170166015625, -0.0804595947265625, -0.05748748779296875, -0.034515380859375, -0.01154327392578125, 0.0114288330078125, 0.03440093994140625, 0.057373046875, 0.08034515380859375, 0.1033172607421875, 0.12628936767578125, 0.149261474609375, 0.17223358154296875, 0.1952056884765625, 0.21817779541015625, 0.24114990234375, 0.26412200927734375, 0.2870941162109375, 0.31006622314453125, 0.333038330078125, 0.35601043701171875, 0.3789825439453125, 0.40195465087890625, 0.4249267578125, 0.44789886474609375, 0.4708709716796875, 0.49384307861328125, 0.516815185546875, 0.5397872924804688, 0.5627593994140625, 0.5857315063476562, 0.60870361328125, 0.6316757202148438, 0.6546478271484375, 0.6776199340820312, 0.700592041015625, 0.7235641479492188, 0.7465362548828125, 0.7695083618164062, 0.79248046875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 5.0, 8.0, 11.0, 14.0, 19.0, 25.0, 27.0, 29.0, 38.0, 40.0, 37.0, 48.0, 62.0, 59.0, 60.0, 63.0, 72.0, 56.0, 46.0, 40.0, 32.0, 39.0, 31.0, 20.0, 31.0, 14.0, 13.0, 10.0, 8.0, 6.0, 8.0, 4.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.7197265625, -0.7012672424316406, -0.6828079223632812, -0.6643486022949219, -0.6458892822265625, -0.6274299621582031, -0.6089706420898438, -0.5905113220214844, -0.572052001953125, -0.5535926818847656, -0.5351333618164062, -0.5166740417480469, -0.4982147216796875, -0.4797554016113281, -0.46129608154296875, -0.4428367614746094, -0.42437744140625, -0.4059181213378906, -0.38745880126953125, -0.3689994812011719, -0.3505401611328125, -0.3320808410644531, -0.31362152099609375, -0.2951622009277344, -0.276702880859375, -0.2582435607910156, -0.23978424072265625, -0.22132492065429688, -0.2028656005859375, -0.18440628051757812, -0.16594696044921875, -0.14748764038085938, -0.1290283203125, -0.11056900024414062, -0.09210968017578125, -0.07365036010742188, -0.0551910400390625, -0.036731719970703125, -0.01827239990234375, 0.000186920166015625, 0.018646240234375, 0.037105560302734375, 0.05556488037109375, 0.07402420043945312, 0.0924835205078125, 0.11094284057617188, 0.12940216064453125, 0.14786148071289062, 0.16632080078125, 0.18478012084960938, 0.20323944091796875, 0.22169876098632812, 0.2401580810546875, 0.2586174011230469, 0.27707672119140625, 0.2955360412597656, 0.313995361328125, 0.3324546813964844, 0.35091400146484375, 0.3693733215332031, 0.3878326416015625, 0.4062919616699219, 0.42475128173828125, 0.4432106018066406, 0.461669921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 6.0, 10.0, 13.0, 16.0, 16.0, 27.0, 36.0, 42.0, 66.0, 107.0, 128.0, 156.0, 245.0, 298.0, 437.0, 799.0, 1614.0, 5027.0, 25102.0, 188968.0, 663299.0, 135657.0, 18798.0, 4107.0, 1379.0, 688.0, 426.0, 269.0, 219.0, 164.0, 126.0, 74.0, 50.0, 46.0, 42.0, 24.0, 28.0, 17.0, 9.0, 7.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.798309326171875, -1.73919677734375, -1.680084228515625, -1.6209716796875, -1.561859130859375, -1.50274658203125, -1.443634033203125, -1.384521484375, -1.325408935546875, -1.26629638671875, -1.207183837890625, -1.1480712890625, -1.088958740234375, -1.02984619140625, -0.970733642578125, -0.91162109375, -0.852508544921875, -0.79339599609375, -0.734283447265625, -0.6751708984375, -0.616058349609375, -0.55694580078125, -0.497833251953125, -0.438720703125, -0.379608154296875, -0.32049560546875, -0.261383056640625, -0.2022705078125, -0.143157958984375, -0.08404541015625, -0.024932861328125, 0.0341796875, 0.093292236328125, 0.15240478515625, 0.211517333984375, 0.2706298828125, 0.329742431640625, 0.38885498046875, 0.447967529296875, 0.507080078125, 0.566192626953125, 0.62530517578125, 0.684417724609375, 0.7435302734375, 0.802642822265625, 0.86175537109375, 0.920867919921875, 0.97998046875, 1.039093017578125, 1.09820556640625, 1.157318115234375, 1.2164306640625, 1.275543212890625, 1.33465576171875, 1.393768310546875, 1.452880859375, 1.511993408203125, 1.57110595703125, 1.630218505859375, 1.6893310546875, 1.748443603515625, 1.80755615234375, 1.866668701171875, 1.92578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 0.0, 1.0, 9.0, 9.0, 4.0, 8.0, 12.0, 12.0, 9.0, 16.0, 18.0, 22.0, 19.0, 26.0, 17.0, 37.0, 38.0, 32.0, 45.0, 35.0, 28.0, 31.0, 41.0, 34.0, 24.0, 42.0, 36.0, 26.0, 46.0, 32.0, 34.0, 27.0, 20.0, 22.0, 21.0, 32.0, 26.0, 17.0, 16.0, 13.0, 6.0, 20.0, 6.0, 7.0, 5.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.0390625, -1.9803009033203125, -1.921539306640625, -1.8627777099609375, -1.80401611328125, -1.7452545166015625, -1.686492919921875, -1.6277313232421875, -1.5689697265625, -1.5102081298828125, -1.451446533203125, -1.3926849365234375, -1.33392333984375, -1.2751617431640625, -1.216400146484375, -1.1576385498046875, -1.098876953125, -1.0401153564453125, -0.981353759765625, -0.9225921630859375, -0.86383056640625, -0.8050689697265625, -0.746307373046875, -0.6875457763671875, -0.6287841796875, -0.5700225830078125, -0.511260986328125, -0.4524993896484375, -0.39373779296875, -0.3349761962890625, -0.276214599609375, -0.2174530029296875, -0.15869140625, -0.0999298095703125, -0.041168212890625, 0.0175933837890625, 0.07635498046875, 0.1351165771484375, 0.193878173828125, 0.2526397705078125, 0.3114013671875, 0.3701629638671875, 0.428924560546875, 0.4876861572265625, 0.54644775390625, 0.6052093505859375, 0.663970947265625, 0.7227325439453125, 0.781494140625, 0.8402557373046875, 0.899017333984375, 0.9577789306640625, 1.01654052734375, 1.0753021240234375, 1.134063720703125, 1.1928253173828125, 1.2515869140625, 1.3103485107421875, 1.369110107421875, 1.4278717041015625, 1.48663330078125, 1.5453948974609375, 1.604156494140625, 1.6629180908203125, 1.7216796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 12.0, 19.0, 39.0, 74.0, 207.0, 672.0, 3949.0, 348695.0, 688651.0, 5040.0, 773.0, 219.0, 88.0, 45.0, 24.0, 10.0, 8.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.86328125, -2.7917938232421875, -2.720306396484375, -2.6488189697265625, -2.57733154296875, -2.5058441162109375, -2.434356689453125, -2.3628692626953125, -2.2913818359375, -2.2198944091796875, -2.148406982421875, -2.0769195556640625, -2.00543212890625, -1.9339447021484375, -1.862457275390625, -1.7909698486328125, -1.719482421875, -1.6479949951171875, -1.576507568359375, -1.5050201416015625, -1.43353271484375, -1.3620452880859375, -1.290557861328125, -1.2190704345703125, -1.1475830078125, -1.0760955810546875, -1.004608154296875, -0.9331207275390625, -0.86163330078125, -0.7901458740234375, -0.718658447265625, -0.6471710205078125, -0.57568359375, -0.5041961669921875, -0.432708740234375, -0.3612213134765625, -0.28973388671875, -0.2182464599609375, -0.146759033203125, -0.0752716064453125, -0.0037841796875, 0.0677032470703125, 0.139190673828125, 0.2106781005859375, 0.28216552734375, 0.3536529541015625, 0.425140380859375, 0.4966278076171875, 0.568115234375, 0.6396026611328125, 0.711090087890625, 0.7825775146484375, 0.85406494140625, 0.9255523681640625, 0.997039794921875, 1.0685272216796875, 1.1400146484375, 1.2115020751953125, 1.282989501953125, 1.3544769287109375, 1.42596435546875, 1.4974517822265625, 1.568939208984375, 1.6404266357421875, 1.7119140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 13.0, 19.0, 19.0, 33.0, 57.0, 81.0, 89.0, 126.0, 141.0, 101.0, 78.0, 64.0, 53.0, 39.0, 27.0, 18.0, 7.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.33272933959961e-05, -7.992424070835114e-05, -7.652118802070618e-05, -7.311813533306122e-05, -6.971508264541626e-05, -6.63120299577713e-05, -6.290897727012634e-05, -5.9505924582481384e-05, -5.6102871894836426e-05, -5.269981920719147e-05, -4.929676651954651e-05, -4.589371383190155e-05, -4.249066114425659e-05, -3.908760845661163e-05, -3.5684555768966675e-05, -3.2281503081321716e-05, -2.8878450393676758e-05, -2.54753977060318e-05, -2.207234501838684e-05, -1.8669292330741882e-05, -1.5266239643096924e-05, -1.1863186955451965e-05, -8.460134267807007e-06, -5.057081580162048e-06, -1.6540288925170898e-06, 1.7490237951278687e-06, 5.152076482772827e-06, 8.555129170417786e-06, 1.1958181858062744e-05, 1.5361234545707703e-05, 1.876428723335266e-05, 2.216733992099762e-05, 2.5570392608642578e-05, 2.8973445296287537e-05, 3.2376497983932495e-05, 3.5779550671577454e-05, 3.918260335922241e-05, 4.258565604686737e-05, 4.598870873451233e-05, 4.939176142215729e-05, 5.2794814109802246e-05, 5.6197866797447205e-05, 5.960091948509216e-05, 6.300397217273712e-05, 6.640702486038208e-05, 6.981007754802704e-05, 7.3213130235672e-05, 7.661618292331696e-05, 8.001923561096191e-05, 8.342228829860687e-05, 8.682534098625183e-05, 9.022839367389679e-05, 9.363144636154175e-05, 9.70344990491867e-05, 0.00010043755173683167, 0.00010384060442447662, 0.00010724365711212158, 0.00011064670979976654, 0.0001140497624874115, 0.00011745281517505646, 0.00012085586786270142, 0.00012425892055034637, 0.00012766197323799133, 0.0001310650259256363, 0.00013446807861328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 0.0, 3.0, 7.0, 6.0, 6.0, 10.0, 5.0, 13.0, 14.0, 15.0, 28.0, 39.0, 51.0, 71.0, 109.0, 247.0, 583.0, 1464.0, 4884.0, 38880.0, 886479.0, 104539.0, 7623.0, 2007.0, 687.0, 301.0, 173.0, 90.0, 59.0, 39.0, 32.0, 22.0, 17.0, 14.0, 5.0, 4.0, 4.0, 5.0, 4.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.197265625, -1.1581878662109375, -1.119110107421875, -1.0800323486328125, -1.04095458984375, -1.0018768310546875, -0.962799072265625, -0.9237213134765625, -0.8846435546875, -0.8455657958984375, -0.806488037109375, -0.7674102783203125, -0.72833251953125, -0.6892547607421875, -0.650177001953125, -0.6110992431640625, -0.572021484375, -0.5329437255859375, -0.493865966796875, -0.4547882080078125, -0.41571044921875, -0.3766326904296875, -0.337554931640625, -0.2984771728515625, -0.2593994140625, -0.2203216552734375, -0.181243896484375, -0.1421661376953125, -0.10308837890625, -0.0640106201171875, -0.024932861328125, 0.0141448974609375, 0.05322265625, 0.0923004150390625, 0.131378173828125, 0.1704559326171875, 0.20953369140625, 0.2486114501953125, 0.287689208984375, 0.3267669677734375, 0.3658447265625, 0.4049224853515625, 0.444000244140625, 0.4830780029296875, 0.52215576171875, 0.5612335205078125, 0.600311279296875, 0.6393890380859375, 0.678466796875, 0.7175445556640625, 0.756622314453125, 0.7957000732421875, 0.83477783203125, 0.8738555908203125, 0.912933349609375, 0.9520111083984375, 0.9910888671875, 1.0301666259765625, 1.069244384765625, 1.1083221435546875, 1.14739990234375, 1.1864776611328125, 1.225555419921875, 1.2646331787109375, 1.3037109375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 17.0, 25.0, 41.0, 86.0, 127.0, 188.0, 186.0, 130.0, 97.0, 52.0, 10.0, 9.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4072265625, -1.3589324951171875, -1.310638427734375, -1.2623443603515625, -1.21405029296875, -1.1657562255859375, -1.117462158203125, -1.0691680908203125, -1.0208740234375, -0.9725799560546875, -0.924285888671875, -0.8759918212890625, -0.82769775390625, -0.7794036865234375, -0.731109619140625, -0.6828155517578125, -0.634521484375, -0.5862274169921875, -0.537933349609375, -0.4896392822265625, -0.44134521484375, -0.3930511474609375, -0.344757080078125, -0.2964630126953125, -0.2481689453125, -0.1998748779296875, -0.151580810546875, -0.1032867431640625, -0.05499267578125, -0.0066986083984375, 0.041595458984375, 0.0898895263671875, 0.13818359375, 0.1864776611328125, 0.234771728515625, 0.2830657958984375, 0.33135986328125, 0.3796539306640625, 0.427947998046875, 0.4762420654296875, 0.5245361328125, 0.5728302001953125, 0.621124267578125, 0.6694183349609375, 0.71771240234375, 0.7660064697265625, 0.814300537109375, 0.8625946044921875, 0.910888671875, 0.9591827392578125, 1.007476806640625, 1.0557708740234375, 1.10406494140625, 1.1523590087890625, 1.200653076171875, 1.2489471435546875, 1.2972412109375, 1.3455352783203125, 1.393829345703125, 1.4421234130859375, 1.49041748046875, 1.5387115478515625, 1.587005615234375, 1.6352996826171875, 1.68359375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 11.0, 12.0, 21.0, 63.0, 93.0, 155.0, 187.0, 189.0, 134.0, 71.0, 26.0, 17.0, 11.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.43998146057129, -24.940895080566406, -24.44180679321289, -23.942720413208008, -23.443632125854492, -22.94454574584961, -22.445459365844727, -21.94637107849121, -21.447284698486328, -20.948198318481445, -20.44911003112793, -19.950023651123047, -19.45093536376953, -18.95184898376465, -18.452762603759766, -17.95367431640625, -17.454587936401367, -16.955501556396484, -16.45641326904297, -15.957326889038086, -15.458239555358887, -14.959152221679688, -14.460064888000488, -13.960977554321289, -13.46189022064209, -12.96280288696289, -12.463715553283691, -11.964629173278809, -11.46554183959961, -10.96645450592041, -10.467367172241211, -9.968280792236328, -9.469193458557129, -8.97010612487793, -8.47101879119873, -7.9719319343566895, -7.472845077514648, -6.973757743835449, -6.47467041015625, -5.975583553314209, -5.476496696472168, -4.977409362792969, -4.478322505950928, -3.9792351722717285, -3.4801483154296875, -2.9810609817504883, -2.481973886489868, -1.982886791229248, -1.4837994575500488, -0.9847123622894287, -0.4856252074241638, 0.013461947441101074, 0.5125490427017212, 1.0116362571716309, 1.510723352432251, 2.009810447692871, 2.508897542953491, 3.0079846382141113, 3.5070717334747314, 4.006158828735352, 4.505246162414551, 5.00433349609375, 5.503420352935791, 6.002507209777832, 6.501594543457031]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 10.0, 8.0, 9.0, 8.0, 15.0, 17.0, 23.0, 25.0, 24.0, 30.0, 40.0, 36.0, 30.0, 36.0, 53.0, 54.0, 54.0, 54.0, 35.0, 56.0, 46.0, 39.0, 37.0, 41.0, 28.0, 24.0, 19.0, 22.0, 23.0, 10.0, 24.0, 7.0, 12.0, 5.0, 10.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-10.5196533203125, -10.20052719116211, -9.881400108337402, -9.562273979187012, -9.243146896362305, -8.924020767211914, -8.604894638061523, -8.285768508911133, -7.966641426086426, -7.647514820098877, -7.328388214111328, -7.0092620849609375, -6.690135478973389, -6.37100887298584, -6.051882743835449, -5.7327561378479, -5.413629531860352, -5.094502925872803, -4.775376319885254, -4.456250190734863, -4.1371235847473145, -3.8179969787597656, -3.498870611190796, -3.179744243621826, -2.8606176376342773, -2.5414910316467285, -2.222364664077759, -1.9032381772994995, -1.5841116905212402, -1.264985203742981, -0.9458587169647217, -0.626732349395752, -0.3076057434082031, 0.011520743370056152, 0.33064723014831543, 0.6497737169265747, 0.968900203704834, 1.2880266904830933, 1.6071531772613525, 1.9262795448303223, 2.245406150817871, 2.56453275680542, 2.8836591243743896, 3.2027854919433594, 3.521912097930908, 3.841038703918457, 4.160164833068848, 4.4792914390563965, 4.798418045043945, 5.117544651031494, 5.436671257019043, 5.755797386169434, 6.074923992156982, 6.394050598144531, 6.713176727294922, 7.032303333282471, 7.3514299392700195, 7.670556545257568, 7.989683151245117, 8.308809280395508, 8.627935409545898, 8.947062492370605, 9.266188621520996, 9.585315704345703, 9.904441833496094]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 7.0, 8.0, 10.0, 12.0, 19.0, 15.0, 38.0, 48.0, 65.0, 96.0, 141.0, 213.0, 407.0, 712.0, 1368.0, 2977.0, 7335.0, 23751.0, 178255.0, 3903273.0, 53792.0, 12604.0, 4715.0, 1986.0, 981.0, 523.0, 315.0, 187.0, 123.0, 82.0, 46.0, 47.0, 25.0, 20.0, 20.0, 18.0, 5.0, 9.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85400390625, -0.825775146484375, -0.79754638671875, -0.769317626953125, -0.7410888671875, -0.712860107421875, -0.68463134765625, -0.656402587890625, -0.628173828125, -0.599945068359375, -0.57171630859375, -0.543487548828125, -0.5152587890625, -0.487030029296875, -0.45880126953125, -0.430572509765625, -0.40234375, -0.374114990234375, -0.34588623046875, -0.317657470703125, -0.2894287109375, -0.261199951171875, -0.23297119140625, -0.204742431640625, -0.176513671875, -0.148284912109375, -0.12005615234375, -0.091827392578125, -0.0635986328125, -0.035369873046875, -0.00714111328125, 0.021087646484375, 0.04931640625, 0.077545166015625, 0.10577392578125, 0.134002685546875, 0.1622314453125, 0.190460205078125, 0.21868896484375, 0.246917724609375, 0.275146484375, 0.303375244140625, 0.33160400390625, 0.359832763671875, 0.3880615234375, 0.416290283203125, 0.44451904296875, 0.472747802734375, 0.5009765625, 0.529205322265625, 0.55743408203125, 0.585662841796875, 0.6138916015625, 0.642120361328125, 0.67034912109375, 0.698577880859375, 0.726806640625, 0.755035400390625, 0.78326416015625, 0.811492919921875, 0.8397216796875, 0.867950439453125, 0.89617919921875, 0.924407958984375, 0.95263671875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 11.0, 12.0, 14.0, 22.0, 31.0, 48.0, 47.0, 57.0, 81.0, 96.0, 100.0, 104.0, 81.0, 64.0, 52.0, 43.0, 45.0, 34.0, 15.0, 13.0, 14.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69970703125, -0.673583984375, -0.6474609375, -0.621337890625, -0.59521484375, -0.569091796875, -0.54296875, -0.516845703125, -0.49072265625, -0.464599609375, -0.4384765625, -0.412353515625, -0.38623046875, -0.360107421875, -0.333984375, -0.307861328125, -0.28173828125, -0.255615234375, -0.2294921875, -0.203369140625, -0.17724609375, -0.151123046875, -0.125, -0.098876953125, -0.07275390625, -0.046630859375, -0.0205078125, 0.005615234375, 0.03173828125, 0.057861328125, 0.083984375, 0.110107421875, 0.13623046875, 0.162353515625, 0.1884765625, 0.214599609375, 0.24072265625, 0.266845703125, 0.29296875, 0.319091796875, 0.34521484375, 0.371337890625, 0.3974609375, 0.423583984375, 0.44970703125, 0.475830078125, 0.501953125, 0.528076171875, 0.55419921875, 0.580322265625, 0.6064453125, 0.632568359375, 0.65869140625, 0.684814453125, 0.7109375, 0.737060546875, 0.76318359375, 0.789306640625, 0.8154296875, 0.841552734375, 0.86767578125, 0.893798828125, 0.919921875, 0.946044921875, 0.97216796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 6.0, 6.0, 12.0, 17.0, 19.0, 15.0, 30.0, 27.0, 45.0, 71.0, 94.0, 123.0, 160.0, 231.0, 434.0, 876.0, 2038.0, 5577.0, 22464.0, 244949.0, 3861036.0, 42030.0, 8464.0, 2843.0, 1133.0, 563.0, 302.0, 188.0, 134.0, 84.0, 73.0, 47.0, 46.0, 31.0, 26.0, 18.0, 13.0, 10.0, 17.0, 6.0, 3.0, 1.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.1354827880859375, -1.095184326171875, -1.0548858642578125, -1.01458740234375, -0.9742889404296875, -0.933990478515625, -0.8936920166015625, -0.8533935546875, -0.8130950927734375, -0.772796630859375, -0.7324981689453125, -0.69219970703125, -0.6519012451171875, -0.611602783203125, -0.5713043212890625, -0.531005859375, -0.4907073974609375, -0.450408935546875, -0.4101104736328125, -0.36981201171875, -0.3295135498046875, -0.289215087890625, -0.2489166259765625, -0.2086181640625, -0.1683197021484375, -0.128021240234375, -0.0877227783203125, -0.04742431640625, -0.0071258544921875, 0.033172607421875, 0.0734710693359375, 0.11376953125, 0.1540679931640625, 0.194366455078125, 0.2346649169921875, 0.27496337890625, 0.3152618408203125, 0.355560302734375, 0.3958587646484375, 0.4361572265625, 0.4764556884765625, 0.516754150390625, 0.5570526123046875, 0.59735107421875, 0.6376495361328125, 0.677947998046875, 0.7182464599609375, 0.758544921875, 0.7988433837890625, 0.839141845703125, 0.8794403076171875, 0.91973876953125, 0.9600372314453125, 1.000335693359375, 1.0406341552734375, 1.0809326171875, 1.1212310791015625, 1.161529541015625, 1.2018280029296875, 1.24212646484375, 1.2824249267578125, 1.322723388671875, 1.3630218505859375, 1.4033203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 6.0, 13.0, 13.0, 27.0, 71.0, 166.0, 3389.0, 251.0, 81.0, 27.0, 16.0, 10.0, 4.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7902297973632812, -0.7625885009765625, -0.7349472045898438, -0.707305908203125, -0.6796646118164062, -0.6520233154296875, -0.6243820190429688, -0.59674072265625, -0.5690994262695312, -0.5414581298828125, -0.5138168334960938, -0.486175537109375, -0.45853424072265625, -0.4308929443359375, -0.40325164794921875, -0.3756103515625, -0.34796905517578125, -0.3203277587890625, -0.29268646240234375, -0.265045166015625, -0.23740386962890625, -0.2097625732421875, -0.18212127685546875, -0.15447998046875, -0.12683868408203125, -0.0991973876953125, -0.07155609130859375, -0.043914794921875, -0.01627349853515625, 0.0113677978515625, 0.03900909423828125, 0.066650390625, 0.09429168701171875, 0.1219329833984375, 0.14957427978515625, 0.177215576171875, 0.20485687255859375, 0.2324981689453125, 0.26013946533203125, 0.28778076171875, 0.31542205810546875, 0.3430633544921875, 0.37070465087890625, 0.398345947265625, 0.42598724365234375, 0.4536285400390625, 0.48126983642578125, 0.5089111328125, 0.5365524291992188, 0.5641937255859375, 0.5918350219726562, 0.619476318359375, 0.6471176147460938, 0.6747589111328125, 0.7024002075195312, 0.73004150390625, 0.7576828002929688, 0.7853240966796875, 0.8129653930664062, 0.840606689453125, 0.8682479858398438, 0.8958892822265625, 0.9235305786132812, 0.951171875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 4.0, 11.0, 9.0, 20.0, 32.0, 60.0, 100.0, 161.0, 160.0, 159.0, 103.0, 82.0, 44.0, 22.0, 14.0, 6.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.623303174972534, -2.545696258544922, -2.4680893421173096, -2.390482187271118, -2.312875270843506, -2.2352683544158936, -2.1576614379882812, -2.080054521560669, -2.0024476051330566, -1.9248406887054443, -1.8472336530685425, -1.7696267366409302, -1.6920197010040283, -1.614412784576416, -1.5368058681488037, -1.4591989517211914, -1.381591796875, -1.3039848804473877, -1.2263778448104858, -1.1487709283828735, -1.0711638927459717, -0.9935569763183594, -0.9159500598907471, -0.83834308385849, -0.7607361078262329, -0.6831291317939758, -0.6055221557617188, -0.5279152393341064, -0.45030826330184937, -0.3727012872695923, -0.2950943410396576, -0.2174873948097229, -0.13988041877746582, -0.062273457646369934, 0.015333503484725952, 0.09294046461582184, 0.17054742574691772, 0.2481544017791748, 0.3257613480091095, 0.4033682942390442, 0.48097527027130127, 0.5585822463035583, 0.6361892223358154, 0.7137961387634277, 0.7914031147956848, 0.8690100908279419, 0.9466170072555542, 1.024224042892456, 1.1018309593200684, 1.1794378757476807, 1.2570449113845825, 1.3346518278121948, 1.4122588634490967, 1.489865779876709, 1.5674726963043213, 1.6450796127319336, 1.7226866483688354, 1.8002935647964478, 1.8779006004333496, 1.955507516860962, 2.033114433288574, 2.1107215881347656, 2.188328504562378, 2.2659354209899902, 2.3435423374176025]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 8.0, 6.0, 11.0, 11.0, 6.0, 7.0, 16.0, 14.0, 14.0, 19.0, 9.0, 20.0, 18.0, 18.0, 28.0, 41.0, 31.0, 32.0, 34.0, 51.0, 47.0, 40.0, 32.0, 37.0, 28.0, 37.0, 33.0, 49.0, 29.0, 24.0, 24.0, 31.0, 23.0, 21.0, 21.0, 24.0, 20.0, 8.0, 13.0, 10.0, 11.0, 9.0, 6.0, 2.0, 5.0, 3.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.9943637251853943, -0.9639459848403931, -0.9335281848907471, -0.9031103849411011, -0.8726926445960999, -0.8422749042510986, -0.8118571043014526, -0.7814393043518066, -0.7510215640068054, -0.7206038236618042, -0.6901860237121582, -0.6597682237625122, -0.629350483417511, -0.5989327430725098, -0.5685149431228638, -0.5380971431732178, -0.5076794028282166, -0.47726163268089294, -0.44684386253356934, -0.4164260923862457, -0.3860083222389221, -0.3555905520915985, -0.3251727819442749, -0.2947550117969513, -0.2643372416496277, -0.23391947150230408, -0.20350170135498047, -0.17308393120765686, -0.14266616106033325, -0.11224839091300964, -0.08183062076568604, -0.05141285061836243, -0.020995140075683594, 0.009422630071640015, 0.03984040021896362, 0.07025817036628723, 0.10067594051361084, 0.13109371066093445, 0.16151148080825806, 0.19192925095558167, 0.22234702110290527, 0.2527647912502289, 0.2831825613975525, 0.3136003315448761, 0.3440181016921997, 0.3744358718395233, 0.4048536419868469, 0.43527141213417053, 0.46568918228149414, 0.49610695242881775, 0.5265247225761414, 0.5569424629211426, 0.5873602628707886, 0.6177780628204346, 0.6481958031654358, 0.678613543510437, 0.709031343460083, 0.739449143409729, 0.7698668837547302, 0.8002846240997314, 0.8307024240493774, 0.8611202239990234, 0.8915379643440247, 0.9219557046890259, 0.9523735046386719]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 9.0, 6.0, 9.0, 29.0, 17.0, 37.0, 63.0, 111.0, 147.0, 322.0, 582.0, 1233.0, 2850.0, 8828.0, 36461.0, 214402.0, 582502.0, 160400.0, 28433.0, 7297.0, 2473.0, 1080.0, 520.0, 281.0, 158.0, 104.0, 60.0, 34.0, 19.0, 13.0, 17.0, 11.0, 9.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.6416015625, -1.5924835205078125, -1.543365478515625, -1.4942474365234375, -1.44512939453125, -1.3960113525390625, -1.346893310546875, -1.2977752685546875, -1.2486572265625, -1.1995391845703125, -1.150421142578125, -1.1013031005859375, -1.05218505859375, -1.0030670166015625, -0.953948974609375, -0.9048309326171875, -0.855712890625, -0.8065948486328125, -0.757476806640625, -0.7083587646484375, -0.65924072265625, -0.6101226806640625, -0.561004638671875, -0.5118865966796875, -0.4627685546875, -0.4136505126953125, -0.364532470703125, -0.3154144287109375, -0.26629638671875, -0.2171783447265625, -0.168060302734375, -0.1189422607421875, -0.06982421875, -0.0207061767578125, 0.028411865234375, 0.0775299072265625, 0.12664794921875, 0.1757659912109375, 0.224884033203125, 0.2740020751953125, 0.3231201171875, 0.3722381591796875, 0.421356201171875, 0.4704742431640625, 0.51959228515625, 0.5687103271484375, 0.617828369140625, 0.6669464111328125, 0.716064453125, 0.7651824951171875, 0.814300537109375, 0.8634185791015625, 0.91253662109375, 0.9616546630859375, 1.010772705078125, 1.0598907470703125, 1.1090087890625, 1.1581268310546875, 1.207244873046875, 1.2563629150390625, 1.30548095703125, 1.3545989990234375, 1.403717041015625, 1.4528350830078125, 1.501953125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 9.0, 11.0, 14.0, 18.0, 25.0, 35.0, 52.0, 60.0, 63.0, 85.0, 89.0, 92.0, 77.0, 94.0, 56.0, 49.0, 49.0, 42.0, 22.0, 22.0, 9.0, 8.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6497344970703125, -0.624176025390625, -0.5986175537109375, -0.57305908203125, -0.5475006103515625, -0.521942138671875, -0.4963836669921875, -0.4708251953125, -0.4452667236328125, -0.419708251953125, -0.3941497802734375, -0.36859130859375, -0.3430328369140625, -0.317474365234375, -0.2919158935546875, -0.266357421875, -0.2407989501953125, -0.215240478515625, -0.1896820068359375, -0.16412353515625, -0.1385650634765625, -0.113006591796875, -0.0874481201171875, -0.0618896484375, -0.0363311767578125, -0.010772705078125, 0.0147857666015625, 0.04034423828125, 0.0659027099609375, 0.091461181640625, 0.1170196533203125, 0.142578125, 0.1681365966796875, 0.193695068359375, 0.2192535400390625, 0.24481201171875, 0.2703704833984375, 0.295928955078125, 0.3214874267578125, 0.3470458984375, 0.3726043701171875, 0.398162841796875, 0.4237213134765625, 0.44927978515625, 0.4748382568359375, 0.500396728515625, 0.5259552001953125, 0.551513671875, 0.5770721435546875, 0.602630615234375, 0.6281890869140625, 0.65374755859375, 0.6793060302734375, 0.704864501953125, 0.7304229736328125, 0.7559814453125, 0.7815399169921875, 0.807098388671875, 0.8326568603515625, 0.85821533203125, 0.8837738037109375, 0.909332275390625, 0.9348907470703125, 0.96044921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 4.0, 12.0, 13.0, 8.0, 22.0, 31.0, 41.0, 37.0, 48.0, 111.0, 152.0, 220.0, 395.0, 768.0, 1806.0, 5749.0, 28573.0, 292724.0, 635094.0, 67610.0, 9957.0, 2708.0, 1105.0, 517.0, 311.0, 154.0, 101.0, 69.0, 61.0, 33.0, 32.0, 23.0, 14.0, 18.0, 9.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.968170166015625, -1.90509033203125, -1.842010498046875, -1.7789306640625, -1.715850830078125, -1.65277099609375, -1.589691162109375, -1.526611328125, -1.463531494140625, -1.40045166015625, -1.337371826171875, -1.2742919921875, -1.211212158203125, -1.14813232421875, -1.085052490234375, -1.02197265625, -0.958892822265625, -0.89581298828125, -0.832733154296875, -0.7696533203125, -0.706573486328125, -0.64349365234375, -0.580413818359375, -0.517333984375, -0.454254150390625, -0.39117431640625, -0.328094482421875, -0.2650146484375, -0.201934814453125, -0.13885498046875, -0.075775146484375, -0.0126953125, 0.050384521484375, 0.11346435546875, 0.176544189453125, 0.2396240234375, 0.302703857421875, 0.36578369140625, 0.428863525390625, 0.491943359375, 0.555023193359375, 0.61810302734375, 0.681182861328125, 0.7442626953125, 0.807342529296875, 0.87042236328125, 0.933502197265625, 0.99658203125, 1.059661865234375, 1.12274169921875, 1.185821533203125, 1.2489013671875, 1.311981201171875, 1.37506103515625, 1.438140869140625, 1.501220703125, 1.564300537109375, 1.62738037109375, 1.690460205078125, 1.7535400390625, 1.816619873046875, 1.87969970703125, 1.942779541015625, 2.005859375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 11.0, 10.0, 15.0, 15.0, 13.0, 28.0, 28.0, 30.0, 36.0, 44.0, 41.0, 41.0, 59.0, 61.0, 57.0, 49.0, 56.0, 56.0, 44.0, 57.0, 50.0, 37.0, 37.0, 22.0, 22.0, 21.0, 16.0, 12.0, 1.0, 5.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.391998291015625, -2.31915283203125, -2.246307373046875, -2.1734619140625, -2.100616455078125, -2.02777099609375, -1.954925537109375, -1.882080078125, -1.809234619140625, -1.73638916015625, -1.663543701171875, -1.5906982421875, -1.517852783203125, -1.44500732421875, -1.372161865234375, -1.29931640625, -1.226470947265625, -1.15362548828125, -1.080780029296875, -1.0079345703125, -0.935089111328125, -0.86224365234375, -0.789398193359375, -0.716552734375, -0.643707275390625, -0.57086181640625, -0.498016357421875, -0.4251708984375, -0.352325439453125, -0.27947998046875, -0.206634521484375, -0.1337890625, -0.060943603515625, 0.01190185546875, 0.084747314453125, 0.1575927734375, 0.230438232421875, 0.30328369140625, 0.376129150390625, 0.448974609375, 0.521820068359375, 0.59466552734375, 0.667510986328125, 0.7403564453125, 0.813201904296875, 0.88604736328125, 0.958892822265625, 1.03173828125, 1.104583740234375, 1.17742919921875, 1.250274658203125, 1.3231201171875, 1.395965576171875, 1.46881103515625, 1.541656494140625, 1.614501953125, 1.687347412109375, 1.76019287109375, 1.833038330078125, 1.9058837890625, 1.978729248046875, 2.05157470703125, 2.124420166015625, 2.197265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 11.0, 19.0, 17.0, 35.0, 42.0, 99.0, 142.0, 284.0, 604.0, 1401.0, 4762.0, 36000.0, 708524.0, 275783.0, 15865.0, 2942.0, 1034.0, 401.0, 256.0, 114.0, 76.0, 48.0, 26.0, 19.0, 13.0, 6.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.806640625, -0.783477783203125, -0.76031494140625, -0.737152099609375, -0.7139892578125, -0.690826416015625, -0.66766357421875, -0.644500732421875, -0.621337890625, -0.598175048828125, -0.57501220703125, -0.551849365234375, -0.5286865234375, -0.505523681640625, -0.48236083984375, -0.459197998046875, -0.43603515625, -0.412872314453125, -0.38970947265625, -0.366546630859375, -0.3433837890625, -0.320220947265625, -0.29705810546875, -0.273895263671875, -0.250732421875, -0.227569580078125, -0.20440673828125, -0.181243896484375, -0.1580810546875, -0.134918212890625, -0.11175537109375, -0.088592529296875, -0.0654296875, -0.042266845703125, -0.01910400390625, 0.004058837890625, 0.0272216796875, 0.050384521484375, 0.07354736328125, 0.096710205078125, 0.119873046875, 0.143035888671875, 0.16619873046875, 0.189361572265625, 0.2125244140625, 0.235687255859375, 0.25885009765625, 0.282012939453125, 0.30517578125, 0.328338623046875, 0.35150146484375, 0.374664306640625, 0.3978271484375, 0.420989990234375, 0.44415283203125, 0.467315673828125, 0.490478515625, 0.513641357421875, 0.53680419921875, 0.559967041015625, 0.5831298828125, 0.606292724609375, 0.62945556640625, 0.652618408203125, 0.67578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 4.0, 10.0, 8.0, 10.0, 20.0, 25.0, 22.0, 20.0, 42.0, 54.0, 58.0, 65.0, 80.0, 90.0, 79.0, 80.0, 79.0, 47.0, 44.0, 32.0, 21.0, 22.0, 15.0, 22.0, 16.0, 5.0, 5.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.577108383178711e-05, -8.344557136297226e-05, -8.112005889415741e-05, -7.879454642534256e-05, -7.646903395652771e-05, -7.414352148771286e-05, -7.181800901889801e-05, -6.949249655008316e-05, -6.716698408126831e-05, -6.484147161245346e-05, -6.251595914363861e-05, -6.019044667482376e-05, -5.786493420600891e-05, -5.553942173719406e-05, -5.321390926837921e-05, -5.088839679956436e-05, -4.856288433074951e-05, -4.623737186193466e-05, -4.391185939311981e-05, -4.158634692430496e-05, -3.926083445549011e-05, -3.693532198667526e-05, -3.460980951786041e-05, -3.228429704904556e-05, -2.9958784580230713e-05, -2.7633272111415863e-05, -2.5307759642601013e-05, -2.2982247173786163e-05, -2.0656734704971313e-05, -1.8331222236156464e-05, -1.6005709767341614e-05, -1.3680197298526764e-05, -1.1354684829711914e-05, -9.029172360897064e-06, -6.703659892082214e-06, -4.3781474232673645e-06, -2.0526349544525146e-06, 2.728775143623352e-07, 2.598389983177185e-06, 4.923902451992035e-06, 7.249414920806885e-06, 9.574927389621735e-06, 1.1900439858436584e-05, 1.4225952327251434e-05, 1.6551464796066284e-05, 1.8876977264881134e-05, 2.1202489733695984e-05, 2.3528002202510834e-05, 2.5853514671325684e-05, 2.8179027140140533e-05, 3.0504539608955383e-05, 3.283005207777023e-05, 3.515556454658508e-05, 3.748107701539993e-05, 3.980658948421478e-05, 4.213210195302963e-05, 4.445761442184448e-05, 4.678312689065933e-05, 4.910863935947418e-05, 5.143415182828903e-05, 5.375966429710388e-05, 5.608517676591873e-05, 5.841068923473358e-05, 6.073620170354843e-05, 6.306171417236328e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 17.0, 17.0, 23.0, 34.0, 68.0, 152.0, 314.0, 781.0, 2696.0, 19631.0, 642307.0, 366499.0, 12659.0, 2094.0, 647.0, 277.0, 140.0, 67.0, 43.0, 29.0, 17.0, 11.0, 8.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7205886840820312, -0.6916656494140625, -0.6627426147460938, -0.633819580078125, -0.6048965454101562, -0.5759735107421875, -0.5470504760742188, -0.51812744140625, -0.48920440673828125, -0.4602813720703125, -0.43135833740234375, -0.402435302734375, -0.37351226806640625, -0.3445892333984375, -0.31566619873046875, -0.2867431640625, -0.25782012939453125, -0.2288970947265625, -0.19997406005859375, -0.171051025390625, -0.14212799072265625, -0.1132049560546875, -0.08428192138671875, -0.05535888671875, -0.02643585205078125, 0.0024871826171875, 0.03141021728515625, 0.060333251953125, 0.08925628662109375, 0.1181793212890625, 0.14710235595703125, 0.176025390625, 0.20494842529296875, 0.2338714599609375, 0.26279449462890625, 0.291717529296875, 0.32064056396484375, 0.3495635986328125, 0.37848663330078125, 0.40740966796875, 0.43633270263671875, 0.4652557373046875, 0.49417877197265625, 0.523101806640625, 0.5520248413085938, 0.5809478759765625, 0.6098709106445312, 0.6387939453125, 0.6677169799804688, 0.6966400146484375, 0.7255630493164062, 0.754486083984375, 0.7834091186523438, 0.8123321533203125, 0.8412551879882812, 0.87017822265625, 0.8991012573242188, 0.9280242919921875, 0.9569473266601562, 0.985870361328125, 1.0147933959960938, 1.0437164306640625, 1.0726394653320312, 1.1015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 0.0, 2.0, 9.0, 7.0, 11.0, 14.0, 23.0, 30.0, 39.0, 51.0, 58.0, 56.0, 81.0, 110.0, 100.0, 95.0, 80.0, 63.0, 44.0, 27.0, 22.0, 18.0, 17.0, 11.0, 7.0, 6.0, 7.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4180488586425781, -0.39884185791015625, -0.3796348571777344, -0.3604278564453125, -0.3412208557128906, -0.32201385498046875, -0.3028068542480469, -0.283599853515625, -0.2643928527832031, -0.24518585205078125, -0.22597885131835938, -0.2067718505859375, -0.18756484985351562, -0.16835784912109375, -0.14915084838867188, -0.12994384765625, -0.11073684692382812, -0.09152984619140625, -0.07232284545898438, -0.0531158447265625, -0.033908843994140625, -0.01470184326171875, 0.004505157470703125, 0.023712158203125, 0.042919158935546875, 0.06212615966796875, 0.08133316040039062, 0.1005401611328125, 0.11974716186523438, 0.13895416259765625, 0.15816116333007812, 0.1773681640625, 0.19657516479492188, 0.21578216552734375, 0.23498916625976562, 0.2541961669921875, 0.2734031677246094, 0.29261016845703125, 0.3118171691894531, 0.331024169921875, 0.3502311706542969, 0.36943817138671875, 0.3886451721191406, 0.4078521728515625, 0.4270591735839844, 0.44626617431640625, 0.4654731750488281, 0.48468017578125, 0.5038871765136719, 0.5230941772460938, 0.5423011779785156, 0.5615081787109375, 0.5807151794433594, 0.5999221801757812, 0.6191291809082031, 0.638336181640625, 0.6575431823730469, 0.6767501831054688, 0.6959571838378906, 0.7151641845703125, 0.7343711853027344, 0.7535781860351562, 0.7727851867675781, 0.7919921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 13.0, 18.0, 23.0, 42.0, 86.0, 94.0, 132.0, 147.0, 141.0, 123.0, 79.0, 42.0, 29.0, 10.0, 12.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.766450881958008, -12.386005401611328, -12.005559921264648, -11.625114440917969, -11.244668006896973, -10.864222526550293, -10.483777046203613, -10.103331565856934, -9.722885131835938, -9.342439651489258, -8.961994171142578, -8.581548690795898, -8.201102256774902, -7.820656776428223, -7.440211296081543, -7.059765815734863, -6.679320335388184, -6.298874855041504, -5.918428897857666, -5.537983417510986, -5.157537460327148, -4.777091979980469, -4.396646499633789, -4.016201019287109, -3.6357550621032715, -3.2553093433380127, -2.874863624572754, -2.494418144226074, -2.1139724254608154, -1.7335267066955566, -1.353081226348877, -0.9726355075836182, -0.5921897888183594, -0.21174412965774536, 0.16870152950286865, 0.5491471290588379, 0.9295928478240967, 1.3100385665893555, 1.6904840469360352, 2.070929765701294, 2.4513754844665527, 2.8318212032318115, 3.2122669219970703, 3.59271240234375, 3.973158121109009, 4.353603839874268, 4.734049320220947, 5.114495277404785, 5.494940757751465, 5.8753862380981445, 6.255832195281982, 6.636277675628662, 7.0167236328125, 7.39716911315918, 7.777614593505859, 8.158060073852539, 8.538505554199219, 8.918951034545898, 9.299396514892578, 9.679841995239258, 10.060288429260254, 10.440733909606934, 10.821179389953613, 11.201624870300293, 11.582071304321289]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 0.0, 3.0, 6.0, 11.0, 8.0, 19.0, 20.0, 25.0, 27.0, 44.0, 66.0, 54.0, 63.0, 70.0, 69.0, 65.0, 64.0, 67.0, 51.0, 53.0, 37.0, 37.0, 27.0, 30.0, 20.0, 12.0, 15.0, 6.0, 11.0, 5.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.205841064453125, -13.823945045471191, -13.442049026489258, -13.06015396118164, -12.678257942199707, -12.296361923217773, -11.91446590423584, -11.532569885253906, -11.150674819946289, -10.768778800964355, -10.386882781982422, -10.004987716674805, -9.623091697692871, -9.241195678710938, -8.859299659729004, -8.47740364074707, -8.095507621765137, -7.713611602783203, -7.331716060638428, -6.949820041656494, -6.567924499511719, -6.186028480529785, -5.804132461547852, -5.422236442565918, -5.040340900421143, -4.658444881439209, -4.276549339294434, -3.8946533203125, -3.5127575397491455, -3.130861759185791, -2.7489657402038574, -2.367069959640503, -1.9851751327514648, -1.6032793521881104, -1.2213834524154663, -0.8394875526428223, -0.4575917720794678, -0.07569599151611328, 0.3062000274658203, 0.6880958080291748, 1.0699915885925293, 1.4518873691558838, 1.8337832689285278, 2.215679168701172, 2.5975749492645264, 2.979470729827881, 3.3613667488098145, 3.743262529373169, 4.125158309936523, 4.507054328918457, 4.888949871063232, 5.270845890045166, 5.652741432189941, 6.034637451171875, 6.416533470153809, 6.798429489135742, 7.180325031280518, 7.562221050262451, 7.944116592407227, 8.32601261138916, 8.707908630371094, 9.089803695678711, 9.471700668334961, 9.853595733642578, 10.235491752624512]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 7.0, 11.0, 11.0, 17.0, 18.0, 21.0, 38.0, 69.0, 96.0, 183.0, 427.0, 1098.0, 3735.0, 18700.0, 400397.0, 3699672.0, 59432.0, 7446.0, 1771.0, 530.0, 239.0, 107.0, 87.0, 40.0, 29.0, 24.0, 20.0, 11.0, 10.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.904296875, -1.8531646728515625, -1.802032470703125, -1.7509002685546875, -1.69976806640625, -1.6486358642578125, -1.597503662109375, -1.5463714599609375, -1.4952392578125, -1.4441070556640625, -1.392974853515625, -1.3418426513671875, -1.29071044921875, -1.2395782470703125, -1.188446044921875, -1.1373138427734375, -1.086181640625, -1.0350494384765625, -0.983917236328125, -0.9327850341796875, -0.88165283203125, -0.8305206298828125, -0.779388427734375, -0.7282562255859375, -0.6771240234375, -0.6259918212890625, -0.574859619140625, -0.5237274169921875, -0.47259521484375, -0.4214630126953125, -0.370330810546875, -0.3191986083984375, -0.26806640625, -0.2169342041015625, -0.165802001953125, -0.1146697998046875, -0.06353759765625, -0.0124053955078125, 0.038726806640625, 0.0898590087890625, 0.1409912109375, 0.1921234130859375, 0.243255615234375, 0.2943878173828125, 0.34552001953125, 0.3966522216796875, 0.447784423828125, 0.4989166259765625, 0.550048828125, 0.6011810302734375, 0.652313232421875, 0.7034454345703125, 0.75457763671875, 0.8057098388671875, 0.856842041015625, 0.9079742431640625, 0.9591064453125, 1.0102386474609375, 1.061370849609375, 1.1125030517578125, 1.16363525390625, 1.2147674560546875, 1.265899658203125, 1.3170318603515625, 1.3681640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 7.0, 6.0, 16.0, 15.0, 19.0, 23.0, 23.0, 29.0, 36.0, 42.0, 42.0, 44.0, 55.0, 57.0, 62.0, 73.0, 49.0, 68.0, 42.0, 48.0, 59.0, 40.0, 38.0, 21.0, 15.0, 22.0, 12.0, 12.0, 8.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49267578125, -0.47628021240234375, -0.4598846435546875, -0.44348907470703125, -0.427093505859375, -0.41069793701171875, -0.3943023681640625, -0.37790679931640625, -0.36151123046875, -0.34511566162109375, -0.3287200927734375, -0.31232452392578125, -0.295928955078125, -0.27953338623046875, -0.2631378173828125, -0.24674224853515625, -0.2303466796875, -0.21395111083984375, -0.1975555419921875, -0.18115997314453125, -0.164764404296875, -0.14836883544921875, -0.1319732666015625, -0.11557769775390625, -0.09918212890625, -0.08278656005859375, -0.0663909912109375, -0.04999542236328125, -0.033599853515625, -0.01720428466796875, -0.0008087158203125, 0.01558685302734375, 0.031982421875, 0.04837799072265625, 0.0647735595703125, 0.08116912841796875, 0.097564697265625, 0.11396026611328125, 0.1303558349609375, 0.14675140380859375, 0.16314697265625, 0.17954254150390625, 0.1959381103515625, 0.21233367919921875, 0.228729248046875, 0.24512481689453125, 0.2615203857421875, 0.27791595458984375, 0.2943115234375, 0.31070709228515625, 0.3271026611328125, 0.34349822998046875, 0.359893798828125, 0.37628936767578125, 0.3926849365234375, 0.40908050537109375, 0.42547607421875, 0.44187164306640625, 0.4582672119140625, 0.47466278076171875, 0.491058349609375, 0.5074539184570312, 0.5238494873046875, 0.5402450561523438, 0.556640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 9.0, 25.0, 20.0, 32.0, 76.0, 150.0, 376.0, 1869.0, 14956.0, 1293940.0, 2861273.0, 18560.0, 2238.0, 457.0, 125.0, 61.0, 39.0, 23.0, 18.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.251953125, -2.171630859375, -2.09130859375, -2.010986328125, -1.9306640625, -1.850341796875, -1.77001953125, -1.689697265625, -1.609375, -1.529052734375, -1.44873046875, -1.368408203125, -1.2880859375, -1.207763671875, -1.12744140625, -1.047119140625, -0.966796875, -0.886474609375, -0.80615234375, -0.725830078125, -0.6455078125, -0.565185546875, -0.48486328125, -0.404541015625, -0.32421875, -0.243896484375, -0.16357421875, -0.083251953125, -0.0029296875, 0.077392578125, 0.15771484375, 0.238037109375, 0.318359375, 0.398681640625, 0.47900390625, 0.559326171875, 0.6396484375, 0.719970703125, 0.80029296875, 0.880615234375, 0.9609375, 1.041259765625, 1.12158203125, 1.201904296875, 1.2822265625, 1.362548828125, 1.44287109375, 1.523193359375, 1.603515625, 1.683837890625, 1.76416015625, 1.844482421875, 1.9248046875, 2.005126953125, 2.08544921875, 2.165771484375, 2.24609375, 2.326416015625, 2.40673828125, 2.487060546875, 2.5673828125, 2.647705078125, 2.72802734375, 2.808349609375, 2.888671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 4.0, 5.0, 13.0, 11.0, 8.0, 10.0, 18.0, 26.0, 37.0, 70.0, 141.0, 323.0, 850.0, 1229.0, 623.0, 257.0, 142.0, 80.0, 57.0, 34.0, 28.0, 24.0, 17.0, 13.0, 8.0, 8.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.2490234375, -1.2127227783203125, -1.176422119140625, -1.1401214599609375, -1.10382080078125, -1.0675201416015625, -1.031219482421875, -0.9949188232421875, -0.9586181640625, -0.9223175048828125, -0.886016845703125, -0.8497161865234375, -0.81341552734375, -0.7771148681640625, -0.740814208984375, -0.7045135498046875, -0.668212890625, -0.6319122314453125, -0.595611572265625, -0.5593109130859375, -0.52301025390625, -0.4867095947265625, -0.450408935546875, -0.4141082763671875, -0.3778076171875, -0.3415069580078125, -0.305206298828125, -0.2689056396484375, -0.23260498046875, -0.1963043212890625, -0.160003662109375, -0.1237030029296875, -0.08740234375, -0.0511016845703125, -0.014801025390625, 0.0214996337890625, 0.05780029296875, 0.0941009521484375, 0.130401611328125, 0.1667022705078125, 0.2030029296875, 0.2393035888671875, 0.275604248046875, 0.3119049072265625, 0.34820556640625, 0.3845062255859375, 0.420806884765625, 0.4571075439453125, 0.493408203125, 0.5297088623046875, 0.566009521484375, 0.6023101806640625, 0.63861083984375, 0.6749114990234375, 0.711212158203125, 0.7475128173828125, 0.7838134765625, 0.8201141357421875, 0.856414794921875, 0.8927154541015625, 0.92901611328125, 0.9653167724609375, 1.001617431640625, 1.0379180908203125, 1.07421875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 7.0, 14.0, 26.0, 37.0, 49.0, 104.0, 153.0, 166.0, 127.0, 119.0, 69.0, 41.0, 17.0, 21.0, 14.0, 8.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.436581611633301, -5.194671154022217, -4.952760219573975, -4.710849761962891, -4.468938827514648, -4.2270283699035645, -3.9851179122924805, -3.7432072162628174, -3.5012965202331543, -3.259385824203491, -3.017475128173828, -2.775564670562744, -2.533653974533081, -2.291743278503418, -2.049832820892334, -1.807922124862671, -1.5660114288330078, -1.3241007328033447, -1.0821901559829712, -0.8402795195579529, -0.5983688831329346, -0.3564581871032715, -0.11454761028289795, 0.12736296653747559, 0.36927366256713867, 0.611184298992157, 0.8530949354171753, 1.0950055122375488, 1.336916208267212, 1.578826904296875, 1.8207374811172485, 2.062648057937622, 2.304558753967285, 2.5464694499969482, 2.7883801460266113, 3.0302906036376953, 3.2722012996673584, 3.5141119956970215, 3.7560224533081055, 3.9979331493377686, 4.239843845367432, 4.481754302978516, 4.723665237426758, 4.965575695037842, 5.207486152648926, 5.449397087097168, 5.691307544708252, 5.933218002319336, 6.175128936767578, 6.417039394378662, 6.658950328826904, 6.900860786437988, 7.1427717208862305, 7.3846821784973145, 7.626592636108398, 7.868503570556641, 8.110414505004883, 8.352325439453125, 8.59423542022705, 8.836146354675293, 9.078057289123535, 9.319967269897461, 9.561878204345703, 9.803789138793945, 10.045699119567871]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 6.0, 8.0, 4.0, 6.0, 6.0, 8.0, 11.0, 16.0, 15.0, 24.0, 22.0, 17.0, 35.0, 37.0, 35.0, 36.0, 46.0, 35.0, 55.0, 50.0, 59.0, 56.0, 39.0, 51.0, 48.0, 47.0, 27.0, 46.0, 29.0, 24.0, 13.0, 18.0, 15.0, 17.0, 17.0, 10.0, 0.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.054336071014404, -4.8941826820373535, -4.734029293060303, -4.57387638092041, -4.413722991943359, -4.253569602966309, -4.093416213989258, -3.933262825012207, -3.7731096744537354, -3.6129562854766846, -3.452803134918213, -3.292649745941162, -3.1324963569641113, -2.9723432064056396, -2.812189817428589, -2.652036666870117, -2.4918832778930664, -2.3317298889160156, -2.171576738357544, -2.011423349380493, -1.851270079612732, -1.6911168098449707, -1.53096342086792, -1.3708101511001587, -1.2106568813323975, -1.0505036115646362, -0.8903502821922302, -0.7301969528198242, -0.570043683052063, -0.40989041328430176, -0.24973708391189575, -0.08958375453948975, 0.07056951522827148, 0.2307228147983551, 0.3908761143684387, 0.5510294437408447, 0.711182713508606, 0.8713359832763672, 1.031489372253418, 1.1916426420211792, 1.3517959117889404, 1.5119491815567017, 1.672102451324463, 1.8322558403015137, 1.992409110069275, 2.152562379837036, 2.312715768814087, 2.4728689193725586, 2.6330223083496094, 2.79317569732666, 2.953328847885132, 3.1134822368621826, 3.2736353874206543, 3.433788776397705, 3.593942165374756, 3.7540955543518066, 3.9142487049102783, 4.07440185546875, 4.234555244445801, 4.394708633422852, 4.554862022399902, 4.715015411376953, 4.875168323516846, 5.0353217124938965, 5.195475101470947]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 18.0, 36.0, 43.0, 60.0, 117.0, 189.0, 359.0, 644.0, 1299.0, 2778.0, 6281.0, 15842.0, 42752.0, 122893.0, 326856.0, 331217.0, 125572.0, 43379.0, 15980.0, 6479.0, 2808.0, 1384.0, 708.0, 365.0, 196.0, 108.0, 72.0, 36.0, 33.0, 12.0, 11.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.783203125, -0.7587356567382812, -0.7342681884765625, -0.7098007202148438, -0.685333251953125, -0.6608657836914062, -0.6363983154296875, -0.6119308471679688, -0.58746337890625, -0.5629959106445312, -0.5385284423828125, -0.5140609741210938, -0.489593505859375, -0.46512603759765625, -0.4406585693359375, -0.41619110107421875, -0.3917236328125, -0.36725616455078125, -0.3427886962890625, -0.31832122802734375, -0.293853759765625, -0.26938629150390625, -0.2449188232421875, -0.22045135498046875, -0.19598388671875, -0.17151641845703125, -0.1470489501953125, -0.12258148193359375, -0.098114013671875, -0.07364654541015625, -0.0491790771484375, -0.02471160888671875, -0.000244140625, 0.02422332763671875, 0.0486907958984375, 0.07315826416015625, 0.097625732421875, 0.12209320068359375, 0.1465606689453125, 0.17102813720703125, 0.19549560546875, 0.21996307373046875, 0.2444305419921875, 0.26889801025390625, 0.293365478515625, 0.31783294677734375, 0.3423004150390625, 0.36676788330078125, 0.3912353515625, 0.41570281982421875, 0.4401702880859375, 0.46463775634765625, 0.489105224609375, 0.5135726928710938, 0.5380401611328125, 0.5625076293945312, 0.58697509765625, 0.6114425659179688, 0.6359100341796875, 0.6603775024414062, 0.684844970703125, 0.7093124389648438, 0.7337799072265625, 0.7582473754882812, 0.78271484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 2.0, 12.0, 7.0, 20.0, 15.0, 29.0, 28.0, 30.0, 32.0, 36.0, 40.0, 50.0, 60.0, 56.0, 58.0, 76.0, 60.0, 58.0, 52.0, 49.0, 38.0, 33.0, 44.0, 27.0, 18.0, 12.0, 18.0, 11.0, 11.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.402099609375, -0.3860588073730469, -0.37001800537109375, -0.3539772033691406, -0.3379364013671875, -0.3218955993652344, -0.30585479736328125, -0.2898139953613281, -0.273773193359375, -0.2577323913574219, -0.24169158935546875, -0.22565078735351562, -0.2096099853515625, -0.19356918334960938, -0.17752838134765625, -0.16148757934570312, -0.14544677734375, -0.12940597534179688, -0.11336517333984375, -0.09732437133789062, -0.0812835693359375, -0.06524276733398438, -0.04920196533203125, -0.033161163330078125, -0.017120361328125, -0.001079559326171875, 0.01496124267578125, 0.031002044677734375, 0.0470428466796875, 0.06308364868164062, 0.07912445068359375, 0.09516525268554688, 0.1112060546875, 0.12724685668945312, 0.14328765869140625, 0.15932846069335938, 0.1753692626953125, 0.19141006469726562, 0.20745086669921875, 0.22349166870117188, 0.239532470703125, 0.2555732727050781, 0.27161407470703125, 0.2876548767089844, 0.3036956787109375, 0.3197364807128906, 0.33577728271484375, 0.3518180847167969, 0.36785888671875, 0.3838996887207031, 0.39994049072265625, 0.4159812927246094, 0.4320220947265625, 0.4480628967285156, 0.46410369873046875, 0.4801445007324219, 0.496185302734375, 0.5122261047363281, 0.5282669067382812, 0.5443077087402344, 0.5603485107421875, 0.5763893127441406, 0.5924301147460938, 0.6084709167480469, 0.62451171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 15.0, 14.0, 32.0, 56.0, 83.0, 192.0, 432.0, 1286.0, 5336.0, 83530.0, 906973.0, 44845.0, 3962.0, 1043.0, 385.0, 169.0, 65.0, 57.0, 26.0, 23.0, 12.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017578125, -2.927276611328125, -2.83697509765625, -2.746673583984375, -2.6563720703125, -2.566070556640625, -2.47576904296875, -2.385467529296875, -2.295166015625, -2.204864501953125, -2.11456298828125, -2.024261474609375, -1.9339599609375, -1.843658447265625, -1.75335693359375, -1.663055419921875, -1.57275390625, -1.482452392578125, -1.39215087890625, -1.301849365234375, -1.2115478515625, -1.121246337890625, -1.03094482421875, -0.940643310546875, -0.850341796875, -0.760040283203125, -0.66973876953125, -0.579437255859375, -0.4891357421875, -0.398834228515625, -0.30853271484375, -0.218231201171875, -0.1279296875, -0.037628173828125, 0.05267333984375, 0.142974853515625, 0.2332763671875, 0.323577880859375, 0.41387939453125, 0.504180908203125, 0.594482421875, 0.684783935546875, 0.77508544921875, 0.865386962890625, 0.9556884765625, 1.045989990234375, 1.13629150390625, 1.226593017578125, 1.31689453125, 1.407196044921875, 1.49749755859375, 1.587799072265625, 1.6781005859375, 1.768402099609375, 1.85870361328125, 1.949005126953125, 2.039306640625, 2.129608154296875, 2.21990966796875, 2.310211181640625, 2.4005126953125, 2.490814208984375, 2.58111572265625, 2.671417236328125, 2.76171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 7.0, 14.0, 20.0, 14.0, 16.0, 23.0, 29.0, 25.0, 27.0, 32.0, 36.0, 39.0, 45.0, 43.0, 37.0, 56.0, 60.0, 49.0, 55.0, 46.0, 38.0, 33.0, 43.0, 32.0, 28.0, 31.0, 23.0, 22.0, 12.0, 4.0, 5.0, 10.0, 7.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.65234375, -1.59686279296875, -1.5413818359375, -1.48590087890625, -1.430419921875, -1.37493896484375, -1.3194580078125, -1.26397705078125, -1.20849609375, -1.15301513671875, -1.0975341796875, -1.04205322265625, -0.986572265625, -0.93109130859375, -0.8756103515625, -0.82012939453125, -0.7646484375, -0.70916748046875, -0.6536865234375, -0.59820556640625, -0.542724609375, -0.48724365234375, -0.4317626953125, -0.37628173828125, -0.32080078125, -0.26531982421875, -0.2098388671875, -0.15435791015625, -0.098876953125, -0.04339599609375, 0.0120849609375, 0.06756591796875, 0.123046875, 0.17852783203125, 0.2340087890625, 0.28948974609375, 0.344970703125, 0.40045166015625, 0.4559326171875, 0.51141357421875, 0.56689453125, 0.62237548828125, 0.6778564453125, 0.73333740234375, 0.788818359375, 0.84429931640625, 0.8997802734375, 0.95526123046875, 1.0107421875, 1.06622314453125, 1.1217041015625, 1.17718505859375, 1.232666015625, 1.28814697265625, 1.3436279296875, 1.39910888671875, 1.45458984375, 1.51007080078125, 1.5655517578125, 1.62103271484375, 1.676513671875, 1.73199462890625, 1.7874755859375, 1.84295654296875, 1.8984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 15.0, 24.0, 33.0, 56.0, 92.0, 167.0, 482.0, 2213.0, 32988.0, 976941.0, 32326.0, 2292.0, 492.0, 181.0, 89.0, 57.0, 30.0, 19.0, 11.0, 7.0, 6.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.033966064453125, -0.99176025390625, -0.949554443359375, -0.9073486328125, -0.865142822265625, -0.82293701171875, -0.780731201171875, -0.738525390625, -0.696319580078125, -0.65411376953125, -0.611907958984375, -0.5697021484375, -0.527496337890625, -0.48529052734375, -0.443084716796875, -0.40087890625, -0.358673095703125, -0.31646728515625, -0.274261474609375, -0.2320556640625, -0.189849853515625, -0.14764404296875, -0.105438232421875, -0.063232421875, -0.021026611328125, 0.02117919921875, 0.063385009765625, 0.1055908203125, 0.147796630859375, 0.19000244140625, 0.232208251953125, 0.2744140625, 0.316619873046875, 0.35882568359375, 0.401031494140625, 0.4432373046875, 0.485443115234375, 0.52764892578125, 0.569854736328125, 0.612060546875, 0.654266357421875, 0.69647216796875, 0.738677978515625, 0.7808837890625, 0.823089599609375, 0.86529541015625, 0.907501220703125, 0.94970703125, 0.991912841796875, 1.03411865234375, 1.076324462890625, 1.1185302734375, 1.160736083984375, 1.20294189453125, 1.245147705078125, 1.287353515625, 1.329559326171875, 1.37176513671875, 1.413970947265625, 1.4561767578125, 1.498382568359375, 1.54058837890625, 1.582794189453125, 1.625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 4.0, 8.0, 6.0, 12.0, 13.0, 21.0, 25.0, 39.0, 41.0, 72.0, 70.0, 111.0, 140.0, 132.0, 78.0, 59.0, 46.0, 29.0, 18.0, 14.0, 9.0, 6.0, 15.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.255243301391602e-05, -7.983110845088959e-05, -7.710978388786316e-05, -7.438845932483673e-05, -7.16671347618103e-05, -6.894581019878387e-05, -6.622448563575745e-05, -6.350316107273102e-05, -6.078183650970459e-05, -5.806051194667816e-05, -5.5339187383651733e-05, -5.2617862820625305e-05, -4.989653825759888e-05, -4.717521369457245e-05, -4.445388913154602e-05, -4.173256456851959e-05, -3.9011240005493164e-05, -3.6289915442466736e-05, -3.356859087944031e-05, -3.084726631641388e-05, -2.812594175338745e-05, -2.5404617190361023e-05, -2.2683292627334595e-05, -1.9961968064308167e-05, -1.7240643501281738e-05, -1.451931893825531e-05, -1.1797994375228882e-05, -9.076669812202454e-06, -6.355345249176025e-06, -3.634020686149597e-06, -9.126961231231689e-07, 1.8086284399032593e-06, 4.5299530029296875e-06, 7.251277565956116e-06, 9.972602128982544e-06, 1.2693926692008972e-05, 1.54152512550354e-05, 1.813657581806183e-05, 2.0857900381088257e-05, 2.3579224944114685e-05, 2.6300549507141113e-05, 2.902187407016754e-05, 3.174319863319397e-05, 3.44645231962204e-05, 3.7185847759246826e-05, 3.9907172322273254e-05, 4.262849688529968e-05, 4.534982144832611e-05, 4.807114601135254e-05, 5.079247057437897e-05, 5.3513795137405396e-05, 5.6235119700431824e-05, 5.895644426345825e-05, 6.167776882648468e-05, 6.439909338951111e-05, 6.712041795253754e-05, 6.984174251556396e-05, 7.256306707859039e-05, 7.528439164161682e-05, 7.800571620464325e-05, 8.072704076766968e-05, 8.34483653306961e-05, 8.616968989372253e-05, 8.889101445674896e-05, 9.161233901977539e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 7.0, 3.0, 5.0, 7.0, 15.0, 35.0, 52.0, 126.0, 396.0, 1372.0, 13101.0, 966863.0, 63007.0, 2612.0, 585.0, 214.0, 65.0, 39.0, 21.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7587890625, -1.710845947265625, -1.66290283203125, -1.614959716796875, -1.5670166015625, -1.519073486328125, -1.47113037109375, -1.423187255859375, -1.375244140625, -1.327301025390625, -1.27935791015625, -1.231414794921875, -1.1834716796875, -1.135528564453125, -1.08758544921875, -1.039642333984375, -0.99169921875, -0.943756103515625, -0.89581298828125, -0.847869873046875, -0.7999267578125, -0.751983642578125, -0.70404052734375, -0.656097412109375, -0.608154296875, -0.560211181640625, -0.51226806640625, -0.464324951171875, -0.4163818359375, -0.368438720703125, -0.32049560546875, -0.272552490234375, -0.224609375, -0.176666259765625, -0.12872314453125, -0.080780029296875, -0.0328369140625, 0.015106201171875, 0.06304931640625, 0.110992431640625, 0.158935546875, 0.206878662109375, 0.25482177734375, 0.302764892578125, 0.3507080078125, 0.398651123046875, 0.44659423828125, 0.494537353515625, 0.54248046875, 0.590423583984375, 0.63836669921875, 0.686309814453125, 0.7342529296875, 0.782196044921875, 0.83013916015625, 0.878082275390625, 0.926025390625, 0.973968505859375, 1.02191162109375, 1.069854736328125, 1.1177978515625, 1.165740966796875, 1.21368408203125, 1.261627197265625, 1.3095703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 7.0, 11.0, 18.0, 29.0, 26.0, 37.0, 51.0, 74.0, 117.0, 120.0, 128.0, 94.0, 79.0, 51.0, 42.0, 26.0, 22.0, 16.0, 12.0, 14.0, 7.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57763671875, -0.5563583374023438, -0.5350799560546875, -0.5138015747070312, -0.492523193359375, -0.47124481201171875, -0.4499664306640625, -0.42868804931640625, -0.40740966796875, -0.38613128662109375, -0.3648529052734375, -0.34357452392578125, -0.322296142578125, -0.30101776123046875, -0.2797393798828125, -0.25846099853515625, -0.2371826171875, -0.21590423583984375, -0.1946258544921875, -0.17334747314453125, -0.152069091796875, -0.13079071044921875, -0.1095123291015625, -0.08823394775390625, -0.06695556640625, -0.04567718505859375, -0.0243988037109375, -0.00312042236328125, 0.018157958984375, 0.03943634033203125, 0.0607147216796875, 0.08199310302734375, 0.103271484375, 0.12454986572265625, 0.1458282470703125, 0.16710662841796875, 0.188385009765625, 0.20966339111328125, 0.2309417724609375, 0.25222015380859375, 0.27349853515625, 0.29477691650390625, 0.3160552978515625, 0.33733367919921875, 0.358612060546875, 0.37989044189453125, 0.4011688232421875, 0.42244720458984375, 0.4437255859375, 0.46500396728515625, 0.4862823486328125, 0.5075607299804688, 0.528839111328125, 0.5501174926757812, 0.5713958740234375, 0.5926742553710938, 0.61395263671875, 0.6352310180664062, 0.6565093994140625, 0.6777877807617188, 0.699066162109375, 0.7203445434570312, 0.7416229248046875, 0.7629013061523438, 0.7841796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 36.0, 174.0, 353.0, 281.0, 95.0, 38.0, 15.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5160493850708, -7.850541591644287, -7.185033798217773, -6.519525527954102, -5.854017734527588, -5.188509941101074, -4.523001670837402, -3.8574938774108887, -3.191986083984375, -2.5264782905578613, -1.8609702587127686, -1.1954623460769653, -0.5299544334411621, 0.13555335998535156, 0.8010613918304443, 1.466569423675537, 2.132077217102051, 2.7975850105285645, 3.4630930423736572, 4.12860107421875, 4.794108867645264, 5.459616661071777, 6.125124931335449, 6.790632724761963, 7.456140518188477, 8.121648788452148, 8.787156105041504, 9.452664375305176, 10.118171691894531, 10.783679962158203, 11.449188232421875, 12.114696502685547, 12.780204772949219, 13.44571304321289, 14.111220359802246, 14.776728630065918, 15.442235946655273, 16.107744216918945, 16.773252487182617, 17.43876075744629, 18.104267120361328, 18.769775390625, 19.435283660888672, 20.10079002380371, 20.766298294067383, 21.431806564331055, 22.097314834594727, 22.7628231048584, 23.42833137512207, 24.093839645385742, 24.759347915649414, 25.424854278564453, 26.090362548828125, 26.755870819091797, 27.42137908935547, 28.08688735961914, 28.752395629882812, 29.417903900146484, 30.083412170410156, 30.748918533325195, 31.414426803588867, 32.079933166503906, 32.74544143676758, 33.41094970703125, 34.07645797729492]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 9.0, 6.0, 14.0, 20.0, 16.0, 22.0, 31.0, 30.0, 40.0, 49.0, 54.0, 44.0, 61.0, 74.0, 68.0, 74.0, 71.0, 42.0, 55.0, 40.0, 32.0, 29.0, 26.0, 20.0, 15.0, 11.0, 16.0, 6.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.755620956420898, -9.486498832702637, -9.217377662658691, -8.94825553894043, -8.679133415222168, -8.410011291503906, -8.140890121459961, -7.871767997741699, -7.602646350860596, -7.333524703979492, -7.0644025802612305, -6.795280933380127, -6.526159286499023, -6.257037162780762, -5.987915515899658, -5.718793869018555, -5.449671745300293, -5.1805500984191895, -4.911427974700928, -4.642306327819824, -4.3731842041015625, -4.104062557220459, -3.8349409103393555, -3.565819025039673, -3.2966971397399902, -3.0275752544403076, -2.758453369140625, -2.4893317222595215, -2.220209836959839, -1.9510879516601562, -1.6819661855697632, -1.4128444194793701, -1.1437225341796875, -0.8746007084846497, -0.6054788827896118, -0.336357057094574, -0.06723523139953613, 0.20188665390014648, 0.47100841999053955, 0.7401301860809326, 1.0092520713806152, 1.2783739566802979, 1.547495722770691, 1.816617488861084, 2.0857393741607666, 2.354861259460449, 2.6239829063415527, 2.8931047916412354, 3.162226676940918, 3.4313485622406006, 3.700470447540283, 3.9695920944213867, 4.238714218139648, 4.507835865020752, 4.7769575119018555, 5.046079635620117, 5.315201282501221, 5.584322929382324, 5.853445053100586, 6.1225666999816895, 6.391688346862793, 6.660810470581055, 6.929932117462158, 7.199053764343262, 7.468175888061523]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 14.0, 19.0, 13.0, 30.0, 31.0, 61.0, 125.0, 253.0, 611.0, 1849.0, 10007.0, 254150.0, 3887113.0, 34383.0, 3945.0, 982.0, 305.0, 148.0, 96.0, 44.0, 25.0, 16.0, 17.0, 6.0, 13.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.2214813232421875, -1.166595458984375, -1.1117095947265625, -1.05682373046875, -1.0019378662109375, -0.947052001953125, -0.8921661376953125, -0.8372802734375, -0.7823944091796875, -0.727508544921875, -0.6726226806640625, -0.61773681640625, -0.5628509521484375, -0.507965087890625, -0.4530792236328125, -0.398193359375, -0.3433074951171875, -0.288421630859375, -0.2335357666015625, -0.17864990234375, -0.1237640380859375, -0.068878173828125, -0.0139923095703125, 0.0408935546875, 0.0957794189453125, 0.150665283203125, 0.2055511474609375, 0.26043701171875, 0.3153228759765625, 0.370208740234375, 0.4250946044921875, 0.47998046875, 0.5348663330078125, 0.589752197265625, 0.6446380615234375, 0.69952392578125, 0.7544097900390625, 0.809295654296875, 0.8641815185546875, 0.9190673828125, 0.9739532470703125, 1.028839111328125, 1.0837249755859375, 1.13861083984375, 1.1934967041015625, 1.248382568359375, 1.3032684326171875, 1.358154296875, 1.4130401611328125, 1.467926025390625, 1.5228118896484375, 1.57769775390625, 1.6325836181640625, 1.687469482421875, 1.7423553466796875, 1.7972412109375, 1.8521270751953125, 1.907012939453125, 1.9618988037109375, 2.01678466796875, 2.0716705322265625, 2.126556396484375, 2.1814422607421875, 2.236328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 7.0, 12.0, 4.0, 7.0, 13.0, 19.0, 32.0, 31.0, 31.0, 35.0, 51.0, 37.0, 49.0, 51.0, 67.0, 56.0, 61.0, 67.0, 45.0, 40.0, 43.0, 34.0, 33.0, 26.0, 31.0, 22.0, 20.0, 22.0, 13.0, 8.0, 10.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385986328125, -0.3716468811035156, -0.35730743408203125, -0.3429679870605469, -0.3286285400390625, -0.3142890930175781, -0.29994964599609375, -0.2856101989746094, -0.271270751953125, -0.2569313049316406, -0.24259185791015625, -0.22825241088867188, -0.2139129638671875, -0.19957351684570312, -0.18523406982421875, -0.17089462280273438, -0.15655517578125, -0.14221572875976562, -0.12787628173828125, -0.11353683471679688, -0.0991973876953125, -0.08485794067382812, -0.07051849365234375, -0.056179046630859375, -0.041839599609375, -0.027500152587890625, -0.01316070556640625, 0.001178741455078125, 0.0155181884765625, 0.029857635498046875, 0.04419708251953125, 0.058536529541015625, 0.0728759765625, 0.08721542358398438, 0.10155487060546875, 0.11589431762695312, 0.1302337646484375, 0.14457321166992188, 0.15891265869140625, 0.17325210571289062, 0.187591552734375, 0.20193099975585938, 0.21627044677734375, 0.23060989379882812, 0.2449493408203125, 0.2592887878417969, 0.27362823486328125, 0.2879676818847656, 0.30230712890625, 0.3166465759277344, 0.33098602294921875, 0.3453254699707031, 0.3596649169921875, 0.3740043640136719, 0.38834381103515625, 0.4026832580566406, 0.417022705078125, 0.4313621520996094, 0.44570159912109375, 0.4600410461425781, 0.4743804931640625, 0.4887199401855469, 0.5030593872070312, 0.5173988342285156, 0.53173828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 10.0, 19.0, 21.0, 37.0, 55.0, 90.0, 126.0, 237.0, 395.0, 915.0, 3320.0, 21215.0, 910249.0, 3219293.0, 32014.0, 4271.0, 1081.0, 404.0, 208.0, 113.0, 72.0, 54.0, 30.0, 16.0, 23.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5859375, -1.533233642578125, -1.48052978515625, -1.427825927734375, -1.3751220703125, -1.322418212890625, -1.26971435546875, -1.217010498046875, -1.164306640625, -1.111602783203125, -1.05889892578125, -1.006195068359375, -0.9534912109375, -0.900787353515625, -0.84808349609375, -0.795379638671875, -0.74267578125, -0.689971923828125, -0.63726806640625, -0.584564208984375, -0.5318603515625, -0.479156494140625, -0.42645263671875, -0.373748779296875, -0.321044921875, -0.268341064453125, -0.21563720703125, -0.162933349609375, -0.1102294921875, -0.057525634765625, -0.00482177734375, 0.047882080078125, 0.1005859375, 0.153289794921875, 0.20599365234375, 0.258697509765625, 0.3114013671875, 0.364105224609375, 0.41680908203125, 0.469512939453125, 0.522216796875, 0.574920654296875, 0.62762451171875, 0.680328369140625, 0.7330322265625, 0.785736083984375, 0.83843994140625, 0.891143798828125, 0.94384765625, 0.996551513671875, 1.04925537109375, 1.101959228515625, 1.1546630859375, 1.207366943359375, 1.26007080078125, 1.312774658203125, 1.365478515625, 1.418182373046875, 1.47088623046875, 1.523590087890625, 1.5762939453125, 1.628997802734375, 1.68170166015625, 1.734405517578125, 1.787109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 21.0, 16.0, 22.0, 34.0, 64.0, 168.0, 371.0, 1097.0, 1390.0, 478.0, 185.0, 99.0, 52.0, 20.0, 18.0, 5.0, 9.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.4787750244140625, -1.439971923828125, -1.4011688232421875, -1.36236572265625, -1.3235626220703125, -1.284759521484375, -1.2459564208984375, -1.2071533203125, -1.1683502197265625, -1.129547119140625, -1.0907440185546875, -1.05194091796875, -1.0131378173828125, -0.974334716796875, -0.9355316162109375, -0.896728515625, -0.8579254150390625, -0.819122314453125, -0.7803192138671875, -0.74151611328125, -0.7027130126953125, -0.663909912109375, -0.6251068115234375, -0.5863037109375, -0.5475006103515625, -0.508697509765625, -0.4698944091796875, -0.43109130859375, -0.3922882080078125, -0.353485107421875, -0.3146820068359375, -0.27587890625, -0.2370758056640625, -0.198272705078125, -0.1594696044921875, -0.12066650390625, -0.0818634033203125, -0.043060302734375, -0.0042572021484375, 0.0345458984375, 0.0733489990234375, 0.112152099609375, 0.1509552001953125, 0.18975830078125, 0.2285614013671875, 0.267364501953125, 0.3061676025390625, 0.344970703125, 0.3837738037109375, 0.422576904296875, 0.4613800048828125, 0.50018310546875, 0.5389862060546875, 0.577789306640625, 0.6165924072265625, 0.6553955078125, 0.6941986083984375, 0.733001708984375, 0.7718048095703125, 0.81060791015625, 0.8494110107421875, 0.888214111328125, 0.9270172119140625, 0.9658203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 17.0, 25.0, 59.0, 114.0, 210.0, 243.0, 172.0, 84.0, 34.0, 17.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.057815551757812, -11.742238998413086, -11.426661491394043, -11.111084938049316, -10.795507431030273, -10.479930877685547, -10.164353370666504, -9.848776817321777, -9.533199310302734, -9.217622756958008, -8.902045249938965, -8.586468696594238, -8.270891189575195, -7.955314636230469, -7.639737606048584, -7.324160575866699, -7.008584022521973, -6.693006992340088, -6.377429962158203, -6.061852931976318, -5.746275901794434, -5.430699348449707, -5.115122318267822, -4.7995452880859375, -4.483968257904053, -4.168391227722168, -3.852814197540283, -3.5372374057769775, -3.2216603755950928, -2.906083345413208, -2.5905065536499023, -2.2749295234680176, -1.9593524932861328, -1.643775463104248, -1.3281985521316528, -1.0126216411590576, -0.6970446109771729, -0.3814675807952881, -0.06589066982269287, 0.24968624114990234, 0.5652632713317871, 0.8808402419090271, 1.196417212486267, 1.5119941234588623, 1.827571153640747, 2.143148183822632, 2.4587249755859375, 2.7743020057678223, 3.089879035949707, 3.405456066131592, 3.7210330963134766, 4.036610126495361, 4.352187156677246, 4.667763710021973, 4.983340740203857, 5.298917770385742, 5.614494800567627, 5.930071830749512, 6.2456488609313965, 6.561225891113281, 6.876802444458008, 7.192379951477051, 7.507956504821777, 7.823533535003662, 8.139110565185547]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 4.0, 7.0, 15.0, 11.0, 7.0, 14.0, 15.0, 11.0, 24.0, 29.0, 23.0, 20.0, 37.0, 43.0, 36.0, 40.0, 52.0, 53.0, 49.0, 50.0, 47.0, 47.0, 33.0, 29.0, 38.0, 34.0, 34.0, 24.0, 28.0, 20.0, 16.0, 16.0, 14.0, 10.0, 13.0, 9.0, 5.0, 9.0, 10.0, 8.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.42110013961792, -3.3187904357910156, -3.2164807319641113, -3.114171028137207, -3.0118613243103027, -2.9095516204833984, -2.807241678237915, -2.7049319744110107, -2.6026222705841064, -2.500312566757202, -2.398002862930298, -2.2956931591033936, -2.19338321685791, -2.091073513031006, -1.9887638092041016, -1.8864541053771973, -1.784144401550293, -1.6818346977233887, -1.5795249938964844, -1.4772151708602905, -1.3749054670333862, -1.272595763206482, -1.170285940170288, -1.0679762363433838, -0.9656665325164795, -0.8633568286895752, -0.7610470652580261, -0.658737301826477, -0.5564275979995728, -0.45411789417266846, -0.3518081307411194, -0.2494983673095703, -0.14718866348266602, -0.04487892985343933, 0.057430803775787354, 0.15974053740501404, 0.2620502710342407, 0.364359974861145, 0.4666697382926941, 0.5689795017242432, 0.6712892055511475, 0.7735989093780518, 0.8759086728096008, 0.9782184362411499, 1.0805281400680542, 1.1828378438949585, 1.2851476669311523, 1.3874573707580566, 1.489767074584961, 1.5920767784118652, 1.6943864822387695, 1.7966963052749634, 1.8990060091018677, 2.0013155937194824, 2.103625535964966, 2.20593523979187, 2.3082449436187744, 2.4105546474456787, 2.512864351272583, 2.6151740550994873, 2.7174839973449707, 2.819793701171875, 2.9221034049987793, 3.0244131088256836, 3.126722812652588]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 9.0, 10.0, 22.0, 32.0, 48.0, 74.0, 154.0, 266.0, 496.0, 1116.0, 2665.0, 6809.0, 19191.0, 58872.0, 204845.0, 468182.0, 198716.0, 56892.0, 18758.0, 6588.0, 2639.0, 1058.0, 545.0, 217.0, 117.0, 91.0, 48.0, 31.0, 16.0, 14.0, 10.0, 3.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7407455444335938, -0.7104949951171875, -0.6802444458007812, -0.649993896484375, -0.6197433471679688, -0.5894927978515625, -0.5592422485351562, -0.52899169921875, -0.49874114990234375, -0.4684906005859375, -0.43824005126953125, -0.407989501953125, -0.37773895263671875, -0.3474884033203125, -0.31723785400390625, -0.2869873046875, -0.25673675537109375, -0.2264862060546875, -0.19623565673828125, -0.165985107421875, -0.13573455810546875, -0.1054840087890625, -0.07523345947265625, -0.04498291015625, -0.01473236083984375, 0.0155181884765625, 0.04576873779296875, 0.076019287109375, 0.10626983642578125, 0.1365203857421875, 0.16677093505859375, 0.197021484375, 0.22727203369140625, 0.2575225830078125, 0.28777313232421875, 0.318023681640625, 0.34827423095703125, 0.3785247802734375, 0.40877532958984375, 0.43902587890625, 0.46927642822265625, 0.4995269775390625, 0.5297775268554688, 0.560028076171875, 0.5902786254882812, 0.6205291748046875, 0.6507797241210938, 0.6810302734375, 0.7112808227539062, 0.7415313720703125, 0.7717819213867188, 0.802032470703125, 0.8322830200195312, 0.8625335693359375, 0.8927841186523438, 0.92303466796875, 0.9532852172851562, 0.9835357666015625, 1.0137863159179688, 1.044036865234375, 1.0742874145507812, 1.1045379638671875, 1.1347885131835938, 1.1650390625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 7.0, 3.0, 9.0, 16.0, 12.0, 17.0, 28.0, 12.0, 31.0, 41.0, 33.0, 41.0, 35.0, 41.0, 45.0, 54.0, 47.0, 53.0, 56.0, 57.0, 44.0, 42.0, 51.0, 31.0, 28.0, 29.0, 25.0, 21.0, 12.0, 21.0, 17.0, 11.0, 9.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.394287109375, -0.3812408447265625, -0.368194580078125, -0.3551483154296875, -0.34210205078125, -0.3290557861328125, -0.316009521484375, -0.3029632568359375, -0.2899169921875, -0.2768707275390625, -0.263824462890625, -0.2507781982421875, -0.23773193359375, -0.2246856689453125, -0.211639404296875, -0.1985931396484375, -0.185546875, -0.1725006103515625, -0.159454345703125, -0.1464080810546875, -0.13336181640625, -0.1203155517578125, -0.107269287109375, -0.0942230224609375, -0.0811767578125, -0.0681304931640625, -0.055084228515625, -0.0420379638671875, -0.02899169921875, -0.0159454345703125, -0.002899169921875, 0.0101470947265625, 0.023193359375, 0.0362396240234375, 0.049285888671875, 0.0623321533203125, 0.07537841796875, 0.0884246826171875, 0.101470947265625, 0.1145172119140625, 0.1275634765625, 0.1406097412109375, 0.153656005859375, 0.1667022705078125, 0.17974853515625, 0.1927947998046875, 0.205841064453125, 0.2188873291015625, 0.23193359375, 0.2449798583984375, 0.258026123046875, 0.2710723876953125, 0.28411865234375, 0.2971649169921875, 0.310211181640625, 0.3232574462890625, 0.3363037109375, 0.3493499755859375, 0.362396240234375, 0.3754425048828125, 0.38848876953125, 0.4015350341796875, 0.414581298828125, 0.4276275634765625, 0.440673828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 9.0, 1.0, 3.0, 8.0, 12.0, 15.0, 21.0, 31.0, 62.0, 80.0, 210.0, 451.0, 1264.0, 5083.0, 32209.0, 418737.0, 545315.0, 37234.0, 5477.0, 1387.0, 489.0, 215.0, 90.0, 47.0, 37.0, 16.0, 14.0, 18.0, 7.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.599609375, -1.540435791015625, -1.48126220703125, -1.422088623046875, -1.3629150390625, -1.303741455078125, -1.24456787109375, -1.185394287109375, -1.126220703125, -1.067047119140625, -1.00787353515625, -0.948699951171875, -0.8895263671875, -0.830352783203125, -0.77117919921875, -0.712005615234375, -0.65283203125, -0.593658447265625, -0.53448486328125, -0.475311279296875, -0.4161376953125, -0.356964111328125, -0.29779052734375, -0.238616943359375, -0.179443359375, -0.120269775390625, -0.06109619140625, -0.001922607421875, 0.0572509765625, 0.116424560546875, 0.17559814453125, 0.234771728515625, 0.2939453125, 0.353118896484375, 0.41229248046875, 0.471466064453125, 0.5306396484375, 0.589813232421875, 0.64898681640625, 0.708160400390625, 0.767333984375, 0.826507568359375, 0.88568115234375, 0.944854736328125, 1.0040283203125, 1.063201904296875, 1.12237548828125, 1.181549072265625, 1.24072265625, 1.299896240234375, 1.35906982421875, 1.418243408203125, 1.4774169921875, 1.536590576171875, 1.59576416015625, 1.654937744140625, 1.714111328125, 1.773284912109375, 1.83245849609375, 1.891632080078125, 1.9508056640625, 2.009979248046875, 2.06915283203125, 2.128326416015625, 2.1875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 12.0, 9.0, 5.0, 9.0, 17.0, 16.0, 14.0, 24.0, 16.0, 32.0, 28.0, 42.0, 52.0, 50.0, 47.0, 53.0, 58.0, 53.0, 51.0, 47.0, 47.0, 56.0, 25.0, 48.0, 29.0, 27.0, 22.0, 29.0, 23.0, 18.0, 14.0, 6.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.3675384521484375, -1.319061279296875, -1.2705841064453125, -1.22210693359375, -1.1736297607421875, -1.125152587890625, -1.0766754150390625, -1.0281982421875, -0.9797210693359375, -0.931243896484375, -0.8827667236328125, -0.83428955078125, -0.7858123779296875, -0.737335205078125, -0.6888580322265625, -0.640380859375, -0.5919036865234375, -0.543426513671875, -0.4949493408203125, -0.44647216796875, -0.3979949951171875, -0.349517822265625, -0.3010406494140625, -0.2525634765625, -0.2040863037109375, -0.155609130859375, -0.1071319580078125, -0.05865478515625, -0.0101776123046875, 0.038299560546875, 0.0867767333984375, 0.13525390625, 0.1837310791015625, 0.232208251953125, 0.2806854248046875, 0.32916259765625, 0.3776397705078125, 0.426116943359375, 0.4745941162109375, 0.5230712890625, 0.5715484619140625, 0.620025634765625, 0.6685028076171875, 0.71697998046875, 0.7654571533203125, 0.813934326171875, 0.8624114990234375, 0.910888671875, 0.9593658447265625, 1.007843017578125, 1.0563201904296875, 1.10479736328125, 1.1532745361328125, 1.201751708984375, 1.2502288818359375, 1.2987060546875, 1.3471832275390625, 1.395660400390625, 1.4441375732421875, 1.49261474609375, 1.5410919189453125, 1.589569091796875, 1.6380462646484375, 1.6865234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 3.0, 8.0, 17.0, 19.0, 40.0, 67.0, 172.0, 445.0, 1498.0, 8096.0, 349877.0, 675328.0, 10378.0, 1803.0, 452.0, 158.0, 80.0, 46.0, 23.0, 18.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8837890625, -0.8498687744140625, -0.815948486328125, -0.7820281982421875, -0.74810791015625, -0.7141876220703125, -0.680267333984375, -0.6463470458984375, -0.6124267578125, -0.5785064697265625, -0.544586181640625, -0.5106658935546875, -0.47674560546875, -0.4428253173828125, -0.408905029296875, -0.3749847412109375, -0.341064453125, -0.3071441650390625, -0.273223876953125, -0.2393035888671875, -0.20538330078125, -0.1714630126953125, -0.137542724609375, -0.1036224365234375, -0.0697021484375, -0.0357818603515625, -0.001861572265625, 0.0320587158203125, 0.06597900390625, 0.0998992919921875, 0.133819580078125, 0.1677398681640625, 0.20166015625, 0.2355804443359375, 0.269500732421875, 0.3034210205078125, 0.33734130859375, 0.3712615966796875, 0.405181884765625, 0.4391021728515625, 0.4730224609375, 0.5069427490234375, 0.540863037109375, 0.5747833251953125, 0.60870361328125, 0.6426239013671875, 0.676544189453125, 0.7104644775390625, 0.744384765625, 0.7783050537109375, 0.812225341796875, 0.8461456298828125, 0.88006591796875, 0.9139862060546875, 0.947906494140625, 0.9818267822265625, 1.0157470703125, 1.0496673583984375, 1.083587646484375, 1.1175079345703125, 1.15142822265625, 1.1853485107421875, 1.219268798828125, 1.2531890869140625, 1.287109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 8.0, 12.0, 18.0, 32.0, 35.0, 69.0, 71.0, 120.0, 154.0, 161.0, 90.0, 70.0, 38.0, 35.0, 18.0, 14.0, 14.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.082389831542969e-05, -7.741153240203857e-05, -7.399916648864746e-05, -7.058680057525635e-05, -6.717443466186523e-05, -6.376206874847412e-05, -6.034970283508301e-05, -5.6937336921691895e-05, -5.352497100830078e-05, -5.011260509490967e-05, -4.6700239181518555e-05, -4.328787326812744e-05, -3.987550735473633e-05, -3.6463141441345215e-05, -3.30507755279541e-05, -2.9638409614562988e-05, -2.6226043701171875e-05, -2.2813677787780762e-05, -1.940131187438965e-05, -1.5988945960998535e-05, -1.2576580047607422e-05, -9.164214134216309e-06, -5.751848220825195e-06, -2.339482307434082e-06, 1.0728836059570312e-06, 4.4852495193481445e-06, 7.897615432739258e-06, 1.1309981346130371e-05, 1.4722347259521484e-05, 1.8134713172912598e-05, 2.154707908630371e-05, 2.4959444999694824e-05, 2.8371810913085938e-05, 3.178417682647705e-05, 3.5196542739868164e-05, 3.860890865325928e-05, 4.202127456665039e-05, 4.5433640480041504e-05, 4.884600639343262e-05, 5.225837230682373e-05, 5.5670738220214844e-05, 5.908310413360596e-05, 6.249547004699707e-05, 6.590783596038818e-05, 6.93202018737793e-05, 7.273256778717041e-05, 7.614493370056152e-05, 7.955729961395264e-05, 8.296966552734375e-05, 8.638203144073486e-05, 8.979439735412598e-05, 9.320676326751709e-05, 9.66191291809082e-05, 0.00010003149509429932, 0.00010344386100769043, 0.00010685622692108154, 0.00011026859283447266, 0.00011368095874786377, 0.00011709332466125488, 0.000120505690574646, 0.0001239180564880371, 0.00012733042240142822, 0.00013074278831481934, 0.00013415515422821045, 0.00013756752014160156]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 14.0, 17.0, 36.0, 58.0, 114.0, 232.0, 601.0, 2061.0, 13336.0, 607960.0, 409540.0, 11669.0, 1936.0, 528.0, 215.0, 113.0, 53.0, 21.0, 17.0, 12.0, 4.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76708984375, -0.7350845336914062, -0.7030792236328125, -0.6710739135742188, -0.639068603515625, -0.6070632934570312, -0.5750579833984375, -0.5430526733398438, -0.51104736328125, -0.47904205322265625, -0.4470367431640625, -0.41503143310546875, -0.383026123046875, -0.35102081298828125, -0.3190155029296875, -0.28701019287109375, -0.2550048828125, -0.22299957275390625, -0.1909942626953125, -0.15898895263671875, -0.126983642578125, -0.09497833251953125, -0.0629730224609375, -0.03096771240234375, 0.00103759765625, 0.03304290771484375, 0.0650482177734375, 0.09705352783203125, 0.129058837890625, 0.16106414794921875, 0.1930694580078125, 0.22507476806640625, 0.257080078125, 0.28908538818359375, 0.3210906982421875, 0.35309600830078125, 0.385101318359375, 0.41710662841796875, 0.4491119384765625, 0.48111724853515625, 0.51312255859375, 0.5451278686523438, 0.5771331787109375, 0.6091384887695312, 0.641143798828125, 0.6731491088867188, 0.7051544189453125, 0.7371597290039062, 0.7691650390625, 0.8011703491210938, 0.8331756591796875, 0.8651809692382812, 0.897186279296875, 0.9291915893554688, 0.9611968994140625, 0.9932022094726562, 1.02520751953125, 1.0572128295898438, 1.0892181396484375, 1.1212234497070312, 1.153228759765625, 1.1852340698242188, 1.2172393798828125, 1.2492446899414062, 1.28125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 8.0, 15.0, 16.0, 33.0, 51.0, 60.0, 93.0, 96.0, 105.0, 118.0, 113.0, 89.0, 65.0, 38.0, 25.0, 19.0, 10.0, 11.0, 6.0, 8.0, 6.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7431640625, -0.725494384765625, -0.70782470703125, -0.690155029296875, -0.6724853515625, -0.654815673828125, -0.63714599609375, -0.619476318359375, -0.601806640625, -0.584136962890625, -0.56646728515625, -0.548797607421875, -0.5311279296875, -0.513458251953125, -0.49578857421875, -0.478118896484375, -0.46044921875, -0.442779541015625, -0.42510986328125, -0.407440185546875, -0.3897705078125, -0.372100830078125, -0.35443115234375, -0.336761474609375, -0.319091796875, -0.301422119140625, -0.28375244140625, -0.266082763671875, -0.2484130859375, -0.230743408203125, -0.21307373046875, -0.195404052734375, -0.177734375, -0.160064697265625, -0.14239501953125, -0.124725341796875, -0.1070556640625, -0.089385986328125, -0.07171630859375, -0.054046630859375, -0.036376953125, -0.018707275390625, -0.00103759765625, 0.016632080078125, 0.0343017578125, 0.051971435546875, 0.06964111328125, 0.087310791015625, 0.10498046875, 0.122650146484375, 0.14031982421875, 0.157989501953125, 0.1756591796875, 0.193328857421875, 0.21099853515625, 0.228668212890625, 0.246337890625, 0.264007568359375, 0.28167724609375, 0.299346923828125, 0.3170166015625, 0.334686279296875, 0.35235595703125, 0.370025634765625, 0.3876953125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 9.0, 6.0, 18.0, 43.0, 112.0, 227.0, 265.0, 159.0, 97.0, 26.0, 15.0, 6.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0981035232543945, -5.669137477874756, -5.240171432495117, -4.81120491027832, -4.382238864898682, -3.953272819519043, -3.524306535720825, -3.0953402519226074, -2.6663742065429688, -2.23740816116333, -1.8084418773651123, -1.379475712776184, -0.9505095481872559, -0.5215435028076172, -0.09257721900939941, 0.33638906478881836, 0.765355110168457, 1.1943212747573853, 1.6232874393463135, 2.0522537231445312, 2.48121976852417, 2.9101858139038086, 3.3391520977020264, 3.768118381500244, 4.197084426879883, 4.6260504722595215, 5.05501651763916, 5.483983039855957, 5.912949085235596, 6.341915130615234, 6.770881652832031, 7.19984769821167, 7.628814697265625, 8.057781219482422, 8.486746788024902, 8.9157133102417, 9.34467887878418, 9.773645401000977, 10.202611923217773, 10.63157844543457, 11.06054401397705, 11.489510536193848, 11.918476104736328, 12.347442626953125, 12.776409149169922, 13.205374717712402, 13.6343412399292, 14.06330680847168, 14.492273330688477, 14.921239852905273, 15.350205421447754, 15.77917194366455, 16.20813751220703, 16.637104034423828, 17.066070556640625, 17.495037078857422, 17.92400360107422, 18.352970123291016, 18.781936645507812, 19.210901260375977, 19.639867782592773, 20.06883430480957, 20.497800827026367, 20.926767349243164, 21.355731964111328]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 1.0, 5.0, 13.0, 19.0, 14.0, 14.0, 25.0, 26.0, 46.0, 33.0, 39.0, 43.0, 43.0, 64.0, 69.0, 86.0, 70.0, 63.0, 45.0, 43.0, 42.0, 31.0, 35.0, 34.0, 12.0, 19.0, 16.0, 15.0, 8.0, 7.0, 6.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.819536209106445, -9.577393531799316, -9.335250854492188, -9.093109130859375, -8.850966453552246, -8.608823776245117, -8.366681098937988, -8.12453842163086, -7.882396221160889, -7.64025354385376, -7.398111343383789, -7.15596866607666, -6.913825988769531, -6.6716837882995605, -6.429541110992432, -6.187398910522461, -5.945256233215332, -5.703113555908203, -5.460971355438232, -5.2188286781311035, -4.976686477661133, -4.734543800354004, -4.492401123046875, -4.250258445739746, -4.008116245269775, -3.7659738063812256, -3.523831367492676, -3.281688690185547, -3.039546251296997, -2.7974038124084473, -2.5552611351013184, -2.3131186962127686, -2.0709762573242188, -1.828833818435669, -1.5866912603378296, -1.3445487022399902, -1.1024062633514404, -0.8602638244628906, -0.6181212663650513, -0.3759787082672119, -0.1338362693786621, 0.10830622911453247, 0.35044872760772705, 0.5925912261009216, 0.8347337245941162, 1.076876163482666, 1.3190187215805054, 1.5611612796783447, 1.8033037185668945, 2.0454461574554443, 2.287588596343994, 2.529731273651123, 2.771873712539673, 3.0140161514282227, 3.2561588287353516, 3.4983012676239014, 3.740443706512451, 3.982586145401001, 4.224728584289551, 4.46687126159668, 4.709013938903809, 4.951156139373779, 5.193298816680908, 5.435441017150879, 5.677583694458008]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 11.0, 4.0, 15.0, 18.0, 26.0, 33.0, 44.0, 78.0, 130.0, 154.0, 269.0, 410.0, 705.0, 1235.0, 2233.0, 4747.0, 11479.0, 36479.0, 289872.0, 3278335.0, 491786.0, 50153.0, 14529.0, 5703.0, 2620.0, 1346.0, 707.0, 429.0, 255.0, 172.0, 99.0, 57.0, 47.0, 30.0, 17.0, 12.0, 11.0, 9.0, 4.0, 6.0, 1.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.77294921875, -0.7518234252929688, -0.7306976318359375, -0.7095718383789062, -0.688446044921875, -0.6673202514648438, -0.6461944580078125, -0.6250686645507812, -0.60394287109375, -0.5828170776367188, -0.5616912841796875, -0.5405654907226562, -0.519439697265625, -0.49831390380859375, -0.4771881103515625, -0.45606231689453125, -0.4349365234375, -0.41381072998046875, -0.3926849365234375, -0.37155914306640625, -0.350433349609375, -0.32930755615234375, -0.3081817626953125, -0.28705596923828125, -0.26593017578125, -0.24480438232421875, -0.2236785888671875, -0.20255279541015625, -0.181427001953125, -0.16030120849609375, -0.1391754150390625, -0.11804962158203125, -0.096923828125, -0.07579803466796875, -0.0546722412109375, -0.03354644775390625, -0.012420654296875, 0.00870513916015625, 0.0298309326171875, 0.05095672607421875, 0.07208251953125, 0.09320831298828125, 0.1143341064453125, 0.13545989990234375, 0.156585693359375, 0.17771148681640625, 0.1988372802734375, 0.21996307373046875, 0.2410888671875, 0.26221466064453125, 0.2833404541015625, 0.30446624755859375, 0.325592041015625, 0.34671783447265625, 0.3678436279296875, 0.38896942138671875, 0.41009521484375, 0.43122100830078125, 0.4523468017578125, 0.47347259521484375, 0.494598388671875, 0.5157241821289062, 0.5368499755859375, 0.5579757690429688, 0.5791015625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 19.0, 19.0, 36.0, 55.0, 50.0, 58.0, 72.0, 75.0, 72.0, 82.0, 84.0, 77.0, 65.0, 72.0, 37.0, 38.0, 26.0, 22.0, 9.0, 9.0, 10.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.7684860229492188, -0.7493743896484375, -0.7302627563476562, -0.711151123046875, -0.6920394897460938, -0.6729278564453125, -0.6538162231445312, -0.63470458984375, -0.6155929565429688, -0.5964813232421875, -0.5773696899414062, -0.558258056640625, -0.5391464233398438, -0.5200347900390625, -0.5009231567382812, -0.4818115234375, -0.46269989013671875, -0.4435882568359375, -0.42447662353515625, -0.405364990234375, -0.38625335693359375, -0.3671417236328125, -0.34803009033203125, -0.32891845703125, -0.30980682373046875, -0.2906951904296875, -0.27158355712890625, -0.252471923828125, -0.23336029052734375, -0.2142486572265625, -0.19513702392578125, -0.176025390625, -0.15691375732421875, -0.1378021240234375, -0.11869049072265625, -0.099578857421875, -0.08046722412109375, -0.0613555908203125, -0.04224395751953125, -0.02313232421875, -0.00402069091796875, 0.0150909423828125, 0.03420257568359375, 0.053314208984375, 0.07242584228515625, 0.0915374755859375, 0.11064910888671875, 0.1297607421875, 0.14887237548828125, 0.1679840087890625, 0.18709564208984375, 0.206207275390625, 0.22531890869140625, 0.2444305419921875, 0.26354217529296875, 0.28265380859375, 0.30176544189453125, 0.3208770751953125, 0.33998870849609375, 0.359100341796875, 0.37821197509765625, 0.3973236083984375, 0.41643524169921875, 0.435546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 7.0, 12.0, 12.0, 20.0, 19.0, 24.0, 45.0, 49.0, 71.0, 126.0, 259.0, 502.0, 1046.0, 2944.0, 10228.0, 71769.0, 3724284.0, 351227.0, 23549.0, 5153.0, 1601.0, 635.0, 281.0, 142.0, 74.0, 49.0, 31.0, 30.0, 22.0, 17.0, 12.0, 10.0, 9.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5478515625, -1.5019683837890625, -1.456085205078125, -1.4102020263671875, -1.36431884765625, -1.3184356689453125, -1.272552490234375, -1.2266693115234375, -1.1807861328125, -1.1349029541015625, -1.089019775390625, -1.0431365966796875, -0.99725341796875, -0.9513702392578125, -0.905487060546875, -0.8596038818359375, -0.813720703125, -0.7678375244140625, -0.721954345703125, -0.6760711669921875, -0.63018798828125, -0.5843048095703125, -0.538421630859375, -0.4925384521484375, -0.4466552734375, -0.4007720947265625, -0.354888916015625, -0.3090057373046875, -0.26312255859375, -0.2172393798828125, -0.171356201171875, -0.1254730224609375, -0.07958984375, -0.0337066650390625, 0.012176513671875, 0.0580596923828125, 0.10394287109375, 0.1498260498046875, 0.195709228515625, 0.2415924072265625, 0.2874755859375, 0.3333587646484375, 0.379241943359375, 0.4251251220703125, 0.47100830078125, 0.5168914794921875, 0.562774658203125, 0.6086578369140625, 0.654541015625, 0.7004241943359375, 0.746307373046875, 0.7921905517578125, 0.83807373046875, 0.8839569091796875, 0.929840087890625, 0.9757232666015625, 1.0216064453125, 1.0674896240234375, 1.113372802734375, 1.1592559814453125, 1.20513916015625, 1.2510223388671875, 1.296905517578125, 1.3427886962890625, 1.388671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 3.0, 4.0, 4.0, 7.0, 4.0, 11.0, 23.0, 17.0, 37.0, 44.0, 60.0, 143.0, 221.0, 503.0, 994.0, 937.0, 447.0, 242.0, 97.0, 78.0, 41.0, 37.0, 22.0, 17.0, 22.0, 10.0, 10.0, 5.0, 5.0, 3.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0771484375, -1.0472259521484375, -1.017303466796875, -0.9873809814453125, -0.95745849609375, -0.9275360107421875, -0.897613525390625, -0.8676910400390625, -0.8377685546875, -0.8078460693359375, -0.777923583984375, -0.7480010986328125, -0.71807861328125, -0.6881561279296875, -0.658233642578125, -0.6283111572265625, -0.598388671875, -0.5684661865234375, -0.538543701171875, -0.5086212158203125, -0.47869873046875, -0.4487762451171875, -0.418853759765625, -0.3889312744140625, -0.3590087890625, -0.3290863037109375, -0.299163818359375, -0.2692413330078125, -0.23931884765625, -0.2093963623046875, -0.179473876953125, -0.1495513916015625, -0.11962890625, -0.0897064208984375, -0.059783935546875, -0.0298614501953125, 6.103515625e-05, 0.0299835205078125, 0.059906005859375, 0.0898284912109375, 0.1197509765625, 0.1496734619140625, 0.179595947265625, 0.2095184326171875, 0.23944091796875, 0.2693634033203125, 0.299285888671875, 0.3292083740234375, 0.359130859375, 0.3890533447265625, 0.418975830078125, 0.4488983154296875, 0.47882080078125, 0.5087432861328125, 0.538665771484375, 0.5685882568359375, 0.5985107421875, 0.6284332275390625, 0.658355712890625, 0.6882781982421875, 0.71820068359375, 0.7481231689453125, 0.778045654296875, 0.8079681396484375, 0.837890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 8.0, 7.0, 3.0, 5.0, 20.0, 29.0, 48.0, 72.0, 94.0, 136.0, 171.0, 141.0, 100.0, 55.0, 40.0, 20.0, 15.0, 14.0, 12.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.387801170349121, -8.15819263458252, -7.928584575653076, -7.698976039886475, -7.469367980957031, -7.23975944519043, -7.010150909423828, -6.780542373657227, -6.550934314727783, -6.321325778961182, -6.091717720031738, -5.862109184265137, -5.632500648498535, -5.402892589569092, -5.17328405380249, -4.943675994873047, -4.714067459106445, -4.484458923339844, -4.2548508644104, -4.025242328643799, -3.7956340312957764, -3.566025733947754, -3.3364171981811523, -3.10680890083313, -2.8772006034851074, -2.647592306137085, -2.4179840087890625, -2.188375473022461, -1.9587671756744385, -1.729158878326416, -1.499550461769104, -1.269942045211792, -1.0403342247009277, -0.8107258677482605, -0.5811175107955933, -0.351509153842926, -0.12190079689025879, 0.10770750045776367, 0.3373159170150757, 0.5669243335723877, 0.7965326309204102, 1.0261409282684326, 1.2557493448257446, 1.4853577613830566, 1.714966058731079, 1.9445743560791016, 2.174182891845703, 2.4037911891937256, 2.633399486541748, 2.8630077838897705, 3.092616081237793, 3.3222246170043945, 3.551832914352417, 3.7814412117004395, 4.011049747467041, 4.240657806396484, 4.470266342163086, 4.6998748779296875, 4.929482936859131, 5.159091472625732, 5.388699531555176, 5.618308067321777, 5.847916603088379, 6.0775251388549805, 6.307133197784424]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 2.0, 5.0, 4.0, 7.0, 8.0, 12.0, 18.0, 19.0, 21.0, 29.0, 29.0, 43.0, 45.0, 46.0, 66.0, 49.0, 70.0, 50.0, 36.0, 55.0, 55.0, 47.0, 45.0, 38.0, 29.0, 40.0, 37.0, 25.0, 20.0, 6.0, 9.0, 14.0, 9.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.767602443695068, -4.622891426086426, -4.478179931640625, -4.333468437194824, -4.188757419586182, -4.044046401977539, -3.8993349075317383, -3.7546236515045166, -3.609912395477295, -3.4652011394500732, -3.3204898834228516, -3.17577862739563, -3.031067371368408, -2.8863561153411865, -2.741644859313965, -2.596933603286743, -2.4522223472595215, -2.3075110912323, -2.162799835205078, -2.0180885791778564, -1.8733773231506348, -1.728666067123413, -1.5839548110961914, -1.4392435550689697, -1.294532299041748, -1.1498210430145264, -1.0051097869873047, -0.860398530960083, -0.7156872749328613, -0.5709760189056396, -0.42626476287841797, -0.2815535068511963, -0.1368427276611328, 0.007868528366088867, 0.15257978439331055, 0.2972910404205322, 0.4420022964477539, 0.5867135524749756, 0.7314248085021973, 0.876136064529419, 1.0208473205566406, 1.1655585765838623, 1.310269832611084, 1.4549810886383057, 1.5996923446655273, 1.744403600692749, 1.8891148567199707, 2.0338261127471924, 2.178537368774414, 2.3232486248016357, 2.4679598808288574, 2.612671136856079, 2.757382392883301, 2.9020936489105225, 3.046804904937744, 3.191516160964966, 3.3362274169921875, 3.480938673019409, 3.625649929046631, 3.7703611850738525, 3.915072441101074, 4.059783935546875, 4.204494953155518, 4.34920597076416, 4.493917465209961]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 6.0, 8.0, 17.0, 24.0, 43.0, 48.0, 97.0, 130.0, 236.0, 346.0, 603.0, 1068.0, 1985.0, 3701.0, 6956.0, 13960.0, 27959.0, 57732.0, 118948.0, 223376.0, 265488.0, 164389.0, 81892.0, 39552.0, 19119.0, 9691.0, 5086.0, 2630.0, 1438.0, 810.0, 461.0, 255.0, 170.0, 98.0, 73.0, 56.0, 30.0, 25.0, 19.0, 12.0, 5.0, 5.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.486297607421875, -0.46966552734375, -0.453033447265625, -0.4364013671875, -0.419769287109375, -0.40313720703125, -0.386505126953125, -0.369873046875, -0.353240966796875, -0.33660888671875, -0.319976806640625, -0.3033447265625, -0.286712646484375, -0.27008056640625, -0.253448486328125, -0.23681640625, -0.220184326171875, -0.20355224609375, -0.186920166015625, -0.1702880859375, -0.153656005859375, -0.13702392578125, -0.120391845703125, -0.103759765625, -0.087127685546875, -0.07049560546875, -0.053863525390625, -0.0372314453125, -0.020599365234375, -0.00396728515625, 0.012664794921875, 0.029296875, 0.045928955078125, 0.06256103515625, 0.079193115234375, 0.0958251953125, 0.112457275390625, 0.12908935546875, 0.145721435546875, 0.162353515625, 0.178985595703125, 0.19561767578125, 0.212249755859375, 0.2288818359375, 0.245513916015625, 0.26214599609375, 0.278778076171875, 0.29541015625, 0.312042236328125, 0.32867431640625, 0.345306396484375, 0.3619384765625, 0.378570556640625, 0.39520263671875, 0.411834716796875, 0.428466796875, 0.445098876953125, 0.46173095703125, 0.478363037109375, 0.4949951171875, 0.511627197265625, 0.52825927734375, 0.544891357421875, 0.5615234375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 11.0, 6.0, 16.0, 25.0, 24.0, 31.0, 38.0, 31.0, 41.0, 45.0, 65.0, 43.0, 52.0, 66.0, 51.0, 72.0, 61.0, 53.0, 40.0, 46.0, 39.0, 23.0, 26.0, 22.0, 19.0, 14.0, 6.0, 8.0, 5.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4150390625, -0.4020271301269531, -0.38901519775390625, -0.3760032653808594, -0.3629913330078125, -0.3499794006347656, -0.33696746826171875, -0.3239555358886719, -0.310943603515625, -0.2979316711425781, -0.28491973876953125, -0.2719078063964844, -0.2588958740234375, -0.24588394165039062, -0.23287200927734375, -0.21986007690429688, -0.20684814453125, -0.19383621215820312, -0.18082427978515625, -0.16781234741210938, -0.1548004150390625, -0.14178848266601562, -0.12877655029296875, -0.11576461791992188, -0.102752685546875, -0.08974075317382812, -0.07672882080078125, -0.06371688842773438, -0.0507049560546875, -0.037693023681640625, -0.02468109130859375, -0.011669158935546875, 0.0013427734375, 0.014354705810546875, 0.02736663818359375, 0.040378570556640625, 0.0533905029296875, 0.06640243530273438, 0.07941436767578125, 0.09242630004882812, 0.105438232421875, 0.11845016479492188, 0.13146209716796875, 0.14447402954101562, 0.1574859619140625, 0.17049789428710938, 0.18350982666015625, 0.19652175903320312, 0.20953369140625, 0.22254562377929688, 0.23555755615234375, 0.24856948852539062, 0.2615814208984375, 0.2745933532714844, 0.28760528564453125, 0.3006172180175781, 0.313629150390625, 0.3266410827636719, 0.33965301513671875, 0.3526649475097656, 0.3656768798828125, 0.3786888122558594, 0.39170074462890625, 0.4047126770019531, 0.417724609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 12.0, 16.0, 29.0, 41.0, 41.0, 107.0, 175.0, 214.0, 384.0, 577.0, 1092.0, 2079.0, 4677.0, 13554.0, 53247.0, 287779.0, 564821.0, 87189.0, 20186.0, 6488.0, 2594.0, 1291.0, 711.0, 400.0, 284.0, 166.0, 119.0, 102.0, 58.0, 32.0, 24.0, 17.0, 11.0, 14.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.9951629638671875, -0.961029052734375, -0.9268951416015625, -0.89276123046875, -0.8586273193359375, -0.824493408203125, -0.7903594970703125, -0.7562255859375, -0.7220916748046875, -0.687957763671875, -0.6538238525390625, -0.61968994140625, -0.5855560302734375, -0.551422119140625, -0.5172882080078125, -0.483154296875, -0.4490203857421875, -0.414886474609375, -0.3807525634765625, -0.34661865234375, -0.3124847412109375, -0.278350830078125, -0.2442169189453125, -0.2100830078125, -0.1759490966796875, -0.141815185546875, -0.1076812744140625, -0.07354736328125, -0.0394134521484375, -0.005279541015625, 0.0288543701171875, 0.06298828125, 0.0971221923828125, 0.131256103515625, 0.1653900146484375, 0.19952392578125, 0.2336578369140625, 0.267791748046875, 0.3019256591796875, 0.3360595703125, 0.3701934814453125, 0.404327392578125, 0.4384613037109375, 0.47259521484375, 0.5067291259765625, 0.540863037109375, 0.5749969482421875, 0.609130859375, 0.6432647705078125, 0.677398681640625, 0.7115325927734375, 0.74566650390625, 0.7798004150390625, 0.813934326171875, 0.8480682373046875, 0.8822021484375, 0.9163360595703125, 0.950469970703125, 0.9846038818359375, 1.01873779296875, 1.0528717041015625, 1.087005615234375, 1.1211395263671875, 1.1552734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 7.0, 5.0, 8.0, 8.0, 4.0, 3.0, 6.0, 3.0, 12.0, 7.0, 11.0, 13.0, 8.0, 21.0, 21.0, 19.0, 28.0, 19.0, 36.0, 28.0, 28.0, 32.0, 37.0, 43.0, 44.0, 41.0, 41.0, 42.0, 37.0, 33.0, 33.0, 31.0, 33.0, 39.0, 32.0, 31.0, 19.0, 14.0, 20.0, 19.0, 8.0, 18.0, 7.0, 6.0, 11.0, 4.0, 8.0, 8.0, 4.0, 6.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0], "bins": [-0.9970703125, -0.9640045166015625, -0.930938720703125, -0.8978729248046875, -0.86480712890625, -0.8317413330078125, -0.798675537109375, -0.7656097412109375, -0.7325439453125, -0.6994781494140625, -0.666412353515625, -0.6333465576171875, -0.60028076171875, -0.5672149658203125, -0.534149169921875, -0.5010833740234375, -0.468017578125, -0.4349517822265625, -0.401885986328125, -0.3688201904296875, -0.33575439453125, -0.3026885986328125, -0.269622802734375, -0.2365570068359375, -0.2034912109375, -0.1704254150390625, -0.137359619140625, -0.1042938232421875, -0.07122802734375, -0.0381622314453125, -0.005096435546875, 0.0279693603515625, 0.06103515625, 0.0941009521484375, 0.127166748046875, 0.1602325439453125, 0.19329833984375, 0.2263641357421875, 0.259429931640625, 0.2924957275390625, 0.3255615234375, 0.3586273193359375, 0.391693115234375, 0.4247589111328125, 0.45782470703125, 0.4908905029296875, 0.523956298828125, 0.5570220947265625, 0.590087890625, 0.6231536865234375, 0.656219482421875, 0.6892852783203125, 0.72235107421875, 0.7554168701171875, 0.788482666015625, 0.8215484619140625, 0.8546142578125, 0.8876800537109375, 0.920745849609375, 0.9538116455078125, 0.98687744140625, 1.0199432373046875, 1.053009033203125, 1.0860748291015625, 1.119140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 6.0, 9.0, 5.0, 15.0, 12.0, 20.0, 26.0, 35.0, 44.0, 69.0, 76.0, 113.0, 171.0, 286.0, 398.0, 656.0, 1203.0, 2344.0, 5142.0, 12914.0, 43020.0, 200103.0, 611143.0, 123892.0, 28902.0, 9510.0, 3962.0, 1844.0, 964.0, 550.0, 366.0, 190.0, 142.0, 105.0, 78.0, 52.0, 47.0, 26.0, 29.0, 13.0, 13.0, 9.0, 11.0, 3.0, 8.0, 0.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.268798828125, -0.26049041748046875, -0.2521820068359375, -0.24387359619140625, -0.235565185546875, -0.22725677490234375, -0.2189483642578125, -0.21063995361328125, -0.20233154296875, -0.19402313232421875, -0.1857147216796875, -0.17740631103515625, -0.169097900390625, -0.16078948974609375, -0.1524810791015625, -0.14417266845703125, -0.1358642578125, -0.12755584716796875, -0.1192474365234375, -0.11093902587890625, -0.102630615234375, -0.09432220458984375, -0.0860137939453125, -0.07770538330078125, -0.06939697265625, -0.06108856201171875, -0.0527801513671875, -0.04447174072265625, -0.036163330078125, -0.02785491943359375, -0.0195465087890625, -0.01123809814453125, -0.0029296875, 0.00537872314453125, 0.0136871337890625, 0.02199554443359375, 0.030303955078125, 0.03861236572265625, 0.0469207763671875, 0.05522918701171875, 0.06353759765625, 0.07184600830078125, 0.0801544189453125, 0.08846282958984375, 0.096771240234375, 0.10507965087890625, 0.1133880615234375, 0.12169647216796875, 0.1300048828125, 0.13831329345703125, 0.1466217041015625, 0.15493011474609375, 0.163238525390625, 0.17154693603515625, 0.1798553466796875, 0.18816375732421875, 0.19647216796875, 0.20478057861328125, 0.2130889892578125, 0.22139739990234375, 0.229705810546875, 0.23801422119140625, 0.2463226318359375, 0.25463104248046875, 0.262939453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 11.0, 20.0, 28.0, 36.0, 60.0, 81.0, 126.0, 128.0, 158.0, 89.0, 72.0, 53.0, 37.0, 24.0, 27.0, 13.0, 4.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010001659393310547, -9.644590318202972e-05, -9.287521243095398e-05, -8.930452167987823e-05, -8.573383092880249e-05, -8.216314017772675e-05, -7.8592449426651e-05, -7.502175867557526e-05, -7.145106792449951e-05, -6.788037717342377e-05, -6.430968642234802e-05, -6.073899567127228e-05, -5.716830492019653e-05, -5.359761416912079e-05, -5.0026923418045044e-05, -4.64562326669693e-05, -4.2885541915893555e-05, -3.931485116481781e-05, -3.5744160413742065e-05, -3.217346966266632e-05, -2.8602778911590576e-05, -2.503208816051483e-05, -2.1461397409439087e-05, -1.7890706658363342e-05, -1.4320015907287598e-05, -1.0749325156211853e-05, -7.178634405136108e-06, -3.6079436540603638e-06, -3.725290298461914e-08, 3.5334378480911255e-06, 7.10412859916687e-06, 1.0674819350242615e-05, 1.424551010131836e-05, 1.7816200852394104e-05, 2.138689160346985e-05, 2.4957582354545593e-05, 2.8528273105621338e-05, 3.209896385669708e-05, 3.566965460777283e-05, 3.924034535884857e-05, 4.2811036109924316e-05, 4.638172686100006e-05, 4.9952417612075806e-05, 5.352310836315155e-05, 5.7093799114227295e-05, 6.066448986530304e-05, 6.423518061637878e-05, 6.780587136745453e-05, 7.137656211853027e-05, 7.494725286960602e-05, 7.851794362068176e-05, 8.208863437175751e-05, 8.565932512283325e-05, 8.9230015873909e-05, 9.280070662498474e-05, 9.637139737606049e-05, 9.994208812713623e-05, 0.00010351277887821198, 0.00010708346962928772, 0.00011065416038036346, 0.00011422485113143921, 0.00011779554188251495, 0.0001213662326335907, 0.00012493692338466644, 0.0001285076141357422]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 9.0, 5.0, 6.0, 11.0, 11.0, 13.0, 23.0, 30.0, 51.0, 65.0, 108.0, 176.0, 304.0, 545.0, 1171.0, 2610.0, 7182.0, 24952.0, 144600.0, 708690.0, 124236.0, 22342.0, 6551.0, 2458.0, 1052.0, 550.0, 289.0, 180.0, 113.0, 61.0, 46.0, 26.0, 20.0, 18.0, 16.0, 12.0, 6.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.337890625, -0.326019287109375, -0.31414794921875, -0.302276611328125, -0.2904052734375, -0.278533935546875, -0.26666259765625, -0.254791259765625, -0.242919921875, -0.231048583984375, -0.21917724609375, -0.207305908203125, -0.1954345703125, -0.183563232421875, -0.17169189453125, -0.159820556640625, -0.14794921875, -0.136077880859375, -0.12420654296875, -0.112335205078125, -0.1004638671875, -0.088592529296875, -0.07672119140625, -0.064849853515625, -0.052978515625, -0.041107177734375, -0.02923583984375, -0.017364501953125, -0.0054931640625, 0.006378173828125, 0.01824951171875, 0.030120849609375, 0.0419921875, 0.053863525390625, 0.06573486328125, 0.077606201171875, 0.0894775390625, 0.101348876953125, 0.11322021484375, 0.125091552734375, 0.136962890625, 0.148834228515625, 0.16070556640625, 0.172576904296875, 0.1844482421875, 0.196319580078125, 0.20819091796875, 0.220062255859375, 0.23193359375, 0.243804931640625, 0.25567626953125, 0.267547607421875, 0.2794189453125, 0.291290283203125, 0.30316162109375, 0.315032958984375, 0.326904296875, 0.338775634765625, 0.35064697265625, 0.362518310546875, 0.3743896484375, 0.386260986328125, 0.39813232421875, 0.410003662109375, 0.421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 6.0, 17.0, 8.0, 8.0, 13.0, 24.0, 19.0, 25.0, 39.0, 46.0, 43.0, 68.0, 68.0, 64.0, 67.0, 71.0, 62.0, 52.0, 61.0, 38.0, 39.0, 36.0, 28.0, 20.0, 6.0, 8.0, 7.0, 11.0, 3.0, 8.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.295654296875, -0.2868232727050781, -0.27799224853515625, -0.2691612243652344, -0.2603302001953125, -0.2514991760253906, -0.24266815185546875, -0.23383712768554688, -0.225006103515625, -0.21617507934570312, -0.20734405517578125, -0.19851303100585938, -0.1896820068359375, -0.18085098266601562, -0.17201995849609375, -0.16318893432617188, -0.15435791015625, -0.14552688598632812, -0.13669586181640625, -0.12786483764648438, -0.1190338134765625, -0.11020278930664062, -0.10137176513671875, -0.09254074096679688, -0.083709716796875, -0.07487869262695312, -0.06604766845703125, -0.057216644287109375, -0.0483856201171875, -0.039554595947265625, -0.03072357177734375, -0.021892547607421875, -0.0130615234375, -0.004230499267578125, 0.00460052490234375, 0.013431549072265625, 0.0222625732421875, 0.031093597412109375, 0.03992462158203125, 0.048755645751953125, 0.057586669921875, 0.06641769409179688, 0.07524871826171875, 0.08407974243164062, 0.0929107666015625, 0.10174179077148438, 0.11057281494140625, 0.11940383911132812, 0.12823486328125, 0.13706588745117188, 0.14589691162109375, 0.15472793579101562, 0.1635589599609375, 0.17238998413085938, 0.18122100830078125, 0.19005203247070312, 0.198883056640625, 0.20771408081054688, 0.21654510498046875, 0.22537612915039062, 0.2342071533203125, 0.24303817749023438, 0.25186920166015625, 0.2607002258300781, 0.26953125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 11.0, 17.0, 27.0, 72.0, 157.0, 226.0, 221.0, 125.0, 55.0, 35.0, 15.0, 9.0, 12.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.688709259033203, -8.36483383178711, -8.0409574508667, -7.7170820236206055, -7.3932061195373535, -7.069330215454102, -6.745454788208008, -6.421578884124756, -6.097702980041504, -5.773827075958252, -5.449951171875, -5.126075744628906, -4.802199840545654, -4.478323936462402, -4.154448509216309, -3.8305726051330566, -3.5066967010498047, -3.1828207969665527, -2.85894513130188, -2.535069465637207, -2.211193561553955, -1.8873177766799927, -1.5634419918060303, -1.2395663261413574, -0.9156904220581055, -0.5918146371841431, -0.26793885231018066, 0.05593693256378174, 0.37981271743774414, 0.7036885023117065, 1.027564287185669, 1.3514399528503418, 1.6753149032592773, 1.9991906881332397, 2.323066473007202, 2.646942138671875, 2.970818042755127, 3.294693946838379, 3.6185696125030518, 3.9424452781677246, 4.266321182250977, 4.5901970863342285, 4.9140729904174805, 5.237948417663574, 5.561824321746826, 5.885700225830078, 6.209575653076172, 6.533451557159424, 6.857327461242676, 7.181203365325928, 7.50507926940918, 7.828954696655273, 8.152830123901367, 8.476706504821777, 8.800581932067871, 9.124458312988281, 9.448333740234375, 9.772209167480469, 10.096085548400879, 10.419960975646973, 10.743837356567383, 11.067712783813477, 11.39158821105957, 11.715463638305664, 12.039340019226074]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 7.0, 7.0, 8.0, 8.0, 13.0, 12.0, 11.0, 15.0, 18.0, 31.0, 31.0, 33.0, 23.0, 36.0, 27.0, 40.0, 50.0, 70.0, 74.0, 75.0, 51.0, 52.0, 29.0, 39.0, 32.0, 41.0, 28.0, 23.0, 18.0, 21.0, 12.0, 11.0, 9.0, 8.0, 9.0, 8.0, 3.0, 8.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.121819496154785, -4.968884468078613, -4.815949440002441, -4.663013935089111, -4.5100789070129395, -4.357143878936768, -4.204208850860596, -4.051273345947266, -3.8983383178710938, -3.745403289794922, -3.592468023300171, -3.439532995223999, -3.286597728729248, -3.133662700653076, -2.9807276725769043, -2.8277924060821533, -2.6748573780059814, -2.5219223499298096, -2.3689870834350586, -2.2160520553588867, -2.0631167888641357, -1.9101817607879639, -1.7572466135025024, -1.604311466217041, -1.4513763189315796, -1.2984411716461182, -1.1455060243606567, -0.9925709366798401, -0.8396357893943787, -0.6867006421089172, -0.5337655544281006, -0.38083040714263916, -0.22789525985717773, -0.0749601274728775, 0.07797500491142273, 0.23091012239456177, 0.3838452696800232, 0.5367804169654846, 0.6897155046463013, 0.8426506519317627, 0.9955857992172241, 1.1485209465026855, 1.301456093788147, 1.4543912410736084, 1.6073262691497803, 1.7602615356445312, 1.9131965637207031, 2.066131591796875, 2.219066858291626, 2.372001886367798, 2.524937152862549, 2.6778721809387207, 2.8308074474334717, 2.9837424755096436, 3.1366777420043945, 3.2896127700805664, 3.4425477981567383, 3.59548282623291, 3.748418092727661, 3.901353120803833, 4.054288387298584, 4.207223415374756, 4.360158443450928, 4.513093948364258, 4.66602897644043]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 1.0, 8.0, 10.0, 14.0, 30.0, 44.0, 42.0, 82.0, 117.0, 278.0, 378.0, 608.0, 1068.0, 2094.0, 3975.0, 9208.0, 27472.0, 157642.0, 2654060.0, 1218941.0, 84135.0, 19486.0, 7378.0, 3237.0, 1726.0, 940.0, 524.0, 291.0, 194.0, 117.0, 73.0, 39.0, 32.0, 14.0, 11.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5016555786132812, -0.4842681884765625, -0.46688079833984375, -0.449493408203125, -0.43210601806640625, -0.4147186279296875, -0.39733123779296875, -0.37994384765625, -0.36255645751953125, -0.3451690673828125, -0.32778167724609375, -0.310394287109375, -0.29300689697265625, -0.2756195068359375, -0.25823211669921875, -0.2408447265625, -0.22345733642578125, -0.2060699462890625, -0.18868255615234375, -0.171295166015625, -0.15390777587890625, -0.1365203857421875, -0.11913299560546875, -0.10174560546875, -0.08435821533203125, -0.0669708251953125, -0.04958343505859375, -0.032196044921875, -0.01480865478515625, 0.0025787353515625, 0.01996612548828125, 0.037353515625, 0.05474090576171875, 0.0721282958984375, 0.08951568603515625, 0.106903076171875, 0.12429046630859375, 0.1416778564453125, 0.15906524658203125, 0.17645263671875, 0.19384002685546875, 0.2112274169921875, 0.22861480712890625, 0.246002197265625, 0.26338958740234375, 0.2807769775390625, 0.29816436767578125, 0.3155517578125, 0.33293914794921875, 0.3503265380859375, 0.36771392822265625, 0.385101318359375, 0.40248870849609375, 0.4198760986328125, 0.43726348876953125, 0.45465087890625, 0.47203826904296875, 0.4894256591796875, 0.5068130493164062, 0.524200439453125, 0.5415878295898438, 0.5589752197265625, 0.5763626098632812, 0.59375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 5.0, 16.0, 19.0, 23.0, 27.0, 31.0, 36.0, 45.0, 55.0, 64.0, 60.0, 42.0, 57.0, 59.0, 80.0, 66.0, 52.0, 44.0, 46.0, 38.0, 27.0, 25.0, 22.0, 11.0, 13.0, 6.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.3923454284667969, -0.37917327880859375, -0.3660011291503906, -0.3528289794921875, -0.3396568298339844, -0.32648468017578125, -0.3133125305175781, -0.300140380859375, -0.2869682312011719, -0.27379608154296875, -0.2606239318847656, -0.2474517822265625, -0.23427963256835938, -0.22110748291015625, -0.20793533325195312, -0.19476318359375, -0.18159103393554688, -0.16841888427734375, -0.15524673461914062, -0.1420745849609375, -0.12890243530273438, -0.11573028564453125, -0.10255813598632812, -0.089385986328125, -0.07621383666992188, -0.06304168701171875, -0.049869537353515625, -0.0366973876953125, -0.023525238037109375, -0.01035308837890625, 0.002819061279296875, 0.0159912109375, 0.029163360595703125, 0.04233551025390625, 0.055507659912109375, 0.0686798095703125, 0.08185195922851562, 0.09502410888671875, 0.10819625854492188, 0.121368408203125, 0.13454055786132812, 0.14771270751953125, 0.16088485717773438, 0.1740570068359375, 0.18722915649414062, 0.20040130615234375, 0.21357345581054688, 0.22674560546875, 0.23991775512695312, 0.25308990478515625, 0.2662620544433594, 0.2794342041015625, 0.2926063537597656, 0.30577850341796875, 0.3189506530761719, 0.332122802734375, 0.3452949523925781, 0.35846710205078125, 0.3716392517089844, 0.3848114013671875, 0.3979835510253906, 0.41115570068359375, 0.4243278503417969, 0.4375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 9.0, 8.0, 15.0, 18.0, 31.0, 34.0, 53.0, 72.0, 128.0, 160.0, 303.0, 472.0, 880.0, 1570.0, 3246.0, 8236.0, 30177.0, 204948.0, 3611317.0, 279273.0, 36311.0, 10164.0, 3600.0, 1547.0, 749.0, 403.0, 219.0, 129.0, 64.0, 58.0, 21.0, 18.0, 16.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78466796875, -0.7589874267578125, -0.733306884765625, -0.7076263427734375, -0.68194580078125, -0.6562652587890625, -0.630584716796875, -0.6049041748046875, -0.5792236328125, -0.5535430908203125, -0.527862548828125, -0.5021820068359375, -0.47650146484375, -0.4508209228515625, -0.425140380859375, -0.3994598388671875, -0.373779296875, -0.3480987548828125, -0.322418212890625, -0.2967376708984375, -0.27105712890625, -0.2453765869140625, -0.219696044921875, -0.1940155029296875, -0.1683349609375, -0.1426544189453125, -0.116973876953125, -0.0912933349609375, -0.06561279296875, -0.0399322509765625, -0.014251708984375, 0.0114288330078125, 0.037109375, 0.0627899169921875, 0.088470458984375, 0.1141510009765625, 0.13983154296875, 0.1655120849609375, 0.191192626953125, 0.2168731689453125, 0.2425537109375, 0.2682342529296875, 0.293914794921875, 0.3195953369140625, 0.34527587890625, 0.3709564208984375, 0.396636962890625, 0.4223175048828125, 0.447998046875, 0.4736785888671875, 0.499359130859375, 0.5250396728515625, 0.55072021484375, 0.5764007568359375, 0.602081298828125, 0.6277618408203125, 0.6534423828125, 0.6791229248046875, 0.704803466796875, 0.7304840087890625, 0.75616455078125, 0.7818450927734375, 0.807525634765625, 0.8332061767578125, 0.85888671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 10.0, 8.0, 11.0, 11.0, 35.0, 55.0, 79.0, 156.0, 316.0, 854.0, 1311.0, 646.0, 267.0, 100.0, 67.0, 35.0, 34.0, 26.0, 10.0, 11.0, 8.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0576171875, -1.0268478393554688, -0.9960784912109375, -0.9653091430664062, -0.934539794921875, -0.9037704467773438, -0.8730010986328125, -0.8422317504882812, -0.81146240234375, -0.7806930541992188, -0.7499237060546875, -0.7191543579101562, -0.688385009765625, -0.6576156616210938, -0.6268463134765625, -0.5960769653320312, -0.5653076171875, -0.5345382690429688, -0.5037689208984375, -0.47299957275390625, -0.442230224609375, -0.41146087646484375, -0.3806915283203125, -0.34992218017578125, -0.31915283203125, -0.28838348388671875, -0.2576141357421875, -0.22684478759765625, -0.196075439453125, -0.16530609130859375, -0.1345367431640625, -0.10376739501953125, -0.072998046875, -0.04222869873046875, -0.0114593505859375, 0.01930999755859375, 0.050079345703125, 0.08084869384765625, 0.1116180419921875, 0.14238739013671875, 0.17315673828125, 0.20392608642578125, 0.2346954345703125, 0.26546478271484375, 0.296234130859375, 0.32700347900390625, 0.3577728271484375, 0.38854217529296875, 0.4193115234375, 0.45008087158203125, 0.4808502197265625, 0.5116195678710938, 0.542388916015625, 0.5731582641601562, 0.6039276123046875, 0.6346969604492188, 0.66546630859375, 0.6962356567382812, 0.7270050048828125, 0.7577743530273438, 0.788543701171875, 0.8193130493164062, 0.8500823974609375, 0.8808517456054688, 0.91162109375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 3.0, 10.0, 17.0, 16.0, 47.0, 90.0, 132.0, 174.0, 188.0, 141.0, 78.0, 37.0, 25.0, 12.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.493501663208008, -7.279058456420898, -7.064615726470947, -6.850172519683838, -6.6357293128967285, -6.421286582946777, -6.206843376159668, -5.992400169372559, -5.777956962585449, -5.56351375579834, -5.349071025848389, -5.134627819061279, -4.92018461227417, -4.705741882324219, -4.491298675537109, -4.27685546875, -4.062412261962891, -3.8479692935943604, -3.633526086807251, -3.4190831184387207, -3.2046399116516113, -2.990196943283081, -2.775753974914551, -2.5613107681274414, -2.3468680381774902, -2.13242506980896, -1.9179818630218506, -1.7035388946533203, -1.489095687866211, -1.2746527194976807, -1.0602096319198608, -0.845766544342041, -0.6313233375549316, -0.4168802499771118, -0.20243719220161438, 0.012005865573883057, 0.22644895315170288, 0.44089198112487793, 0.6553350687026978, 0.8697781562805176, 1.0842212438583374, 1.2986643314361572, 1.513107419013977, 1.7275505065917969, 1.9419934749603271, 2.1564364433288574, 2.370879650115967, 2.585322856903076, 2.7997658252716064, 3.0142087936401367, 3.228652000427246, 3.4430949687957764, 3.6575381755828857, 3.871981143951416, 4.086424350738525, 4.300867080688477, 4.515310287475586, 4.729753494262695, 4.9441962242126465, 5.158639430999756, 5.373082637786865, 5.587525367736816, 5.801968574523926, 6.016411781311035, 6.2308549880981445]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 10.0, 12.0, 11.0, 27.0, 29.0, 37.0, 41.0, 56.0, 57.0, 69.0, 68.0, 72.0, 77.0, 71.0, 68.0, 57.0, 50.0, 52.0, 42.0, 22.0, 26.0, 13.0, 15.0, 5.0, 10.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2524070739746094, -3.106252431869507, -2.960097551345825, -2.8139429092407227, -2.667788028717041, -2.5216333866119385, -2.375478744506836, -2.2293238639831543, -2.0831689834594727, -1.9370142221450806, -1.7908594608306885, -1.644704818725586, -1.4985499382019043, -1.3523952960968018, -1.2062405347824097, -1.0600857734680176, -0.913931131362915, -0.767776370048523, -0.6216216087341309, -0.47546690702438354, -0.32931214570999146, -0.18315738439559937, -0.03700268268585205, 0.10915207862854004, 0.25530683994293213, 0.4014616012573242, 0.5476163625717163, 0.6937710642814636, 0.8399258255958557, 0.9860805869102478, 1.1322352886199951, 1.2783900499343872, 1.4245448112487793, 1.5706995725631714, 1.7168543338775635, 1.863008975982666, 2.0091638565063477, 2.15531849861145, 2.3014731407165527, 2.4476280212402344, 2.593782901763916, 2.7399375438690186, 2.8860924243927, 3.0322470664978027, 3.1784019470214844, 3.324556589126587, 3.4707112312316895, 3.616866111755371, 3.7630207538604736, 3.909175395965576, 4.055330276489258, 4.2014851570129395, 4.347639560699463, 4.4937944412231445, 4.639949321746826, 4.786104202270508, 4.932258605957031, 5.078413486480713, 5.224567890167236, 5.370722770690918, 5.5168776512146, 5.663032531738281, 5.809186935424805, 5.955341815948486, 6.101496696472168]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 7.0, 9.0, 9.0, 16.0, 16.0, 27.0, 31.0, 62.0, 76.0, 104.0, 128.0, 255.0, 382.0, 597.0, 1004.0, 1803.0, 3241.0, 6463.0, 12998.0, 29751.0, 71678.0, 185008.0, 372428.0, 214466.0, 83086.0, 34179.0, 14911.0, 7357.0, 3613.0, 1925.0, 1112.0, 662.0, 379.0, 250.0, 167.0, 103.0, 82.0, 47.0, 32.0, 21.0, 16.0, 14.0, 20.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.701171875, -0.6774673461914062, -0.6537628173828125, -0.6300582885742188, -0.606353759765625, -0.5826492309570312, -0.5589447021484375, -0.5352401733398438, -0.51153564453125, -0.48783111572265625, -0.4641265869140625, -0.44042205810546875, -0.416717529296875, -0.39301300048828125, -0.3693084716796875, -0.34560394287109375, -0.3218994140625, -0.29819488525390625, -0.2744903564453125, -0.25078582763671875, -0.227081298828125, -0.20337677001953125, -0.1796722412109375, -0.15596771240234375, -0.13226318359375, -0.10855865478515625, -0.0848541259765625, -0.06114959716796875, -0.037445068359375, -0.01374053955078125, 0.0099639892578125, 0.03366851806640625, 0.057373046875, 0.08107757568359375, 0.1047821044921875, 0.12848663330078125, 0.152191162109375, 0.17589569091796875, 0.1996002197265625, 0.22330474853515625, 0.24700927734375, 0.27071380615234375, 0.2944183349609375, 0.31812286376953125, 0.341827392578125, 0.36553192138671875, 0.3892364501953125, 0.41294097900390625, 0.4366455078125, 0.46035003662109375, 0.4840545654296875, 0.5077590942382812, 0.531463623046875, 0.5551681518554688, 0.5788726806640625, 0.6025772094726562, 0.62628173828125, 0.6499862670898438, 0.6736907958984375, 0.6973953247070312, 0.721099853515625, 0.7448043823242188, 0.7685089111328125, 0.7922134399414062, 0.81591796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 7.0, 12.0, 11.0, 21.0, 20.0, 20.0, 24.0, 34.0, 42.0, 35.0, 41.0, 55.0, 39.0, 41.0, 66.0, 72.0, 64.0, 55.0, 54.0, 45.0, 45.0, 36.0, 35.0, 24.0, 21.0, 20.0, 10.0, 15.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35986328125, -0.3478584289550781, -0.33585357666015625, -0.3238487243652344, -0.3118438720703125, -0.2998390197753906, -0.28783416748046875, -0.2758293151855469, -0.263824462890625, -0.2518196105957031, -0.23981475830078125, -0.22780990600585938, -0.2158050537109375, -0.20380020141601562, -0.19179534912109375, -0.17979049682617188, -0.16778564453125, -0.15578079223632812, -0.14377593994140625, -0.13177108764648438, -0.1197662353515625, -0.10776138305664062, -0.09575653076171875, -0.08375167846679688, -0.071746826171875, -0.059741973876953125, -0.04773712158203125, -0.035732269287109375, -0.0237274169921875, -0.011722564697265625, 0.00028228759765625, 0.012287139892578125, 0.0242919921875, 0.036296844482421875, 0.04830169677734375, 0.060306549072265625, 0.0723114013671875, 0.08431625366210938, 0.09632110595703125, 0.10832595825195312, 0.120330810546875, 0.13233566284179688, 0.14434051513671875, 0.15634536743164062, 0.1683502197265625, 0.18035507202148438, 0.19235992431640625, 0.20436477661132812, 0.21636962890625, 0.22837448120117188, 0.24037933349609375, 0.2523841857910156, 0.2643890380859375, 0.2763938903808594, 0.28839874267578125, 0.3004035949707031, 0.312408447265625, 0.3244132995605469, 0.33641815185546875, 0.3484230041503906, 0.3604278564453125, 0.3724327087402344, 0.38443756103515625, 0.3964424133300781, 0.408447265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 14.0, 14.0, 23.0, 32.0, 61.0, 78.0, 147.0, 258.0, 511.0, 1092.0, 2563.0, 6373.0, 18882.0, 66045.0, 313933.0, 523422.0, 80305.0, 22012.0, 7499.0, 2843.0, 1243.0, 549.0, 275.0, 148.0, 81.0, 55.0, 32.0, 19.0, 16.0, 9.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9208984375, -0.8855743408203125, -0.850250244140625, -0.8149261474609375, -0.77960205078125, -0.7442779541015625, -0.708953857421875, -0.6736297607421875, -0.6383056640625, -0.6029815673828125, -0.567657470703125, -0.5323333740234375, -0.49700927734375, -0.4616851806640625, -0.426361083984375, -0.3910369873046875, -0.355712890625, -0.3203887939453125, -0.285064697265625, -0.2497406005859375, -0.21441650390625, -0.1790924072265625, -0.143768310546875, -0.1084442138671875, -0.0731201171875, -0.0377960205078125, -0.002471923828125, 0.0328521728515625, 0.06817626953125, 0.1035003662109375, 0.138824462890625, 0.1741485595703125, 0.20947265625, 0.2447967529296875, 0.280120849609375, 0.3154449462890625, 0.35076904296875, 0.3860931396484375, 0.421417236328125, 0.4567413330078125, 0.4920654296875, 0.5273895263671875, 0.562713623046875, 0.5980377197265625, 0.63336181640625, 0.6686859130859375, 0.704010009765625, 0.7393341064453125, 0.774658203125, 0.8099822998046875, 0.845306396484375, 0.8806304931640625, 0.91595458984375, 0.9512786865234375, 0.986602783203125, 1.0219268798828125, 1.0572509765625, 1.0925750732421875, 1.127899169921875, 1.1632232666015625, 1.19854736328125, 1.2338714599609375, 1.269195556640625, 1.3045196533203125, 1.33984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 0.0, 7.0, 4.0, 6.0, 7.0, 10.0, 12.0, 12.0, 13.0, 15.0, 14.0, 24.0, 24.0, 25.0, 25.0, 26.0, 32.0, 33.0, 42.0, 46.0, 40.0, 43.0, 46.0, 51.0, 50.0, 44.0, 34.0, 51.0, 30.0, 32.0, 20.0, 32.0, 17.0, 17.0, 24.0, 21.0, 15.0, 8.0, 11.0, 8.0, 8.0, 3.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.046875, -1.0137481689453125, -0.980621337890625, -0.9474945068359375, -0.91436767578125, -0.8812408447265625, -0.848114013671875, -0.8149871826171875, -0.7818603515625, -0.7487335205078125, -0.715606689453125, -0.6824798583984375, -0.64935302734375, -0.6162261962890625, -0.583099365234375, -0.5499725341796875, -0.516845703125, -0.4837188720703125, -0.450592041015625, -0.4174652099609375, -0.38433837890625, -0.3512115478515625, -0.318084716796875, -0.2849578857421875, -0.2518310546875, -0.2187042236328125, -0.185577392578125, -0.1524505615234375, -0.11932373046875, -0.0861968994140625, -0.053070068359375, -0.0199432373046875, 0.01318359375, 0.0463104248046875, 0.079437255859375, 0.1125640869140625, 0.14569091796875, 0.1788177490234375, 0.211944580078125, 0.2450714111328125, 0.2781982421875, 0.3113250732421875, 0.344451904296875, 0.3775787353515625, 0.41070556640625, 0.4438323974609375, 0.476959228515625, 0.5100860595703125, 0.543212890625, 0.5763397216796875, 0.609466552734375, 0.6425933837890625, 0.67572021484375, 0.7088470458984375, 0.741973876953125, 0.7751007080078125, 0.8082275390625, 0.8413543701171875, 0.874481201171875, 0.9076080322265625, 0.94073486328125, 0.9738616943359375, 1.006988525390625, 1.0401153564453125, 1.0732421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 11.0, 12.0, 18.0, 24.0, 40.0, 63.0, 109.0, 287.0, 631.0, 2014.0, 8497.0, 74806.0, 849545.0, 98672.0, 10029.0, 2395.0, 750.0, 301.0, 111.0, 79.0, 46.0, 26.0, 16.0, 8.0, 10.0, 6.0, 7.0, 12.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5087890625, -0.49213409423828125, -0.4754791259765625, -0.45882415771484375, -0.442169189453125, -0.42551422119140625, -0.4088592529296875, -0.39220428466796875, -0.37554931640625, -0.35889434814453125, -0.3422393798828125, -0.32558441162109375, -0.308929443359375, -0.29227447509765625, -0.2756195068359375, -0.25896453857421875, -0.2423095703125, -0.22565460205078125, -0.2089996337890625, -0.19234466552734375, -0.175689697265625, -0.15903472900390625, -0.1423797607421875, -0.12572479248046875, -0.10906982421875, -0.09241485595703125, -0.0757598876953125, -0.05910491943359375, -0.042449951171875, -0.02579498291015625, -0.0091400146484375, 0.00751495361328125, 0.024169921875, 0.04082489013671875, 0.0574798583984375, 0.07413482666015625, 0.090789794921875, 0.10744476318359375, 0.1240997314453125, 0.14075469970703125, 0.15740966796875, 0.17406463623046875, 0.1907196044921875, 0.20737457275390625, 0.224029541015625, 0.24068450927734375, 0.2573394775390625, 0.27399444580078125, 0.2906494140625, 0.30730438232421875, 0.3239593505859375, 0.34061431884765625, 0.357269287109375, 0.37392425537109375, 0.3905792236328125, 0.40723419189453125, 0.42388916015625, 0.44054412841796875, 0.4571990966796875, 0.47385406494140625, 0.490509033203125, 0.5071640014648438, 0.5238189697265625, 0.5404739379882812, 0.55712890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 4.0, 8.0, 10.0, 4.0, 12.0, 14.0, 23.0, 19.0, 28.0, 42.0, 79.0, 121.0, 145.0, 146.0, 107.0, 51.0, 57.0, 27.0, 20.0, 14.0, 12.0, 11.0, 8.0, 10.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010776519775390625, -0.00010438170284032822, -0.00010099820792675018, -9.761471301317215e-05, -9.423121809959412e-05, -9.084772318601608e-05, -8.746422827243805e-05, -8.408073335886002e-05, -8.069723844528198e-05, -7.731374353170395e-05, -7.393024861812592e-05, -7.054675370454788e-05, -6.716325879096985e-05, -6.377976387739182e-05, -6.039626896381378e-05, -5.701277405023575e-05, -5.3629279136657715e-05, -5.024578422307968e-05, -4.686228930950165e-05, -4.3478794395923615e-05, -4.009529948234558e-05, -3.671180456876755e-05, -3.3328309655189514e-05, -2.994481474161148e-05, -2.6561319828033447e-05, -2.3177824914455414e-05, -1.979433000087738e-05, -1.6410835087299347e-05, -1.3027340173721313e-05, -9.64384526014328e-06, -6.260350346565247e-06, -2.876855432987213e-06, 5.066394805908203e-07, 3.890134394168854e-06, 7.273629307746887e-06, 1.065712422132492e-05, 1.4040619134902954e-05, 1.7424114048480988e-05, 2.080760896205902e-05, 2.4191103875637054e-05, 2.7574598789215088e-05, 3.095809370279312e-05, 3.4341588616371155e-05, 3.772508352994919e-05, 4.110857844352722e-05, 4.4492073357105255e-05, 4.787556827068329e-05, 5.125906318426132e-05, 5.4642558097839355e-05, 5.802605301141739e-05, 6.140954792499542e-05, 6.479304283857346e-05, 6.817653775215149e-05, 7.156003266572952e-05, 7.494352757930756e-05, 7.832702249288559e-05, 8.171051740646362e-05, 8.509401232004166e-05, 8.847750723361969e-05, 9.186100214719772e-05, 9.524449706077576e-05, 9.862799197435379e-05, 0.00010201148688793182, 0.00010539498180150986, 0.00010877847671508789]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 1.0, 7.0, 5.0, 6.0, 9.0, 17.0, 24.0, 32.0, 49.0, 74.0, 146.0, 187.0, 358.0, 589.0, 1173.0, 2392.0, 5471.0, 14793.0, 51012.0, 257192.0, 588715.0, 89330.0, 22548.0, 7709.0, 3338.0, 1525.0, 732.0, 447.0, 259.0, 139.0, 86.0, 57.0, 42.0, 22.0, 25.0, 9.0, 18.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.266357421875, -0.2575340270996094, -0.24871063232421875, -0.23988723754882812, -0.2310638427734375, -0.22224044799804688, -0.21341705322265625, -0.20459365844726562, -0.195770263671875, -0.18694686889648438, -0.17812347412109375, -0.16930007934570312, -0.1604766845703125, -0.15165328979492188, -0.14282989501953125, -0.13400650024414062, -0.12518310546875, -0.11635971069335938, -0.10753631591796875, -0.09871292114257812, -0.0898895263671875, -0.08106613159179688, -0.07224273681640625, -0.06341934204101562, -0.054595947265625, -0.045772552490234375, -0.03694915771484375, -0.028125762939453125, -0.0193023681640625, -0.010478973388671875, -0.00165557861328125, 0.007167816162109375, 0.0159912109375, 0.024814605712890625, 0.03363800048828125, 0.042461395263671875, 0.0512847900390625, 0.060108184814453125, 0.06893157958984375, 0.07775497436523438, 0.086578369140625, 0.09540176391601562, 0.10422515869140625, 0.11304855346679688, 0.1218719482421875, 0.13069534301757812, 0.13951873779296875, 0.14834213256835938, 0.15716552734375, 0.16598892211914062, 0.17481231689453125, 0.18363571166992188, 0.1924591064453125, 0.20128250122070312, 0.21010589599609375, 0.21892929077148438, 0.227752685546875, 0.23657608032226562, 0.24539947509765625, 0.2542228698730469, 0.2630462646484375, 0.2718696594238281, 0.28069305419921875, 0.2895164489746094, 0.29833984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 6.0, 7.0, 8.0, 11.0, 9.0, 16.0, 24.0, 38.0, 36.0, 51.0, 76.0, 79.0, 90.0, 95.0, 100.0, 80.0, 62.0, 53.0, 30.0, 27.0, 25.0, 23.0, 10.0, 6.0, 10.0, 6.0, 7.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24578857421875, -0.2364501953125, -0.22711181640625, -0.2177734375, -0.20843505859375, -0.1990966796875, -0.18975830078125, -0.180419921875, -0.17108154296875, -0.1617431640625, -0.15240478515625, -0.14306640625, -0.13372802734375, -0.1243896484375, -0.11505126953125, -0.105712890625, -0.09637451171875, -0.0870361328125, -0.07769775390625, -0.068359375, -0.05902099609375, -0.0496826171875, -0.04034423828125, -0.031005859375, -0.02166748046875, -0.0123291015625, -0.00299072265625, 0.00634765625, 0.01568603515625, 0.0250244140625, 0.03436279296875, 0.043701171875, 0.05303955078125, 0.0623779296875, 0.07171630859375, 0.0810546875, 0.09039306640625, 0.0997314453125, 0.10906982421875, 0.118408203125, 0.12774658203125, 0.1370849609375, 0.14642333984375, 0.15576171875, 0.16510009765625, 0.1744384765625, 0.18377685546875, 0.193115234375, 0.20245361328125, 0.2117919921875, 0.22113037109375, 0.23046875, 0.23980712890625, 0.2491455078125, 0.25848388671875, 0.267822265625, 0.27716064453125, 0.2864990234375, 0.29583740234375, 0.30517578125, 0.31451416015625, 0.3238525390625, 0.33319091796875, 0.342529296875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 7.0, 15.0, 33.0, 82.0, 138.0, 322.0, 195.0, 90.0, 58.0, 26.0, 8.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.334053039550781, -7.981848239898682, -7.629642963409424, -7.277438163757324, -6.925232887268066, -6.573028087615967, -6.220823287963867, -5.868618011474609, -5.51641321182251, -5.16420841217041, -4.812003135681152, -4.459798336029053, -4.107593536376953, -3.7553882598876953, -3.4031834602355957, -3.050978422164917, -2.6987733840942383, -2.3465683460235596, -1.9943634271621704, -1.6421585083007812, -1.2899534702301025, -0.9377484321594238, -0.5855436325073242, -0.2333385944366455, 0.1188664436340332, 0.47107142210006714, 0.8232764005661011, 1.1754813194274902, 1.527686357498169, 1.8798913955688477, 2.2320961952209473, 2.584301233291626, 2.9365062713623047, 3.2887113094329834, 3.640916347503662, 3.9931211471557617, 4.3453264236450195, 4.697531223297119, 5.049736022949219, 5.401941299438477, 5.754146099090576, 6.106350898742676, 6.458556175231934, 6.810760974884033, 7.162965774536133, 7.515171051025391, 7.86737585067749, 8.21958065032959, 8.571785926818848, 8.923991203308105, 9.276195526123047, 9.628400802612305, 9.980606079101562, 10.33281135559082, 10.685015678405762, 11.03722095489502, 11.389425277709961, 11.741630554199219, 12.09383487701416, 12.446040153503418, 12.798245429992676, 13.150449752807617, 13.502655029296875, 13.854860305786133, 14.20706558227539]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 10.0, 10.0, 4.0, 11.0, 8.0, 10.0, 9.0, 12.0, 24.0, 17.0, 23.0, 12.0, 24.0, 28.0, 25.0, 32.0, 29.0, 39.0, 57.0, 59.0, 75.0, 59.0, 56.0, 40.0, 34.0, 40.0, 34.0, 37.0, 28.0, 14.0, 19.0, 23.0, 17.0, 12.0, 12.0, 12.0, 8.0, 4.0, 8.0, 4.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-5.045686721801758, -4.908112049102783, -4.770537376403809, -4.632962226867676, -4.495387554168701, -4.357812881469727, -4.220238208770752, -4.082663536071777, -3.9450886249542236, -3.807513952255249, -3.6699390411376953, -3.5323643684387207, -3.394789695739746, -3.2572147846221924, -3.1196401119232178, -2.982065200805664, -2.8444905281066895, -2.706915855407715, -2.569340944290161, -2.4317662715911865, -2.294191360473633, -2.156616687774658, -2.0190420150756836, -1.8814672231674194, -1.7438924312591553, -1.6063176393508911, -1.468742847442627, -1.3311681747436523, -1.1935933828353882, -1.056018590927124, -0.9184438586235046, -0.7808691263198853, -0.643294095993042, -0.5057193040847778, -0.36814457178115845, -0.23056980967521667, -0.0929950475692749, 0.04457974433898926, 0.18215447664260864, 0.319729208946228, 0.4573040008544922, 0.5948787927627563, 0.7324535250663757, 0.8700282573699951, 1.0076030492782593, 1.1451778411865234, 1.282752513885498, 1.4203273057937622, 1.5579020977020264, 1.6954768896102905, 1.8330516815185547, 1.9706263542175293, 2.108201026916504, 2.2457759380340576, 2.3833506107330322, 2.520925521850586, 2.6585001945495605, 2.796074867248535, 2.933649778366089, 3.0712244510650635, 3.208799362182617, 3.346374034881592, 3.4839487075805664, 3.621523380279541, 3.7590982913970947]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 7.0, 13.0, 17.0, 28.0, 34.0, 44.0, 63.0, 91.0, 146.0, 239.0, 374.0, 619.0, 1037.0, 1941.0, 4067.0, 10070.0, 35942.0, 238264.0, 2518564.0, 1230014.0, 115488.0, 22558.0, 7382.0, 3239.0, 1631.0, 886.0, 586.0, 346.0, 219.0, 138.0, 78.0, 66.0, 33.0, 20.0, 15.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36181640625, -0.347808837890625, -0.33380126953125, -0.319793701171875, -0.3057861328125, -0.291778564453125, -0.27777099609375, -0.263763427734375, -0.249755859375, -0.235748291015625, -0.22174072265625, -0.207733154296875, -0.1937255859375, -0.179718017578125, -0.16571044921875, -0.151702880859375, -0.1376953125, -0.123687744140625, -0.10968017578125, -0.095672607421875, -0.0816650390625, -0.067657470703125, -0.05364990234375, -0.039642333984375, -0.025634765625, -0.011627197265625, 0.00238037109375, 0.016387939453125, 0.0303955078125, 0.044403076171875, 0.05841064453125, 0.072418212890625, 0.08642578125, 0.100433349609375, 0.11444091796875, 0.128448486328125, 0.1424560546875, 0.156463623046875, 0.17047119140625, 0.184478759765625, 0.198486328125, 0.212493896484375, 0.22650146484375, 0.240509033203125, 0.2545166015625, 0.268524169921875, 0.28253173828125, 0.296539306640625, 0.310546875, 0.324554443359375, 0.33856201171875, 0.352569580078125, 0.3665771484375, 0.380584716796875, 0.39459228515625, 0.408599853515625, 0.422607421875, 0.436614990234375, 0.45062255859375, 0.464630126953125, 0.4786376953125, 0.492645263671875, 0.50665283203125, 0.520660400390625, 0.53466796875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 6.0, 10.0, 16.0, 19.0, 20.0, 33.0, 33.0, 27.0, 31.0, 46.0, 47.0, 57.0, 55.0, 68.0, 67.0, 65.0, 51.0, 51.0, 41.0, 52.0, 37.0, 35.0, 22.0, 23.0, 20.0, 9.0, 15.0, 9.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.332275390625, -0.32083892822265625, -0.3094024658203125, -0.29796600341796875, -0.286529541015625, -0.27509307861328125, -0.2636566162109375, -0.25222015380859375, -0.24078369140625, -0.22934722900390625, -0.2179107666015625, -0.20647430419921875, -0.195037841796875, -0.18360137939453125, -0.1721649169921875, -0.16072845458984375, -0.1492919921875, -0.13785552978515625, -0.1264190673828125, -0.11498260498046875, -0.103546142578125, -0.09210968017578125, -0.0806732177734375, -0.06923675537109375, -0.05780029296875, -0.04636383056640625, -0.0349273681640625, -0.02349090576171875, -0.012054443359375, -0.00061798095703125, 0.0108184814453125, 0.02225494384765625, 0.03369140625, 0.04512786865234375, 0.0565643310546875, 0.06800079345703125, 0.079437255859375, 0.09087371826171875, 0.1023101806640625, 0.11374664306640625, 0.12518310546875, 0.13661956787109375, 0.1480560302734375, 0.15949249267578125, 0.170928955078125, 0.18236541748046875, 0.1938018798828125, 0.20523834228515625, 0.2166748046875, 0.22811126708984375, 0.2395477294921875, 0.25098419189453125, 0.262420654296875, 0.27385711669921875, 0.2852935791015625, 0.29673004150390625, 0.30816650390625, 0.31960296630859375, 0.3310394287109375, 0.34247589111328125, 0.353912353515625, 0.36534881591796875, 0.3767852783203125, 0.38822174072265625, 0.399658203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 10.0, 14.0, 19.0, 32.0, 51.0, 91.0, 99.0, 217.0, 377.0, 655.0, 1254.0, 2707.0, 6799.0, 20575.0, 107569.0, 2747142.0, 1211830.0, 69878.0, 15491.0, 5266.0, 2047.0, 964.0, 514.0, 267.0, 135.0, 96.0, 43.0, 40.0, 27.0, 22.0, 9.0, 12.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76416015625, -0.7422561645507812, -0.7203521728515625, -0.6984481811523438, -0.676544189453125, -0.6546401977539062, -0.6327362060546875, -0.6108322143554688, -0.58892822265625, -0.5670242309570312, -0.5451202392578125, -0.5232162475585938, -0.501312255859375, -0.47940826416015625, -0.4575042724609375, -0.43560028076171875, -0.4136962890625, -0.39179229736328125, -0.3698883056640625, -0.34798431396484375, -0.326080322265625, -0.30417633056640625, -0.2822723388671875, -0.26036834716796875, -0.23846435546875, -0.21656036376953125, -0.1946563720703125, -0.17275238037109375, -0.150848388671875, -0.12894439697265625, -0.1070404052734375, -0.08513641357421875, -0.063232421875, -0.04132843017578125, -0.0194244384765625, 0.00247955322265625, 0.024383544921875, 0.04628753662109375, 0.0681915283203125, 0.09009552001953125, 0.11199951171875, 0.13390350341796875, 0.1558074951171875, 0.17771148681640625, 0.199615478515625, 0.22151947021484375, 0.2434234619140625, 0.26532745361328125, 0.2872314453125, 0.30913543701171875, 0.3310394287109375, 0.35294342041015625, 0.374847412109375, 0.39675140380859375, 0.4186553955078125, 0.44055938720703125, 0.46246337890625, 0.48436737060546875, 0.5062713623046875, 0.5281753540039062, 0.550079345703125, 0.5719833374023438, 0.5938873291015625, 0.6157913208007812, 0.6376953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 2.0, 7.0, 9.0, 6.0, 11.0, 24.0, 38.0, 43.0, 73.0, 130.0, 274.0, 598.0, 1041.0, 862.0, 428.0, 218.0, 109.0, 65.0, 49.0, 27.0, 16.0, 14.0, 7.0, 4.0, 4.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75927734375, -0.7353897094726562, -0.7115020751953125, -0.6876144409179688, -0.663726806640625, -0.6398391723632812, -0.6159515380859375, -0.5920639038085938, -0.56817626953125, -0.5442886352539062, -0.5204010009765625, -0.49651336669921875, -0.472625732421875, -0.44873809814453125, -0.4248504638671875, -0.40096282958984375, -0.3770751953125, -0.35318756103515625, -0.3292999267578125, -0.30541229248046875, -0.281524658203125, -0.25763702392578125, -0.2337493896484375, -0.20986175537109375, -0.18597412109375, -0.16208648681640625, -0.1381988525390625, -0.11431121826171875, -0.090423583984375, -0.06653594970703125, -0.0426483154296875, -0.01876068115234375, 0.005126953125, 0.02901458740234375, 0.0529022216796875, 0.07678985595703125, 0.100677490234375, 0.12456512451171875, 0.1484527587890625, 0.17234039306640625, 0.19622802734375, 0.22011566162109375, 0.2440032958984375, 0.26789093017578125, 0.291778564453125, 0.31566619873046875, 0.3395538330078125, 0.36344146728515625, 0.3873291015625, 0.41121673583984375, 0.4351043701171875, 0.45899200439453125, 0.482879638671875, 0.5067672729492188, 0.5306549072265625, 0.5545425415039062, 0.57843017578125, 0.6023178100585938, 0.6262054443359375, 0.6500930786132812, 0.673980712890625, 0.6978683471679688, 0.7217559814453125, 0.7456436157226562, 0.76953125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 12.0, 37.0, 108.0, 235.0, 339.0, 168.0, 61.0, 15.0, 7.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.616809844970703, -16.29242515563965, -15.96804141998291, -15.643656730651855, -15.319272994995117, -14.994888305664062, -14.670503616333008, -14.346118927001953, -14.021735191345215, -13.69735050201416, -13.372966766357422, -13.048582077026367, -12.724197387695312, -12.399813652038574, -12.07542896270752, -11.751045227050781, -11.426660537719727, -11.102275848388672, -10.777892112731934, -10.453507423400879, -10.12912368774414, -9.804738998413086, -9.480354309082031, -9.155969619750977, -8.831585884094238, -8.507201194763184, -8.182817459106445, -7.858432769775391, -7.534048557281494, -7.209664344787598, -6.885279655456543, -6.5608954429626465, -6.23651123046875, -5.9121270179748535, -5.587742805480957, -5.263358116149902, -4.938973903656006, -4.614589691162109, -4.290205001831055, -3.965820789337158, -3.6414365768432617, -3.3170523643493652, -2.9926679134368896, -2.668283462524414, -2.3438992500305176, -2.019515037536621, -1.6951305866241455, -1.37074613571167, -1.0463619232177734, -0.7219775915145874, -0.39759325981140137, -0.07320892810821533, 0.2511754035949707, 0.5755597352981567, 0.8999440670013428, 1.2243285179138184, 1.5487127304077148, 1.8730970621109009, 2.197481393814087, 2.5218658447265625, 2.846250057220459, 3.1706342697143555, 3.495018720626831, 3.8194031715393066, 4.143787384033203]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 9.0, 10.0, 16.0, 16.0, 17.0, 31.0, 29.0, 34.0, 37.0, 30.0, 42.0, 42.0, 47.0, 55.0, 50.0, 66.0, 56.0, 47.0, 41.0, 43.0, 40.0, 32.0, 31.0, 26.0, 31.0, 22.0, 16.0, 18.0, 12.0, 8.0, 10.0, 8.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.011326789855957, -1.9330666065216064, -1.8548064231872559, -1.7765462398529053, -1.6982859373092651, -1.6200257539749146, -1.541765570640564, -1.4635052680969238, -1.3852450847625732, -1.3069849014282227, -1.228724718093872, -1.1504645347595215, -1.0722042322158813, -0.9939440488815308, -0.9156838655471802, -0.8374236226081848, -0.759163498878479, -0.6809033155441284, -0.6026430726051331, -0.5243828892707825, -0.4461226761341095, -0.3678624629974365, -0.28960227966308594, -0.21134203672409058, -0.13308185338974, -0.054821647703647614, 0.023438557982444763, 0.10169875621795654, 0.17995896935462952, 0.2582191824913025, 0.3364793658256531, 0.41473960876464844, 0.492999792098999, 0.5712599754333496, 0.649520218372345, 0.7277804017066956, 0.8060406446456909, 0.8843008279800415, 0.9625610113143921, 1.0408213138580322, 1.1190814971923828, 1.1973416805267334, 1.275601863861084, 1.3538620471954346, 1.4321223497390747, 1.5103825330734253, 1.5886427164077759, 1.666903018951416, 1.745163083076477, 1.8234232664108276, 1.9016834497451782, 1.9799437522888184, 2.058203935623169, 2.1364641189575195, 2.21472430229187, 2.2929844856262207, 2.3712446689605713, 2.449504852294922, 2.5277650356292725, 2.606025218963623, 2.6842854022979736, 2.762545585632324, 2.840806007385254, 2.9190661907196045, 2.997326374053955]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 2.0, 6.0, 9.0, 5.0, 22.0, 22.0, 37.0, 48.0, 73.0, 127.0, 170.0, 260.0, 446.0, 672.0, 1129.0, 1850.0, 3333.0, 6286.0, 13227.0, 33351.0, 104588.0, 407204.0, 337347.0, 85486.0, 28139.0, 11690.0, 5532.0, 3065.0, 1667.0, 1012.0, 594.0, 388.0, 259.0, 175.0, 95.0, 77.0, 51.0, 40.0, 20.0, 15.0, 11.0, 7.0, 9.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1728515625, -1.1372222900390625, -1.101593017578125, -1.0659637451171875, -1.03033447265625, -0.9947052001953125, -0.959075927734375, -0.9234466552734375, -0.8878173828125, -0.8521881103515625, -0.816558837890625, -0.7809295654296875, -0.74530029296875, -0.7096710205078125, -0.674041748046875, -0.6384124755859375, -0.602783203125, -0.5671539306640625, -0.531524658203125, -0.4958953857421875, -0.46026611328125, -0.4246368408203125, -0.389007568359375, -0.3533782958984375, -0.3177490234375, -0.2821197509765625, -0.246490478515625, -0.2108612060546875, -0.17523193359375, -0.1396026611328125, -0.103973388671875, -0.0683441162109375, -0.03271484375, 0.0029144287109375, 0.038543701171875, 0.0741729736328125, 0.10980224609375, 0.1454315185546875, 0.181060791015625, 0.2166900634765625, 0.2523193359375, 0.2879486083984375, 0.323577880859375, 0.3592071533203125, 0.39483642578125, 0.4304656982421875, 0.466094970703125, 0.5017242431640625, 0.537353515625, 0.5729827880859375, 0.608612060546875, 0.6442413330078125, 0.67987060546875, 0.7154998779296875, 0.751129150390625, 0.7867584228515625, 0.8223876953125, 0.8580169677734375, 0.893646240234375, 0.9292755126953125, 0.96490478515625, 1.0005340576171875, 1.036163330078125, 1.0717926025390625, 1.107421875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 1.0, 3.0, 4.0, 3.0, 13.0, 5.0, 13.0, 20.0, 23.0, 28.0, 24.0, 23.0, 26.0, 44.0, 47.0, 41.0, 45.0, 52.0, 72.0, 68.0, 52.0, 50.0, 43.0, 61.0, 35.0, 41.0, 36.0, 34.0, 17.0, 20.0, 16.0, 9.0, 9.0, 7.0, 8.0, 4.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.3280754089355469, -0.31679534912109375, -0.3055152893066406, -0.2942352294921875, -0.2829551696777344, -0.27167510986328125, -0.2603950500488281, -0.249114990234375, -0.23783493041992188, -0.22655487060546875, -0.21527481079101562, -0.2039947509765625, -0.19271469116210938, -0.18143463134765625, -0.17015457153320312, -0.15887451171875, -0.14759445190429688, -0.13631439208984375, -0.12503433227539062, -0.1137542724609375, -0.10247421264648438, -0.09119415283203125, -0.07991409301757812, -0.068634033203125, -0.057353973388671875, -0.04607391357421875, -0.034793853759765625, -0.0235137939453125, -0.012233734130859375, -0.00095367431640625, 0.010326385498046875, 0.0216064453125, 0.032886505126953125, 0.04416656494140625, 0.055446624755859375, 0.0667266845703125, 0.07800674438476562, 0.08928680419921875, 0.10056686401367188, 0.111846923828125, 0.12312698364257812, 0.13440704345703125, 0.14568710327148438, 0.1569671630859375, 0.16824722290039062, 0.17952728271484375, 0.19080734252929688, 0.20208740234375, 0.21336746215820312, 0.22464752197265625, 0.23592758178710938, 0.2472076416015625, 0.2584877014160156, 0.26976776123046875, 0.2810478210449219, 0.292327880859375, 0.3036079406738281, 0.31488800048828125, 0.3261680603027344, 0.3374481201171875, 0.3487281799316406, 0.36000823974609375, 0.3712882995605469, 0.382568359375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 6.0, 11.0, 12.0, 17.0, 30.0, 36.0, 66.0, 104.0, 159.0, 297.0, 534.0, 947.0, 1922.0, 3929.0, 8836.0, 22284.0, 70780.0, 306272.0, 507415.0, 81552.0, 25013.0, 9620.0, 4166.0, 2064.0, 1023.0, 584.0, 334.0, 187.0, 114.0, 76.0, 46.0, 31.0, 20.0, 14.0, 17.0, 4.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.78662109375, -0.7575454711914062, -0.7284698486328125, -0.6993942260742188, -0.670318603515625, -0.6412429809570312, -0.6121673583984375, -0.5830917358398438, -0.55401611328125, -0.5249404907226562, -0.4958648681640625, -0.46678924560546875, -0.437713623046875, -0.40863800048828125, -0.3795623779296875, -0.35048675537109375, -0.3214111328125, -0.29233551025390625, -0.2632598876953125, -0.23418426513671875, -0.205108642578125, -0.17603302001953125, -0.1469573974609375, -0.11788177490234375, -0.08880615234375, -0.05973052978515625, -0.0306549072265625, -0.00157928466796875, 0.027496337890625, 0.05657196044921875, 0.0856475830078125, 0.11472320556640625, 0.143798828125, 0.17287445068359375, 0.2019500732421875, 0.23102569580078125, 0.260101318359375, 0.28917694091796875, 0.3182525634765625, 0.34732818603515625, 0.37640380859375, 0.40547943115234375, 0.4345550537109375, 0.46363067626953125, 0.492706298828125, 0.5217819213867188, 0.5508575439453125, 0.5799331665039062, 0.6090087890625, 0.6380844116210938, 0.6671600341796875, 0.6962356567382812, 0.725311279296875, 0.7543869018554688, 0.7834625244140625, 0.8125381469726562, 0.84161376953125, 0.8706893920898438, 0.8997650146484375, 0.9288406372070312, 0.957916259765625, 0.9869918823242188, 1.0160675048828125, 1.0451431274414062, 1.07421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 5.0, 10.0, 13.0, 15.0, 15.0, 25.0, 13.0, 23.0, 29.0, 42.0, 30.0, 42.0, 53.0, 44.0, 54.0, 36.0, 43.0, 54.0, 49.0, 54.0, 46.0, 48.0, 29.0, 42.0, 23.0, 19.0, 19.0, 21.0, 20.0, 16.0, 10.0, 3.0, 8.0, 10.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94580078125, -0.9135360717773438, -0.8812713623046875, -0.8490066528320312, -0.816741943359375, -0.7844772338867188, -0.7522125244140625, -0.7199478149414062, -0.68768310546875, -0.6554183959960938, -0.6231536865234375, -0.5908889770507812, -0.558624267578125, -0.5263595581054688, -0.4940948486328125, -0.46183013916015625, -0.4295654296875, -0.39730072021484375, -0.3650360107421875, -0.33277130126953125, -0.300506591796875, -0.26824188232421875, -0.2359771728515625, -0.20371246337890625, -0.17144775390625, -0.13918304443359375, -0.1069183349609375, -0.07465362548828125, -0.042388916015625, -0.01012420654296875, 0.0221405029296875, 0.05440521240234375, 0.086669921875, 0.11893463134765625, 0.1511993408203125, 0.18346405029296875, 0.215728759765625, 0.24799346923828125, 0.2802581787109375, 0.31252288818359375, 0.34478759765625, 0.37705230712890625, 0.4093170166015625, 0.44158172607421875, 0.473846435546875, 0.5061111450195312, 0.5383758544921875, 0.5706405639648438, 0.6029052734375, 0.6351699829101562, 0.6674346923828125, 0.6996994018554688, 0.731964111328125, 0.7642288208007812, 0.7964935302734375, 0.8287582397460938, 0.86102294921875, 0.8932876586914062, 0.9255523681640625, 0.9578170776367188, 0.990081787109375, 1.0223464965820312, 1.0546112060546875, 1.0868759155273438, 1.119140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 14.0, 21.0, 30.0, 67.0, 119.0, 324.0, 782.0, 2422.0, 12862.0, 185455.0, 803920.0, 35640.0, 4784.0, 1264.0, 432.0, 183.0, 100.0, 42.0, 31.0, 13.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.69482421875, -0.6756439208984375, -0.656463623046875, -0.6372833251953125, -0.61810302734375, -0.5989227294921875, -0.579742431640625, -0.5605621337890625, -0.5413818359375, -0.5222015380859375, -0.503021240234375, -0.4838409423828125, -0.46466064453125, -0.4454803466796875, -0.426300048828125, -0.4071197509765625, -0.387939453125, -0.3687591552734375, -0.349578857421875, -0.3303985595703125, -0.31121826171875, -0.2920379638671875, -0.272857666015625, -0.2536773681640625, -0.2344970703125, -0.2153167724609375, -0.196136474609375, -0.1769561767578125, -0.15777587890625, -0.1385955810546875, -0.119415283203125, -0.1002349853515625, -0.0810546875, -0.0618743896484375, -0.042694091796875, -0.0235137939453125, -0.00433349609375, 0.0148468017578125, 0.034027099609375, 0.0532073974609375, 0.0723876953125, 0.0915679931640625, 0.110748291015625, 0.1299285888671875, 0.14910888671875, 0.1682891845703125, 0.187469482421875, 0.2066497802734375, 0.225830078125, 0.2450103759765625, 0.264190673828125, 0.2833709716796875, 0.30255126953125, 0.3217315673828125, 0.340911865234375, 0.3600921630859375, 0.3792724609375, 0.3984527587890625, 0.417633056640625, 0.4368133544921875, 0.45599365234375, 0.4751739501953125, 0.494354248046875, 0.5135345458984375, 0.53271484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 17.0, 24.0, 41.0, 83.0, 118.0, 180.0, 179.0, 148.0, 74.0, 47.0, 30.0, 23.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012767314910888672, -0.00012314878404140472, -0.00011862441897392273, -0.00011410005390644073, -0.00010957568883895874, -0.00010505132377147675, -0.00010052695870399475, -9.600259363651276e-05, -9.147822856903076e-05, -8.695386350154877e-05, -8.242949843406677e-05, -7.790513336658478e-05, -7.338076829910278e-05, -6.885640323162079e-05, -6.43320381641388e-05, -5.98076730966568e-05, -5.5283308029174805e-05, -5.075894296169281e-05, -4.6234577894210815e-05, -4.171021282672882e-05, -3.7185847759246826e-05, -3.266148269176483e-05, -2.8137117624282837e-05, -2.3612752556800842e-05, -1.9088387489318848e-05, -1.4564022421836853e-05, -1.0039657354354858e-05, -5.515292286872864e-06, -9.909272193908691e-07, 3.5334378480911255e-06, 8.05780291557312e-06, 1.2582167983055115e-05, 1.710653305053711e-05, 2.1630898118019104e-05, 2.61552631855011e-05, 3.067962825298309e-05, 3.520399332046509e-05, 3.972835838794708e-05, 4.425272345542908e-05, 4.877708852291107e-05, 5.3301453590393066e-05, 5.782581865787506e-05, 6.235018372535706e-05, 6.687454879283905e-05, 7.139891386032104e-05, 7.592327892780304e-05, 8.044764399528503e-05, 8.497200906276703e-05, 8.949637413024902e-05, 9.402073919773102e-05, 9.854510426521301e-05, 0.00010306946933269501, 0.000107593834400177, 0.000112118199467659, 0.00011664256453514099, 0.00012116692960262299, 0.00012569129467010498, 0.00013021565973758698, 0.00013474002480506897, 0.00013926438987255096, 0.00014378875494003296, 0.00014831312000751495, 0.00015283748507499695, 0.00015736185014247894, 0.00016188621520996094]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 8.0, 12.0, 16.0, 33.0, 74.0, 105.0, 168.0, 392.0, 858.0, 2126.0, 6610.0, 28692.0, 218383.0, 700778.0, 71190.0, 13091.0, 3598.0, 1250.0, 550.0, 288.0, 140.0, 80.0, 47.0, 22.0, 13.0, 10.0, 9.0, 4.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322998046875, -0.31069183349609375, -0.2983856201171875, -0.28607940673828125, -0.273773193359375, -0.26146697998046875, -0.2491607666015625, -0.23685455322265625, -0.22454833984375, -0.21224212646484375, -0.1999359130859375, -0.18762969970703125, -0.175323486328125, -0.16301727294921875, -0.1507110595703125, -0.13840484619140625, -0.1260986328125, -0.11379241943359375, -0.1014862060546875, -0.08917999267578125, -0.076873779296875, -0.06456756591796875, -0.0522613525390625, -0.03995513916015625, -0.02764892578125, -0.01534271240234375, -0.0030364990234375, 0.00926971435546875, 0.021575927734375, 0.03388214111328125, 0.0461883544921875, 0.05849456787109375, 0.07080078125, 0.08310699462890625, 0.0954132080078125, 0.10771942138671875, 0.120025634765625, 0.13233184814453125, 0.1446380615234375, 0.15694427490234375, 0.16925048828125, 0.18155670166015625, 0.1938629150390625, 0.20616912841796875, 0.218475341796875, 0.23078155517578125, 0.2430877685546875, 0.25539398193359375, 0.2677001953125, 0.28000640869140625, 0.2923126220703125, 0.30461883544921875, 0.316925048828125, 0.32923126220703125, 0.3415374755859375, 0.35384368896484375, 0.36614990234375, 0.37845611572265625, 0.3907623291015625, 0.40306854248046875, 0.415374755859375, 0.42768096923828125, 0.4399871826171875, 0.45229339599609375, 0.464599609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 7.0, 12.0, 13.0, 12.0, 17.0, 34.0, 46.0, 71.0, 77.0, 89.0, 101.0, 115.0, 87.0, 91.0, 52.0, 45.0, 29.0, 20.0, 24.0, 14.0, 7.0, 7.0, 2.0, 5.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.288818359375, -0.2798004150390625, -0.270782470703125, -0.2617645263671875, -0.25274658203125, -0.2437286376953125, -0.234710693359375, -0.2256927490234375, -0.2166748046875, -0.2076568603515625, -0.198638916015625, -0.1896209716796875, -0.18060302734375, -0.1715850830078125, -0.162567138671875, -0.1535491943359375, -0.14453125, -0.1355133056640625, -0.126495361328125, -0.1174774169921875, -0.10845947265625, -0.0994415283203125, -0.090423583984375, -0.0814056396484375, -0.0723876953125, -0.0633697509765625, -0.054351806640625, -0.0453338623046875, -0.03631591796875, -0.0272979736328125, -0.018280029296875, -0.0092620849609375, -0.000244140625, 0.0087738037109375, 0.017791748046875, 0.0268096923828125, 0.03582763671875, 0.0448455810546875, 0.053863525390625, 0.0628814697265625, 0.0718994140625, 0.0809173583984375, 0.089935302734375, 0.0989532470703125, 0.10797119140625, 0.1169891357421875, 0.126007080078125, 0.1350250244140625, 0.14404296875, 0.1530609130859375, 0.162078857421875, 0.1710968017578125, 0.18011474609375, 0.1891326904296875, 0.198150634765625, 0.2071685791015625, 0.2161865234375, 0.2252044677734375, 0.234222412109375, 0.2432403564453125, 0.25225830078125, 0.2612762451171875, 0.270294189453125, 0.2793121337890625, 0.288330078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 20.0, 24.0, 57.0, 66.0, 184.0, 258.0, 137.0, 80.0, 69.0, 36.0, 27.0, 10.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.147005081176758, -6.918535232543945, -6.690065383911133, -6.4615960121154785, -6.233126163482666, -6.0046563148498535, -5.776186943054199, -5.547717094421387, -5.319247245788574, -5.090777397155762, -4.862307548522949, -4.633838176727295, -4.405368328094482, -4.17689847946167, -3.9484288692474365, -3.719959259033203, -3.4914894104003906, -3.263019561767578, -3.0345499515533447, -2.8060803413391113, -2.577610492706299, -2.3491406440734863, -2.120671033859253, -1.89220130443573, -1.663731575012207, -1.435261845588684, -1.2067921161651611, -0.9783223867416382, -0.7498526573181152, -0.5213829278945923, -0.29291319847106934, -0.06444346904754639, 0.16402673721313477, 0.3924964666366577, 0.6209661960601807, 0.8494359254837036, 1.0779056549072266, 1.3063753843307495, 1.5348451137542725, 1.7633148431777954, 1.9917845726013184, 2.220254421234131, 2.4487240314483643, 2.6771936416625977, 2.90566349029541, 3.1341333389282227, 3.362602949142456, 3.5910725593566895, 3.819542407989502, 4.0480122566223145, 4.276481628417969, 4.504951477050781, 4.733421325683594, 4.961891174316406, 5.190361022949219, 5.418830394744873, 5.6473002433776855, 5.875770092010498, 6.104239463806152, 6.332709312438965, 6.561179161071777, 6.78964900970459, 7.018118858337402, 7.246588230133057, 7.475058078765869]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 11.0, 3.0, 9.0, 5.0, 11.0, 13.0, 17.0, 16.0, 11.0, 17.0, 25.0, 23.0, 24.0, 21.0, 27.0, 33.0, 40.0, 41.0, 56.0, 69.0, 81.0, 65.0, 52.0, 39.0, 45.0, 34.0, 23.0, 29.0, 23.0, 26.0, 26.0, 8.0, 11.0, 13.0, 11.0, 8.0, 6.0, 7.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.6752586364746094, -3.5616910457611084, -3.4481232166290283, -3.3345556259155273, -3.2209877967834473, -3.1074202060699463, -2.9938526153564453, -2.8802847862243652, -2.7667171955108643, -2.6531496047973633, -2.539581775665283, -2.4260141849517822, -2.312446355819702, -2.198878765106201, -2.085310935974121, -1.9717433452606201, -1.8581756353378296, -1.744607925415039, -1.6310402154922485, -1.517472505569458, -1.403904914855957, -1.2903372049331665, -1.176769495010376, -1.063201904296875, -0.9496341347694397, -0.8360664248466492, -0.7224987745285034, -0.6089310646057129, -0.49536338448524475, -0.3817957043647766, -0.2682279944419861, -0.15466034412384033, -0.041092634201049805, 0.07247505336999893, 0.18604274094104767, 0.299610435962677, 0.41317811608314514, 0.5267457962036133, 0.6403135061264038, 0.7538811564445496, 0.8674488663673401, 0.9810165762901306, 1.0945842266082764, 1.208151936531067, 1.3217196464538574, 1.4352872371673584, 1.5488550662994385, 1.6624226570129395, 1.77599036693573, 1.8895580768585205, 2.0031256675720215, 2.1166934967041016, 2.2302610874176025, 2.3438286781311035, 2.4573965072631836, 2.5709640979766846, 2.6845319271087646, 2.7980995178222656, 2.9116673469543457, 3.0252349376678467, 3.1388027667999268, 3.2523703575134277, 3.365938186645508, 3.479505777359009, 3.5930733680725098]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 4.0, 3.0, 5.0, 11.0, 8.0, 9.0, 14.0, 21.0, 16.0, 14.0, 26.0, 26.0, 53.0, 55.0, 69.0, 84.0, 82.0, 145.0, 174.0, 303.0, 447.0, 832.0, 1904.0, 8558.0, 3216510.0, 954989.0, 6057.0, 1602.0, 776.0, 432.0, 266.0, 140.0, 120.0, 88.0, 93.0, 61.0, 41.0, 55.0, 38.0, 29.0, 24.0, 20.0, 15.0, 17.0, 18.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 4.0], "bins": [-2.234375, -2.1685028076171875, -2.102630615234375, -2.0367584228515625, -1.97088623046875, -1.9050140380859375, -1.839141845703125, -1.7732696533203125, -1.7073974609375, -1.6415252685546875, -1.575653076171875, -1.5097808837890625, -1.44390869140625, -1.3780364990234375, -1.312164306640625, -1.2462921142578125, -1.180419921875, -1.1145477294921875, -1.048675537109375, -0.9828033447265625, -0.91693115234375, -0.8510589599609375, -0.785186767578125, -0.7193145751953125, -0.6534423828125, -0.5875701904296875, -0.521697998046875, -0.4558258056640625, -0.38995361328125, -0.3240814208984375, -0.258209228515625, -0.1923370361328125, -0.12646484375, -0.0605926513671875, 0.005279541015625, 0.0711517333984375, 0.13702392578125, 0.2028961181640625, 0.268768310546875, 0.3346405029296875, 0.4005126953125, 0.4663848876953125, 0.532257080078125, 0.5981292724609375, 0.66400146484375, 0.7298736572265625, 0.795745849609375, 0.8616180419921875, 0.927490234375, 0.9933624267578125, 1.059234619140625, 1.1251068115234375, 1.19097900390625, 1.2568511962890625, 1.322723388671875, 1.3885955810546875, 1.4544677734375, 1.5203399658203125, 1.586212158203125, 1.6520843505859375, 1.71795654296875, 1.7838287353515625, 1.849700927734375, 1.9155731201171875, 1.9814453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 14.0, 14.0, 13.0, 22.0, 26.0, 26.0, 37.0, 50.0, 38.0, 45.0, 51.0, 51.0, 79.0, 53.0, 52.0, 60.0, 57.0, 44.0, 60.0, 35.0, 33.0, 30.0, 28.0, 16.0, 14.0, 20.0, 3.0, 6.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.346923828125, -0.3351325988769531, -0.32334136962890625, -0.3115501403808594, -0.2997589111328125, -0.2879676818847656, -0.27617645263671875, -0.2643852233886719, -0.252593994140625, -0.24080276489257812, -0.22901153564453125, -0.21722030639648438, -0.2054290771484375, -0.19363784790039062, -0.18184661865234375, -0.17005538940429688, -0.15826416015625, -0.14647293090820312, -0.13468170166015625, -0.12289047241210938, -0.1110992431640625, -0.09930801391601562, -0.08751678466796875, -0.07572555541992188, -0.063934326171875, -0.052143096923828125, -0.04035186767578125, -0.028560638427734375, -0.0167694091796875, -0.004978179931640625, 0.00681304931640625, 0.018604278564453125, 0.0303955078125, 0.042186737060546875, 0.05397796630859375, 0.06576919555664062, 0.0775604248046875, 0.08935165405273438, 0.10114288330078125, 0.11293411254882812, 0.124725341796875, 0.13651657104492188, 0.14830780029296875, 0.16009902954101562, 0.1718902587890625, 0.18368148803710938, 0.19547271728515625, 0.20726394653320312, 0.21905517578125, 0.23084640502929688, 0.24263763427734375, 0.2544288635253906, 0.2662200927734375, 0.2780113220214844, 0.28980255126953125, 0.3015937805175781, 0.313385009765625, 0.3251762390136719, 0.33696746826171875, 0.3487586975097656, 0.3605499267578125, 0.3723411560058594, 0.38413238525390625, 0.3959236145019531, 0.40771484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 5.0, 7.0, 11.0, 31.0, 58.0, 125.0, 253.0, 663.0, 1996.0, 19219.0, 4120966.0, 47242.0, 2440.0, 707.0, 311.0, 131.0, 56.0, 23.0, 14.0, 3.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763671875, -2.673370361328125, -2.58306884765625, -2.492767333984375, -2.4024658203125, -2.312164306640625, -2.22186279296875, -2.131561279296875, -2.041259765625, -1.950958251953125, -1.86065673828125, -1.770355224609375, -1.6800537109375, -1.589752197265625, -1.49945068359375, -1.409149169921875, -1.31884765625, -1.228546142578125, -1.13824462890625, -1.047943115234375, -0.9576416015625, -0.867340087890625, -0.77703857421875, -0.686737060546875, -0.596435546875, -0.506134033203125, -0.41583251953125, -0.325531005859375, -0.2352294921875, -0.144927978515625, -0.05462646484375, 0.035675048828125, 0.1259765625, 0.216278076171875, 0.30657958984375, 0.396881103515625, 0.4871826171875, 0.577484130859375, 0.66778564453125, 0.758087158203125, 0.848388671875, 0.938690185546875, 1.02899169921875, 1.119293212890625, 1.2095947265625, 1.299896240234375, 1.39019775390625, 1.480499267578125, 1.57080078125, 1.661102294921875, 1.75140380859375, 1.841705322265625, 1.9320068359375, 2.022308349609375, 2.11260986328125, 2.202911376953125, 2.293212890625, 2.383514404296875, 2.47381591796875, 2.564117431640625, 2.6544189453125, 2.744720458984375, 2.83502197265625, 2.925323486328125, 3.015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 10.0, 20.0, 30.0, 50.0, 114.0, 345.0, 1354.0, 1480.0, 442.0, 115.0, 65.0, 22.0, 11.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8603515625, -1.8087310791015625, -1.757110595703125, -1.7054901123046875, -1.65386962890625, -1.6022491455078125, -1.550628662109375, -1.4990081787109375, -1.4473876953125, -1.3957672119140625, -1.344146728515625, -1.2925262451171875, -1.24090576171875, -1.1892852783203125, -1.137664794921875, -1.0860443115234375, -1.034423828125, -0.9828033447265625, -0.931182861328125, -0.8795623779296875, -0.82794189453125, -0.7763214111328125, -0.724700927734375, -0.6730804443359375, -0.6214599609375, -0.5698394775390625, -0.518218994140625, -0.4665985107421875, -0.41497802734375, -0.3633575439453125, -0.311737060546875, -0.2601165771484375, -0.20849609375, -0.1568756103515625, -0.105255126953125, -0.0536346435546875, -0.00201416015625, 0.0496063232421875, 0.101226806640625, 0.1528472900390625, 0.2044677734375, 0.2560882568359375, 0.307708740234375, 0.3593292236328125, 0.41094970703125, 0.4625701904296875, 0.514190673828125, 0.5658111572265625, 0.617431640625, 0.6690521240234375, 0.720672607421875, 0.7722930908203125, 0.82391357421875, 0.8755340576171875, 0.927154541015625, 0.9787750244140625, 1.0303955078125, 1.0820159912109375, 1.133636474609375, 1.1852569580078125, 1.23687744140625, 1.2884979248046875, 1.340118408203125, 1.3917388916015625, 1.443359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 15.0, 20.0, 41.0, 71.0, 131.0, 196.0, 221.0, 163.0, 73.0, 28.0, 8.0, 7.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.95085620880127, -13.605608940124512, -13.260361671447754, -12.915114402770996, -12.569867134094238, -12.22461986541748, -11.879372596740723, -11.534125328063965, -11.188878059387207, -10.84363079071045, -10.498383522033691, -10.153136253356934, -9.807888984680176, -9.462641716003418, -9.11739444732666, -8.772147178649902, -8.426899909973145, -8.081652641296387, -7.736405372619629, -7.391158103942871, -7.045910835266113, -6.7006635665893555, -6.355416297912598, -6.01016902923584, -5.664921760559082, -5.319674491882324, -4.974427223205566, -4.629179954528809, -4.283932685852051, -3.938685417175293, -3.593438148498535, -3.2481908798217773, -2.9029436111450195, -2.5576963424682617, -2.212449073791504, -1.867201805114746, -1.5219545364379883, -1.1767072677612305, -0.8314599990844727, -0.48621273040771484, -0.14096546173095703, 0.20428180694580078, 0.5495290756225586, 0.8947763442993164, 1.2400236129760742, 1.585270881652832, 1.9305181503295898, 2.2757654190063477, 2.6210126876831055, 2.9662599563598633, 3.311507225036621, 3.656754493713379, 4.002001762390137, 4.3472490310668945, 4.692496299743652, 5.03774356842041, 5.382990837097168, 5.728238105773926, 6.073485374450684, 6.418732643127441, 6.763979911804199, 7.109227180480957, 7.454474449157715, 7.799721717834473, 8.14496898651123]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 3.0, 3.0, 11.0, 7.0, 14.0, 12.0, 20.0, 27.0, 20.0, 28.0, 40.0, 30.0, 31.0, 33.0, 41.0, 41.0, 60.0, 49.0, 38.0, 39.0, 34.0, 41.0, 56.0, 38.0, 40.0, 37.0, 38.0, 28.0, 20.0, 22.0, 18.0, 14.0, 14.0, 14.0, 6.0, 9.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4690582752227783, -3.3464033603668213, -3.2237484455108643, -3.1010935306549072, -2.97843861579895, -2.855783700942993, -2.733128547668457, -2.6104736328125, -2.487818717956543, -2.365163803100586, -2.242508888244629, -2.119853973388672, -1.9971990585327148, -1.8745441436767578, -1.7518891096115112, -1.6292341947555542, -1.5065793991088867, -1.3839244842529297, -1.2612695693969727, -1.1386146545410156, -1.0159597396850586, -0.8933047652244568, -0.770649790763855, -0.647994875907898, -0.5253399610519409, -0.4026850461959839, -0.28003010153770447, -0.15737515687942505, -0.03472024202346802, 0.08793467283248901, 0.21058964729309082, 0.33324456214904785, 0.4558992385864258, 0.5785541534423828, 0.7012090682983398, 0.8238640427589417, 0.9465189576148987, 1.069173812866211, 1.1918288469314575, 1.3144837617874146, 1.4371386766433716, 1.5597935914993286, 1.6824485063552856, 1.8051035404205322, 1.9277584552764893, 2.0504133701324463, 2.1730682849884033, 2.2957231998443604, 2.4183781147003174, 2.5410330295562744, 2.6636879444122314, 2.7863428592681885, 2.9089977741241455, 3.0316526889801025, 3.1543078422546387, 3.2769627571105957, 3.3996176719665527, 3.5222725868225098, 3.644927501678467, 3.767582416534424, 3.890237331390381, 4.012892246246338, 4.135547161102295, 4.258202075958252, 4.380856990814209]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 7.0, 5.0, 14.0, 8.0, 17.0, 28.0, 39.0, 67.0, 74.0, 123.0, 200.0, 284.0, 407.0, 613.0, 957.0, 1611.0, 2766.0, 4785.0, 8634.0, 16518.0, 34073.0, 77404.0, 199343.0, 366065.0, 191739.0, 73736.0, 32943.0, 16079.0, 8366.0, 4613.0, 2671.0, 1507.0, 979.0, 632.0, 427.0, 236.0, 172.0, 128.0, 81.0, 58.0, 39.0, 35.0, 24.0, 16.0, 9.0, 6.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.6226654052734375, -0.600799560546875, -0.5789337158203125, -0.55706787109375, -0.5352020263671875, -0.513336181640625, -0.4914703369140625, -0.4696044921875, -0.4477386474609375, -0.425872802734375, -0.4040069580078125, -0.38214111328125, -0.3602752685546875, -0.338409423828125, -0.3165435791015625, -0.294677734375, -0.2728118896484375, -0.250946044921875, -0.2290802001953125, -0.20721435546875, -0.1853485107421875, -0.163482666015625, -0.1416168212890625, -0.1197509765625, -0.0978851318359375, -0.076019287109375, -0.0541534423828125, -0.03228759765625, -0.0104217529296875, 0.011444091796875, 0.0333099365234375, 0.05517578125, 0.0770416259765625, 0.098907470703125, 0.1207733154296875, 0.14263916015625, 0.1645050048828125, 0.186370849609375, 0.2082366943359375, 0.2301025390625, 0.2519683837890625, 0.273834228515625, 0.2957000732421875, 0.31756591796875, 0.3394317626953125, 0.361297607421875, 0.3831634521484375, 0.405029296875, 0.4268951416015625, 0.448760986328125, 0.4706268310546875, 0.49249267578125, 0.5143585205078125, 0.536224365234375, 0.5580902099609375, 0.5799560546875, 0.6018218994140625, 0.623687744140625, 0.6455535888671875, 0.66741943359375, 0.6892852783203125, 0.711151123046875, 0.7330169677734375, 0.7548828125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 8.0, 8.0, 2.0, 8.0, 17.0, 11.0, 14.0, 14.0, 21.0, 27.0, 28.0, 22.0, 35.0, 48.0, 43.0, 50.0, 30.0, 52.0, 36.0, 54.0, 46.0, 47.0, 46.0, 41.0, 40.0, 35.0, 35.0, 30.0, 20.0, 23.0, 38.0, 17.0, 16.0, 4.0, 7.0, 7.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2647056579589844, -0.25426483154296875, -0.24382400512695312, -0.2333831787109375, -0.22294235229492188, -0.21250152587890625, -0.20206069946289062, -0.191619873046875, -0.18117904663085938, -0.17073822021484375, -0.16029739379882812, -0.1498565673828125, -0.13941574096679688, -0.12897491455078125, -0.11853408813476562, -0.10809326171875, -0.09765243530273438, -0.08721160888671875, -0.07677078247070312, -0.0663299560546875, -0.055889129638671875, -0.04544830322265625, -0.035007476806640625, -0.024566650390625, -0.014125823974609375, -0.00368499755859375, 0.006755828857421875, 0.0171966552734375, 0.027637481689453125, 0.03807830810546875, 0.048519134521484375, 0.0589599609375, 0.06940078735351562, 0.07984161376953125, 0.09028244018554688, 0.1007232666015625, 0.11116409301757812, 0.12160491943359375, 0.13204574584960938, 0.142486572265625, 0.15292739868164062, 0.16336822509765625, 0.17380905151367188, 0.1842498779296875, 0.19469070434570312, 0.20513153076171875, 0.21557235717773438, 0.22601318359375, 0.23645401000976562, 0.24689483642578125, 0.2573356628417969, 0.2677764892578125, 0.2782173156738281, 0.28865814208984375, 0.2990989685058594, 0.309539794921875, 0.3199806213378906, 0.33042144775390625, 0.3408622741699219, 0.3513031005859375, 0.3617439270019531, 0.37218475341796875, 0.3826255798339844, 0.39306640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 8.0, 11.0, 12.0, 10.0, 22.0, 46.0, 45.0, 62.0, 106.0, 157.0, 310.0, 533.0, 1011.0, 2209.0, 5308.0, 15795.0, 64993.0, 587393.0, 298599.0, 50408.0, 13073.0, 4465.0, 1853.0, 960.0, 445.0, 279.0, 132.0, 102.0, 62.0, 42.0, 30.0, 17.0, 18.0, 11.0, 8.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.90643310546875, -0.8714599609375, -0.83648681640625, -0.801513671875, -0.76654052734375, -0.7315673828125, -0.69659423828125, -0.66162109375, -0.62664794921875, -0.5916748046875, -0.55670166015625, -0.521728515625, -0.48675537109375, -0.4517822265625, -0.41680908203125, -0.3818359375, -0.34686279296875, -0.3118896484375, -0.27691650390625, -0.241943359375, -0.20697021484375, -0.1719970703125, -0.13702392578125, -0.10205078125, -0.06707763671875, -0.0321044921875, 0.00286865234375, 0.037841796875, 0.07281494140625, 0.1077880859375, 0.14276123046875, 0.177734375, 0.21270751953125, 0.2476806640625, 0.28265380859375, 0.317626953125, 0.35260009765625, 0.3875732421875, 0.42254638671875, 0.45751953125, 0.49249267578125, 0.5274658203125, 0.56243896484375, 0.597412109375, 0.63238525390625, 0.6673583984375, 0.70233154296875, 0.7373046875, 0.77227783203125, 0.8072509765625, 0.84222412109375, 0.877197265625, 0.91217041015625, 0.9471435546875, 0.98211669921875, 1.01708984375, 1.05206298828125, 1.0870361328125, 1.12200927734375, 1.156982421875, 1.19195556640625, 1.2269287109375, 1.26190185546875, 1.296875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 4.0, 11.0, 10.0, 7.0, 7.0, 15.0, 14.0, 18.0, 26.0, 34.0, 28.0, 37.0, 39.0, 43.0, 45.0, 60.0, 52.0, 52.0, 51.0, 55.0, 57.0, 46.0, 46.0, 44.0, 27.0, 17.0, 21.0, 24.0, 17.0, 19.0, 15.0, 8.0, 9.0, 7.0, 5.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.3046875, -1.264190673828125, -1.22369384765625, -1.183197021484375, -1.1427001953125, -1.102203369140625, -1.06170654296875, -1.021209716796875, -0.980712890625, -0.940216064453125, -0.89971923828125, -0.859222412109375, -0.8187255859375, -0.778228759765625, -0.73773193359375, -0.697235107421875, -0.65673828125, -0.616241455078125, -0.57574462890625, -0.535247802734375, -0.4947509765625, -0.454254150390625, -0.41375732421875, -0.373260498046875, -0.332763671875, -0.292266845703125, -0.25177001953125, -0.211273193359375, -0.1707763671875, -0.130279541015625, -0.08978271484375, -0.049285888671875, -0.0087890625, 0.031707763671875, 0.07220458984375, 0.112701416015625, 0.1531982421875, 0.193695068359375, 0.23419189453125, 0.274688720703125, 0.315185546875, 0.355682373046875, 0.39617919921875, 0.436676025390625, 0.4771728515625, 0.517669677734375, 0.55816650390625, 0.598663330078125, 0.63916015625, 0.679656982421875, 0.72015380859375, 0.760650634765625, 0.8011474609375, 0.841644287109375, 0.88214111328125, 0.922637939453125, 0.963134765625, 1.003631591796875, 1.04412841796875, 1.084625244140625, 1.1251220703125, 1.165618896484375, 1.20611572265625, 1.246612548828125, 1.287109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 12.0, 14.0, 16.0, 36.0, 42.0, 68.0, 107.0, 174.0, 306.0, 536.0, 1007.0, 2282.0, 6852.0, 36011.0, 740626.0, 230986.0, 20898.0, 4747.0, 1803.0, 857.0, 449.0, 265.0, 162.0, 99.0, 56.0, 40.0, 21.0, 17.0, 13.0, 3.0, 4.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.55322265625, -0.535858154296875, -0.51849365234375, -0.501129150390625, -0.4837646484375, -0.466400146484375, -0.44903564453125, -0.431671142578125, -0.414306640625, -0.396942138671875, -0.37957763671875, -0.362213134765625, -0.3448486328125, -0.327484130859375, -0.31011962890625, -0.292755126953125, -0.275390625, -0.258026123046875, -0.24066162109375, -0.223297119140625, -0.2059326171875, -0.188568115234375, -0.17120361328125, -0.153839111328125, -0.136474609375, -0.119110107421875, -0.10174560546875, -0.084381103515625, -0.0670166015625, -0.049652099609375, -0.03228759765625, -0.014923095703125, 0.00244140625, 0.019805908203125, 0.03717041015625, 0.054534912109375, 0.0718994140625, 0.089263916015625, 0.10662841796875, 0.123992919921875, 0.141357421875, 0.158721923828125, 0.17608642578125, 0.193450927734375, 0.2108154296875, 0.228179931640625, 0.24554443359375, 0.262908935546875, 0.2802734375, 0.297637939453125, 0.31500244140625, 0.332366943359375, 0.3497314453125, 0.367095947265625, 0.38446044921875, 0.401824951171875, 0.419189453125, 0.436553955078125, 0.45391845703125, 0.471282958984375, 0.4886474609375, 0.506011962890625, 0.52337646484375, 0.540740966796875, 0.55810546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 4.0, 9.0, 10.0, 15.0, 16.0, 26.0, 37.0, 38.0, 67.0, 112.0, 162.0, 162.0, 102.0, 61.0, 52.0, 28.0, 16.0, 19.0, 8.0, 10.0, 8.0, 6.0, 8.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0001169443130493164, -0.0001135868951678276, -0.0001102294772863388, -0.00010687205940485, -0.0001035146415233612, -0.0001001572236418724, -9.67998057603836e-05, -9.34423878788948e-05, -9.0084969997406e-05, -8.67275521159172e-05, -8.33701342344284e-05, -8.00127163529396e-05, -7.66552984714508e-05, -7.3297880589962e-05, -6.99404627084732e-05, -6.65830448269844e-05, -6.32256269454956e-05, -5.9868209064006805e-05, -5.6510791182518005e-05, -5.3153373301029205e-05, -4.9795955419540405e-05, -4.6438537538051605e-05, -4.3081119656562805e-05, -3.9723701775074005e-05, -3.6366283893585205e-05, -3.3008866012096405e-05, -2.9651448130607605e-05, -2.6294030249118805e-05, -2.2936612367630005e-05, -1.9579194486141205e-05, -1.6221776604652405e-05, -1.2864358723163605e-05, -9.506940841674805e-06, -6.149522960186005e-06, -2.7921050786972046e-06, 5.653128027915955e-07, 3.9227306842803955e-06, 7.2801485657691956e-06, 1.0637566447257996e-05, 1.3994984328746796e-05, 1.7352402210235596e-05, 2.0709820091724396e-05, 2.4067237973213196e-05, 2.7424655854701996e-05, 3.0782073736190796e-05, 3.4139491617679596e-05, 3.7496909499168396e-05, 4.0854327380657196e-05, 4.4211745262145996e-05, 4.7569163143634796e-05, 5.0926581025123596e-05, 5.4283998906612396e-05, 5.7641416788101196e-05, 6.0998834669589996e-05, 6.43562525510788e-05, 6.77136704325676e-05, 7.10710883140564e-05, 7.44285061955452e-05, 7.7785924077034e-05, 8.11433419585228e-05, 8.45007598400116e-05, 8.78581777215004e-05, 9.12155956029892e-05, 9.4573013484478e-05, 9.79304313659668e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 3.0, 7.0, 11.0, 20.0, 17.0, 40.0, 46.0, 100.0, 177.0, 291.0, 606.0, 1295.0, 3454.0, 14307.0, 137348.0, 826779.0, 51986.0, 7886.0, 2265.0, 898.0, 426.0, 228.0, 129.0, 86.0, 43.0, 30.0, 21.0, 8.0, 13.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.47119140625, -0.45328521728515625, -0.4353790283203125, -0.41747283935546875, -0.399566650390625, -0.38166046142578125, -0.3637542724609375, -0.34584808349609375, -0.32794189453125, -0.31003570556640625, -0.2921295166015625, -0.27422332763671875, -0.256317138671875, -0.23841094970703125, -0.2205047607421875, -0.20259857177734375, -0.1846923828125, -0.16678619384765625, -0.1488800048828125, -0.13097381591796875, -0.113067626953125, -0.09516143798828125, -0.0772552490234375, -0.05934906005859375, -0.04144287109375, -0.02353668212890625, -0.0056304931640625, 0.01227569580078125, 0.030181884765625, 0.04808807373046875, 0.0659942626953125, 0.08390045166015625, 0.101806640625, 0.11971282958984375, 0.1376190185546875, 0.15552520751953125, 0.173431396484375, 0.19133758544921875, 0.2092437744140625, 0.22714996337890625, 0.24505615234375, 0.26296234130859375, 0.2808685302734375, 0.29877471923828125, 0.316680908203125, 0.33458709716796875, 0.3524932861328125, 0.37039947509765625, 0.3883056640625, 0.40621185302734375, 0.4241180419921875, 0.44202423095703125, 0.459930419921875, 0.47783660888671875, 0.4957427978515625, 0.5136489868164062, 0.53155517578125, 0.5494613647460938, 0.5673675537109375, 0.5852737426757812, 0.603179931640625, 0.6210861206054688, 0.6389923095703125, 0.6568984985351562, 0.6748046875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 1.0, 8.0, 11.0, 16.0, 17.0, 32.0, 52.0, 78.0, 99.0, 157.0, 170.0, 121.0, 82.0, 56.0, 35.0, 22.0, 20.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.46044921875, -0.44362640380859375, -0.4268035888671875, -0.40998077392578125, -0.393157958984375, -0.37633514404296875, -0.3595123291015625, -0.34268951416015625, -0.32586669921875, -0.30904388427734375, -0.2922210693359375, -0.27539825439453125, -0.258575439453125, -0.24175262451171875, -0.2249298095703125, -0.20810699462890625, -0.1912841796875, -0.17446136474609375, -0.1576385498046875, -0.14081573486328125, -0.123992919921875, -0.10717010498046875, -0.0903472900390625, -0.07352447509765625, -0.05670166015625, -0.03987884521484375, -0.0230560302734375, -0.00623321533203125, 0.010589599609375, 0.02741241455078125, 0.0442352294921875, 0.06105804443359375, 0.077880859375, 0.09470367431640625, 0.1115264892578125, 0.12834930419921875, 0.145172119140625, 0.16199493408203125, 0.1788177490234375, 0.19564056396484375, 0.21246337890625, 0.22928619384765625, 0.2461090087890625, 0.26293182373046875, 0.279754638671875, 0.29657745361328125, 0.3134002685546875, 0.33022308349609375, 0.3470458984375, 0.36386871337890625, 0.3806915283203125, 0.39751434326171875, 0.414337158203125, 0.43115997314453125, 0.4479827880859375, 0.46480560302734375, 0.48162841796875, 0.49845123291015625, 0.5152740478515625, 0.5320968627929688, 0.548919677734375, 0.5657424926757812, 0.5825653076171875, 0.5993881225585938, 0.6162109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 16.0, 38.0, 67.0, 208.0, 508.0, 122.0, 22.0, 9.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.81678771972656, -36.1271858215332, -35.43758773803711, -34.74798583984375, -34.058387756347656, -33.3687858581543, -32.6791877746582, -31.989585876464844, -31.299985885620117, -30.61038589477539, -29.920785903930664, -29.231185913085938, -28.54158592224121, -27.851985931396484, -27.162384033203125, -26.4727840423584, -25.783184051513672, -25.093584060668945, -24.40398406982422, -23.714384078979492, -23.024784088134766, -22.335182189941406, -21.645584106445312, -20.955982208251953, -20.26638412475586, -19.576784133911133, -18.887184143066406, -18.19758415222168, -17.507984161376953, -16.818382263183594, -16.1287841796875, -15.43918228149414, -14.749581336975098, -14.059981346130371, -13.370381355285645, -12.680780410766602, -11.991180419921875, -11.301580429077148, -10.611980438232422, -9.922380447387695, -9.232780456542969, -8.543180465698242, -7.853579998016357, -7.163980007171631, -6.474379539489746, -5.7847795486450195, -5.095179557800293, -4.405579090118408, -3.7159786224365234, -3.0263783931732178, -2.336778163909912, -1.6471781730651855, -0.9575779438018799, -0.2679777145385742, 0.42162227630615234, 1.111222743988037, 1.8008227348327637, 2.4904229640960693, 3.180023193359375, 3.8696231842041016, 4.559223175048828, 5.248823642730713, 5.9384236335754395, 6.628024101257324, 7.317624092102051]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 8.0, 4.0, 7.0, 11.0, 12.0, 14.0, 14.0, 24.0, 19.0, 29.0, 25.0, 40.0, 42.0, 27.0, 48.0, 66.0, 108.0, 89.0, 81.0, 35.0, 34.0, 31.0, 38.0, 25.0, 14.0, 17.0, 20.0, 12.0, 16.0, 14.0, 14.0, 8.0, 8.0, 11.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.840521812438965, -4.6782732009887695, -4.516025066375732, -4.353776454925537, -4.191527843475342, -4.029279708862305, -3.8670310974121094, -3.704782485961914, -3.542534112930298, -3.3802857398986816, -3.2180371284484863, -3.05578875541687, -2.893540382385254, -2.7312917709350586, -2.5690433979034424, -2.406795024871826, -2.244546413421631, -2.0822980403900146, -1.9200494289398193, -1.7578010559082031, -1.5955525636672974, -1.4333040714263916, -1.2710556983947754, -1.1088072061538696, -0.9465587139129639, -0.7843102216720581, -0.6220617890357971, -0.45981332659721375, -0.29756486415863037, -0.1353163719177246, 0.026932060718536377, 0.18918049335479736, 0.3514285087585449, 0.5136770009994507, 0.6759254336357117, 0.8381738662719727, 1.0004223585128784, 1.1626708507537842, 1.3249192237854004, 1.4871677160263062, 1.649416208267212, 1.8116647005081177, 1.9739131927490234, 2.1361615657806396, 2.298409938812256, 2.460658550262451, 2.6229069232940674, 2.7851552963256836, 2.947403907775879, 3.109652280807495, 3.2719008922576904, 3.4341492652893066, 3.596397876739502, 3.758646249771118, 3.9208946228027344, 4.08314323425293, 4.245391845703125, 4.40764045715332, 4.569888591766357, 4.732137203216553, 4.894385814666748, 5.056633949279785, 5.2188825607299805, 5.381131172180176, 5.543379306793213]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 9.0, 14.0, 12.0, 22.0, 22.0, 42.0, 84.0, 97.0, 150.0, 304.0, 495.0, 969.0, 2000.0, 4362.0, 12032.0, 60338.0, 902658.0, 2878471.0, 288597.0, 29642.0, 7738.0, 3042.0, 1467.0, 723.0, 378.0, 228.0, 135.0, 72.0, 63.0, 44.0, 18.0, 16.0, 12.0, 5.0, 6.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58349609375, -0.561309814453125, -0.53912353515625, -0.516937255859375, -0.4947509765625, -0.472564697265625, -0.45037841796875, -0.428192138671875, -0.406005859375, -0.383819580078125, -0.36163330078125, -0.339447021484375, -0.3172607421875, -0.295074462890625, -0.27288818359375, -0.250701904296875, -0.228515625, -0.206329345703125, -0.18414306640625, -0.161956787109375, -0.1397705078125, -0.117584228515625, -0.09539794921875, -0.073211669921875, -0.051025390625, -0.028839111328125, -0.00665283203125, 0.015533447265625, 0.0377197265625, 0.059906005859375, 0.08209228515625, 0.104278564453125, 0.12646484375, 0.148651123046875, 0.17083740234375, 0.193023681640625, 0.2152099609375, 0.237396240234375, 0.25958251953125, 0.281768798828125, 0.303955078125, 0.326141357421875, 0.34832763671875, 0.370513916015625, 0.3927001953125, 0.414886474609375, 0.43707275390625, 0.459259033203125, 0.4814453125, 0.503631591796875, 0.52581787109375, 0.548004150390625, 0.5701904296875, 0.592376708984375, 0.61456298828125, 0.636749267578125, 0.658935546875, 0.681121826171875, 0.70330810546875, 0.725494384765625, 0.7476806640625, 0.769866943359375, 0.79205322265625, 0.814239501953125, 0.83642578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 6.0, 10.0, 6.0, 15.0, 10.0, 21.0, 18.0, 33.0, 38.0, 32.0, 35.0, 50.0, 30.0, 51.0, 36.0, 46.0, 58.0, 42.0, 53.0, 49.0, 48.0, 49.0, 42.0, 36.0, 29.0, 35.0, 28.0, 20.0, 13.0, 12.0, 9.0, 8.0, 5.0, 2.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3609886169433594, -0.34917449951171875, -0.3373603820800781, -0.3255462646484375, -0.3137321472167969, -0.30191802978515625, -0.2901039123535156, -0.278289794921875, -0.2664756774902344, -0.25466156005859375, -0.24284744262695312, -0.2310333251953125, -0.21921920776367188, -0.20740509033203125, -0.19559097290039062, -0.18377685546875, -0.17196273803710938, -0.16014862060546875, -0.14833450317382812, -0.1365203857421875, -0.12470626831054688, -0.11289215087890625, -0.10107803344726562, -0.089263916015625, -0.07744979858398438, -0.06563568115234375, -0.053821563720703125, -0.0420074462890625, -0.030193328857421875, -0.01837921142578125, -0.006565093994140625, 0.0052490234375, 0.017063140869140625, 0.02887725830078125, 0.040691375732421875, 0.0525054931640625, 0.06431961059570312, 0.07613372802734375, 0.08794784545898438, 0.099761962890625, 0.11157608032226562, 0.12339019775390625, 0.13520431518554688, 0.1470184326171875, 0.15883255004882812, 0.17064666748046875, 0.18246078491210938, 0.19427490234375, 0.20608901977539062, 0.21790313720703125, 0.22971725463867188, 0.2415313720703125, 0.2533454895019531, 0.26515960693359375, 0.2769737243652344, 0.288787841796875, 0.3006019592285156, 0.31241607666015625, 0.3242301940917969, 0.3360443115234375, 0.3478584289550781, 0.35967254638671875, 0.3714866638183594, 0.38330078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 5.0, 11.0, 22.0, 50.0, 94.0, 213.0, 624.0, 3487.0, 217516.0, 3959905.0, 10818.0, 966.0, 339.0, 125.0, 60.0, 21.0, 16.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.501953125, -2.4132080078125, -2.324462890625, -2.2357177734375, -2.14697265625, -2.0582275390625, -1.969482421875, -1.8807373046875, -1.7919921875, -1.7032470703125, -1.614501953125, -1.5257568359375, -1.43701171875, -1.3482666015625, -1.259521484375, -1.1707763671875, -1.08203125, -0.9932861328125, -0.904541015625, -0.8157958984375, -0.72705078125, -0.6383056640625, -0.549560546875, -0.4608154296875, -0.3720703125, -0.2833251953125, -0.194580078125, -0.1058349609375, -0.01708984375, 0.0716552734375, 0.160400390625, 0.2491455078125, 0.337890625, 0.4266357421875, 0.515380859375, 0.6041259765625, 0.69287109375, 0.7816162109375, 0.870361328125, 0.9591064453125, 1.0478515625, 1.1365966796875, 1.225341796875, 1.3140869140625, 1.40283203125, 1.4915771484375, 1.580322265625, 1.6690673828125, 1.7578125, 1.8465576171875, 1.935302734375, 2.0240478515625, 2.11279296875, 2.2015380859375, 2.290283203125, 2.3790283203125, 2.4677734375, 2.5565185546875, 2.645263671875, 2.7340087890625, 2.82275390625, 2.9114990234375, 3.000244140625, 3.0889892578125, 3.177734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 4.0, 18.0, 18.0, 35.0, 61.0, 146.0, 356.0, 959.0, 1330.0, 665.0, 228.0, 112.0, 61.0, 33.0, 17.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.046875, -1.997344970703125, -1.94781494140625, -1.898284912109375, -1.8487548828125, -1.799224853515625, -1.74969482421875, -1.700164794921875, -1.650634765625, -1.601104736328125, -1.55157470703125, -1.502044677734375, -1.4525146484375, -1.402984619140625, -1.35345458984375, -1.303924560546875, -1.25439453125, -1.204864501953125, -1.15533447265625, -1.105804443359375, -1.0562744140625, -1.006744384765625, -0.95721435546875, -0.907684326171875, -0.858154296875, -0.808624267578125, -0.75909423828125, -0.709564208984375, -0.6600341796875, -0.610504150390625, -0.56097412109375, -0.511444091796875, -0.4619140625, -0.412384033203125, -0.36285400390625, -0.313323974609375, -0.2637939453125, -0.214263916015625, -0.16473388671875, -0.115203857421875, -0.065673828125, -0.016143798828125, 0.03338623046875, 0.082916259765625, 0.1324462890625, 0.181976318359375, 0.23150634765625, 0.281036376953125, 0.33056640625, 0.380096435546875, 0.42962646484375, 0.479156494140625, 0.5286865234375, 0.578216552734375, 0.62774658203125, 0.677276611328125, 0.726806640625, 0.776336669921875, 0.82586669921875, 0.875396728515625, 0.9249267578125, 0.974456787109375, 1.02398681640625, 1.073516845703125, 1.123046875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 13.0, 34.0, 135.0, 394.0, 306.0, 82.0, 24.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.721954345703125, -13.120304107666016, -12.518653869628906, -11.917003631591797, -11.315353393554688, -10.713703155517578, -10.112052917480469, -9.51040267944336, -8.90875244140625, -8.30710220336914, -7.705451965332031, -7.103801727294922, -6.5021514892578125, -5.900501251220703, -5.298851013183594, -4.697200775146484, -4.095550537109375, -3.4939002990722656, -2.8922500610351562, -2.290599822998047, -1.6889495849609375, -1.0872993469238281, -0.48564910888671875, 0.11600112915039062, 0.7176513671875, 1.3193016052246094, 1.9209518432617188, 2.522602081298828, 3.1242523193359375, 3.725902557373047, 4.327552795410156, 4.929203033447266, 5.530853271484375, 6.132503509521484, 6.734153747558594, 7.335803985595703, 7.9374542236328125, 8.539104461669922, 9.140754699707031, 9.74240493774414, 10.34405517578125, 10.94570541381836, 11.547355651855469, 12.149005889892578, 12.750656127929688, 13.352306365966797, 13.953956604003906, 14.555606842041016, 15.157257080078125, 15.758907318115234, 16.360557556152344, 16.962207794189453, 17.563858032226562, 18.165508270263672, 18.76715850830078, 19.36880874633789, 19.970458984375, 20.57210922241211, 21.17375946044922, 21.775409698486328, 22.377059936523438, 22.978710174560547, 23.580360412597656, 24.182010650634766, 24.783660888671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 9.0, 6.0, 13.0, 16.0, 20.0, 24.0, 29.0, 27.0, 29.0, 42.0, 30.0, 43.0, 40.0, 53.0, 58.0, 55.0, 47.0, 64.0, 52.0, 35.0, 35.0, 44.0, 29.0, 32.0, 20.0, 23.0, 16.0, 22.0, 22.0, 11.0, 9.0, 5.0, 6.0, 3.0, 2.0, 11.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.170454502105713, -4.041761875152588, -3.913069248199463, -3.784376382827759, -3.655683755874634, -3.526991128921509, -3.3982982635498047, -3.2696056365966797, -3.1409130096435547, -3.0122203826904297, -2.8835277557373047, -2.7548348903656006, -2.6261422634124756, -2.4974496364593506, -2.3687567710876465, -2.2400641441345215, -2.1113715171813965, -1.9826788902282715, -1.853986144065857, -1.7252933979034424, -1.5966007709503174, -1.4679081439971924, -1.3392153978347778, -1.2105226516723633, -1.0818300247192383, -0.9531373381614685, -0.8244446516036987, -0.695751965045929, -0.5670592784881592, -0.4383665919303894, -0.30967390537261963, -0.18098121881484985, -0.05228900909423828, 0.0764036774635315, 0.20509636402130127, 0.33378905057907104, 0.4624817371368408, 0.5911744236946106, 0.7198671102523804, 0.8485597968101501, 0.9772524833679199, 1.105945110321045, 1.2346378564834595, 1.363330602645874, 1.492023229598999, 1.620715856552124, 1.7494086027145386, 1.8781013488769531, 2.006793975830078, 2.135486602783203, 2.264179229736328, 2.3928720951080322, 2.5215647220611572, 2.6502573490142822, 2.7789502143859863, 2.9076428413391113, 3.0363354682922363, 3.1650280952453613, 3.2937207221984863, 3.4224135875701904, 3.5511062145233154, 3.6797988414764404, 3.8084917068481445, 3.9371843338012695, 4.0658769607543945]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 5.0, 5.0, 7.0, 6.0, 24.0, 18.0, 35.0, 40.0, 75.0, 108.0, 176.0, 239.0, 469.0, 752.0, 1282.0, 2448.0, 4962.0, 10619.0, 25634.0, 71388.0, 234828.0, 444235.0, 162498.0, 52126.0, 19453.0, 8423.0, 3901.0, 2024.0, 1146.0, 560.0, 385.0, 218.0, 147.0, 98.0, 48.0, 48.0, 39.0, 24.0, 23.0, 14.0, 4.0, 7.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8310546875, -0.8061370849609375, -0.781219482421875, -0.7563018798828125, -0.73138427734375, -0.7064666748046875, -0.681549072265625, -0.6566314697265625, -0.6317138671875, -0.6067962646484375, -0.581878662109375, -0.5569610595703125, -0.53204345703125, -0.5071258544921875, -0.482208251953125, -0.4572906494140625, -0.432373046875, -0.4074554443359375, -0.382537841796875, -0.3576202392578125, -0.33270263671875, -0.3077850341796875, -0.282867431640625, -0.2579498291015625, -0.2330322265625, -0.2081146240234375, -0.183197021484375, -0.1582794189453125, -0.13336181640625, -0.1084442138671875, -0.083526611328125, -0.0586090087890625, -0.03369140625, -0.0087738037109375, 0.016143798828125, 0.0410614013671875, 0.06597900390625, 0.0908966064453125, 0.115814208984375, 0.1407318115234375, 0.1656494140625, 0.1905670166015625, 0.215484619140625, 0.2404022216796875, 0.26531982421875, 0.2902374267578125, 0.315155029296875, 0.3400726318359375, 0.364990234375, 0.3899078369140625, 0.414825439453125, 0.4397430419921875, 0.46466064453125, 0.4895782470703125, 0.514495849609375, 0.5394134521484375, 0.5643310546875, 0.5892486572265625, 0.614166259765625, 0.6390838623046875, 0.66400146484375, 0.6889190673828125, 0.713836669921875, 0.7387542724609375, 0.763671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 9.0, 7.0, 6.0, 5.0, 13.0, 13.0, 19.0, 21.0, 17.0, 22.0, 17.0, 33.0, 34.0, 38.0, 40.0, 37.0, 52.0, 47.0, 41.0, 42.0, 44.0, 50.0, 47.0, 49.0, 42.0, 31.0, 32.0, 23.0, 29.0, 23.0, 18.0, 20.0, 14.0, 14.0, 10.0, 7.0, 9.0, 6.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.39208984375, -0.3799552917480469, -0.36782073974609375, -0.3556861877441406, -0.3435516357421875, -0.3314170837402344, -0.31928253173828125, -0.3071479797363281, -0.295013427734375, -0.2828788757324219, -0.27074432373046875, -0.2586097717285156, -0.2464752197265625, -0.23434066772460938, -0.22220611572265625, -0.21007156372070312, -0.19793701171875, -0.18580245971679688, -0.17366790771484375, -0.16153335571289062, -0.1493988037109375, -0.13726425170898438, -0.12512969970703125, -0.11299514770507812, -0.100860595703125, -0.08872604370117188, -0.07659149169921875, -0.06445693969726562, -0.0523223876953125, -0.040187835693359375, -0.02805328369140625, -0.015918731689453125, -0.0037841796875, 0.008350372314453125, 0.02048492431640625, 0.032619476318359375, 0.0447540283203125, 0.056888580322265625, 0.06902313232421875, 0.08115768432617188, 0.093292236328125, 0.10542678833007812, 0.11756134033203125, 0.12969589233398438, 0.1418304443359375, 0.15396499633789062, 0.16609954833984375, 0.17823410034179688, 0.19036865234375, 0.20250320434570312, 0.21463775634765625, 0.22677230834960938, 0.2389068603515625, 0.2510414123535156, 0.26317596435546875, 0.2753105163574219, 0.287445068359375, 0.2995796203613281, 0.31171417236328125, 0.3238487243652344, 0.3359832763671875, 0.3481178283691406, 0.36025238037109375, 0.3723869323730469, 0.384521484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 15.0, 15.0, 21.0, 37.0, 37.0, 72.0, 93.0, 144.0, 201.0, 338.0, 560.0, 1182.0, 3243.0, 14931.0, 181810.0, 799960.0, 36517.0, 5680.0, 1697.0, 760.0, 422.0, 286.0, 167.0, 110.0, 70.0, 46.0, 41.0, 14.0, 20.0, 11.0, 9.0, 14.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.642578125, -1.5899505615234375, -1.537322998046875, -1.4846954345703125, -1.43206787109375, -1.3794403076171875, -1.326812744140625, -1.2741851806640625, -1.2215576171875, -1.1689300537109375, -1.116302490234375, -1.0636749267578125, -1.01104736328125, -0.9584197998046875, -0.905792236328125, -0.8531646728515625, -0.800537109375, -0.7479095458984375, -0.695281982421875, -0.6426544189453125, -0.59002685546875, -0.5373992919921875, -0.484771728515625, -0.4321441650390625, -0.3795166015625, -0.3268890380859375, -0.274261474609375, -0.2216339111328125, -0.16900634765625, -0.1163787841796875, -0.063751220703125, -0.0111236572265625, 0.04150390625, 0.0941314697265625, 0.146759033203125, 0.1993865966796875, 0.25201416015625, 0.3046417236328125, 0.357269287109375, 0.4098968505859375, 0.4625244140625, 0.5151519775390625, 0.567779541015625, 0.6204071044921875, 0.67303466796875, 0.7256622314453125, 0.778289794921875, 0.8309173583984375, 0.883544921875, 0.9361724853515625, 0.988800048828125, 1.0414276123046875, 1.09405517578125, 1.1466827392578125, 1.199310302734375, 1.2519378662109375, 1.3045654296875, 1.3571929931640625, 1.409820556640625, 1.4624481201171875, 1.51507568359375, 1.5677032470703125, 1.620330810546875, 1.6729583740234375, 1.7255859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 9.0, 17.0, 26.0, 19.0, 44.0, 36.0, 53.0, 49.0, 71.0, 51.0, 74.0, 75.0, 71.0, 69.0, 61.0, 56.0, 43.0, 30.0, 21.0, 19.0, 25.0, 16.0, 10.0, 14.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.310546875, -2.244537353515625, -2.17852783203125, -2.112518310546875, -2.0465087890625, -1.980499267578125, -1.91448974609375, -1.848480224609375, -1.782470703125, -1.716461181640625, -1.65045166015625, -1.584442138671875, -1.5184326171875, -1.452423095703125, -1.38641357421875, -1.320404052734375, -1.25439453125, -1.188385009765625, -1.12237548828125, -1.056365966796875, -0.9903564453125, -0.924346923828125, -0.85833740234375, -0.792327880859375, -0.726318359375, -0.660308837890625, -0.59429931640625, -0.528289794921875, -0.4622802734375, -0.396270751953125, -0.33026123046875, -0.264251708984375, -0.1982421875, -0.132232666015625, -0.06622314453125, -0.000213623046875, 0.0657958984375, 0.131805419921875, 0.19781494140625, 0.263824462890625, 0.329833984375, 0.395843505859375, 0.46185302734375, 0.527862548828125, 0.5938720703125, 0.659881591796875, 0.72589111328125, 0.791900634765625, 0.85791015625, 0.923919677734375, 0.98992919921875, 1.055938720703125, 1.1219482421875, 1.187957763671875, 1.25396728515625, 1.319976806640625, 1.385986328125, 1.451995849609375, 1.51800537109375, 1.584014892578125, 1.6500244140625, 1.716033935546875, 1.78204345703125, 1.848052978515625, 1.9140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 9.0, 14.0, 17.0, 20.0, 24.0, 36.0, 41.0, 83.0, 118.0, 186.0, 375.0, 781.0, 1650.0, 4599.0, 16054.0, 94716.0, 814050.0, 92018.0, 15731.0, 4682.0, 1688.0, 772.0, 360.0, 189.0, 107.0, 55.0, 40.0, 38.0, 19.0, 14.0, 11.0, 16.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.366943359375, -0.355987548828125, -0.34503173828125, -0.334075927734375, -0.3231201171875, -0.312164306640625, -0.30120849609375, -0.290252685546875, -0.279296875, -0.268341064453125, -0.25738525390625, -0.246429443359375, -0.2354736328125, -0.224517822265625, -0.21356201171875, -0.202606201171875, -0.191650390625, -0.180694580078125, -0.16973876953125, -0.158782958984375, -0.1478271484375, -0.136871337890625, -0.12591552734375, -0.114959716796875, -0.10400390625, -0.093048095703125, -0.08209228515625, -0.071136474609375, -0.0601806640625, -0.049224853515625, -0.03826904296875, -0.027313232421875, -0.016357421875, -0.005401611328125, 0.00555419921875, 0.016510009765625, 0.0274658203125, 0.038421630859375, 0.04937744140625, 0.060333251953125, 0.0712890625, 0.082244873046875, 0.09320068359375, 0.104156494140625, 0.1151123046875, 0.126068115234375, 0.13702392578125, 0.147979736328125, 0.158935546875, 0.169891357421875, 0.18084716796875, 0.191802978515625, 0.2027587890625, 0.213714599609375, 0.22467041015625, 0.235626220703125, 0.24658203125, 0.257537841796875, 0.26849365234375, 0.279449462890625, 0.2904052734375, 0.301361083984375, 0.31231689453125, 0.323272705078125, 0.334228515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 9.0, 10.0, 16.0, 12.0, 15.0, 23.0, 29.0, 42.0, 65.0, 86.0, 126.0, 119.0, 110.0, 90.0, 56.0, 42.0, 30.0, 23.0, 19.0, 13.0, 11.0, 12.0, 7.0, 6.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.671117782592773e-05, -7.435865700244904e-05, -7.200613617897034e-05, -6.965361535549164e-05, -6.730109453201294e-05, -6.494857370853424e-05, -6.259605288505554e-05, -6.024353206157684e-05, -5.7891011238098145e-05, -5.5538490414619446e-05, -5.318596959114075e-05, -5.083344876766205e-05, -4.848092794418335e-05, -4.612840712070465e-05, -4.377588629722595e-05, -4.1423365473747253e-05, -3.9070844650268555e-05, -3.6718323826789856e-05, -3.436580300331116e-05, -3.201328217983246e-05, -2.966076135635376e-05, -2.730824053287506e-05, -2.4955719709396362e-05, -2.2603198885917664e-05, -2.0250678062438965e-05, -1.7898157238960266e-05, -1.5545636415481567e-05, -1.3193115592002869e-05, -1.084059476852417e-05, -8.488073945045471e-06, -6.1355531215667725e-06, -3.7830322980880737e-06, -1.430511474609375e-06, 9.220093488693237e-07, 3.2745301723480225e-06, 5.627050995826721e-06, 7.97957181930542e-06, 1.0332092642784119e-05, 1.2684613466262817e-05, 1.5037134289741516e-05, 1.7389655113220215e-05, 1.9742175936698914e-05, 2.2094696760177612e-05, 2.444721758365631e-05, 2.679973840713501e-05, 2.915225923061371e-05, 3.150478005409241e-05, 3.3857300877571106e-05, 3.6209821701049805e-05, 3.8562342524528503e-05, 4.09148633480072e-05, 4.32673841714859e-05, 4.56199049949646e-05, 4.79724258184433e-05, 5.0324946641922e-05, 5.2677467465400696e-05, 5.5029988288879395e-05, 5.738250911235809e-05, 5.973502993583679e-05, 6.208755075931549e-05, 6.444007158279419e-05, 6.679259240627289e-05, 6.914511322975159e-05, 7.149763405323029e-05, 7.385015487670898e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 16.0, 23.0, 65.0, 93.0, 186.0, 438.0, 1053.0, 4061.0, 34537.0, 863753.0, 132624.0, 8717.0, 1804.0, 626.0, 256.0, 143.0, 60.0, 44.0, 22.0, 5.0, 5.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52734375, -0.5117034912109375, -0.496063232421875, -0.4804229736328125, -0.46478271484375, -0.4491424560546875, -0.433502197265625, -0.4178619384765625, -0.4022216796875, -0.3865814208984375, -0.370941162109375, -0.3553009033203125, -0.33966064453125, -0.3240203857421875, -0.308380126953125, -0.2927398681640625, -0.277099609375, -0.2614593505859375, -0.245819091796875, -0.2301788330078125, -0.21453857421875, -0.1988983154296875, -0.183258056640625, -0.1676177978515625, -0.1519775390625, -0.1363372802734375, -0.120697021484375, -0.1050567626953125, -0.08941650390625, -0.0737762451171875, -0.058135986328125, -0.0424957275390625, -0.02685546875, -0.0112152099609375, 0.004425048828125, 0.0200653076171875, 0.03570556640625, 0.0513458251953125, 0.066986083984375, 0.0826263427734375, 0.0982666015625, 0.1139068603515625, 0.129547119140625, 0.1451873779296875, 0.16082763671875, 0.1764678955078125, 0.192108154296875, 0.2077484130859375, 0.223388671875, 0.2390289306640625, 0.254669189453125, 0.2703094482421875, 0.28594970703125, 0.3015899658203125, 0.317230224609375, 0.3328704833984375, 0.3485107421875, 0.3641510009765625, 0.379791259765625, 0.3954315185546875, 0.41107177734375, 0.4267120361328125, 0.442352294921875, 0.4579925537109375, 0.4736328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 10.0, 7.0, 13.0, 10.0, 22.0, 21.0, 35.0, 31.0, 56.0, 42.0, 58.0, 68.0, 82.0, 94.0, 91.0, 65.0, 52.0, 47.0, 38.0, 22.0, 26.0, 24.0, 16.0, 9.0, 10.0, 8.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.279052734375, -0.2700996398925781, -0.26114654541015625, -0.2521934509277344, -0.2432403564453125, -0.23428726196289062, -0.22533416748046875, -0.21638107299804688, -0.207427978515625, -0.19847488403320312, -0.18952178955078125, -0.18056869506835938, -0.1716156005859375, -0.16266250610351562, -0.15370941162109375, -0.14475631713867188, -0.13580322265625, -0.12685012817382812, -0.11789703369140625, -0.10894393920898438, -0.0999908447265625, -0.09103775024414062, -0.08208465576171875, -0.07313156127929688, -0.064178466796875, -0.055225372314453125, -0.04627227783203125, -0.037319183349609375, -0.0283660888671875, -0.019412994384765625, -0.01045989990234375, -0.001506805419921875, 0.0074462890625, 0.016399383544921875, 0.02535247802734375, 0.034305572509765625, 0.0432586669921875, 0.052211761474609375, 0.06116485595703125, 0.07011795043945312, 0.079071044921875, 0.08802413940429688, 0.09697723388671875, 0.10593032836914062, 0.1148834228515625, 0.12383651733398438, 0.13278961181640625, 0.14174270629882812, 0.15069580078125, 0.15964889526367188, 0.16860198974609375, 0.17755508422851562, 0.1865081787109375, 0.19546127319335938, 0.20441436767578125, 0.21336746215820312, 0.222320556640625, 0.23127365112304688, 0.24022674560546875, 0.24917984008789062, 0.2581329345703125, 0.2670860290527344, 0.27603912353515625, 0.2849922180175781, 0.2939453125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 7.0, 13.0, 36.0, 74.0, 234.0, 495.0, 98.0, 32.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.056167602539062, -17.497779846191406, -16.939390182495117, -16.38100242614746, -15.822614669799805, -15.264225959777832, -14.70583724975586, -14.147449493408203, -13.589061737060547, -13.030673027038574, -12.472285270690918, -11.913896560668945, -11.355508804321289, -10.797120094299316, -10.238731384277344, -9.680343627929688, -9.121954917907715, -8.563566207885742, -8.005178451538086, -7.446789741516113, -6.888401985168457, -6.330013275146484, -5.77162504196167, -5.2132368087768555, -4.654848575592041, -4.096460342407227, -3.538072109222412, -2.9796836376190186, -2.421295404434204, -1.8629071712493896, -1.304518699645996, -0.7461304664611816, -0.1877422332763672, 0.37064605951309204, 0.9290343523025513, 1.4874227046966553, 2.0458109378814697, 2.604199171066284, 3.1625876426696777, 3.720975875854492, 4.279364109039307, 4.837752342224121, 5.3961405754089355, 5.95452880859375, 6.512917518615723, 7.071305274963379, 7.629693984985352, 8.188081741333008, 8.74647045135498, 9.304859161376953, 9.86324691772461, 10.421635627746582, 10.980023384094238, 11.538412094116211, 12.096799850463867, 12.65518856048584, 13.213577270507812, 13.771965980529785, 14.330353736877441, 14.888742446899414, 15.44713020324707, 16.005517959594727, 16.563907623291016, 17.122295379638672, 17.680683135986328]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 2.0, 8.0, 7.0, 10.0, 7.0, 10.0, 11.0, 7.0, 20.0, 27.0, 24.0, 21.0, 23.0, 27.0, 43.0, 49.0, 78.0, 119.0, 103.0, 62.0, 42.0, 29.0, 40.0, 27.0, 21.0, 23.0, 16.0, 15.0, 20.0, 8.0, 14.0, 14.0, 5.0, 6.0, 6.0, 16.0, 3.0, 8.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.256782531738281, -6.059810638427734, -5.862838268280029, -5.665866374969482, -5.468894004821777, -5.2719221115112305, -5.074950218200684, -4.8779778480529785, -4.681005954742432, -4.484034061431885, -4.28706169128418, -4.090089797973633, -3.893117666244507, -3.696145534515381, -3.499173402786255, -3.302201271057129, -3.105229139328003, -2.908257007598877, -2.711284875869751, -2.514312744140625, -2.317340850830078, -2.120368719100952, -1.9233965873718262, -1.7264245748519897, -1.5294524431228638, -1.3324803113937378, -1.1355082988739014, -0.9385361671447754, -0.7415640950202942, -0.544592022895813, -0.347619891166687, -0.15064787864685059, 0.04632425308227539, 0.24329634010791779, 0.4402684271335602, 0.6372405290603638, 0.834212601184845, 1.0311846733093262, 1.2281568050384521, 1.4251288175582886, 1.6221009492874146, 1.8190730810165405, 2.016045093536377, 2.213017225265503, 2.409989356994629, 2.606961250305176, 2.803933620452881, 3.0009055137634277, 3.1978776454925537, 3.3948497772216797, 3.5918219089508057, 3.7887940406799316, 3.9857659339904785, 4.182738304138184, 4.3797101974487305, 4.576682090759277, 4.773654460906982, 4.970626354217529, 5.167598724365234, 5.364570617675781, 5.561542987823486, 5.758514881134033, 5.955487251281738, 6.152459144592285, 6.349431037902832]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 8.0, 13.0, 10.0, 15.0, 21.0, 41.0, 53.0, 81.0, 109.0, 197.0, 306.0, 472.0, 802.0, 1305.0, 2279.0, 4301.0, 8690.0, 21904.0, 72343.0, 313818.0, 1159578.0, 1735770.0, 649837.0, 155152.0, 39654.0, 13952.0, 6168.0, 3118.0, 1724.0, 988.0, 604.0, 342.0, 233.0, 131.0, 79.0, 64.0, 46.0, 22.0, 17.0, 15.0, 10.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.52392578125, -0.5086326599121094, -0.49333953857421875, -0.4780464172363281, -0.4627532958984375, -0.4474601745605469, -0.43216705322265625, -0.4168739318847656, -0.401580810546875, -0.3862876892089844, -0.37099456787109375, -0.3557014465332031, -0.3404083251953125, -0.3251152038574219, -0.30982208251953125, -0.2945289611816406, -0.27923583984375, -0.2639427185058594, -0.24864959716796875, -0.23335647583007812, -0.2180633544921875, -0.20277023315429688, -0.18747711181640625, -0.17218399047851562, -0.156890869140625, -0.14159774780273438, -0.12630462646484375, -0.11101150512695312, -0.0957183837890625, -0.08042526245117188, -0.06513214111328125, -0.049839019775390625, -0.0345458984375, -0.019252777099609375, -0.00395965576171875, 0.011333465576171875, 0.0266265869140625, 0.041919708251953125, 0.05721282958984375, 0.07250595092773438, 0.087799072265625, 0.10309219360351562, 0.11838531494140625, 0.13367843627929688, 0.1489715576171875, 0.16426467895507812, 0.17955780029296875, 0.19485092163085938, 0.21014404296875, 0.22543716430664062, 0.24073028564453125, 0.2560234069824219, 0.2713165283203125, 0.2866096496582031, 0.30190277099609375, 0.3171958923339844, 0.332489013671875, 0.3477821350097656, 0.36307525634765625, 0.3783683776855469, 0.3936614990234375, 0.4089546203613281, 0.42424774169921875, 0.4395408630371094, 0.454833984375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 7.0, 9.0, 14.0, 14.0, 15.0, 13.0, 24.0, 19.0, 30.0, 33.0, 34.0, 31.0, 55.0, 43.0, 58.0, 60.0, 57.0, 43.0, 53.0, 64.0, 48.0, 35.0, 39.0, 32.0, 24.0, 25.0, 29.0, 17.0, 16.0, 14.0, 8.0, 11.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4033203125, -0.3900871276855469, -0.37685394287109375, -0.3636207580566406, -0.3503875732421875, -0.3371543884277344, -0.32392120361328125, -0.3106880187988281, -0.297454833984375, -0.2842216491699219, -0.27098846435546875, -0.2577552795410156, -0.2445220947265625, -0.23128890991210938, -0.21805572509765625, -0.20482254028320312, -0.19158935546875, -0.17835617065429688, -0.16512298583984375, -0.15188980102539062, -0.1386566162109375, -0.12542343139648438, -0.11219024658203125, -0.09895706176757812, -0.085723876953125, -0.07249069213867188, -0.05925750732421875, -0.046024322509765625, -0.0327911376953125, -0.019557952880859375, -0.00632476806640625, 0.006908416748046875, 0.0201416015625, 0.033374786376953125, 0.04660797119140625, 0.059841156005859375, 0.0730743408203125, 0.08630752563476562, 0.09954071044921875, 0.11277389526367188, 0.126007080078125, 0.13924026489257812, 0.15247344970703125, 0.16570663452148438, 0.1789398193359375, 0.19217300415039062, 0.20540618896484375, 0.21863937377929688, 0.23187255859375, 0.24510574340820312, 0.25833892822265625, 0.2715721130371094, 0.2848052978515625, 0.2980384826660156, 0.31127166748046875, 0.3245048522949219, 0.337738037109375, 0.3509712219238281, 0.36420440673828125, 0.3774375915527344, 0.3906707763671875, 0.4039039611816406, 0.41713714599609375, 0.4303703308105469, 0.443603515625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 3.0, 12.0, 12.0, 16.0, 20.0, 28.0, 61.0, 100.0, 199.0, 468.0, 1171.0, 4712.0, 81662.0, 4062770.0, 37373.0, 3714.0, 1044.0, 453.0, 210.0, 82.0, 74.0, 38.0, 24.0, 10.0, 5.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48828125, -2.403656005859375, -2.31903076171875, -2.234405517578125, -2.1497802734375, -2.065155029296875, -1.98052978515625, -1.895904541015625, -1.811279296875, -1.726654052734375, -1.64202880859375, -1.557403564453125, -1.4727783203125, -1.388153076171875, -1.30352783203125, -1.218902587890625, -1.13427734375, -1.049652099609375, -0.96502685546875, -0.880401611328125, -0.7957763671875, -0.711151123046875, -0.62652587890625, -0.541900634765625, -0.457275390625, -0.372650146484375, -0.28802490234375, -0.203399658203125, -0.1187744140625, -0.034149169921875, 0.05047607421875, 0.135101318359375, 0.2197265625, 0.304351806640625, 0.38897705078125, 0.473602294921875, 0.5582275390625, 0.642852783203125, 0.72747802734375, 0.812103271484375, 0.896728515625, 0.981353759765625, 1.06597900390625, 1.150604248046875, 1.2352294921875, 1.319854736328125, 1.40447998046875, 1.489105224609375, 1.57373046875, 1.658355712890625, 1.74298095703125, 1.827606201171875, 1.9122314453125, 1.996856689453125, 2.08148193359375, 2.166107177734375, 2.250732421875, 2.335357666015625, 2.41998291015625, 2.504608154296875, 2.5892333984375, 2.673858642578125, 2.75848388671875, 2.843109130859375, 2.927734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 11.0, 16.0, 21.0, 60.0, 93.0, 161.0, 281.0, 535.0, 846.0, 848.0, 513.0, 285.0, 154.0, 99.0, 53.0, 35.0, 19.0, 12.0, 4.0, 6.0, 8.0, 7.0, 1.0, 3.0, 3.0, 2.0], "bins": [-2.6875, -2.6300811767578125, -2.572662353515625, -2.5152435302734375, -2.45782470703125, -2.4004058837890625, -2.342987060546875, -2.2855682373046875, -2.2281494140625, -2.1707305908203125, -2.113311767578125, -2.0558929443359375, -1.99847412109375, -1.9410552978515625, -1.883636474609375, -1.8262176513671875, -1.768798828125, -1.7113800048828125, -1.653961181640625, -1.5965423583984375, -1.53912353515625, -1.4817047119140625, -1.424285888671875, -1.3668670654296875, -1.3094482421875, -1.2520294189453125, -1.194610595703125, -1.1371917724609375, -1.07977294921875, -1.0223541259765625, -0.964935302734375, -0.9075164794921875, -0.85009765625, -0.7926788330078125, -0.735260009765625, -0.6778411865234375, -0.62042236328125, -0.5630035400390625, -0.505584716796875, -0.4481658935546875, -0.3907470703125, -0.3333282470703125, -0.275909423828125, -0.2184906005859375, -0.16107177734375, -0.1036529541015625, -0.046234130859375, 0.0111846923828125, 0.068603515625, 0.1260223388671875, 0.183441162109375, 0.2408599853515625, 0.29827880859375, 0.3556976318359375, 0.413116455078125, 0.4705352783203125, 0.5279541015625, 0.5853729248046875, 0.642791748046875, 0.7002105712890625, 0.75762939453125, 0.8150482177734375, 0.872467041015625, 0.9298858642578125, 0.9873046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 10.0, 9.0, 16.0, 35.0, 44.0, 72.0, 170.0, 219.0, 170.0, 108.0, 57.0, 28.0, 15.0, 9.0, 12.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.74794864654541, -11.288476943969727, -10.829004287719727, -10.369531631469727, -9.910059928894043, -9.45058822631836, -8.99111557006836, -8.53164291381836, -8.072171211242676, -7.612699031829834, -7.153226852416992, -6.69375467300415, -6.234282493591309, -5.774810314178467, -5.315338134765625, -4.855865955352783, -4.396393775939941, -3.9369215965270996, -3.477449417114258, -3.017977237701416, -2.558505058288574, -2.0990328788757324, -1.6395606994628906, -1.1800885200500488, -0.720616340637207, -0.26114416122436523, 0.19832801818847656, 0.6578001976013184, 1.1172723770141602, 1.576744556427002, 2.0362167358398438, 2.4956889152526855, 2.955160140991211, 3.4146323204040527, 3.8741044998168945, 4.333576679229736, 4.793048858642578, 5.25252103805542, 5.711993217468262, 6.1714653968811035, 6.630937576293945, 7.090409755706787, 7.549881935119629, 8.009353637695312, 8.468826293945312, 8.928298950195312, 9.387770652770996, 9.84724235534668, 10.30671501159668, 10.76618766784668, 11.225659370422363, 11.685131072998047, 12.144603729248047, 12.604076385498047, 13.06354808807373, 13.523019790649414, 13.982492446899414, 14.441965103149414, 14.901436805725098, 15.360908508300781, 15.820381164550781, 16.27985382080078, 16.73932647705078, 17.19879722595215, 17.65826988220215]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 3.0, 12.0, 9.0, 14.0, 16.0, 9.0, 20.0, 24.0, 36.0, 32.0, 40.0, 46.0, 59.0, 38.0, 57.0, 46.0, 75.0, 80.0, 60.0, 57.0, 40.0, 46.0, 39.0, 36.0, 18.0, 17.0, 16.0, 14.0, 10.0, 4.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.849696159362793, -8.571756362915039, -8.293816566467285, -8.015877723693848, -7.737937927246094, -7.45999813079834, -7.182058334350586, -6.904118537902832, -6.626179218292236, -6.348239421844482, -6.070300102233887, -5.792360305786133, -5.514420509338379, -5.236481189727783, -4.958541393280029, -4.680602073669434, -4.40266227722168, -4.124722480773926, -3.84678316116333, -3.568843364715576, -3.2909038066864014, -3.0129642486572266, -2.7350244522094727, -2.457084894180298, -2.179145336151123, -1.9012057781219482, -1.6232661008834839, -1.3453264236450195, -1.0673868656158447, -0.7894473075866699, -0.5115076303482056, -0.2335679531097412, 0.04437065124511719, 0.32231026887893677, 0.6002498865127563, 0.8781895041465759, 1.1561291217803955, 1.4340686798095703, 1.7120083570480347, 1.989948034286499, 2.267887592315674, 2.5458271503448486, 2.8237667083740234, 3.1017065048217773, 3.379646062850952, 3.657585620880127, 3.935525417327881, 4.213464736938477, 4.4914045333862305, 4.769344329833984, 5.04728364944458, 5.325223445892334, 5.60316276550293, 5.881102561950684, 6.1590423583984375, 6.436982154846191, 6.714921474456787, 6.992861270904541, 7.270800590515137, 7.548740386962891, 7.8266801834106445, 8.104619979858398, 8.382558822631836, 8.66049861907959, 8.938438415527344]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 10.0, 10.0, 13.0, 18.0, 26.0, 65.0, 92.0, 198.0, 364.0, 897.0, 2307.0, 7551.0, 38909.0, 609468.0, 349376.0, 29433.0, 6296.0, 2030.0, 774.0, 369.0, 158.0, 80.0, 48.0, 23.0, 16.0, 5.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.40997314453125, -1.3707275390625, -1.33148193359375, -1.292236328125, -1.25299072265625, -1.2137451171875, -1.17449951171875, -1.13525390625, -1.09600830078125, -1.0567626953125, -1.01751708984375, -0.978271484375, -0.93902587890625, -0.8997802734375, -0.86053466796875, -0.8212890625, -0.78204345703125, -0.7427978515625, -0.70355224609375, -0.664306640625, -0.62506103515625, -0.5858154296875, -0.54656982421875, -0.50732421875, -0.46807861328125, -0.4288330078125, -0.38958740234375, -0.350341796875, -0.31109619140625, -0.2718505859375, -0.23260498046875, -0.193359375, -0.15411376953125, -0.1148681640625, -0.07562255859375, -0.036376953125, 0.00286865234375, 0.0421142578125, 0.08135986328125, 0.12060546875, 0.15985107421875, 0.1990966796875, 0.23834228515625, 0.277587890625, 0.31683349609375, 0.3560791015625, 0.39532470703125, 0.4345703125, 0.47381591796875, 0.5130615234375, 0.55230712890625, 0.591552734375, 0.63079833984375, 0.6700439453125, 0.70928955078125, 0.74853515625, 0.78778076171875, 0.8270263671875, 0.86627197265625, 0.905517578125, 0.94476318359375, 0.9840087890625, 1.02325439453125, 1.0625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 7.0, 12.0, 6.0, 21.0, 22.0, 28.0, 40.0, 30.0, 70.0, 51.0, 60.0, 92.0, 75.0, 71.0, 87.0, 65.0, 63.0, 55.0, 33.0, 31.0, 34.0, 18.0, 12.0, 13.0, 9.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86669921875, -0.842559814453125, -0.81842041015625, -0.794281005859375, -0.7701416015625, -0.746002197265625, -0.72186279296875, -0.697723388671875, -0.673583984375, -0.649444580078125, -0.62530517578125, -0.601165771484375, -0.5770263671875, -0.552886962890625, -0.52874755859375, -0.504608154296875, -0.48046875, -0.456329345703125, -0.43218994140625, -0.408050537109375, -0.3839111328125, -0.359771728515625, -0.33563232421875, -0.311492919921875, -0.287353515625, -0.263214111328125, -0.23907470703125, -0.214935302734375, -0.1907958984375, -0.166656494140625, -0.14251708984375, -0.118377685546875, -0.09423828125, -0.070098876953125, -0.04595947265625, -0.021820068359375, 0.0023193359375, 0.026458740234375, 0.05059814453125, 0.074737548828125, 0.098876953125, 0.123016357421875, 0.14715576171875, 0.171295166015625, 0.1954345703125, 0.219573974609375, 0.24371337890625, 0.267852783203125, 0.2919921875, 0.316131591796875, 0.34027099609375, 0.364410400390625, 0.3885498046875, 0.412689208984375, 0.43682861328125, 0.460968017578125, 0.485107421875, 0.509246826171875, 0.53338623046875, 0.557525634765625, 0.5816650390625, 0.605804443359375, 0.62994384765625, 0.654083251953125, 0.67822265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 9.0, 10.0, 7.0, 10.0, 12.0, 18.0, 18.0, 26.0, 38.0, 40.0, 68.0, 93.0, 129.0, 185.0, 288.0, 521.0, 1002.0, 2605.0, 10061.0, 69589.0, 904951.0, 46807.0, 7559.0, 2286.0, 883.0, 446.0, 263.0, 156.0, 120.0, 85.0, 73.0, 36.0, 40.0, 34.0, 18.0, 16.0, 17.0, 10.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.9829864501953125, -0.948394775390625, -0.9138031005859375, -0.87921142578125, -0.8446197509765625, -0.810028076171875, -0.7754364013671875, -0.7408447265625, -0.7062530517578125, -0.671661376953125, -0.6370697021484375, -0.60247802734375, -0.5678863525390625, -0.533294677734375, -0.4987030029296875, -0.464111328125, -0.4295196533203125, -0.394927978515625, -0.3603363037109375, -0.32574462890625, -0.2911529541015625, -0.256561279296875, -0.2219696044921875, -0.1873779296875, -0.1527862548828125, -0.118194580078125, -0.0836029052734375, -0.04901123046875, -0.0144195556640625, 0.020172119140625, 0.0547637939453125, 0.08935546875, 0.1239471435546875, 0.158538818359375, 0.1931304931640625, 0.22772216796875, 0.2623138427734375, 0.296905517578125, 0.3314971923828125, 0.3660888671875, 0.4006805419921875, 0.435272216796875, 0.4698638916015625, 0.50445556640625, 0.5390472412109375, 0.573638916015625, 0.6082305908203125, 0.642822265625, 0.6774139404296875, 0.712005615234375, 0.7465972900390625, 0.78118896484375, 0.8157806396484375, 0.850372314453125, 0.8849639892578125, 0.9195556640625, 0.9541473388671875, 0.988739013671875, 1.0233306884765625, 1.05792236328125, 1.0925140380859375, 1.127105712890625, 1.1616973876953125, 1.1962890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 3.0, 10.0, 6.0, 8.0, 10.0, 11.0, 9.0, 13.0, 16.0, 18.0, 18.0, 20.0, 15.0, 29.0, 41.0, 41.0, 56.0, 72.0, 67.0, 82.0, 64.0, 62.0, 66.0, 32.0, 35.0, 21.0, 24.0, 21.0, 18.0, 12.0, 8.0, 13.0, 9.0, 8.0, 3.0, 7.0, 7.0, 5.0, 6.0, 5.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-1.9619140625, -1.904754638671875, -1.84759521484375, -1.790435791015625, -1.7332763671875, -1.676116943359375, -1.61895751953125, -1.561798095703125, -1.504638671875, -1.447479248046875, -1.39031982421875, -1.333160400390625, -1.2760009765625, -1.218841552734375, -1.16168212890625, -1.104522705078125, -1.04736328125, -0.990203857421875, -0.93304443359375, -0.875885009765625, -0.8187255859375, -0.761566162109375, -0.70440673828125, -0.647247314453125, -0.590087890625, -0.532928466796875, -0.47576904296875, -0.418609619140625, -0.3614501953125, -0.304290771484375, -0.24713134765625, -0.189971923828125, -0.1328125, -0.075653076171875, -0.01849365234375, 0.038665771484375, 0.0958251953125, 0.152984619140625, 0.21014404296875, 0.267303466796875, 0.324462890625, 0.381622314453125, 0.43878173828125, 0.495941162109375, 0.5531005859375, 0.610260009765625, 0.66741943359375, 0.724578857421875, 0.78173828125, 0.838897705078125, 0.89605712890625, 0.953216552734375, 1.0103759765625, 1.067535400390625, 1.12469482421875, 1.181854248046875, 1.239013671875, 1.296173095703125, 1.35333251953125, 1.410491943359375, 1.4676513671875, 1.524810791015625, 1.58197021484375, 1.639129638671875, 1.6962890625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 9.0, 5.0, 9.0, 16.0, 15.0, 35.0, 45.0, 76.0, 100.0, 211.0, 462.0, 1046.0, 3372.0, 23245.0, 963104.0, 49095.0, 5235.0, 1321.0, 540.0, 250.0, 144.0, 69.0, 48.0, 16.0, 16.0, 16.0, 7.0, 10.0, 6.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.377197265625, -0.3648834228515625, -0.352569580078125, -0.3402557373046875, -0.32794189453125, -0.3156280517578125, -0.303314208984375, -0.2910003662109375, -0.2786865234375, -0.2663726806640625, -0.254058837890625, -0.2417449951171875, -0.22943115234375, -0.2171173095703125, -0.204803466796875, -0.1924896240234375, -0.18017578125, -0.1678619384765625, -0.155548095703125, -0.1432342529296875, -0.13092041015625, -0.1186065673828125, -0.106292724609375, -0.0939788818359375, -0.0816650390625, -0.0693511962890625, -0.057037353515625, -0.0447235107421875, -0.03240966796875, -0.0200958251953125, -0.007781982421875, 0.0045318603515625, 0.016845703125, 0.0291595458984375, 0.041473388671875, 0.0537872314453125, 0.06610107421875, 0.0784149169921875, 0.090728759765625, 0.1030426025390625, 0.1153564453125, 0.1276702880859375, 0.139984130859375, 0.1522979736328125, 0.16461181640625, 0.1769256591796875, 0.189239501953125, 0.2015533447265625, 0.2138671875, 0.2261810302734375, 0.238494873046875, 0.2508087158203125, 0.26312255859375, 0.2754364013671875, 0.287750244140625, 0.3000640869140625, 0.3123779296875, 0.3246917724609375, 0.337005615234375, 0.3493194580078125, 0.36163330078125, 0.3739471435546875, 0.386260986328125, 0.3985748291015625, 0.410888671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 11.0, 27.0, 52.0, 117.0, 374.0, 248.0, 76.0, 45.0, 19.0, 16.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022208690643310547, -0.00021635927259922028, -0.00021063163876533508, -0.0002049040049314499, -0.0001991763710975647, -0.0001934487372636795, -0.0001877211034297943, -0.00018199346959590912, -0.00017626583576202393, -0.00017053820192813873, -0.00016481056809425354, -0.00015908293426036835, -0.00015335530042648315, -0.00014762766659259796, -0.00014190003275871277, -0.00013617239892482758, -0.00013044476509094238, -0.0001247171312570572, -0.000118989497423172, -0.0001132618635892868, -0.00010753422975540161, -0.00010180659592151642, -9.607896208763123e-05, -9.035132825374603e-05, -8.462369441986084e-05, -7.889606058597565e-05, -7.316842675209045e-05, -6.744079291820526e-05, -6.171315908432007e-05, -5.5985525250434875e-05, -5.025789141654968e-05, -4.453025758266449e-05, -3.88026237487793e-05, -3.3074989914894104e-05, -2.734735608100891e-05, -2.1619722247123718e-05, -1.5892088413238525e-05, -1.0164454579353333e-05, -4.43682074546814e-06, 1.2908130884170532e-06, 7.018446922302246e-06, 1.2746080756187439e-05, 1.8473714590072632e-05, 2.4201348423957825e-05, 2.9928982257843018e-05, 3.565661609172821e-05, 4.13842499256134e-05, 4.7111883759498596e-05, 5.283951759338379e-05, 5.856715142726898e-05, 6.429478526115417e-05, 7.002241909503937e-05, 7.575005292892456e-05, 8.147768676280975e-05, 8.720532059669495e-05, 9.293295443058014e-05, 9.866058826446533e-05, 0.00010438822209835052, 0.00011011585593223572, 0.00011584348976612091, 0.0001215711236000061, 0.0001272987574338913, 0.0001330263912677765, 0.00013875402510166168, 0.00014448165893554688]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 7.0, 4.0, 6.0, 13.0, 18.0, 19.0, 33.0, 40.0, 77.0, 96.0, 167.0, 216.0, 430.0, 803.0, 1607.0, 4027.0, 13147.0, 75470.0, 888538.0, 47590.0, 9852.0, 3298.0, 1367.0, 684.0, 383.0, 222.0, 123.0, 97.0, 69.0, 45.0, 25.0, 21.0, 16.0, 7.0, 7.0, 11.0, 4.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18359375, -0.17712783813476562, -0.17066192626953125, -0.16419601440429688, -0.1577301025390625, -0.15126419067382812, -0.14479827880859375, -0.13833236694335938, -0.131866455078125, -0.12540054321289062, -0.11893463134765625, -0.11246871948242188, -0.1060028076171875, -0.09953689575195312, -0.09307098388671875, -0.08660507202148438, -0.08013916015625, -0.07367324829101562, -0.06720733642578125, -0.060741424560546875, -0.0542755126953125, -0.047809600830078125, -0.04134368896484375, -0.034877777099609375, -0.028411865234375, -0.021945953369140625, -0.01548004150390625, -0.009014129638671875, -0.0025482177734375, 0.003917694091796875, 0.01038360595703125, 0.016849517822265625, 0.0233154296875, 0.029781341552734375, 0.03624725341796875, 0.042713165283203125, 0.0491790771484375, 0.055644989013671875, 0.06211090087890625, 0.06857681274414062, 0.075042724609375, 0.08150863647460938, 0.08797454833984375, 0.09444046020507812, 0.1009063720703125, 0.10737228393554688, 0.11383819580078125, 0.12030410766601562, 0.12677001953125, 0.13323593139648438, 0.13970184326171875, 0.14616775512695312, 0.1526336669921875, 0.15909957885742188, 0.16556549072265625, 0.17203140258789062, 0.178497314453125, 0.18496322631835938, 0.19142913818359375, 0.19789505004882812, 0.2043609619140625, 0.21082687377929688, 0.21729278564453125, 0.22375869750976562, 0.230224609375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 7.0, 11.0, 14.0, 19.0, 17.0, 29.0, 27.0, 42.0, 60.0, 134.0, 164.0, 149.0, 71.0, 63.0, 52.0, 30.0, 24.0, 15.0, 16.0, 6.0, 7.0, 2.0, 5.0, 4.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23486328125, -0.22696685791015625, -0.2190704345703125, -0.21117401123046875, -0.203277587890625, -0.19538116455078125, -0.1874847412109375, -0.17958831787109375, -0.17169189453125, -0.16379547119140625, -0.1558990478515625, -0.14800262451171875, -0.140106201171875, -0.13220977783203125, -0.1243133544921875, -0.11641693115234375, -0.1085205078125, -0.10062408447265625, -0.0927276611328125, -0.08483123779296875, -0.076934814453125, -0.06903839111328125, -0.0611419677734375, -0.05324554443359375, -0.04534912109375, -0.03745269775390625, -0.0295562744140625, -0.02165985107421875, -0.013763427734375, -0.00586700439453125, 0.0020294189453125, 0.00992584228515625, 0.017822265625, 0.02571868896484375, 0.0336151123046875, 0.04151153564453125, 0.049407958984375, 0.05730438232421875, 0.0652008056640625, 0.07309722900390625, 0.08099365234375, 0.08889007568359375, 0.0967864990234375, 0.10468292236328125, 0.112579345703125, 0.12047576904296875, 0.1283721923828125, 0.13626861572265625, 0.1441650390625, 0.15206146240234375, 0.1599578857421875, 0.16785430908203125, 0.175750732421875, 0.18364715576171875, 0.1915435791015625, 0.19944000244140625, 0.20733642578125, 0.21523284912109375, 0.2231292724609375, 0.23102569580078125, 0.238922119140625, 0.24681854248046875, 0.2547149658203125, 0.26261138916015625, 0.2705078125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 12.0, 17.0, 29.0, 75.0, 458.0, 230.0, 75.0, 48.0, 21.0, 9.0, 12.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2812445163726807, -2.948821544647217, -2.616398334503174, -2.28397536277771, -1.9515522718429565, -1.6191291809082031, -1.2867062091827393, -0.9542829990386963, -0.6218600273132324, -0.2894369661808014, 0.04298609495162964, 0.3754091262817383, 0.7078322172164917, 1.0402553081512451, 1.372678279876709, 1.705101490020752, 2.037524461746216, 2.3699474334716797, 2.7023706436157227, 3.0347936153411865, 3.3672165870666504, 3.6996397972106934, 4.032062530517578, 4.364485740661621, 4.696908950805664, 5.029332160949707, 5.361754894256592, 5.694178104400635, 6.026601314544678, 6.3590240478515625, 6.6914472579956055, 7.023870468139648, 7.356293678283691, 7.688716888427734, 8.021140098571777, 8.35356330871582, 8.685985565185547, 9.01840877532959, 9.350831985473633, 9.683255195617676, 10.015678405761719, 10.348101615905762, 10.680524826049805, 11.012947082519531, 11.345370292663574, 11.677793502807617, 12.01021671295166, 12.342639923095703, 12.67506217956543, 13.007485389709473, 13.339908599853516, 13.672330856323242, 14.004754066467285, 14.337177276611328, 14.669600486755371, 15.002023696899414, 15.334446907043457, 15.6668701171875, 15.999293327331543, 16.331716537475586, 16.664138793945312, 16.996562957763672, 17.3289852142334, 17.661407470703125, 17.993831634521484]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 9.0, 4.0, 6.0, 4.0, 7.0, 10.0, 13.0, 10.0, 22.0, 19.0, 15.0, 16.0, 26.0, 22.0, 24.0, 51.0, 200.0, 202.0, 85.0, 38.0, 28.0, 23.0, 24.0, 18.0, 14.0, 15.0, 19.0, 12.0, 6.0, 5.0, 6.0, 4.0, 7.0, 2.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0], "bins": [-5.5023298263549805, -5.335952281951904, -5.169575214385986, -5.00319766998291, -4.836820125579834, -4.670442581176758, -4.50406551361084, -4.337687969207764, -4.1713104248046875, -4.004932880401611, -3.8385555744171143, -3.672178268432617, -3.505800724029541, -3.339423418045044, -3.173046112060547, -3.0066685676574707, -2.8402915000915527, -2.6739141941070557, -2.5075366497039795, -2.3411593437194824, -2.1747817993164062, -2.008404493331909, -1.842027187347412, -1.6756497621536255, -1.5092723369598389, -1.3428949117660522, -1.1765174865722656, -1.0101401805877686, -0.8437627553939819, -0.6773853302001953, -0.5110079646110535, -0.3446305990219116, -0.178253173828125, -0.011875778436660767, 0.15450161695480347, 0.3208790123462677, 0.48725640773773193, 0.6536338329315186, 0.8200111985206604, 0.9863885641098022, 1.1527659893035889, 1.3191434144973755, 1.485520839691162, 1.6518981456756592, 1.8182755708694458, 1.9846529960632324, 2.1510303020477295, 2.3174076080322266, 2.4837851524353027, 2.6501624584198, 2.816540002822876, 2.982917308807373, 3.149294853210449, 3.3156721591949463, 3.4820494651794434, 3.6484270095825195, 3.8148043155670166, 3.9811816215515137, 4.14755916595459, 4.313936710357666, 4.480313777923584, 4.64669132232666, 4.813068866729736, 4.979445934295654, 5.1458234786987305]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 14.0, 10.0, 9.0, 8.0, 10.0, 15.0, 21.0, 25.0, 17.0, 20.0, 27.0, 28.0, 47.0, 82.0, 226.0, 118.0, 57.0, 30.0, 35.0, 32.0, 25.0, 14.0, 16.0, 17.0, 13.0, 14.0, 6.0, 14.0, 4.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.35546875, -0.3431510925292969, -0.33083343505859375, -0.3185157775878906, -0.3061981201171875, -0.2938804626464844, -0.28156280517578125, -0.2692451477050781, -0.256927490234375, -0.24460983276367188, -0.23229217529296875, -0.21997451782226562, -0.2076568603515625, -0.19533920288085938, -0.18302154541015625, -0.17070388793945312, -0.15838623046875, -0.14606857299804688, -0.13375091552734375, -0.12143325805664062, -0.1091156005859375, -0.09679794311523438, -0.08448028564453125, -0.07216262817382812, -0.059844970703125, -0.047527313232421875, -0.03520965576171875, -0.022891998291015625, -0.0105743408203125, 0.001743316650390625, 0.01406097412109375, 0.026378631591796875, 0.0386962890625, 0.051013946533203125, 0.06333160400390625, 0.07564926147460938, 0.0879669189453125, 0.10028457641601562, 0.11260223388671875, 0.12491989135742188, 0.137237548828125, 0.14955520629882812, 0.16187286376953125, 0.17419052124023438, 0.1865081787109375, 0.19882583618164062, 0.21114349365234375, 0.22346115112304688, 0.23577880859375, 0.24809646606445312, 0.26041412353515625, 0.2727317810058594, 0.2850494384765625, 0.2973670959472656, 0.30968475341796875, 0.3220024108886719, 0.334320068359375, 0.3466377258300781, 0.35895538330078125, 0.3712730407714844, 0.3835906982421875, 0.3959083557128906, 0.40822601318359375, 0.4205436706542969, 0.432861328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 14.0, 28.0, 33.0, 50.0, 117.0, 279.0, 1053.0, 8757.0, 8367406.0, 9316.0, 983.0, 263.0, 111.0, 66.0, 22.0, 16.0, 16.0, 12.0, 3.0, 1.0, 2.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-7.506015777587891, -7.294615745544434, -7.083215236663818, -6.871815204620361, -6.660415172576904, -6.449014663696289, -6.237614631652832, -6.026214599609375, -5.814814567565918, -5.603414535522461, -5.392014026641846, -5.180613994598389, -4.969213962554932, -4.757813453674316, -4.546413421630859, -4.335013389587402, -4.123613357543945, -3.912213087081909, -3.700813055038452, -3.489412784576416, -3.278012752532959, -3.066612482070923, -2.8552122116088867, -2.6438121795654297, -2.4324116706848145, -2.2210114002227783, -2.0096113681793213, -1.7982110977172852, -1.5868110656738281, -1.375410795211792, -1.1640106439590454, -0.9526104927062988, -0.7412104606628418, -0.5298103094100952, -0.31841012835502625, -0.10700994729995728, 0.1043902039527893, 0.31579041481018066, 0.5271905660629272, 0.7385907173156738, 0.9499908685684204, 1.161391019821167, 1.3727911710739136, 1.5841913223266602, 1.7955915927886963, 2.0069918632507324, 2.2183918952941895, 2.4297919273376465, 2.6411921977996826, 2.8525924682617188, 3.063992500305176, 3.275392770767212, 3.486792802810669, 3.698193073272705, 3.909593105316162, 4.120993614196777, 4.332393646240234, 4.543793678283691, 4.755194187164307, 4.966594219207764, 5.177994251251221, 5.389394760131836, 5.600794792175293, 5.81219482421875, 6.023594856262207]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 6.0, 1.0, 3.0, 2.0, 3.0, 8.0, 3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.252260684967041, -2.1556754112243652, -2.0590901374816895, -1.9625048637390137, -1.865919589996338, -1.769334316253662, -1.6727490425109863, -1.5761637687683105, -1.4795784950256348, -1.382993221282959, -1.2864079475402832, -1.1898226737976074, -1.0932374000549316, -0.9966521263122559, -0.9000668525695801, -0.8034815788269043, -0.7068963050842285, -0.6103110313415527, -0.513725757598877, -0.41714048385620117, -0.3205552101135254, -0.2239699363708496, -0.12738466262817383, -0.030799388885498047, 0.06578588485717773, 0.16237115859985352, 0.2589564323425293, 0.3555417060852051, 0.45212697982788086, 0.5487122535705566, 0.6452975273132324, 0.7418828010559082, 0.8384678363800049, 0.9350531101226807, 1.0316383838653564, 1.1282236576080322, 1.224808931350708, 1.3213942050933838, 1.4179794788360596, 1.5145647525787354, 1.6111500263214111, 1.707735300064087, 1.8043205738067627, 1.9009058475494385, 1.9974911212921143, 2.09407639503479, 2.190661668777466, 2.2872469425201416, 2.3838322162628174, 2.480417490005493, 2.577002763748169, 2.6735880374908447, 2.7701733112335205, 2.8667585849761963, 2.963343858718872, 3.059929132461548, 3.1565144062042236, 3.2530996799468994, 3.349684953689575, 3.446270227432251, 3.5428555011749268, 3.6394407749176025, 3.7360260486602783, 3.832611322402954, 3.92919659614563]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 16.0, 11.0, 25.0, 29.0, 49.0, 68.0, 127.0, 204.0, 431.0, 987.0, 3027.0, 13494.0, 78107.0, 306516.0, 98754.0, 16142.0, 3847.0, 1291.0, 471.0, 259.0, 132.0, 104.0, 54.0, 28.0, 24.0, 22.0, 9.0, 7.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.8515625, -5.69580078125, -5.5400390625, -5.38427734375, -5.228515625, -5.07275390625, -4.9169921875, -4.76123046875, -4.60546875, -4.44970703125, -4.2939453125, -4.13818359375, -3.982421875, -3.82666015625, -3.6708984375, -3.51513671875, -3.359375, -3.20361328125, -3.0478515625, -2.89208984375, -2.736328125, -2.58056640625, -2.4248046875, -2.26904296875, -2.11328125, -1.95751953125, -1.8017578125, -1.64599609375, -1.490234375, -1.33447265625, -1.1787109375, -1.02294921875, -0.8671875, -0.71142578125, -0.5556640625, -0.39990234375, -0.244140625, -0.08837890625, 0.0673828125, 0.22314453125, 0.37890625, 0.53466796875, 0.6904296875, 0.84619140625, 1.001953125, 1.15771484375, 1.3134765625, 1.46923828125, 1.625, 1.78076171875, 1.9365234375, 2.09228515625, 2.248046875, 2.40380859375, 2.5595703125, 2.71533203125, 2.87109375, 3.02685546875, 3.1826171875, 3.33837890625, 3.494140625, 3.64990234375, 3.8056640625, 3.96142578125, 4.1171875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 7.0, 18.0, 23.0, 40.0, 47.0, 58.0, 62.0, 90.0, 114.0, 89.0, 109.0, 73.0, 70.0, 49.0, 38.0, 22.0, 28.0, 16.0, 14.0, 8.0, 7.0, 7.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90087890625, -0.8756332397460938, -0.8503875732421875, -0.8251419067382812, -0.799896240234375, -0.7746505737304688, -0.7494049072265625, -0.7241592407226562, -0.69891357421875, -0.6736679077148438, -0.6484222412109375, -0.6231765747070312, -0.597930908203125, -0.5726852416992188, -0.5474395751953125, -0.5221939086914062, -0.4969482421875, -0.47170257568359375, -0.4464569091796875, -0.42121124267578125, -0.395965576171875, -0.37071990966796875, -0.3454742431640625, -0.32022857666015625, -0.29498291015625, -0.26973724365234375, -0.2444915771484375, -0.21924591064453125, -0.194000244140625, -0.16875457763671875, -0.1435089111328125, -0.11826324462890625, -0.093017578125, -0.06777191162109375, -0.0425262451171875, -0.01728057861328125, 0.007965087890625, 0.03321075439453125, 0.0584564208984375, 0.08370208740234375, 0.10894775390625, 0.13419342041015625, 0.1594390869140625, 0.18468475341796875, 0.209930419921875, 0.23517608642578125, 0.2604217529296875, 0.28566741943359375, 0.3109130859375, 0.33615875244140625, 0.3614044189453125, 0.38665008544921875, 0.411895751953125, 0.43714141845703125, 0.4623870849609375, 0.48763275146484375, 0.51287841796875, 0.5381240844726562, 0.5633697509765625, 0.5886154174804688, 0.613861083984375, 0.6391067504882812, 0.6643524169921875, 0.6895980834960938, 0.71484375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 13.0, 17.0, 18.0, 28.0, 60.0, 56.0, 73.0, 65.0, 51.0, 25.0, 16.0, 10.0, 11.0, 7.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.363767385482788, -2.2669224739074707, -2.170077323913574, -2.073232412338257, -1.97638738155365, -1.879542350769043, -1.7826974391937256, -1.6858524084091187, -1.5890073776245117, -1.4921623468399048, -1.3953173160552979, -1.2984724044799805, -1.2016273736953735, -1.1047823429107666, -1.0079374313354492, -0.9110924005508423, -0.8142473697662354, -0.7174023389816284, -0.6205573678016663, -0.5237123966217041, -0.42686736583709717, -0.3300223648548126, -0.23317736387252808, -0.13633239269256592, -0.039487361907958984, 0.05735763907432556, 0.1542026400566101, 0.25104764103889465, 0.3478926420211792, 0.44473764300346375, 0.5415826439857483, 0.6384276151657104, 0.7352724075317383, 0.8321174383163452, 0.9289624094963074, 1.0258073806762695, 1.1226524114608765, 1.2194974422454834, 1.3163423538208008, 1.4131873846054077, 1.5100324153900146, 1.6068774461746216, 1.7037224769592285, 1.800567388534546, 1.8974124193191528, 1.9942574501037598, 2.091102361679077, 2.1879472732543945, 2.284792423248291, 2.3816373348236084, 2.478482484817505, 2.5753273963928223, 2.6721725463867188, 2.769017457962036, 2.8658623695373535, 2.96270751953125, 3.0595524311065674, 3.1563973426818848, 3.2532424926757812, 3.3500874042510986, 3.446932315826416, 3.5437774658203125, 3.64062237739563, 3.7374672889709473, 3.8343124389648438]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 11.0, 32.0, 54.0, 83.0, 84.0, 74.0, 31.0, 22.0, 13.0, 11.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3969743251800537, -3.293792247772217, -3.190609931945801, -3.087427854537964, -2.984245538711548, -2.881063461303711, -2.777881145477295, -2.674699068069458, -2.571516990661621, -2.468334913253784, -2.365152597427368, -2.2619705200195312, -2.1587882041931152, -2.0556061267852783, -1.9524239301681519, -1.8492417335510254, -1.7460594177246094, -1.642877221107483, -1.5396950244903564, -1.4365129470825195, -1.3333306312561035, -1.2301485538482666, -1.1269663572311401, -1.0237841606140137, -0.9206019639968872, -0.8174197673797607, -0.7142375707626343, -0.6110554337501526, -0.5078732371330261, -0.40469104051589966, -0.30150890350341797, -0.1983267068862915, -0.09514427185058594, 0.008037909865379333, 0.1112200915813446, 0.21440225839614868, 0.31758445501327515, 0.4207666516304016, 0.5239487886428833, 0.6271309852600098, 0.7303131818771362, 0.8334953784942627, 0.9366775751113892, 1.0398597717285156, 1.1430418491363525, 1.2462241649627686, 1.3494062423706055, 1.452588438987732, 1.5557706356048584, 1.6589528322219849, 1.7621350288391113, 1.8653171062469482, 1.9684994220733643, 2.071681499481201, 2.174863815307617, 2.278045892715454, 2.381227970123291, 2.484410047531128, 2.587592363357544, 2.690774440765381, 2.793956756591797, 2.897138833999634, 3.0003209114074707, 3.1035032272338867, 3.2066855430603027]}, "train/train_runtime": 5087.4578, "train/train_samples_per_second": 5.609, "train/train_steps_per_second": 0.088, "train/total_flos": 0.0, "train/train_loss": 4.256010225535508, "eval/loss": 4.295446395874023, "eval/wer": 2.317671558905196, "eval/runtime": 1115.1949, "eval/samples_per_second": 2.369, "eval/steps_per_second": 0.297} \ No newline at end of file +{"train/loss": 4.1867, "train/learning_rate": 8.88e-05, "train/epoch": 1.0, "train/global_step": 446, "_runtime": 6494, "_timestamp": 1646179246, "_step": 447, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 33.0, 233.0, 533.0, 191.0, 23.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.007577896118164, -19.918153762817383, -16.828731536865234, -13.739307403564453, -10.649883270263672, -7.560459136962891, -4.471036911010742, -1.381612777709961, 1.7078113555908203, 4.797235012054443, 7.886658668518066, 10.976081848144531, 14.065505981445312, 17.154930114746094, 20.244352340698242, 23.333776473999023, 26.423200607299805, 29.512624740600586, 32.602046966552734, 35.691471099853516, 38.7808952331543, 41.87031936645508, 44.959739685058594, 48.049163818359375, 51.138587951660156, 54.22801208496094, 57.31743621826172, 60.4068603515625, 63.49628448486328, 66.58570861816406, 69.67512512207031, 72.76455688476562, 75.85397338867188, 78.94339752197266, 82.03282165527344, 85.12224578857422, 88.211669921875, 91.30109405517578, 94.39051818847656, 97.47993469238281, 100.56936645507812, 103.6587905883789, 106.74821472167969, 109.83763885498047, 112.92706298828125, 116.01648712158203, 119.10591125488281, 122.19532775878906, 125.28475189208984, 128.37417602539062, 131.46359252929688, 134.5530242919922, 137.64244079589844, 140.73187255859375, 143.8212890625, 146.9107208251953, 150.00013732910156, 153.0895538330078, 156.17898559570312, 159.26840209960938, 162.3578338623047, 165.44725036621094, 168.53668212890625, 171.6260986328125, 174.7155303955078]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 1.0, 7.0, 7.0, 6.0, 5.0, 9.0, 12.0, 13.0, 9.0, 11.0, 29.0, 28.0, 28.0, 23.0, 25.0, 31.0, 32.0, 39.0, 41.0, 36.0, 49.0, 50.0, 49.0, 33.0, 39.0, 37.0, 42.0, 40.0, 34.0, 35.0, 17.0, 40.0, 22.0, 24.0, 15.0, 14.0, 14.0, 12.0, 14.0, 11.0, 8.0, 8.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.05972671508789, -29.033992767333984, -28.00826072692871, -26.982526779174805, -25.9567928314209, -24.931060791015625, -23.90532684326172, -22.879592895507812, -21.853858947753906, -20.828125, -19.802392959594727, -18.77665901184082, -17.750925064086914, -16.72519302368164, -15.699459075927734, -14.673725128173828, -13.647993087768555, -12.622260093688965, -11.596526145935059, -10.570793151855469, -9.545059204101562, -8.519326210021973, -7.493593215942383, -6.467859745025635, -5.442126274108887, -4.416392803192139, -3.3906595706939697, -2.364926338195801, -1.3391928672790527, -0.3134593963623047, 0.7122735977172852, 1.7380070686340332, 2.7637405395507812, 3.7894740104675293, 4.815207481384277, 5.840940475463867, 6.866673946380615, 7.892407417297363, 8.918140411376953, 9.94387435913086, 10.96960735321045, 11.995340347290039, 13.021074295043945, 14.046807289123535, 15.072540283203125, 16.09827423095703, 17.124008178710938, 18.14974021911621, 19.175474166870117, 20.201208114624023, 21.226940155029297, 22.252674102783203, 23.27840805053711, 24.304141998291016, 25.32987403869629, 26.355607986450195, 27.38134002685547, 28.407073974609375, 29.43280601501465, 30.458539962768555, 31.48427391052246, 32.510005950927734, 33.53573989868164, 34.56147384643555, 35.58720779418945]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 3.0, 2.0, 11.0, 4.0, 6.0, 4.0, 15.0, 12.0, 17.0, 11.0, 23.0, 31.0, 27.0, 27.0, 18.0, 38.0, 39.0, 34.0, 30.0, 42.0, 37.0, 47.0, 56.0, 40.0, 34.0, 43.0, 30.0, 38.0, 51.0, 29.0, 26.0, 28.0, 28.0, 22.0, 20.0, 12.0, 10.0, 15.0, 15.0, 9.0, 11.0, 5.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3164215087890625, -1.271514892578125, -1.2266082763671875, -1.18170166015625, -1.1367950439453125, -1.091888427734375, -1.0469818115234375, -1.0020751953125, -0.9571685791015625, -0.912261962890625, -0.8673553466796875, -0.82244873046875, -0.7775421142578125, -0.732635498046875, -0.6877288818359375, -0.642822265625, -0.5979156494140625, -0.553009033203125, -0.5081024169921875, -0.46319580078125, -0.4182891845703125, -0.373382568359375, -0.3284759521484375, -0.2835693359375, -0.2386627197265625, -0.193756103515625, -0.1488494873046875, -0.10394287109375, -0.0590362548828125, -0.014129638671875, 0.0307769775390625, 0.07568359375, 0.1205902099609375, 0.165496826171875, 0.2104034423828125, 0.25531005859375, 0.3002166748046875, 0.345123291015625, 0.3900299072265625, 0.4349365234375, 0.4798431396484375, 0.524749755859375, 0.5696563720703125, 0.61456298828125, 0.6594696044921875, 0.704376220703125, 0.7492828369140625, 0.794189453125, 0.8390960693359375, 0.884002685546875, 0.9289093017578125, 0.97381591796875, 1.0187225341796875, 1.063629150390625, 1.1085357666015625, 1.1534423828125, 1.1983489990234375, 1.243255615234375, 1.2881622314453125, 1.33306884765625, 1.3779754638671875, 1.422882080078125, 1.4677886962890625, 1.5126953125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 10.0, 9.0, 13.0, 16.0, 17.0, 23.0, 27.0, 44.0, 60.0, 73.0, 99.0, 120.0, 208.0, 281.0, 446.0, 643.0, 1085.0, 1817.0, 3753.0, 9070.0, 28623.0, 141013.0, 1479029.0, 2245036.0, 222844.0, 38747.0, 11184.0, 4406.0, 2179.0, 1165.0, 751.0, 445.0, 298.0, 193.0, 142.0, 107.0, 84.0, 55.0, 45.0, 35.0, 25.0, 20.0, 11.0, 11.0, 5.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.1875, -5.020751953125, -4.85400390625, -4.687255859375, -4.5205078125, -4.353759765625, -4.18701171875, -4.020263671875, -3.853515625, -3.686767578125, -3.52001953125, -3.353271484375, -3.1865234375, -3.019775390625, -2.85302734375, -2.686279296875, -2.51953125, -2.352783203125, -2.18603515625, -2.019287109375, -1.8525390625, -1.685791015625, -1.51904296875, -1.352294921875, -1.185546875, -1.018798828125, -0.85205078125, -0.685302734375, -0.5185546875, -0.351806640625, -0.18505859375, -0.018310546875, 0.1484375, 0.315185546875, 0.48193359375, 0.648681640625, 0.8154296875, 0.982177734375, 1.14892578125, 1.315673828125, 1.482421875, 1.649169921875, 1.81591796875, 1.982666015625, 2.1494140625, 2.316162109375, 2.48291015625, 2.649658203125, 2.81640625, 2.983154296875, 3.14990234375, 3.316650390625, 3.4833984375, 3.650146484375, 3.81689453125, 3.983642578125, 4.150390625, 4.317138671875, 4.48388671875, 4.650634765625, 4.8173828125, 4.984130859375, 5.15087890625, 5.317626953125, 5.484375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 16.0, 30.0, 66.0, 173.0, 441.0, 1089.0, 1279.0, 557.0, 238.0, 87.0, 49.0, 17.0, 11.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3359375, -12.8775634765625, -12.419189453125, -11.9608154296875, -11.50244140625, -11.0440673828125, -10.585693359375, -10.1273193359375, -9.6689453125, -9.2105712890625, -8.752197265625, -8.2938232421875, -7.83544921875, -7.3770751953125, -6.918701171875, -6.4603271484375, -6.001953125, -5.5435791015625, -5.085205078125, -4.6268310546875, -4.16845703125, -3.7100830078125, -3.251708984375, -2.7933349609375, -2.3349609375, -1.8765869140625, -1.418212890625, -0.9598388671875, -0.50146484375, -0.0430908203125, 0.415283203125, 0.8736572265625, 1.33203125, 1.7904052734375, 2.248779296875, 2.7071533203125, 3.16552734375, 3.6239013671875, 4.082275390625, 4.5406494140625, 4.9990234375, 5.4573974609375, 5.915771484375, 6.3741455078125, 6.83251953125, 7.2908935546875, 7.749267578125, 8.2076416015625, 8.666015625, 9.1243896484375, 9.582763671875, 10.0411376953125, 10.49951171875, 10.9578857421875, 11.416259765625, 11.8746337890625, 12.3330078125, 12.7913818359375, 13.249755859375, 13.7081298828125, 14.16650390625, 14.6248779296875, 15.083251953125, 15.5416259765625, 16.0]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 5.0, 3.0, 11.0, 10.0, 12.0, 40.0, 71.0, 194.0, 502.0, 2078.0, 27085.0, 4147883.0, 13883.0, 1694.0, 479.0, 175.0, 71.0, 36.0, 11.0, 13.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.8125, -41.40576171875, -39.9990234375, -38.59228515625, -37.185546875, -35.77880859375, -34.3720703125, -32.96533203125, -31.55859375, -30.15185546875, -28.7451171875, -27.33837890625, -25.931640625, -24.52490234375, -23.1181640625, -21.71142578125, -20.3046875, -18.89794921875, -17.4912109375, -16.08447265625, -14.677734375, -13.27099609375, -11.8642578125, -10.45751953125, -9.05078125, -7.64404296875, -6.2373046875, -4.83056640625, -3.423828125, -2.01708984375, -0.6103515625, 0.79638671875, 2.203125, 3.60986328125, 5.0166015625, 6.42333984375, 7.830078125, 9.23681640625, 10.6435546875, 12.05029296875, 13.45703125, 14.86376953125, 16.2705078125, 17.67724609375, 19.083984375, 20.49072265625, 21.8974609375, 23.30419921875, 24.7109375, 26.11767578125, 27.5244140625, 28.93115234375, 30.337890625, 31.74462890625, 33.1513671875, 34.55810546875, 35.96484375, 37.37158203125, 38.7783203125, 40.18505859375, 41.591796875, 42.99853515625, 44.4052734375, 45.81201171875, 47.21875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 61.0, 348.0, 424.0, 158.0, 14.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.08546447753906, -98.74624633789062, -96.40702056884766, -94.06779479980469, -91.72857666015625, -89.38935852050781, -87.05013275146484, -84.71090698242188, -82.37168884277344, -80.032470703125, -77.69324493408203, -75.35401916503906, -73.01480102539062, -70.67558288574219, -68.33635711669922, -65.99713134765625, -63.65791320800781, -61.31869125366211, -58.979469299316406, -56.6402473449707, -54.301025390625, -51.9618034362793, -49.622581481933594, -47.28335952758789, -44.94413757324219, -42.604915618896484, -40.26569366455078, -37.92647171020508, -35.587249755859375, -33.24802780151367, -30.90880584716797, -28.569583892822266, -26.230358123779297, -23.891136169433594, -21.55191421508789, -19.212692260742188, -16.873470306396484, -14.534248352050781, -12.195026397705078, -9.855804443359375, -7.516582489013672, -5.177360534667969, -2.8381385803222656, -0.4989166259765625, 1.8403053283691406, 4.179527282714844, 6.518749237060547, 8.85797119140625, 11.197193145751953, 13.536415100097656, 15.87563705444336, 18.214859008789062, 20.554080963134766, 22.89330291748047, 25.232524871826172, 27.571746826171875, 29.910968780517578, 32.25019073486328, 34.589412689208984, 36.92863464355469, 39.26785659790039, 41.607078552246094, 43.9463005065918, 46.2855224609375, 48.6247444152832]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 10.0, 14.0, 14.0, 13.0, 17.0, 27.0, 28.0, 26.0, 32.0, 35.0, 41.0, 36.0, 45.0, 42.0, 49.0, 39.0, 46.0, 34.0, 29.0, 42.0, 39.0, 35.0, 38.0, 35.0, 37.0, 29.0, 25.0, 19.0, 18.0, 13.0, 16.0, 18.0, 8.0, 6.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.333791732788086, -19.734371185302734, -19.134950637817383, -18.53553009033203, -17.93610954284668, -17.336688995361328, -16.737268447875977, -16.137847900390625, -15.53842830657959, -14.939007759094238, -14.339587211608887, -13.740166664123535, -13.1407470703125, -12.541326522827148, -11.941905975341797, -11.342485427856445, -10.743064880371094, -10.143644332885742, -9.54422378540039, -8.944803237915039, -8.345382690429688, -7.745962619781494, -7.146542549133301, -6.547122001647949, -5.947701454162598, -5.348280906677246, -4.7488603591918945, -4.149440288543701, -3.5500197410583496, -2.950599193572998, -2.3511788845062256, -1.7517585754394531, -1.1523361206054688, -0.5529156923294067, 0.04650473594665527, 0.6459251642227173, 1.2453455924987793, 1.8447661399841309, 2.4441864490509033, 3.043606758117676, 3.6430273056030273, 4.242447853088379, 4.8418684005737305, 5.441288471221924, 6.040709018707275, 6.640129566192627, 7.23954963684082, 7.838970184326172, 8.438390731811523, 9.037811279296875, 9.637231826782227, 10.236652374267578, 10.83607292175293, 11.435493469238281, 12.034913063049316, 12.634333610534668, 13.23375415802002, 13.833174705505371, 14.432595252990723, 15.032015800476074, 15.63143539428711, 16.23085594177246, 16.830276489257812, 17.429697036743164, 18.029117584228516]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 3.0, 4.0, 7.0, 4.0, 13.0, 15.0, 7.0, 13.0, 23.0, 24.0, 27.0, 24.0, 32.0, 37.0, 46.0, 30.0, 27.0, 30.0, 42.0, 28.0, 50.0, 31.0, 50.0, 59.0, 36.0, 36.0, 41.0, 23.0, 34.0, 25.0, 25.0, 24.0, 26.0, 17.0, 21.0, 12.0, 11.0, 12.0, 13.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2374725341796875, -1.194671630859375, -1.1518707275390625, -1.10906982421875, -1.0662689208984375, -1.023468017578125, -0.9806671142578125, -0.9378662109375, -0.8950653076171875, -0.852264404296875, -0.8094635009765625, -0.76666259765625, -0.7238616943359375, -0.681060791015625, -0.6382598876953125, -0.595458984375, -0.5526580810546875, -0.509857177734375, -0.4670562744140625, -0.42425537109375, -0.3814544677734375, -0.338653564453125, -0.2958526611328125, -0.2530517578125, -0.2102508544921875, -0.167449951171875, -0.1246490478515625, -0.08184814453125, -0.0390472412109375, 0.003753662109375, 0.0465545654296875, 0.08935546875, 0.1321563720703125, 0.174957275390625, 0.2177581787109375, 0.26055908203125, 0.3033599853515625, 0.346160888671875, 0.3889617919921875, 0.4317626953125, 0.4745635986328125, 0.517364501953125, 0.5601654052734375, 0.60296630859375, 0.6457672119140625, 0.688568115234375, 0.7313690185546875, 0.774169921875, 0.8169708251953125, 0.859771728515625, 0.9025726318359375, 0.94537353515625, 0.9881744384765625, 1.030975341796875, 1.0737762451171875, 1.1165771484375, 1.1593780517578125, 1.202178955078125, 1.2449798583984375, 1.28778076171875, 1.3305816650390625, 1.373382568359375, 1.4161834716796875, 1.458984375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 5.0, 4.0, 7.0, 16.0, 23.0, 34.0, 35.0, 44.0, 76.0, 116.0, 159.0, 205.0, 313.0, 456.0, 657.0, 903.0, 1365.0, 2004.0, 2786.0, 4326.0, 6342.0, 9706.0, 15099.0, 24082.0, 38808.0, 62878.0, 102220.0, 160843.0, 201921.0, 154341.0, 96196.0, 59854.0, 36798.0, 22723.0, 14654.0, 9423.0, 6188.0, 4123.0, 2645.0, 1901.0, 1255.0, 939.0, 618.0, 463.0, 295.0, 210.0, 164.0, 99.0, 72.0, 47.0, 36.0, 35.0, 22.0, 14.0, 5.0, 6.0, 3.0, 7.0, 0.0, 1.0, 1.0], "bins": [-0.1319580078125, -0.1277618408203125, -0.123565673828125, -0.1193695068359375, -0.11517333984375, -0.1109771728515625, -0.106781005859375, -0.1025848388671875, -0.098388671875, -0.0941925048828125, -0.089996337890625, -0.0858001708984375, -0.08160400390625, -0.0774078369140625, -0.073211669921875, -0.0690155029296875, -0.0648193359375, -0.0606231689453125, -0.056427001953125, -0.0522308349609375, -0.04803466796875, -0.0438385009765625, -0.039642333984375, -0.0354461669921875, -0.03125, -0.0270538330078125, -0.022857666015625, -0.0186614990234375, -0.01446533203125, -0.0102691650390625, -0.006072998046875, -0.0018768310546875, 0.0023193359375, 0.0065155029296875, 0.010711669921875, 0.0149078369140625, 0.01910400390625, 0.0233001708984375, 0.027496337890625, 0.0316925048828125, 0.035888671875, 0.0400848388671875, 0.044281005859375, 0.0484771728515625, 0.05267333984375, 0.0568695068359375, 0.061065673828125, 0.0652618408203125, 0.0694580078125, 0.0736541748046875, 0.077850341796875, 0.0820465087890625, 0.08624267578125, 0.0904388427734375, 0.094635009765625, 0.0988311767578125, 0.10302734375, 0.1072235107421875, 0.111419677734375, 0.1156158447265625, 0.11981201171875, 0.1240081787109375, 0.128204345703125, 0.1324005126953125, 0.1365966796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 10.0, 4.0, 7.0, 18.0, 19.0, 14.0, 28.0, 19.0, 19.0, 27.0, 33.0, 35.0, 35.0, 34.0, 46.0, 41.0, 38.0, 38.0, 36.0, 1067.0, 34.0, 42.0, 37.0, 32.0, 39.0, 35.0, 31.0, 19.0, 27.0, 27.0, 21.0, 17.0, 15.0, 14.0, 9.0, 11.0, 11.0, 4.0, 8.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.853515625, -0.8255844116210938, -0.7976531982421875, -0.7697219848632812, -0.741790771484375, -0.7138595581054688, -0.6859283447265625, -0.6579971313476562, -0.63006591796875, -0.6021347045898438, -0.5742034912109375, -0.5462722778320312, -0.518341064453125, -0.49040985107421875, -0.4624786376953125, -0.43454742431640625, -0.4066162109375, -0.37868499755859375, -0.3507537841796875, -0.32282257080078125, -0.294891357421875, -0.26696014404296875, -0.2390289306640625, -0.21109771728515625, -0.18316650390625, -0.15523529052734375, -0.1273040771484375, -0.09937286376953125, -0.071441650390625, -0.04351043701171875, -0.0155792236328125, 0.01235198974609375, 0.040283203125, 0.06821441650390625, 0.0961456298828125, 0.12407684326171875, 0.152008056640625, 0.17993927001953125, 0.2078704833984375, 0.23580169677734375, 0.26373291015625, 0.29166412353515625, 0.3195953369140625, 0.34752655029296875, 0.375457763671875, 0.40338897705078125, 0.4313201904296875, 0.45925140380859375, 0.4871826171875, 0.5151138305664062, 0.5430450439453125, 0.5709762573242188, 0.598907470703125, 0.6268386840820312, 0.6547698974609375, 0.6827011108398438, 0.71063232421875, 0.7385635375976562, 0.7664947509765625, 0.7944259643554688, 0.822357177734375, 0.8502883911132812, 0.8782196044921875, 0.9061508178710938, 0.93408203125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 12.0, 7.0, 11.0, 18.0, 23.0, 57.0, 86.0, 115.0, 192.0, 275.0, 425.0, 592.0, 915.0, 1328.0, 1945.0, 2987.0, 4519.0, 6730.0, 10386.0, 15985.0, 24496.0, 37138.0, 55596.0, 83013.0, 117803.0, 384885.0, 967776.0, 122802.0, 85998.0, 58316.0, 38728.0, 25601.0, 16326.0, 11024.0, 7007.0, 4668.0, 3155.0, 2079.0, 1359.0, 893.0, 631.0, 431.0, 268.0, 190.0, 112.0, 74.0, 49.0, 40.0, 20.0, 15.0, 15.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0], "bins": [-0.08612060546875, -0.0834341049194336, -0.08074760437011719, -0.07806110382080078, -0.07537460327148438, -0.07268810272216797, -0.07000160217285156, -0.06731510162353516, -0.06462860107421875, -0.061942100524902344, -0.05925559997558594, -0.05656909942626953, -0.053882598876953125, -0.05119609832763672, -0.04850959777832031, -0.045823097229003906, -0.0431365966796875, -0.040450096130371094, -0.03776359558105469, -0.03507709503173828, -0.032390594482421875, -0.02970409393310547, -0.027017593383789062, -0.024331092834472656, -0.02164459228515625, -0.018958091735839844, -0.016271591186523438, -0.013585090637207031, -0.010898590087890625, -0.008212089538574219, -0.0055255889892578125, -0.0028390884399414062, -0.000152587890625, 0.0025339126586914062, 0.0052204132080078125, 0.007906913757324219, 0.010593414306640625, 0.013279914855957031, 0.015966415405273438, 0.018652915954589844, 0.02133941650390625, 0.024025917053222656, 0.026712417602539062, 0.02939891815185547, 0.032085418701171875, 0.03477191925048828, 0.03745841979980469, 0.040144920349121094, 0.0428314208984375, 0.045517921447753906, 0.04820442199707031, 0.05089092254638672, 0.053577423095703125, 0.05626392364501953, 0.05895042419433594, 0.061636924743652344, 0.06432342529296875, 0.06700992584228516, 0.06969642639160156, 0.07238292694091797, 0.07506942749023438, 0.07775592803955078, 0.08044242858886719, 0.0831289291381836, 0.0858154296875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 2.0, 2.0, 8.0, 4.0, 3.0, 10.0, 9.0, 6.0, 16.0, 9.0, 9.0, 14.0, 10.0, 24.0, 23.0, 30.0, 39.0, 46.0, 39.0, 71.0, 44.0, 78.0, 70.0, 75.0, 56.0, 43.0, 37.0, 30.0, 18.0, 16.0, 22.0, 19.0, 16.0, 9.0, 11.0, 12.0, 14.0, 5.0, 6.0, 5.0, 5.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0017910003662109375, -0.0017289519309997559, -0.0016669034957885742, -0.0016048550605773926, -0.001542806625366211, -0.0014807581901550293, -0.0014187097549438477, -0.001356661319732666, -0.0012946128845214844, -0.0012325644493103027, -0.001170516014099121, -0.0011084675788879395, -0.0010464191436767578, -0.0009843707084655762, -0.0009223222732543945, -0.0008602738380432129, -0.0007982254028320312, -0.0007361769676208496, -0.000674128532409668, -0.0006120800971984863, -0.0005500316619873047, -0.00048798322677612305, -0.0004259347915649414, -0.00036388635635375977, -0.0003018379211425781, -0.00023978948593139648, -0.00017774105072021484, -0.0001156926155090332, -5.364418029785156e-05, 8.404254913330078e-06, 7.045269012451172e-05, 0.00013250112533569336, 0.000194549560546875, 0.00025659799575805664, 0.0003186464309692383, 0.0003806948661804199, 0.00044274330139160156, 0.0005047917366027832, 0.0005668401718139648, 0.0006288886070251465, 0.0006909370422363281, 0.0007529854774475098, 0.0008150339126586914, 0.000877082347869873, 0.0009391307830810547, 0.0010011792182922363, 0.001063227653503418, 0.0011252760887145996, 0.0011873245239257812, 0.0012493729591369629, 0.0013114213943481445, 0.0013734698295593262, 0.0014355182647705078, 0.0014975666999816895, 0.001559615135192871, 0.0016216635704040527, 0.0016837120056152344, 0.001745760440826416, 0.0018078088760375977, 0.0018698573112487793, 0.001931905746459961, 0.0019939541816711426, 0.0020560026168823242, 0.002118051052093506, 0.0021800994873046875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 10.0, 4.0, 6.0, 15.0, 12.0, 16.0, 21.0, 13.0, 15.0, 23.0, 24.0, 35.0, 40.0, 39.0, 39.0, 58.0, 74.0, 84.0, 113.0, 154.0, 220.0, 269.0, 639.0, 8303.0, 1029566.0, 6862.0, 621.0, 305.0, 187.0, 140.0, 95.0, 93.0, 65.0, 59.0, 56.0, 37.0, 50.0, 42.0, 17.0, 16.0, 11.0, 21.0, 25.0, 14.0, 10.0, 7.0, 4.0, 12.0, 8.0, 3.0, 4.0, 1.0, 4.0, 1.0, 3.0], "bins": [-0.03857421875, -0.03742218017578125, -0.0362701416015625, -0.03511810302734375, -0.033966064453125, -0.03281402587890625, -0.0316619873046875, -0.03050994873046875, -0.02935791015625, -0.02820587158203125, -0.0270538330078125, -0.02590179443359375, -0.024749755859375, -0.02359771728515625, -0.0224456787109375, -0.02129364013671875, -0.0201416015625, -0.01898956298828125, -0.0178375244140625, -0.01668548583984375, -0.015533447265625, -0.01438140869140625, -0.0132293701171875, -0.01207733154296875, -0.01092529296875, -0.00977325439453125, -0.0086212158203125, -0.00746917724609375, -0.006317138671875, -0.00516510009765625, -0.0040130615234375, -0.00286102294921875, -0.001708984375, -0.00055694580078125, 0.0005950927734375, 0.00174713134765625, 0.002899169921875, 0.00405120849609375, 0.0052032470703125, 0.00635528564453125, 0.00750732421875, 0.00865936279296875, 0.0098114013671875, 0.01096343994140625, 0.012115478515625, 0.01326751708984375, 0.0144195556640625, 0.01557159423828125, 0.0167236328125, 0.01787567138671875, 0.0190277099609375, 0.02017974853515625, 0.021331787109375, 0.02248382568359375, 0.0236358642578125, 0.02478790283203125, 0.02593994140625, 0.02709197998046875, 0.0282440185546875, 0.02939605712890625, 0.030548095703125, 0.03170013427734375, 0.0328521728515625, 0.03400421142578125, 0.03515625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 975.0, 39.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035568419843912125, -0.03475503996014595, -0.033941660076379776, -0.0331282801926136, -0.03231490030884743, -0.03150152042508125, -0.03068814054131508, -0.029874760657548904, -0.02906138077378273, -0.028248000890016556, -0.02743462100625038, -0.026621241122484207, -0.025807861238718033, -0.02499448135495186, -0.024181101471185684, -0.02336772158741951, -0.022554343566298485, -0.02174096368253231, -0.020927583798766136, -0.020114203914999962, -0.019300824031233788, -0.018487444147467613, -0.017674066126346588, -0.016860686242580414, -0.01604730635881424, -0.015233926475048065, -0.014420546591281891, -0.013607166707515717, -0.012793786823749542, -0.011980406939983368, -0.011167027987539768, -0.010353648103773594, -0.009540269151329994, -0.00872688926756382, -0.007913509383797646, -0.0071001299656927586, -0.006286750081926584, -0.00547337019816041, -0.004659990780055523, -0.0038466108962893486, -0.0030332310125231743, -0.002219851128757, -0.0014064714778214693, -0.0005930918268859386, 0.00022028805688023567, 0.00103366794064641, 0.001847047358751297, 0.0026604272425174713, 0.0034738071262836456, 0.00428718701004982, 0.005100566893815994, 0.005913946311920881, 0.006727326195687056, 0.00754070607945323, 0.008354085497558117, 0.009167465381324291, 0.009980845265090466, 0.01079422514885664, 0.011607605032622814, 0.012420983985066414, 0.013234363868832588, 0.014047743752598763, 0.014861123636364937, 0.01567450352013111, 0.016487883403897285]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 10.0, 6.0, 19.0, 18.0, 25.0, 33.0, 39.0, 55.0, 47.0, 69.0, 66.0, 63.0, 73.0, 68.0, 70.0, 66.0, 40.0, 50.0, 46.0, 29.0, 37.0, 28.0, 16.0, 11.0, 9.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0030336976051330566, -0.002960260957479477, -0.002886824309825897, -0.0028133876621723175, -0.002739951014518738, -0.002666514366865158, -0.0025930777192115784, -0.0025196410715579987, -0.002446204423904419, -0.0023727677762508392, -0.0022993311285972595, -0.00222589448094368, -0.0021524578332901, -0.0020790211856365204, -0.0020055845379829407, -0.001932147890329361, -0.0018587112426757812, -0.0017852745950222015, -0.0017118379473686218, -0.0016384012997150421, -0.0015649646520614624, -0.0014915280044078827, -0.001418091356754303, -0.0013446547091007233, -0.0012712180614471436, -0.0011977814137935638, -0.0011243447661399841, -0.0010509081184864044, -0.0009774714708328247, -0.000904034823179245, -0.0008305981755256653, -0.0007571615278720856, -0.0006837248802185059, -0.0006102882325649261, -0.0005368515849113464, -0.0004634149372577667, -0.000389978289604187, -0.0003165416419506073, -0.0002431049942970276, -0.00016966834664344788, -9.623169898986816e-05, -2.2795051336288452e-05, 5.064159631729126e-05, 0.00012407824397087097, 0.00019751489162445068, 0.0002709515392780304, 0.0003443881869316101, 0.0004178248345851898, 0.0004912614822387695, 0.0005646981298923492, 0.000638134777545929, 0.0007115714251995087, 0.0007850080728530884, 0.0008584447205066681, 0.0009318813681602478, 0.0010053180158138275, 0.0010787546634674072, 0.001152191311120987, 0.0012256279587745667, 0.0012990646064281464, 0.001372501254081726, 0.0014459379017353058, 0.0015193745493888855, 0.0015928111970424652, 0.001666247844696045]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 3.0, 4.0, 7.0, 4.0, 13.0, 15.0, 7.0, 13.0, 23.0, 24.0, 27.0, 24.0, 32.0, 38.0, 45.0, 30.0, 27.0, 30.0, 42.0, 28.0, 50.0, 31.0, 50.0, 59.0, 36.0, 36.0, 41.0, 23.0, 34.0, 25.0, 25.0, 24.0, 25.0, 18.0, 21.0, 12.0, 11.0, 12.0, 13.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2374725341796875, -1.194671630859375, -1.1518707275390625, -1.10906982421875, -1.0662689208984375, -1.023468017578125, -0.9806671142578125, -0.9378662109375, -0.8950653076171875, -0.852264404296875, -0.8094635009765625, -0.76666259765625, -0.7238616943359375, -0.681060791015625, -0.6382598876953125, -0.595458984375, -0.5526580810546875, -0.509857177734375, -0.4670562744140625, -0.42425537109375, -0.3814544677734375, -0.338653564453125, -0.2958526611328125, -0.2530517578125, -0.2102508544921875, -0.167449951171875, -0.1246490478515625, -0.08184814453125, -0.0390472412109375, 0.003753662109375, 0.0465545654296875, 0.08935546875, 0.1321563720703125, 0.174957275390625, 0.2177581787109375, 0.26055908203125, 0.3033599853515625, 0.346160888671875, 0.3889617919921875, 0.4317626953125, 0.4745635986328125, 0.517364501953125, 0.5601654052734375, 0.60296630859375, 0.6457672119140625, 0.688568115234375, 0.7313690185546875, 0.774169921875, 0.8169708251953125, 0.859771728515625, 0.9025726318359375, 0.94537353515625, 0.9881744384765625, 1.030975341796875, 1.0737762451171875, 1.1165771484375, 1.1593780517578125, 1.202178955078125, 1.2449798583984375, 1.28778076171875, 1.3305816650390625, 1.373382568359375, 1.4161834716796875, 1.458984375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 10.0, 7.0, 12.0, 24.0, 27.0, 30.0, 50.0, 67.0, 88.0, 122.0, 178.0, 252.0, 394.0, 512.0, 732.0, 1014.0, 1403.0, 2021.0, 3081.0, 4473.0, 7115.0, 12091.0, 23005.0, 56048.0, 176401.0, 415922.0, 214602.0, 66111.0, 26219.0, 13281.0, 7815.0, 4876.0, 3190.0, 2130.0, 1538.0, 1099.0, 725.0, 567.0, 398.0, 250.0, 194.0, 132.0, 122.0, 86.0, 48.0, 38.0, 28.0, 15.0, 8.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.20806884765625, -3.0958251953125, -2.98358154296875, -2.871337890625, -2.75909423828125, -2.6468505859375, -2.53460693359375, -2.42236328125, -2.31011962890625, -2.1978759765625, -2.08563232421875, -1.973388671875, -1.86114501953125, -1.7489013671875, -1.63665771484375, -1.5244140625, -1.41217041015625, -1.2999267578125, -1.18768310546875, -1.075439453125, -0.96319580078125, -0.8509521484375, -0.73870849609375, -0.62646484375, -0.51422119140625, -0.4019775390625, -0.28973388671875, -0.177490234375, -0.06524658203125, 0.0469970703125, 0.15924072265625, 0.271484375, 0.38372802734375, 0.4959716796875, 0.60821533203125, 0.720458984375, 0.83270263671875, 0.9449462890625, 1.05718994140625, 1.16943359375, 1.28167724609375, 1.3939208984375, 1.50616455078125, 1.618408203125, 1.73065185546875, 1.8428955078125, 1.95513916015625, 2.0673828125, 2.17962646484375, 2.2918701171875, 2.40411376953125, 2.516357421875, 2.62860107421875, 2.7408447265625, 2.85308837890625, 2.96533203125, 3.07757568359375, 3.1898193359375, 3.30206298828125, 3.414306640625, 3.52655029296875, 3.6387939453125, 3.75103759765625, 3.86328125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 5.0, 10.0, 8.0, 6.0, 16.0, 16.0, 18.0, 28.0, 35.0, 34.0, 32.0, 39.0, 52.0, 60.0, 54.0, 90.0, 130.0, 188.0, 1297.0, 214.0, 137.0, 107.0, 68.0, 59.0, 51.0, 42.0, 28.0, 27.0, 29.0, 26.0, 23.0, 19.0, 10.0, 23.0, 10.0, 9.0, 2.0, 7.0, 5.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.6846923828125, -3.560791015625, -3.4368896484375, -3.31298828125, -3.1890869140625, -3.065185546875, -2.9412841796875, -2.8173828125, -2.6934814453125, -2.569580078125, -2.4456787109375, -2.32177734375, -2.1978759765625, -2.073974609375, -1.9500732421875, -1.826171875, -1.7022705078125, -1.578369140625, -1.4544677734375, -1.33056640625, -1.2066650390625, -1.082763671875, -0.9588623046875, -0.8349609375, -0.7110595703125, -0.587158203125, -0.4632568359375, -0.33935546875, -0.2154541015625, -0.091552734375, 0.0323486328125, 0.15625, 0.2801513671875, 0.404052734375, 0.5279541015625, 0.65185546875, 0.7757568359375, 0.899658203125, 1.0235595703125, 1.1474609375, 1.2713623046875, 1.395263671875, 1.5191650390625, 1.64306640625, 1.7669677734375, 1.890869140625, 2.0147705078125, 2.138671875, 2.2625732421875, 2.386474609375, 2.5103759765625, 2.63427734375, 2.7581787109375, 2.882080078125, 3.0059814453125, 3.1298828125, 3.2537841796875, 3.377685546875, 3.5015869140625, 3.62548828125, 3.7493896484375, 3.873291015625, 3.9971923828125, 4.12109375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 7.0, 6.0, 9.0, 8.0, 10.0, 19.0, 14.0, 19.0, 23.0, 25.0, 32.0, 27.0, 48.0, 69.0, 111.0, 269.0, 692.0, 2343.0, 55197.0, 3047795.0, 35702.0, 1959.0, 612.0, 242.0, 121.0, 67.0, 52.0, 40.0, 28.0, 24.0, 25.0, 20.0, 21.0, 10.0, 10.0, 9.0, 6.0, 11.0, 2.0, 5.0, 1.0, 0.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-17.53125, -17.036865234375, -16.54248046875, -16.048095703125, -15.5537109375, -15.059326171875, -14.56494140625, -14.070556640625, -13.576171875, -13.081787109375, -12.58740234375, -12.093017578125, -11.5986328125, -11.104248046875, -10.60986328125, -10.115478515625, -9.62109375, -9.126708984375, -8.63232421875, -8.137939453125, -7.6435546875, -7.149169921875, -6.65478515625, -6.160400390625, -5.666015625, -5.171630859375, -4.67724609375, -4.182861328125, -3.6884765625, -3.194091796875, -2.69970703125, -2.205322265625, -1.7109375, -1.216552734375, -0.72216796875, -0.227783203125, 0.2666015625, 0.760986328125, 1.25537109375, 1.749755859375, 2.244140625, 2.738525390625, 3.23291015625, 3.727294921875, 4.2216796875, 4.716064453125, 5.21044921875, 5.704833984375, 6.19921875, 6.693603515625, 7.18798828125, 7.682373046875, 8.1767578125, 8.671142578125, 9.16552734375, 9.659912109375, 10.154296875, 10.648681640625, 11.14306640625, 11.637451171875, 12.1318359375, 12.626220703125, 13.12060546875, 13.614990234375, 14.109375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 31.0, 564.0, 406.0, 9.0, 0.0, 1.0], "bins": [-97.55330657958984, -95.92345428466797, -94.29360961914062, -92.66375732421875, -91.03390502929688, -89.404052734375, -87.77420806884766, -86.14435577392578, -84.5145034790039, -82.88465118408203, -81.25480651855469, -79.62495422363281, -77.99510192871094, -76.36524963378906, -74.73540496826172, -73.10555267333984, -71.4757080078125, -69.84585571289062, -68.21601104736328, -66.5861587524414, -64.95630645751953, -63.32645797729492, -61.69660949707031, -60.06675720214844, -58.43690490722656, -56.80705642700195, -55.17720413208008, -53.54735565185547, -51.917503356933594, -50.287654876708984, -48.657806396484375, -47.0279541015625, -45.39810562133789, -43.76825714111328, -42.138404846191406, -40.5085563659668, -38.87870407104492, -37.24885559082031, -35.61900329589844, -33.98915481567383, -32.35930633544922, -30.729455947875977, -29.099605560302734, -27.469757080078125, -25.839906692504883, -24.21005630493164, -22.5802059173584, -20.950355529785156, -19.32050323486328, -17.69065284729004, -16.060802459716797, -14.430953025817871, -12.801103591918945, -11.171253204345703, -9.541402816772461, -7.911553382873535, -6.281703948974609, -4.651854038238525, -3.0220038890838623, -1.3921537399291992, 0.23769617080688477, 1.8675460815429688, 3.497396469116211, 5.127245903015137, 6.757096290588379]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 14.0, 9.0, 5.0, 8.0, 9.0, 12.0, 11.0, 12.0, 18.0, 12.0, 27.0, 35.0, 24.0, 28.0, 33.0, 44.0, 40.0, 37.0, 39.0, 32.0, 55.0, 41.0, 36.0, 41.0, 31.0, 40.0, 29.0, 29.0, 36.0, 26.0, 21.0, 32.0, 22.0, 25.0, 19.0, 9.0, 11.0, 9.0, 10.0, 3.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.687631607055664, -12.281689643859863, -11.875746726989746, -11.469804763793945, -11.063861846923828, -10.657919883728027, -10.251977920532227, -9.84603500366211, -9.440092086791992, -9.034150123596191, -8.628207206726074, -8.222265243530273, -7.816322326660156, -7.4103803634643555, -7.0044379234313965, -6.5984954833984375, -6.192553520202637, -5.786611080169678, -5.380668640136719, -4.974726676940918, -4.568783760070801, -4.162841796875, -3.756899356842041, -3.350956916809082, -2.945014476776123, -2.539072036743164, -2.133129596710205, -1.7271873950958252, -1.3212449550628662, -0.9153025150299072, -0.5093603134155273, -0.10341787338256836, 0.3025245666503906, 0.7084669470787048, 1.114409327507019, 1.5203516483306885, 1.9262940883636475, 2.3322365283966064, 2.7381787300109863, 3.1441211700439453, 3.5500636100769043, 3.9560060501098633, 4.361948490142822, 4.767890930175781, 5.173832893371582, 5.579775810241699, 5.9857177734375, 6.391660213470459, 6.797602653503418, 7.203545093536377, 7.609487533569336, 8.015429496765137, 8.421372413635254, 8.827314376831055, 9.233257293701172, 9.639199256896973, 10.045141220092773, 10.451083183288574, 10.857026100158691, 11.262968063354492, 11.66891098022461, 12.07485294342041, 12.480794906616211, 12.886737823486328, 13.292680740356445]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 6.0, 5.0, 8.0, 13.0, 10.0, 15.0, 9.0, 12.0, 22.0, 28.0, 23.0, 26.0, 30.0, 37.0, 36.0, 24.0, 33.0, 40.0, 23.0, 41.0, 30.0, 46.0, 42.0, 48.0, 47.0, 27.0, 36.0, 30.0, 29.0, 26.0, 21.0, 27.0, 24.0, 21.0, 19.0, 9.0, 13.0, 12.0, 13.0, 8.0, 10.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.281524658203125, -1.23883056640625, -1.196136474609375, -1.1534423828125, -1.110748291015625, -1.06805419921875, -1.025360107421875, -0.982666015625, -0.939971923828125, -0.89727783203125, -0.854583740234375, -0.8118896484375, -0.769195556640625, -0.72650146484375, -0.683807373046875, -0.64111328125, -0.598419189453125, -0.55572509765625, -0.513031005859375, -0.4703369140625, -0.427642822265625, -0.38494873046875, -0.342254638671875, -0.299560546875, -0.256866455078125, -0.21417236328125, -0.171478271484375, -0.1287841796875, -0.086090087890625, -0.04339599609375, -0.000701904296875, 0.0419921875, 0.084686279296875, 0.12738037109375, 0.170074462890625, 0.2127685546875, 0.255462646484375, 0.29815673828125, 0.340850830078125, 0.383544921875, 0.426239013671875, 0.46893310546875, 0.511627197265625, 0.5543212890625, 0.597015380859375, 0.63970947265625, 0.682403564453125, 0.72509765625, 0.767791748046875, 0.81048583984375, 0.853179931640625, 0.8958740234375, 0.938568115234375, 0.98126220703125, 1.023956298828125, 1.066650390625, 1.109344482421875, 1.15203857421875, 1.194732666015625, 1.2374267578125, 1.280120849609375, 1.32281494140625, 1.365509033203125, 1.408203125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 13.0, 8.0, 11.0, 20.0, 25.0, 38.0, 36.0, 63.0, 75.0, 111.0, 148.0, 219.0, 353.0, 518.0, 949.0, 2206.0, 6326.0, 24251.0, 130270.0, 1386823.0, 2361295.0, 230112.0, 36187.0, 8553.0, 2788.0, 1133.0, 590.0, 347.0, 218.0, 161.0, 123.0, 76.0, 67.0, 40.0, 23.0, 23.0, 24.0, 14.0, 8.0, 9.0, 10.0, 3.0, 8.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.2734375, -6.08966064453125, -5.9058837890625, -5.72210693359375, -5.538330078125, -5.35455322265625, -5.1707763671875, -4.98699951171875, -4.80322265625, -4.61944580078125, -4.4356689453125, -4.25189208984375, -4.068115234375, -3.88433837890625, -3.7005615234375, -3.51678466796875, -3.3330078125, -3.14923095703125, -2.9654541015625, -2.78167724609375, -2.597900390625, -2.41412353515625, -2.2303466796875, -2.04656982421875, -1.86279296875, -1.67901611328125, -1.4952392578125, -1.31146240234375, -1.127685546875, -0.94390869140625, -0.7601318359375, -0.57635498046875, -0.392578125, -0.20880126953125, -0.0250244140625, 0.15875244140625, 0.342529296875, 0.52630615234375, 0.7100830078125, 0.89385986328125, 1.07763671875, 1.26141357421875, 1.4451904296875, 1.62896728515625, 1.812744140625, 1.99652099609375, 2.1802978515625, 2.36407470703125, 2.5478515625, 2.73162841796875, 2.9154052734375, 3.09918212890625, 3.282958984375, 3.46673583984375, 3.6505126953125, 3.83428955078125, 4.01806640625, 4.20184326171875, 4.3856201171875, 4.56939697265625, 4.753173828125, 4.93695068359375, 5.1207275390625, 5.30450439453125, 5.48828125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 17.0, 26.0, 46.0, 73.0, 103.0, 208.0, 328.0, 599.0, 808.0, 717.0, 473.0, 259.0, 162.0, 94.0, 61.0, 40.0, 21.0, 16.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.6328125, -11.3543701171875, -11.075927734375, -10.7974853515625, -10.51904296875, -10.2406005859375, -9.962158203125, -9.6837158203125, -9.4052734375, -9.1268310546875, -8.848388671875, -8.5699462890625, -8.29150390625, -8.0130615234375, -7.734619140625, -7.4561767578125, -7.177734375, -6.8992919921875, -6.620849609375, -6.3424072265625, -6.06396484375, -5.7855224609375, -5.507080078125, -5.2286376953125, -4.9501953125, -4.6717529296875, -4.393310546875, -4.1148681640625, -3.83642578125, -3.5579833984375, -3.279541015625, -3.0010986328125, -2.72265625, -2.4442138671875, -2.165771484375, -1.8873291015625, -1.60888671875, -1.3304443359375, -1.052001953125, -0.7735595703125, -0.4951171875, -0.2166748046875, 0.061767578125, 0.3402099609375, 0.61865234375, 0.8970947265625, 1.175537109375, 1.4539794921875, 1.732421875, 2.0108642578125, 2.289306640625, 2.5677490234375, 2.84619140625, 3.1246337890625, 3.403076171875, 3.6815185546875, 3.9599609375, 4.2384033203125, 4.516845703125, 4.7952880859375, 5.07373046875, 5.3521728515625, 5.630615234375, 5.9090576171875, 6.1875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 7.0, 10.0, 21.0, 20.0, 19.0, 41.0, 52.0, 72.0, 148.0, 208.0, 397.0, 724.0, 1564.0, 5098.0, 43986.0, 1423298.0, 2628709.0, 79317.0, 6811.0, 1908.0, 755.0, 457.0, 224.0, 142.0, 91.0, 67.0, 45.0, 33.0, 18.0, 14.0, 9.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.8671875, -13.4212646484375, -12.975341796875, -12.5294189453125, -12.08349609375, -11.6375732421875, -11.191650390625, -10.7457275390625, -10.2998046875, -9.8538818359375, -9.407958984375, -8.9620361328125, -8.51611328125, -8.0701904296875, -7.624267578125, -7.1783447265625, -6.732421875, -6.2864990234375, -5.840576171875, -5.3946533203125, -4.94873046875, -4.5028076171875, -4.056884765625, -3.6109619140625, -3.1650390625, -2.7191162109375, -2.273193359375, -1.8272705078125, -1.38134765625, -0.9354248046875, -0.489501953125, -0.0435791015625, 0.40234375, 0.8482666015625, 1.294189453125, 1.7401123046875, 2.18603515625, 2.6319580078125, 3.077880859375, 3.5238037109375, 3.9697265625, 4.4156494140625, 4.861572265625, 5.3074951171875, 5.75341796875, 6.1993408203125, 6.645263671875, 7.0911865234375, 7.537109375, 7.9830322265625, 8.428955078125, 8.8748779296875, 9.32080078125, 9.7667236328125, 10.212646484375, 10.6585693359375, 11.1044921875, 11.5504150390625, 11.996337890625, 12.4422607421875, 12.88818359375, 13.3341064453125, 13.780029296875, 14.2259521484375, 14.671875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 12.0, 52.0, 146.0, 293.0, 260.0, 169.0, 66.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.969112396240234, -52.470314025878906, -50.971519470214844, -49.472721099853516, -47.97392654418945, -46.475128173828125, -44.97633361816406, -43.477535247802734, -41.978736877441406, -40.47993850708008, -38.981143951416016, -37.48234558105469, -35.983551025390625, -34.4847526550293, -32.98595428466797, -31.487159729003906, -29.98836326599121, -28.489566802978516, -26.99077033996582, -25.491973876953125, -23.993175506591797, -22.4943790435791, -20.995582580566406, -19.496784210205078, -17.997989654541016, -16.49919319152832, -15.000395774841309, -13.501599311828613, -12.002801895141602, -10.504005432128906, -9.005208969116211, -7.506411552429199, -6.0076141357421875, -4.508817195892334, -3.0100204944610596, -1.5112237930297852, -0.01242685317993164, 1.4863700866699219, 2.985166549682617, 4.483963966369629, 5.982760429382324, 7.481557369232178, 8.980354309082031, 10.479150772094727, 11.977947235107422, 13.476744651794434, 14.975541114807129, 16.47433853149414, 17.973134994506836, 19.47193145751953, 20.970727920532227, 22.469524383544922, 23.96832275390625, 25.467119216918945, 26.96591567993164, 28.46471405029297, 29.96350860595703, 31.462305068969727, 32.96110153198242, 34.45989990234375, 35.95869445800781, 37.45749282836914, 38.95629119873047, 40.45508575439453, 41.95388412475586]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 7.0, 9.0, 13.0, 13.0, 12.0, 17.0, 25.0, 13.0, 19.0, 31.0, 21.0, 34.0, 24.0, 29.0, 30.0, 32.0, 41.0, 38.0, 51.0, 23.0, 45.0, 36.0, 46.0, 32.0, 46.0, 32.0, 29.0, 41.0, 29.0, 20.0, 24.0, 17.0, 20.0, 16.0, 16.0, 7.0, 12.0, 10.0, 6.0, 6.0, 8.0, 4.0, 1.0, 5.0, 6.0, 1.0, 2.0, 1.0], "bins": [-17.54867935180664, -17.057861328125, -16.56704330444336, -16.07622528076172, -15.585408210754395, -15.09459114074707, -14.60377311706543, -14.112955093383789, -13.622137069702148, -13.131319046020508, -12.640501976013184, -12.149683952331543, -11.658865928649902, -11.168048858642578, -10.677230834960938, -10.186412811279297, -9.695595741271973, -9.204777717590332, -8.713960647583008, -8.223142623901367, -7.732324600219727, -7.241507053375244, -6.750689506530762, -6.259871482849121, -5.769053936004639, -5.278236389160156, -4.787418365478516, -4.296600818634033, -3.8057830333709717, -3.31496524810791, -2.8241477012634277, -2.333329916000366, -1.8425121307373047, -1.3516943454742432, -0.8608766794204712, -0.3700590133666992, 0.1207587718963623, 0.6115765571594238, 1.1023941040039062, 1.5932118892669678, 2.0840296745300293, 2.574847459793091, 3.0656652450561523, 3.5564827919006348, 4.047300338745117, 4.538118362426758, 5.02893590927124, 5.519753456115723, 6.010571479797363, 6.501389026641846, 6.992207050323486, 7.483024597167969, 7.973842620849609, 8.46466064453125, 8.955477714538574, 9.446295738220215, 9.937112808227539, 10.42793083190918, 10.918747901916504, 11.409565925598145, 11.900383949279785, 12.39120101928711, 12.88201904296875, 13.37283706665039, 13.863655090332031]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 10.0, 7.0, 12.0, 10.0, 16.0, 21.0, 20.0, 24.0, 28.0, 24.0, 27.0, 43.0, 27.0, 36.0, 36.0, 31.0, 48.0, 34.0, 52.0, 44.0, 41.0, 37.0, 43.0, 35.0, 33.0, 30.0, 25.0, 18.0, 18.0, 24.0, 22.0, 23.0, 13.0, 17.0, 9.0, 8.0, 11.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.24969482421875, -1.2054443359375, -1.16119384765625, -1.116943359375, -1.07269287109375, -1.0284423828125, -0.98419189453125, -0.93994140625, -0.89569091796875, -0.8514404296875, -0.80718994140625, -0.762939453125, -0.71868896484375, -0.6744384765625, -0.63018798828125, -0.5859375, -0.54168701171875, -0.4974365234375, -0.45318603515625, -0.408935546875, -0.36468505859375, -0.3204345703125, -0.27618408203125, -0.23193359375, -0.18768310546875, -0.1434326171875, -0.09918212890625, -0.054931640625, -0.01068115234375, 0.0335693359375, 0.07781982421875, 0.1220703125, 0.16632080078125, 0.2105712890625, 0.25482177734375, 0.299072265625, 0.34332275390625, 0.3875732421875, 0.43182373046875, 0.47607421875, 0.52032470703125, 0.5645751953125, 0.60882568359375, 0.653076171875, 0.69732666015625, 0.7415771484375, 0.78582763671875, 0.830078125, 0.87432861328125, 0.9185791015625, 0.96282958984375, 1.007080078125, 1.05133056640625, 1.0955810546875, 1.13983154296875, 1.18408203125, 1.22833251953125, 1.2725830078125, 1.31683349609375, 1.361083984375, 1.40533447265625, 1.4495849609375, 1.49383544921875, 1.5380859375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 1.0, 2.0, 7.0, 9.0, 13.0, 27.0, 27.0, 40.0, 47.0, 68.0, 143.0, 146.0, 207.0, 374.0, 504.0, 716.0, 1049.0, 1474.0, 2217.0, 3233.0, 4704.0, 6934.0, 10458.0, 15503.0, 24281.0, 37826.0, 60425.0, 95854.0, 143698.0, 188373.0, 156106.0, 105713.0, 66819.0, 42024.0, 26817.0, 17351.0, 11506.0, 7581.0, 5109.0, 3415.0, 2406.0, 1661.0, 1151.0, 790.0, 529.0, 345.0, 272.0, 196.0, 137.0, 78.0, 56.0, 48.0, 28.0, 26.0, 10.0, 12.0, 6.0, 6.0, 2.0, 4.0, 4.0], "bins": [-0.1363525390625, -0.132171630859375, -0.12799072265625, -0.123809814453125, -0.11962890625, -0.115447998046875, -0.11126708984375, -0.107086181640625, -0.1029052734375, -0.098724365234375, -0.09454345703125, -0.090362548828125, -0.086181640625, -0.082000732421875, -0.07781982421875, -0.073638916015625, -0.0694580078125, -0.065277099609375, -0.06109619140625, -0.056915283203125, -0.052734375, -0.048553466796875, -0.04437255859375, -0.040191650390625, -0.0360107421875, -0.031829833984375, -0.02764892578125, -0.023468017578125, -0.019287109375, -0.015106201171875, -0.01092529296875, -0.006744384765625, -0.0025634765625, 0.001617431640625, 0.00579833984375, 0.009979248046875, 0.01416015625, 0.018341064453125, 0.02252197265625, 0.026702880859375, 0.0308837890625, 0.035064697265625, 0.03924560546875, 0.043426513671875, 0.047607421875, 0.051788330078125, 0.05596923828125, 0.060150146484375, 0.0643310546875, 0.068511962890625, 0.07269287109375, 0.076873779296875, 0.0810546875, 0.085235595703125, 0.08941650390625, 0.093597412109375, 0.0977783203125, 0.101959228515625, 0.10614013671875, 0.110321044921875, 0.114501953125, 0.118682861328125, 0.12286376953125, 0.127044677734375, 0.1312255859375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 5.0, 8.0, 8.0, 8.0, 5.0, 14.0, 16.0, 8.0, 20.0, 20.0, 22.0, 21.0, 35.0, 35.0, 34.0, 49.0, 27.0, 32.0, 30.0, 36.0, 34.0, 1060.0, 36.0, 39.0, 44.0, 35.0, 20.0, 38.0, 34.0, 24.0, 25.0, 24.0, 24.0, 22.0, 23.0, 14.0, 15.0, 12.0, 9.0, 11.0, 14.0, 5.0, 7.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.87060546875, -0.8441162109375, -0.817626953125, -0.7911376953125, -0.7646484375, -0.7381591796875, -0.711669921875, -0.6851806640625, -0.65869140625, -0.6322021484375, -0.605712890625, -0.5792236328125, -0.552734375, -0.5262451171875, -0.499755859375, -0.4732666015625, -0.44677734375, -0.4202880859375, -0.393798828125, -0.3673095703125, -0.3408203125, -0.3143310546875, -0.287841796875, -0.2613525390625, -0.23486328125, -0.2083740234375, -0.181884765625, -0.1553955078125, -0.12890625, -0.1024169921875, -0.075927734375, -0.0494384765625, -0.02294921875, 0.0035400390625, 0.030029296875, 0.0565185546875, 0.0830078125, 0.1094970703125, 0.135986328125, 0.1624755859375, 0.18896484375, 0.2154541015625, 0.241943359375, 0.2684326171875, 0.294921875, 0.3214111328125, 0.347900390625, 0.3743896484375, 0.40087890625, 0.4273681640625, 0.453857421875, 0.4803466796875, 0.5068359375, 0.5333251953125, 0.559814453125, 0.5863037109375, 0.61279296875, 0.6392822265625, 0.665771484375, 0.6922607421875, 0.71875, 0.7452392578125, 0.771728515625, 0.7982177734375, 0.82470703125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 5.0, 14.0, 12.0, 16.0, 30.0, 45.0, 69.0, 109.0, 140.0, 238.0, 333.0, 491.0, 700.0, 1079.0, 1672.0, 2328.0, 3594.0, 5436.0, 8056.0, 12188.0, 18467.0, 27712.0, 41645.0, 62317.0, 91831.0, 127587.0, 1164733.0, 179094.0, 111715.0, 77961.0, 52939.0, 34688.0, 23624.0, 15489.0, 10287.0, 6712.0, 4539.0, 3035.0, 2013.0, 1343.0, 927.0, 614.0, 436.0, 298.0, 195.0, 138.0, 82.0, 59.0, 29.0, 20.0, 28.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08331298828125, -0.08060646057128906, -0.07789993286132812, -0.07519340515136719, -0.07248687744140625, -0.06978034973144531, -0.06707382202148438, -0.06436729431152344, -0.0616607666015625, -0.05895423889160156, -0.056247711181640625, -0.05354118347167969, -0.05083465576171875, -0.04812812805175781, -0.045421600341796875, -0.04271507263183594, -0.040008544921875, -0.03730201721191406, -0.034595489501953125, -0.03188896179199219, -0.02918243408203125, -0.026475906372070312, -0.023769378662109375, -0.021062850952148438, -0.0183563232421875, -0.015649795532226562, -0.012943267822265625, -0.010236740112304688, -0.00753021240234375, -0.0048236846923828125, -0.002117156982421875, 0.0005893707275390625, 0.0032958984375, 0.0060024261474609375, 0.008708953857421875, 0.011415481567382812, 0.01412200927734375, 0.016828536987304688, 0.019535064697265625, 0.022241592407226562, 0.0249481201171875, 0.027654647827148438, 0.030361175537109375, 0.03306770324707031, 0.03577423095703125, 0.03848075866699219, 0.041187286376953125, 0.04389381408691406, 0.046600341796875, 0.04930686950683594, 0.052013397216796875, 0.05471992492675781, 0.05742645263671875, 0.06013298034667969, 0.06283950805664062, 0.06554603576660156, 0.0682525634765625, 0.07095909118652344, 0.07366561889648438, 0.07637214660644531, 0.07907867431640625, 0.08178520202636719, 0.08449172973632812, 0.08719825744628906, 0.08990478515625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 3.0, 6.0, 2.0, 14.0, 10.0, 13.0, 17.0, 21.0, 19.0, 47.0, 53.0, 70.0, 55.0, 71.0, 100.0, 82.0, 82.0, 48.0, 61.0, 42.0, 40.0, 35.0, 20.0, 9.0, 14.0, 11.0, 13.0, 9.0, 8.0, 8.0, 9.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0033817291259765625, -0.0032904446125030518, -0.003199160099029541, -0.0031078755855560303, -0.0030165910720825195, -0.002925306558609009, -0.002834022045135498, -0.0027427375316619873, -0.0026514530181884766, -0.002560168504714966, -0.002468883991241455, -0.0023775994777679443, -0.0022863149642944336, -0.002195030450820923, -0.002103745937347412, -0.0020124614238739014, -0.0019211769104003906, -0.0018298923969268799, -0.0017386078834533691, -0.0016473233699798584, -0.0015560388565063477, -0.001464754343032837, -0.0013734698295593262, -0.0012821853160858154, -0.0011909008026123047, -0.001099616289138794, -0.0010083317756652832, -0.0009170472621917725, -0.0008257627487182617, -0.000734478235244751, -0.0006431937217712402, -0.0005519092082977295, -0.00046062469482421875, -0.000369340181350708, -0.00027805566787719727, -0.00018677115440368652, -9.548664093017578e-05, -4.202127456665039e-06, 8.70823860168457e-05, 0.00017836689949035645, 0.0002696514129638672, 0.00036093592643737793, 0.00045222043991088867, 0.0005435049533843994, 0.0006347894668579102, 0.0007260739803314209, 0.0008173584938049316, 0.0009086430072784424, 0.0009999275207519531, 0.0010912120342254639, 0.0011824965476989746, 0.0012737810611724854, 0.001365065574645996, 0.0014563500881195068, 0.0015476346015930176, 0.0016389191150665283, 0.001730203628540039, 0.0018214881420135498, 0.0019127726554870605, 0.0020040571689605713, 0.002095341682434082, 0.0021866261959075928, 0.0022779107093811035, 0.0023691952228546143, 0.002460479736328125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 8.0, 23.0, 18.0, 20.0, 28.0, 39.0, 54.0, 62.0, 98.0, 160.0, 217.0, 354.0, 639.0, 14074.0, 1025454.0, 5693.0, 548.0, 294.0, 220.0, 148.0, 85.0, 69.0, 43.0, 38.0, 24.0, 41.0, 19.0, 27.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05126953125, -0.049637794494628906, -0.04800605773925781, -0.04637432098388672, -0.044742584228515625, -0.04311084747314453, -0.04147911071777344, -0.039847373962402344, -0.03821563720703125, -0.036583900451660156, -0.03495216369628906, -0.03332042694091797, -0.031688690185546875, -0.03005695343017578, -0.028425216674804688, -0.026793479919433594, -0.0251617431640625, -0.023530006408691406, -0.021898269653320312, -0.02026653289794922, -0.018634796142578125, -0.01700305938720703, -0.015371322631835938, -0.013739585876464844, -0.01210784912109375, -0.010476112365722656, -0.008844375610351562, -0.007212638854980469, -0.005580902099609375, -0.003949165344238281, -0.0023174285888671875, -0.0006856918334960938, 0.000946044921875, 0.0025777816772460938, 0.0042095184326171875, 0.005841255187988281, 0.007472991943359375, 0.009104728698730469, 0.010736465454101562, 0.012368202209472656, 0.01399993896484375, 0.015631675720214844, 0.017263412475585938, 0.01889514923095703, 0.020526885986328125, 0.02215862274169922, 0.023790359497070312, 0.025422096252441406, 0.0270538330078125, 0.028685569763183594, 0.030317306518554688, 0.03194904327392578, 0.033580780029296875, 0.03521251678466797, 0.03684425354003906, 0.038475990295410156, 0.04010772705078125, 0.041739463806152344, 0.04337120056152344, 0.04500293731689453, 0.046634674072265625, 0.04826641082763672, 0.04989814758300781, 0.051529884338378906, 0.05316162109375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 748.0, 266.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05945118889212608, -0.05809766799211502, -0.05674414709210396, -0.055390626192092896, -0.05403710529208183, -0.05268358439207077, -0.051330067217350006, -0.049976546317338943, -0.04862302541732788, -0.04726950451731682, -0.045915983617305756, -0.04456246271729469, -0.04320894181728363, -0.041855424642562866, -0.040501900017261505, -0.03914838284254074, -0.03779485821723938, -0.03644133731722832, -0.035087816417217255, -0.03373429551720619, -0.03238077461719513, -0.031027255579829216, -0.029673734679818153, -0.02832021564245224, -0.026966694742441177, -0.025613173842430115, -0.024259652942419052, -0.02290613204240799, -0.021552613005042076, -0.020199092105031013, -0.01884557120501995, -0.017492052167654037, -0.016138533130288124, -0.014785012230277061, -0.013431492261588573, -0.01207797136157751, -0.010724451392889023, -0.00937093049287796, -0.008017409592866898, -0.00666388962417841, -0.005310368724167347, -0.003956848289817572, -0.0026033276226371527, -0.0012498069554567337, 0.00010371347889304161, 0.001457233913242817, 0.0028107548132538795, 0.0041642747819423676, 0.00551779568195343, 0.0068713161163032055, 0.00822483655065298, 0.009578357450664043, 0.010931877419352531, 0.012285398319363594, 0.013638919219374657, 0.014992439188063145, 0.016345959156751633, 0.017699480056762695, 0.019053000956773758, 0.02040652185678482, 0.021760040894150734, 0.023113561794161797, 0.02446708269417286, 0.025820601731538773, 0.027174124494194984]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 13.0, 22.0, 27.0, 47.0, 38.0, 77.0, 68.0, 77.0, 90.0, 99.0, 91.0, 65.0, 71.0, 50.0, 51.0, 37.0, 29.0, 22.0, 9.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004184544086456299, -0.004071698524057865, -0.0039588529616594315, -0.0038460073992609978, -0.003733161836862564, -0.0036203162744641304, -0.0035074707120656967, -0.003394625149667263, -0.0032817795872688293, -0.0031689340248703957, -0.003056088462471962, -0.0029432429000735283, -0.0028303973376750946, -0.002717551775276661, -0.0026047062128782272, -0.0024918606504797935, -0.00237901508808136, -0.002266169525682926, -0.0021533239632844925, -0.002040478400886059, -0.0019276328384876251, -0.0018147872760891914, -0.0017019417136907578, -0.001589096151292324, -0.0014762505888938904, -0.0013634050264954567, -0.001250559464097023, -0.0011377139016985893, -0.0010248683393001556, -0.000912022776901722, -0.0007991772145032883, -0.0006863316521048546, -0.0005734860897064209, -0.0004606405273079872, -0.00034779496490955353, -0.00023494940251111984, -0.00012210384011268616, -9.258277714252472e-06, 0.00010358728468418121, 0.0002164328470826149, 0.0003292784094810486, 0.00044212397187948227, 0.000554969534277916, 0.0006678150966763496, 0.0007806606590747833, 0.000893506221473217, 0.0010063517838716507, 0.0011191973462700844, 0.001232042908668518, 0.0013448884710669518, 0.0014577340334653854, 0.0015705795958638191, 0.0016834251582622528, 0.0017962707206606865, 0.0019091162830591202, 0.002021961845457554, 0.0021348074078559875, 0.0022476529702544212, 0.002360498532652855, 0.0024733440950512886, 0.0025861896574497223, 0.002699035219848156, 0.0028118807822465897, 0.0029247263446450233, 0.003037571907043457]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 10.0, 7.0, 12.0, 10.0, 16.0, 21.0, 20.0, 24.0, 28.0, 24.0, 27.0, 43.0, 27.0, 36.0, 36.0, 31.0, 48.0, 34.0, 52.0, 44.0, 41.0, 37.0, 43.0, 34.0, 34.0, 30.0, 25.0, 18.0, 18.0, 24.0, 22.0, 23.0, 13.0, 17.0, 9.0, 8.0, 11.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.24969482421875, -1.2054443359375, -1.16119384765625, -1.116943359375, -1.07269287109375, -1.0284423828125, -0.98419189453125, -0.93994140625, -0.89569091796875, -0.8514404296875, -0.80718994140625, -0.762939453125, -0.71868896484375, -0.6744384765625, -0.63018798828125, -0.5859375, -0.54168701171875, -0.4974365234375, -0.45318603515625, -0.408935546875, -0.36468505859375, -0.3204345703125, -0.27618408203125, -0.23193359375, -0.18768310546875, -0.1434326171875, -0.09918212890625, -0.054931640625, -0.01068115234375, 0.0335693359375, 0.07781982421875, 0.1220703125, 0.16632080078125, 0.2105712890625, 0.25482177734375, 0.299072265625, 0.34332275390625, 0.3875732421875, 0.43182373046875, 0.47607421875, 0.52032470703125, 0.5645751953125, 0.60882568359375, 0.653076171875, 0.69732666015625, 0.7415771484375, 0.78582763671875, 0.830078125, 0.87432861328125, 0.9185791015625, 0.96282958984375, 1.007080078125, 1.05133056640625, 1.0955810546875, 1.13983154296875, 1.18408203125, 1.22833251953125, 1.2725830078125, 1.31683349609375, 1.361083984375, 1.40533447265625, 1.4495849609375, 1.49383544921875, 1.5380859375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 1.0, 5.0, 13.0, 14.0, 22.0, 24.0, 43.0, 62.0, 90.0, 149.0, 220.0, 320.0, 591.0, 983.0, 1945.0, 4007.0, 9508.0, 25588.0, 71569.0, 193299.0, 359060.0, 236210.0, 91118.0, 31986.0, 11819.0, 4791.0, 2220.0, 1161.0, 647.0, 386.0, 250.0, 166.0, 91.0, 63.0, 47.0, 32.0, 20.0, 18.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8876953125, -1.8260345458984375, -1.764373779296875, -1.7027130126953125, -1.64105224609375, -1.5793914794921875, -1.517730712890625, -1.4560699462890625, -1.3944091796875, -1.3327484130859375, -1.271087646484375, -1.2094268798828125, -1.14776611328125, -1.0861053466796875, -1.024444580078125, -0.9627838134765625, -0.901123046875, -0.8394622802734375, -0.777801513671875, -0.7161407470703125, -0.65447998046875, -0.5928192138671875, -0.531158447265625, -0.4694976806640625, -0.4078369140625, -0.3461761474609375, -0.284515380859375, -0.2228546142578125, -0.16119384765625, -0.0995330810546875, -0.037872314453125, 0.0237884521484375, 0.08544921875, 0.1471099853515625, 0.208770751953125, 0.2704315185546875, 0.33209228515625, 0.3937530517578125, 0.455413818359375, 0.5170745849609375, 0.5787353515625, 0.6403961181640625, 0.702056884765625, 0.7637176513671875, 0.82537841796875, 0.8870391845703125, 0.948699951171875, 1.0103607177734375, 1.072021484375, 1.1336822509765625, 1.195343017578125, 1.2570037841796875, 1.31866455078125, 1.3803253173828125, 1.441986083984375, 1.5036468505859375, 1.5653076171875, 1.6269683837890625, 1.688629150390625, 1.7502899169921875, 1.81195068359375, 1.8736114501953125, 1.935272216796875, 1.9969329833984375, 2.05859375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 11.0, 9.0, 18.0, 14.0, 20.0, 13.0, 35.0, 23.0, 26.0, 35.0, 51.0, 44.0, 42.0, 53.0, 80.0, 155.0, 360.0, 1396.0, 149.0, 96.0, 50.0, 53.0, 46.0, 40.0, 31.0, 29.0, 24.0, 22.0, 18.0, 14.0, 9.0, 14.0, 18.0, 7.0, 3.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.28515625, -5.12506103515625, -4.9649658203125, -4.80487060546875, -4.644775390625, -4.48468017578125, -4.3245849609375, -4.16448974609375, -4.00439453125, -3.84429931640625, -3.6842041015625, -3.52410888671875, -3.364013671875, -3.20391845703125, -3.0438232421875, -2.88372802734375, -2.7236328125, -2.56353759765625, -2.4034423828125, -2.24334716796875, -2.083251953125, -1.92315673828125, -1.7630615234375, -1.60296630859375, -1.44287109375, -1.28277587890625, -1.1226806640625, -0.96258544921875, -0.802490234375, -0.64239501953125, -0.4822998046875, -0.32220458984375, -0.162109375, -0.00201416015625, 0.1580810546875, 0.31817626953125, 0.478271484375, 0.63836669921875, 0.7984619140625, 0.95855712890625, 1.11865234375, 1.27874755859375, 1.4388427734375, 1.59893798828125, 1.759033203125, 1.91912841796875, 2.0792236328125, 2.23931884765625, 2.3994140625, 2.55950927734375, 2.7196044921875, 2.87969970703125, 3.039794921875, 3.19989013671875, 3.3599853515625, 3.52008056640625, 3.68017578125, 3.84027099609375, 4.0003662109375, 4.16046142578125, 4.320556640625, 4.48065185546875, 4.6407470703125, 4.80084228515625, 4.9609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 16.0, 7.0, 16.0, 13.0, 12.0, 13.0, 21.0, 20.0, 30.0, 46.0, 57.0, 67.0, 107.0, 230.0, 506.0, 1474.0, 15366.0, 2257505.0, 859310.0, 8627.0, 1216.0, 393.0, 187.0, 114.0, 63.0, 55.0, 33.0, 35.0, 27.0, 23.0, 20.0, 13.0, 22.0, 11.0, 8.0, 6.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0625, -9.7369384765625, -9.411376953125, -9.0858154296875, -8.76025390625, -8.4346923828125, -8.109130859375, -7.7835693359375, -7.4580078125, -7.1324462890625, -6.806884765625, -6.4813232421875, -6.15576171875, -5.8302001953125, -5.504638671875, -5.1790771484375, -4.853515625, -4.5279541015625, -4.202392578125, -3.8768310546875, -3.55126953125, -3.2257080078125, -2.900146484375, -2.5745849609375, -2.2490234375, -1.9234619140625, -1.597900390625, -1.2723388671875, -0.94677734375, -0.6212158203125, -0.295654296875, 0.0299072265625, 0.35546875, 0.6810302734375, 1.006591796875, 1.3321533203125, 1.65771484375, 1.9832763671875, 2.308837890625, 2.6343994140625, 2.9599609375, 3.2855224609375, 3.611083984375, 3.9366455078125, 4.26220703125, 4.5877685546875, 4.913330078125, 5.2388916015625, 5.564453125, 5.8900146484375, 6.215576171875, 6.5411376953125, 6.86669921875, 7.1922607421875, 7.517822265625, 7.8433837890625, 8.1689453125, 8.4945068359375, 8.820068359375, 9.1456298828125, 9.47119140625, 9.7967529296875, 10.122314453125, 10.4478759765625, 10.7734375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 9.0, 38.0, 242.0, 463.0, 225.0, 32.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.20339584350586, -45.353675842285156, -44.50395202636719, -43.654232025146484, -42.80451202392578, -41.95479202270508, -41.105072021484375, -40.255348205566406, -39.4056282043457, -38.555908203125, -37.70618438720703, -36.85646438598633, -36.006744384765625, -35.15702438354492, -34.30730438232422, -33.45758056640625, -32.60786056518555, -31.758140563964844, -30.908418655395508, -30.058696746826172, -29.20897674560547, -28.359256744384766, -27.50953483581543, -26.659812927246094, -25.81009292602539, -24.960372924804688, -24.11065101623535, -23.260929107666016, -22.411209106445312, -21.56148910522461, -20.711767196655273, -19.862045288085938, -19.012327194213867, -18.16260528564453, -17.312885284423828, -16.463165283203125, -15.613443374633789, -14.76372241973877, -13.91400146484375, -13.06428050994873, -12.214559555053711, -11.364838600158691, -10.515117645263672, -9.665396690368652, -8.815675735473633, -7.965954780578613, -7.116233825683594, -6.266512870788574, -5.416791915893555, -4.567070960998535, -3.7173500061035156, -2.867629051208496, -2.0179080963134766, -1.168187141418457, -0.3184661865234375, 0.531254768371582, 1.3809757232666016, 2.230696678161621, 3.0804176330566406, 3.93013858795166, 4.77985954284668, 5.629580497741699, 6.479301452636719, 7.329022407531738, 8.178743362426758]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 5.0, 14.0, 12.0, 13.0, 11.0, 15.0, 20.0, 27.0, 25.0, 23.0, 25.0, 26.0, 30.0, 26.0, 35.0, 39.0, 41.0, 45.0, 31.0, 39.0, 43.0, 38.0, 34.0, 34.0, 40.0, 23.0, 28.0, 23.0, 30.0, 34.0, 24.0, 19.0, 23.0, 16.0, 7.0, 10.0, 15.0, 8.0, 3.0, 6.0, 7.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 4.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.750160217285156, -13.298480987548828, -12.846802711486816, -12.395123481750488, -11.943445205688477, -11.491765975952148, -11.04008674621582, -10.588407516479492, -10.13672924041748, -9.685050010681152, -9.23337173461914, -8.781692504882812, -8.330013275146484, -7.878334999084473, -7.4266557693481445, -6.974977016448975, -6.523298263549805, -6.071619510650635, -5.619940757751465, -5.168261528015137, -4.716582775115967, -4.264904022216797, -3.813225030899048, -3.361546039581299, -2.909867286682129, -2.458188533782959, -2.00650954246521, -1.5548306703567505, -1.103151798248291, -0.6514730453491211, -0.19979405403137207, 0.25188493728637695, 0.7035636901855469, 1.1552425622940063, 1.6069214344024658, 2.058600425720215, 2.5102791786193848, 2.9619579315185547, 3.4136369228363037, 3.8653159141540527, 4.316994667053223, 4.768673419952393, 5.2203521728515625, 5.672031402587891, 6.1237101554870605, 6.5753889083862305, 7.027068138122559, 7.4787468910217285, 7.930425643920898, 8.382104873657227, 8.833783149719238, 9.285462379455566, 9.737140655517578, 10.188819885253906, 10.640499114990234, 11.092178344726562, 11.543856620788574, 11.995535850524902, 12.447214126586914, 12.898893356323242, 13.35057258605957, 13.802250862121582, 14.25393009185791, 14.705608367919922, 15.15728759765625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 10.0, 6.0, 3.0, 8.0, 11.0, 13.0, 18.0, 9.0, 31.0, 25.0, 19.0, 26.0, 24.0, 42.0, 24.0, 36.0, 37.0, 42.0, 36.0, 54.0, 31.0, 55.0, 30.0, 48.0, 37.0, 27.0, 39.0, 29.0, 29.0, 19.0, 24.0, 23.0, 20.0, 19.0, 20.0, 14.0, 11.0, 10.0, 8.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3076171875, -1.2619171142578125, -1.216217041015625, -1.1705169677734375, -1.12481689453125, -1.0791168212890625, -1.033416748046875, -0.9877166748046875, -0.9420166015625, -0.8963165283203125, -0.850616455078125, -0.8049163818359375, -0.75921630859375, -0.7135162353515625, -0.667816162109375, -0.6221160888671875, -0.576416015625, -0.5307159423828125, -0.485015869140625, -0.4393157958984375, -0.39361572265625, -0.3479156494140625, -0.302215576171875, -0.2565155029296875, -0.2108154296875, -0.1651153564453125, -0.119415283203125, -0.0737152099609375, -0.02801513671875, 0.0176849365234375, 0.063385009765625, 0.1090850830078125, 0.15478515625, 0.2004852294921875, 0.246185302734375, 0.2918853759765625, 0.33758544921875, 0.3832855224609375, 0.428985595703125, 0.4746856689453125, 0.5203857421875, 0.5660858154296875, 0.611785888671875, 0.6574859619140625, 0.70318603515625, 0.7488861083984375, 0.794586181640625, 0.8402862548828125, 0.885986328125, 0.9316864013671875, 0.977386474609375, 1.0230865478515625, 1.06878662109375, 1.1144866943359375, 1.160186767578125, 1.2058868408203125, 1.2515869140625, 1.2972869873046875, 1.342987060546875, 1.3886871337890625, 1.43438720703125, 1.4800872802734375, 1.525787353515625, 1.5714874267578125, 1.6171875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 5.0, 13.0, 8.0, 12.0, 32.0, 21.0, 26.0, 35.0, 45.0, 52.0, 91.0, 122.0, 197.0, 365.0, 783.0, 1912.0, 5794.0, 21884.0, 111629.0, 898405.0, 2619273.0, 447425.0, 65387.0, 14003.0, 3978.0, 1323.0, 538.0, 333.0, 175.0, 107.0, 60.0, 50.0, 34.0, 43.0, 26.0, 16.0, 14.0, 21.0, 9.0, 8.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.078125, -4.92584228515625, -4.7735595703125, -4.62127685546875, -4.468994140625, -4.31671142578125, -4.1644287109375, -4.01214599609375, -3.85986328125, -3.70758056640625, -3.5552978515625, -3.40301513671875, -3.250732421875, -3.09844970703125, -2.9461669921875, -2.79388427734375, -2.6416015625, -2.48931884765625, -2.3370361328125, -2.18475341796875, -2.032470703125, -1.88018798828125, -1.7279052734375, -1.57562255859375, -1.42333984375, -1.27105712890625, -1.1187744140625, -0.96649169921875, -0.814208984375, -0.66192626953125, -0.5096435546875, -0.35736083984375, -0.205078125, -0.05279541015625, 0.0994873046875, 0.25177001953125, 0.404052734375, 0.55633544921875, 0.7086181640625, 0.86090087890625, 1.01318359375, 1.16546630859375, 1.3177490234375, 1.47003173828125, 1.622314453125, 1.77459716796875, 1.9268798828125, 2.07916259765625, 2.2314453125, 2.38372802734375, 2.5360107421875, 2.68829345703125, 2.840576171875, 2.99285888671875, 3.1451416015625, 3.29742431640625, 3.44970703125, 3.60198974609375, 3.7542724609375, 3.90655517578125, 4.058837890625, 4.21112060546875, 4.3634033203125, 4.51568603515625, 4.66796875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 8.0, 14.0, 13.0, 19.0, 23.0, 29.0, 52.0, 67.0, 87.0, 103.0, 190.0, 251.0, 362.0, 432.0, 483.0, 569.0, 354.0, 310.0, 192.0, 131.0, 100.0, 88.0, 58.0, 35.0, 34.0, 17.0, 18.0, 7.0, 11.0, 12.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.44140625, -6.26611328125, -6.0908203125, -5.91552734375, -5.740234375, -5.56494140625, -5.3896484375, -5.21435546875, -5.0390625, -4.86376953125, -4.6884765625, -4.51318359375, -4.337890625, -4.16259765625, -3.9873046875, -3.81201171875, -3.63671875, -3.46142578125, -3.2861328125, -3.11083984375, -2.935546875, -2.76025390625, -2.5849609375, -2.40966796875, -2.234375, -2.05908203125, -1.8837890625, -1.70849609375, -1.533203125, -1.35791015625, -1.1826171875, -1.00732421875, -0.83203125, -0.65673828125, -0.4814453125, -0.30615234375, -0.130859375, 0.04443359375, 0.2197265625, 0.39501953125, 0.5703125, 0.74560546875, 0.9208984375, 1.09619140625, 1.271484375, 1.44677734375, 1.6220703125, 1.79736328125, 1.97265625, 2.14794921875, 2.3232421875, 2.49853515625, 2.673828125, 2.84912109375, 3.0244140625, 3.19970703125, 3.375, 3.55029296875, 3.7255859375, 3.90087890625, 4.076171875, 4.25146484375, 4.4267578125, 4.60205078125, 4.77734375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 12.0, 7.0, 13.0, 22.0, 23.0, 38.0, 68.0, 85.0, 155.0, 233.0, 403.0, 671.0, 1463.0, 3540.0, 12252.0, 60184.0, 388282.0, 2429711.0, 1107988.0, 151855.0, 26409.0, 6319.0, 2177.0, 944.0, 536.0, 323.0, 199.0, 112.0, 84.0, 52.0, 37.0, 26.0, 19.0, 8.0, 5.0, 10.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.369873046875, -6.12255859375, -5.875244140625, -5.6279296875, -5.380615234375, -5.13330078125, -4.885986328125, -4.638671875, -4.391357421875, -4.14404296875, -3.896728515625, -3.6494140625, -3.402099609375, -3.15478515625, -2.907470703125, -2.66015625, -2.412841796875, -2.16552734375, -1.918212890625, -1.6708984375, -1.423583984375, -1.17626953125, -0.928955078125, -0.681640625, -0.434326171875, -0.18701171875, 0.060302734375, 0.3076171875, 0.554931640625, 0.80224609375, 1.049560546875, 1.296875, 1.544189453125, 1.79150390625, 2.038818359375, 2.2861328125, 2.533447265625, 2.78076171875, 3.028076171875, 3.275390625, 3.522705078125, 3.77001953125, 4.017333984375, 4.2646484375, 4.511962890625, 4.75927734375, 5.006591796875, 5.25390625, 5.501220703125, 5.74853515625, 5.995849609375, 6.2431640625, 6.490478515625, 6.73779296875, 6.985107421875, 7.232421875, 7.479736328125, 7.72705078125, 7.974365234375, 8.2216796875, 8.468994140625, 8.71630859375, 8.963623046875, 9.2109375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 20.0, 36.0, 78.0, 156.0, 168.0, 209.0, 163.0, 100.0, 47.0, 18.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.31755828857422, -49.15058517456055, -47.983612060546875, -46.81663513183594, -45.649662017822266, -44.482688903808594, -43.315711975097656, -42.148738861083984, -40.98176574707031, -39.81479263305664, -38.64781951904297, -37.48084259033203, -36.31386947631836, -35.14689636230469, -33.97991943359375, -32.81294631958008, -31.645973205566406, -30.479000091552734, -29.31202507019043, -28.145050048828125, -26.978076934814453, -25.81110382080078, -24.644128799438477, -23.477153778076172, -22.3101806640625, -21.143207550048828, -19.976232528686523, -18.80925750732422, -17.642284393310547, -16.475311279296875, -15.30833625793457, -14.141362190246582, -12.97439193725586, -11.807417869567871, -10.640443801879883, -9.473469734191895, -8.306495666503906, -7.139521598815918, -5.97254753112793, -4.805573463439941, -3.638599395751953, -2.471625328063965, -1.3046512603759766, -0.13767719268798828, 1.029296875, 2.1962709426879883, 3.3632450103759766, 4.530219078063965, 5.697193145751953, 6.864167213439941, 8.03114128112793, 9.198115348815918, 10.365089416503906, 11.532063484191895, 12.699037551879883, 13.866011619567871, 15.03298568725586, 16.19995880126953, 17.366933822631836, 18.53390884399414, 19.700881958007812, 20.867855072021484, 22.03483009338379, 23.201805114746094, 24.368778228759766]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 7.0, 10.0, 22.0, 22.0, 19.0, 17.0, 19.0, 18.0, 27.0, 40.0, 42.0, 31.0, 44.0, 38.0, 39.0, 47.0, 42.0, 45.0, 44.0, 37.0, 42.0, 35.0, 36.0, 42.0, 32.0, 24.0, 25.0, 20.0, 16.0, 20.0, 9.0, 28.0, 11.0, 10.0, 9.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.64270782470703, -16.109790802001953, -15.576874732971191, -15.043957710266113, -14.511041641235352, -13.978124618530273, -13.445207595825195, -12.912291526794434, -12.379375457763672, -11.846458435058594, -11.313542366027832, -10.780625343322754, -10.247709274291992, -9.714792251586914, -9.181875228881836, -8.648959159851074, -8.116042137145996, -7.583125591278076, -7.050209045410156, -6.517292022705078, -5.984375953674316, -5.451458930969238, -4.918542385101318, -4.385625839233398, -3.8527092933654785, -3.3197927474975586, -2.7868762016296387, -2.2539594173431396, -1.7210428714752197, -1.1881263256072998, -0.6552095413208008, -0.12229299545288086, 0.41062355041503906, 0.9435401558876038, 1.4764567613601685, 2.009373426437378, 2.542289972305298, 3.0752065181732178, 3.608123302459717, 4.141039848327637, 4.673956394195557, 5.206872940063477, 5.7397894859313965, 6.272706031799316, 6.8056230545043945, 7.338539123535156, 7.871456146240234, 8.404373168945312, 8.937289237976074, 9.470206260681152, 10.003122329711914, 10.536039352416992, 11.068955421447754, 11.601872444152832, 12.134788513183594, 12.667705535888672, 13.20062255859375, 13.733539581298828, 14.26645565032959, 14.799372673034668, 15.33228874206543, 15.865205764770508, 16.398122787475586, 16.93103790283203, 17.46395492553711]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 5.0, 5.0, 5.0, 5.0, 7.0, 12.0, 14.0, 16.0, 24.0, 22.0, 14.0, 21.0, 26.0, 26.0, 24.0, 34.0, 28.0, 34.0, 31.0, 49.0, 39.0, 55.0, 44.0, 36.0, 36.0, 38.0, 24.0, 42.0, 34.0, 32.0, 28.0, 31.0, 28.0, 17.0, 14.0, 10.0, 12.0, 21.0, 11.0, 15.0, 4.0, 8.0, 6.0, 11.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.3777618408203125, -1.330718994140625, -1.2836761474609375, -1.23663330078125, -1.1895904541015625, -1.142547607421875, -1.0955047607421875, -1.0484619140625, -1.0014190673828125, -0.954376220703125, -0.9073333740234375, -0.86029052734375, -0.8132476806640625, -0.766204833984375, -0.7191619873046875, -0.672119140625, -0.6250762939453125, -0.578033447265625, -0.5309906005859375, -0.48394775390625, -0.4369049072265625, -0.389862060546875, -0.3428192138671875, -0.2957763671875, -0.2487335205078125, -0.201690673828125, -0.1546478271484375, -0.10760498046875, -0.0605621337890625, -0.013519287109375, 0.0335235595703125, 0.08056640625, 0.1276092529296875, 0.174652099609375, 0.2216949462890625, 0.26873779296875, 0.3157806396484375, 0.362823486328125, 0.4098663330078125, 0.4569091796875, 0.5039520263671875, 0.550994873046875, 0.5980377197265625, 0.64508056640625, 0.6921234130859375, 0.739166259765625, 0.7862091064453125, 0.833251953125, 0.8802947998046875, 0.927337646484375, 0.9743804931640625, 1.02142333984375, 1.0684661865234375, 1.115509033203125, 1.1625518798828125, 1.2095947265625, 1.2566375732421875, 1.303680419921875, 1.3507232666015625, 1.39776611328125, 1.4448089599609375, 1.491851806640625, 1.5388946533203125, 1.5859375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 8.0, 7.0, 13.0, 16.0, 42.0, 37.0, 61.0, 91.0, 123.0, 196.0, 280.0, 353.0, 560.0, 743.0, 991.0, 1435.0, 2051.0, 2979.0, 4150.0, 5890.0, 8596.0, 12222.0, 18308.0, 26642.0, 40241.0, 60836.0, 92807.0, 139895.0, 181206.0, 148258.0, 99341.0, 65721.0, 43090.0, 28613.0, 19327.0, 13192.0, 9143.0, 6346.0, 4265.0, 3126.0, 2112.0, 1509.0, 1084.0, 809.0, 548.0, 383.0, 261.0, 226.0, 138.0, 105.0, 56.0, 53.0, 27.0, 26.0, 10.0, 8.0, 5.0, 5.0, 1.0, 3.0], "bins": [-0.1434326171875, -0.13903045654296875, -0.1346282958984375, -0.13022613525390625, -0.125823974609375, -0.12142181396484375, -0.1170196533203125, -0.11261749267578125, -0.10821533203125, -0.10381317138671875, -0.0994110107421875, -0.09500885009765625, -0.090606689453125, -0.08620452880859375, -0.0818023681640625, -0.07740020751953125, -0.072998046875, -0.06859588623046875, -0.0641937255859375, -0.05979156494140625, -0.055389404296875, -0.05098724365234375, -0.0465850830078125, -0.04218292236328125, -0.03778076171875, -0.03337860107421875, -0.0289764404296875, -0.02457427978515625, -0.020172119140625, -0.01576995849609375, -0.0113677978515625, -0.00696563720703125, -0.0025634765625, 0.00183868408203125, 0.0062408447265625, 0.01064300537109375, 0.015045166015625, 0.01944732666015625, 0.0238494873046875, 0.02825164794921875, 0.03265380859375, 0.03705596923828125, 0.0414581298828125, 0.04586029052734375, 0.050262451171875, 0.05466461181640625, 0.0590667724609375, 0.06346893310546875, 0.06787109375, 0.07227325439453125, 0.0766754150390625, 0.08107757568359375, 0.085479736328125, 0.08988189697265625, 0.0942840576171875, 0.09868621826171875, 0.10308837890625, 0.10749053955078125, 0.1118927001953125, 0.11629486083984375, 0.120697021484375, 0.12509918212890625, 0.1295013427734375, 0.13390350341796875, 0.1383056640625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 4.0, 2.0, 5.0, 9.0, 2.0, 6.0, 9.0, 13.0, 8.0, 8.0, 8.0, 21.0, 21.0, 16.0, 20.0, 29.0, 19.0, 31.0, 44.0, 29.0, 36.0, 38.0, 29.0, 29.0, 43.0, 1060.0, 37.0, 32.0, 33.0, 38.0, 40.0, 35.0, 26.0, 35.0, 22.0, 27.0, 29.0, 24.0, 26.0, 21.0, 9.0, 10.0, 13.0, 8.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.93896484375, -0.9089736938476562, -0.8789825439453125, -0.8489913940429688, -0.819000244140625, -0.7890090942382812, -0.7590179443359375, -0.7290267944335938, -0.69903564453125, -0.6690444946289062, -0.6390533447265625, -0.6090621948242188, -0.579071044921875, -0.5490798950195312, -0.5190887451171875, -0.48909759521484375, -0.4591064453125, -0.42911529541015625, -0.3991241455078125, -0.36913299560546875, -0.339141845703125, -0.30915069580078125, -0.2791595458984375, -0.24916839599609375, -0.21917724609375, -0.18918609619140625, -0.1591949462890625, -0.12920379638671875, -0.099212646484375, -0.06922149658203125, -0.0392303466796875, -0.00923919677734375, 0.020751953125, 0.05074310302734375, 0.0807342529296875, 0.11072540283203125, 0.140716552734375, 0.17070770263671875, 0.2006988525390625, 0.23069000244140625, 0.26068115234375, 0.29067230224609375, 0.3206634521484375, 0.35065460205078125, 0.380645751953125, 0.41063690185546875, 0.4406280517578125, 0.47061920166015625, 0.5006103515625, 0.5306015014648438, 0.5605926513671875, 0.5905838012695312, 0.620574951171875, 0.6505661010742188, 0.6805572509765625, 0.7105484008789062, 0.74053955078125, 0.7705307006835938, 0.8005218505859375, 0.8305130004882812, 0.860504150390625, 0.8904953002929688, 0.9204864501953125, 0.9504776000976562, 0.98046875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 9.0, 13.0, 13.0, 14.0, 27.0, 32.0, 50.0, 82.0, 93.0, 171.0, 243.0, 342.0, 507.0, 716.0, 1052.0, 1567.0, 2227.0, 3355.0, 4675.0, 6818.0, 10218.0, 14783.0, 22013.0, 32023.0, 46690.0, 67936.0, 96290.0, 132028.0, 1181904.0, 142236.0, 101067.0, 71899.0, 49483.0, 33867.0, 23021.0, 15485.0, 10769.0, 7244.0, 5092.0, 3521.0, 2401.0, 1632.0, 1090.0, 754.0, 528.0, 353.0, 247.0, 166.0, 117.0, 68.0, 69.0, 47.0, 30.0, 16.0, 21.0, 10.0, 7.0, 3.0, 5.0, 0.0, 3.0], "bins": [-0.0882568359375, -0.08546161651611328, -0.08266639709472656, -0.07987117767333984, -0.07707595825195312, -0.0742807388305664, -0.07148551940917969, -0.06869029998779297, -0.06589508056640625, -0.06309986114501953, -0.06030464172363281, -0.057509422302246094, -0.054714202880859375, -0.051918983459472656, -0.04912376403808594, -0.04632854461669922, -0.0435333251953125, -0.04073810577392578, -0.03794288635253906, -0.035147666931152344, -0.032352447509765625, -0.029557228088378906, -0.026762008666992188, -0.02396678924560547, -0.02117156982421875, -0.01837635040283203, -0.015581130981445312, -0.012785911560058594, -0.009990692138671875, -0.007195472717285156, -0.0044002532958984375, -0.0016050338745117188, 0.001190185546875, 0.003985404968261719, 0.0067806243896484375, 0.009575843811035156, 0.012371063232421875, 0.015166282653808594, 0.017961502075195312, 0.02075672149658203, 0.02355194091796875, 0.02634716033935547, 0.029142379760742188, 0.031937599182128906, 0.034732818603515625, 0.037528038024902344, 0.04032325744628906, 0.04311847686767578, 0.0459136962890625, 0.04870891571044922, 0.05150413513183594, 0.054299354553222656, 0.057094573974609375, 0.059889793395996094, 0.06268501281738281, 0.06548023223876953, 0.06827545166015625, 0.07107067108154297, 0.07386589050292969, 0.0766611099243164, 0.07945632934570312, 0.08225154876708984, 0.08504676818847656, 0.08784198760986328, 0.09063720703125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 7.0, 6.0, 10.0, 15.0, 16.0, 12.0, 20.0, 28.0, 27.0, 32.0, 40.0, 45.0, 33.0, 43.0, 56.0, 31.0, 63.0, 57.0, 59.0, 55.0, 39.0, 43.0, 36.0, 35.0, 38.0, 28.0, 24.0, 18.0, 16.0, 20.0, 8.0, 9.0, 4.0, 4.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.002971649169921875, -0.0028788745403289795, -0.002786099910736084, -0.0026933252811431885, -0.002600550651550293, -0.0025077760219573975, -0.002415001392364502, -0.0023222267627716064, -0.002229452133178711, -0.0021366775035858154, -0.00204390287399292, -0.0019511282444000244, -0.001858353614807129, -0.0017655789852142334, -0.0016728043556213379, -0.0015800297260284424, -0.0014872550964355469, -0.0013944804668426514, -0.0013017058372497559, -0.0012089312076568604, -0.0011161565780639648, -0.0010233819484710693, -0.0009306073188781738, -0.0008378326892852783, -0.0007450580596923828, -0.0006522834300994873, -0.0005595088005065918, -0.0004667341709136963, -0.0003739595413208008, -0.0002811849117279053, -0.00018841028213500977, -9.563565254211426e-05, -2.86102294921875e-06, 8.991360664367676e-05, 0.00018268823623657227, 0.0002754628658294678, 0.0003682374954223633, 0.0004610121250152588, 0.0005537867546081543, 0.0006465613842010498, 0.0007393360137939453, 0.0008321106433868408, 0.0009248852729797363, 0.0010176599025726318, 0.0011104345321655273, 0.0012032091617584229, 0.0012959837913513184, 0.0013887584209442139, 0.0014815330505371094, 0.0015743076801300049, 0.0016670823097229004, 0.001759856939315796, 0.0018526315689086914, 0.001945406198501587, 0.0020381808280944824, 0.002130955457687378, 0.0022237300872802734, 0.002316504716873169, 0.0024092793464660645, 0.00250205397605896, 0.0025948286056518555, 0.002687603235244751, 0.0027803778648376465, 0.002873152494430542, 0.0029659271240234375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 4.0, 13.0, 12.0, 20.0, 30.0, 26.0, 34.0, 55.0, 67.0, 78.0, 103.0, 127.0, 156.0, 228.0, 343.0, 850.0, 16819.0, 1006927.0, 20412.0, 864.0, 373.0, 248.0, 189.0, 117.0, 97.0, 82.0, 69.0, 46.0, 39.0, 27.0, 25.0, 19.0, 13.0, 4.0, 10.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0496826171875, -0.04805469512939453, -0.04642677307128906, -0.044798851013183594, -0.043170928955078125, -0.041543006896972656, -0.03991508483886719, -0.03828716278076172, -0.03665924072265625, -0.03503131866455078, -0.03340339660644531, -0.031775474548339844, -0.030147552490234375, -0.028519630432128906, -0.026891708374023438, -0.02526378631591797, -0.0236358642578125, -0.02200794219970703, -0.020380020141601562, -0.018752098083496094, -0.017124176025390625, -0.015496253967285156, -0.013868331909179688, -0.012240409851074219, -0.01061248779296875, -0.008984565734863281, -0.0073566436767578125, -0.005728721618652344, -0.004100799560546875, -0.0024728775024414062, -0.0008449554443359375, 0.0007829666137695312, 0.002410888671875, 0.004038810729980469, 0.0056667327880859375, 0.007294654846191406, 0.008922576904296875, 0.010550498962402344, 0.012178421020507812, 0.013806343078613281, 0.01543426513671875, 0.01706218719482422, 0.018690109252929688, 0.020318031311035156, 0.021945953369140625, 0.023573875427246094, 0.025201797485351562, 0.02682971954345703, 0.0284576416015625, 0.03008556365966797, 0.03171348571777344, 0.033341407775878906, 0.034969329833984375, 0.036597251892089844, 0.03822517395019531, 0.03985309600830078, 0.04148101806640625, 0.04310894012451172, 0.04473686218261719, 0.046364784240722656, 0.047992706298828125, 0.049620628356933594, 0.05124855041503906, 0.05287647247314453, 0.05450439453125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 993.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04610783979296684, -0.044237278401851654, -0.04236671328544617, -0.04049615189433098, -0.03862559050321579, -0.0367550291121006, -0.03488446772098541, -0.033013902604579926, -0.031143341213464737, -0.02927277982234955, -0.02740221656858921, -0.025531653314828873, -0.023661091923713684, -0.021790530532598495, -0.019919967278838158, -0.01804940402507782, -0.01617884263396263, -0.014308280311524868, -0.012437717989087105, -0.010567155666649342, -0.008696593344211578, -0.006826031021773815, -0.004955468699336052, -0.0030849063768982887, -0.0012143440544605255, 0.0006562182679772377, 0.002526780590415001, 0.004397342912852764, 0.006267905235290527, 0.00813846755772829, 0.010009029880166054, 0.011879592202603817, 0.013750158250331879, 0.015620720572769642, 0.017491282895207405, 0.019361846148967743, 0.02123240754008293, 0.02310296893119812, 0.024973532184958458, 0.026844095438718796, 0.028714656829833984, 0.030585218220949173, 0.03245577961206436, 0.03432634472846985, 0.03619690611958504, 0.038067467510700226, 0.03993803262710571, 0.0418085940182209, 0.04367915540933609, 0.04554971680045128, 0.04742027819156647, 0.049290843307971954, 0.05116140469908714, 0.05303196609020233, 0.05490253120660782, 0.05677309259772301, 0.058643653988838196, 0.060514215379953384, 0.06238477677106857, 0.06425534188747406, 0.06612589955329895, 0.06799646466970444, 0.06986702978610992, 0.07173758745193481, 0.0736081525683403]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 7.0, 12.0, 23.0, 30.0, 27.0, 47.0, 38.0, 44.0, 59.0, 59.0, 58.0, 72.0, 87.0, 68.0, 62.0, 56.0, 63.0, 37.0, 37.0, 35.0, 21.0, 21.0, 16.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004634082317352295, -0.004500299692153931, -0.004366517066955566, -0.004232734441757202, -0.004098951816558838, -0.003965169191360474, -0.0038313865661621094, -0.003697603940963745, -0.003563821315765381, -0.0034300386905670166, -0.0032962560653686523, -0.003162473440170288, -0.003028690814971924, -0.0028949081897735596, -0.0027611255645751953, -0.002627342939376831, -0.002493560314178467, -0.0023597776889801025, -0.0022259950637817383, -0.002092212438583374, -0.0019584298133850098, -0.0018246471881866455, -0.0016908645629882812, -0.001557081937789917, -0.0014232993125915527, -0.0012895166873931885, -0.0011557340621948242, -0.00102195143699646, -0.0008881688117980957, -0.0007543861865997314, -0.0006206035614013672, -0.00048682093620300293, -0.00035303831100463867, -0.00021925568580627441, -8.547306060791016e-05, 4.83095645904541e-05, 0.00018209218978881836, 0.0003158748149871826, 0.0004496574401855469, 0.0005834400653839111, 0.0007172226905822754, 0.0008510053157806396, 0.000984787940979004, 0.0011185705661773682, 0.0012523531913757324, 0.0013861358165740967, 0.001519918441772461, 0.0016537010669708252, 0.0017874836921691895, 0.0019212663173675537, 0.002055048942565918, 0.0021888315677642822, 0.0023226141929626465, 0.0024563968181610107, 0.002590179443359375, 0.0027239620685577393, 0.0028577446937561035, 0.0029915273189544678, 0.003125309944152832, 0.0032590925693511963, 0.0033928751945495605, 0.003526657819747925, 0.003660440444946289, 0.0037942230701446533, 0.003928005695343018]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 5.0, 5.0, 5.0, 5.0, 7.0, 12.0, 14.0, 16.0, 24.0, 22.0, 14.0, 21.0, 26.0, 26.0, 24.0, 34.0, 28.0, 34.0, 31.0, 49.0, 39.0, 55.0, 44.0, 36.0, 36.0, 38.0, 24.0, 42.0, 34.0, 32.0, 28.0, 31.0, 28.0, 17.0, 14.0, 10.0, 12.0, 21.0, 11.0, 15.0, 4.0, 8.0, 6.0, 11.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.3777618408203125, -1.330718994140625, -1.2836761474609375, -1.23663330078125, -1.1895904541015625, -1.142547607421875, -1.0955047607421875, -1.0484619140625, -1.0014190673828125, -0.954376220703125, -0.9073333740234375, -0.86029052734375, -0.8132476806640625, -0.766204833984375, -0.7191619873046875, -0.672119140625, -0.6250762939453125, -0.578033447265625, -0.5309906005859375, -0.48394775390625, -0.4369049072265625, -0.389862060546875, -0.3428192138671875, -0.2957763671875, -0.2487335205078125, -0.201690673828125, -0.1546478271484375, -0.10760498046875, -0.0605621337890625, -0.013519287109375, 0.0335235595703125, 0.08056640625, 0.1276092529296875, 0.174652099609375, 0.2216949462890625, 0.26873779296875, 0.3157806396484375, 0.362823486328125, 0.4098663330078125, 0.4569091796875, 0.5039520263671875, 0.550994873046875, 0.5980377197265625, 0.64508056640625, 0.6921234130859375, 0.739166259765625, 0.7862091064453125, 0.833251953125, 0.8802947998046875, 0.927337646484375, 0.9743804931640625, 1.02142333984375, 1.0684661865234375, 1.115509033203125, 1.1625518798828125, 1.2095947265625, 1.2566375732421875, 1.303680419921875, 1.3507232666015625, 1.39776611328125, 1.4448089599609375, 1.491851806640625, 1.5388946533203125, 1.5859375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 9.0, 15.0, 24.0, 35.0, 41.0, 70.0, 99.0, 122.0, 184.0, 258.0, 364.0, 559.0, 839.0, 1330.0, 2037.0, 3436.0, 5957.0, 10727.0, 20590.0, 45167.0, 118016.0, 329459.0, 310801.0, 110705.0, 42935.0, 19582.0, 10178.0, 5697.0, 3376.0, 2018.0, 1316.0, 812.0, 543.0, 391.0, 254.0, 188.0, 122.0, 96.0, 48.0, 43.0, 27.0, 24.0, 14.0, 14.0, 9.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.9267578125, -1.8716583251953125, -1.816558837890625, -1.7614593505859375, -1.70635986328125, -1.6512603759765625, -1.596160888671875, -1.5410614013671875, -1.4859619140625, -1.4308624267578125, -1.375762939453125, -1.3206634521484375, -1.26556396484375, -1.2104644775390625, -1.155364990234375, -1.1002655029296875, -1.045166015625, -0.9900665283203125, -0.934967041015625, -0.8798675537109375, -0.82476806640625, -0.7696685791015625, -0.714569091796875, -0.6594696044921875, -0.6043701171875, -0.5492706298828125, -0.494171142578125, -0.4390716552734375, -0.38397216796875, -0.3288726806640625, -0.273773193359375, -0.2186737060546875, -0.16357421875, -0.1084747314453125, -0.053375244140625, 0.0017242431640625, 0.05682373046875, 0.1119232177734375, 0.167022705078125, 0.2221221923828125, 0.2772216796875, 0.3323211669921875, 0.387420654296875, 0.4425201416015625, 0.49761962890625, 0.5527191162109375, 0.607818603515625, 0.6629180908203125, 0.718017578125, 0.7731170654296875, 0.828216552734375, 0.8833160400390625, 0.93841552734375, 0.9935150146484375, 1.048614501953125, 1.1037139892578125, 1.1588134765625, 1.2139129638671875, 1.269012451171875, 1.3241119384765625, 1.37921142578125, 1.4343109130859375, 1.489410400390625, 1.5445098876953125, 1.599609375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 6.0, 3.0, 4.0, 7.0, 9.0, 13.0, 10.0, 13.0, 16.0, 26.0, 20.0, 38.0, 30.0, 34.0, 36.0, 49.0, 52.0, 67.0, 129.0, 324.0, 1511.0, 173.0, 68.0, 48.0, 58.0, 43.0, 52.0, 43.0, 21.0, 16.0, 23.0, 21.0, 14.0, 17.0, 13.0, 13.0, 8.0, 9.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.70703125, -5.52392578125, -5.3408203125, -5.15771484375, -4.974609375, -4.79150390625, -4.6083984375, -4.42529296875, -4.2421875, -4.05908203125, -3.8759765625, -3.69287109375, -3.509765625, -3.32666015625, -3.1435546875, -2.96044921875, -2.77734375, -2.59423828125, -2.4111328125, -2.22802734375, -2.044921875, -1.86181640625, -1.6787109375, -1.49560546875, -1.3125, -1.12939453125, -0.9462890625, -0.76318359375, -0.580078125, -0.39697265625, -0.2138671875, -0.03076171875, 0.15234375, 0.33544921875, 0.5185546875, 0.70166015625, 0.884765625, 1.06787109375, 1.2509765625, 1.43408203125, 1.6171875, 1.80029296875, 1.9833984375, 2.16650390625, 2.349609375, 2.53271484375, 2.7158203125, 2.89892578125, 3.08203125, 3.26513671875, 3.4482421875, 3.63134765625, 3.814453125, 3.99755859375, 4.1806640625, 4.36376953125, 4.546875, 4.72998046875, 4.9130859375, 5.09619140625, 5.279296875, 5.46240234375, 5.6455078125, 5.82861328125, 6.01171875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 10.0, 9.0, 13.0, 27.0, 25.0, 30.0, 33.0, 44.0, 56.0, 77.0, 132.0, 209.0, 412.0, 1115.0, 7168.0, 133711.0, 2918552.0, 77087.0, 5026.0, 983.0, 343.0, 214.0, 108.0, 71.0, 59.0, 44.0, 22.0, 19.0, 18.0, 15.0, 16.0, 11.0, 7.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.767333984375, -9.45654296875, -9.145751953125, -8.8349609375, -8.524169921875, -8.21337890625, -7.902587890625, -7.591796875, -7.281005859375, -6.97021484375, -6.659423828125, -6.3486328125, -6.037841796875, -5.72705078125, -5.416259765625, -5.10546875, -4.794677734375, -4.48388671875, -4.173095703125, -3.8623046875, -3.551513671875, -3.24072265625, -2.929931640625, -2.619140625, -2.308349609375, -1.99755859375, -1.686767578125, -1.3759765625, -1.065185546875, -0.75439453125, -0.443603515625, -0.1328125, 0.177978515625, 0.48876953125, 0.799560546875, 1.1103515625, 1.421142578125, 1.73193359375, 2.042724609375, 2.353515625, 2.664306640625, 2.97509765625, 3.285888671875, 3.5966796875, 3.907470703125, 4.21826171875, 4.529052734375, 4.83984375, 5.150634765625, 5.46142578125, 5.772216796875, 6.0830078125, 6.393798828125, 6.70458984375, 7.015380859375, 7.326171875, 7.636962890625, 7.94775390625, 8.258544921875, 8.5693359375, 8.880126953125, 9.19091796875, 9.501708984375, 9.8125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 36.0, 512.0, 446.0, 22.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.72103118896484, -82.98821258544922, -81.25540161132812, -79.5225830078125, -77.78976440429688, -76.05694580078125, -74.32413482666016, -72.59131622314453, -70.85850524902344, -69.12568664550781, -67.39287567138672, -65.6600570678711, -63.92723846435547, -62.19442367553711, -60.46160888671875, -58.728790283203125, -56.9959716796875, -55.26315689086914, -53.530338287353516, -51.797523498535156, -50.06470489501953, -48.33189010620117, -46.59907531738281, -44.86625671386719, -43.13344192504883, -41.40062713623047, -39.667808532714844, -37.934993743896484, -36.202178955078125, -34.4693603515625, -32.73654556274414, -31.00372886657715, -29.27090835571289, -27.5380916595459, -25.805274963378906, -24.072460174560547, -22.339643478393555, -20.606826782226562, -18.874011993408203, -17.14119529724121, -15.408378601074219, -13.675561904907227, -11.94274616241455, -10.209930419921875, -8.477113723754883, -6.744297027587891, -5.011481285095215, -3.278665542602539, -1.5458488464355469, 0.1869673728942871, 1.919783592224121, 3.652599811553955, 5.385416030883789, 7.118232727050781, 8.851048469543457, 10.583864212036133, 12.316680908203125, 14.049497604370117, 15.782313346862793, 17.51512908935547, 19.24794578552246, 20.980762481689453, 22.713577270507812, 24.446393966674805, 26.179210662841797]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 4.0, 4.0, 5.0, 8.0, 6.0, 5.0, 12.0, 12.0, 11.0, 12.0, 13.0, 24.0, 23.0, 22.0, 26.0, 38.0, 34.0, 44.0, 34.0, 26.0, 46.0, 37.0, 39.0, 40.0, 42.0, 32.0, 35.0, 33.0, 41.0, 25.0, 26.0, 24.0, 22.0, 29.0, 30.0, 15.0, 15.0, 22.0, 12.0, 13.0, 16.0, 9.0, 10.0, 3.0, 6.0, 8.0, 7.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-16.52822494506836, -16.022205352783203, -15.516183853149414, -15.010163307189941, -14.504142761230469, -13.998122215270996, -13.492101669311523, -12.98608112335205, -12.480060577392578, -11.974040031433105, -11.468019485473633, -10.96199893951416, -10.455978393554688, -9.949957847595215, -9.443937301635742, -8.93791675567627, -8.431896209716797, -7.925875663757324, -7.419855117797852, -6.913834571838379, -6.407814025878906, -5.901793479919434, -5.395772933959961, -4.889752388000488, -4.383731842041016, -3.877711296081543, -3.3716907501220703, -2.8656702041625977, -2.359649658203125, -1.8536291122436523, -1.3476085662841797, -0.841588020324707, -0.33556556701660156, 0.1704549789428711, 0.6764755249023438, 1.1824960708618164, 1.688516616821289, 2.1945371627807617, 2.7005577087402344, 3.206578254699707, 3.7125988006591797, 4.218619346618652, 4.724639892578125, 5.230660438537598, 5.73668098449707, 6.242701530456543, 6.748722076416016, 7.254742622375488, 7.760763168334961, 8.266783714294434, 8.772804260253906, 9.278824806213379, 9.784845352172852, 10.290865898132324, 10.796886444091797, 11.30290699005127, 11.808927536010742, 12.314948081970215, 12.820968627929688, 13.32698917388916, 13.833009719848633, 14.339030265808105, 14.845050811767578, 15.35107135772705, 15.857091903686523]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 12.0, 7.0, 18.0, 20.0, 16.0, 24.0, 18.0, 21.0, 25.0, 23.0, 34.0, 31.0, 28.0, 35.0, 34.0, 47.0, 51.0, 51.0, 42.0, 36.0, 32.0, 33.0, 26.0, 32.0, 39.0, 27.0, 27.0, 32.0, 24.0, 12.0, 18.0, 8.0, 20.0, 14.0, 12.0, 18.0, 5.0, 4.0, 8.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4541015625, -1.4054107666015625, -1.356719970703125, -1.3080291748046875, -1.25933837890625, -1.2106475830078125, -1.161956787109375, -1.1132659912109375, -1.0645751953125, -1.0158843994140625, -0.967193603515625, -0.9185028076171875, -0.86981201171875, -0.8211212158203125, -0.772430419921875, -0.7237396240234375, -0.675048828125, -0.6263580322265625, -0.577667236328125, -0.5289764404296875, -0.48028564453125, -0.4315948486328125, -0.382904052734375, -0.3342132568359375, -0.2855224609375, -0.2368316650390625, -0.188140869140625, -0.1394500732421875, -0.09075927734375, -0.0420684814453125, 0.006622314453125, 0.0553131103515625, 0.10400390625, 0.1526947021484375, 0.201385498046875, 0.2500762939453125, 0.29876708984375, 0.3474578857421875, 0.396148681640625, 0.4448394775390625, 0.4935302734375, 0.5422210693359375, 0.590911865234375, 0.6396026611328125, 0.68829345703125, 0.7369842529296875, 0.785675048828125, 0.8343658447265625, 0.883056640625, 0.9317474365234375, 0.980438232421875, 1.0291290283203125, 1.07781982421875, 1.1265106201171875, 1.175201416015625, 1.2238922119140625, 1.2725830078125, 1.3212738037109375, 1.369964599609375, 1.4186553955078125, 1.46734619140625, 1.5160369873046875, 1.564727783203125, 1.6134185791015625, 1.662109375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 1.0, 4.0, 5.0, 9.0, 9.0, 8.0, 9.0, 19.0, 24.0, 25.0, 23.0, 32.0, 35.0, 59.0, 70.0, 125.0, 249.0, 614.0, 1748.0, 7267.0, 45179.0, 456328.0, 2999825.0, 614261.0, 56342.0, 8637.0, 2004.0, 628.0, 248.0, 141.0, 87.0, 53.0, 53.0, 29.0, 23.0, 19.0, 13.0, 17.0, 15.0, 5.0, 6.0, 11.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.08203125, -5.8892822265625, -5.696533203125, -5.5037841796875, -5.31103515625, -5.1182861328125, -4.925537109375, -4.7327880859375, -4.5400390625, -4.3472900390625, -4.154541015625, -3.9617919921875, -3.76904296875, -3.5762939453125, -3.383544921875, -3.1907958984375, -2.998046875, -2.8052978515625, -2.612548828125, -2.4197998046875, -2.22705078125, -2.0343017578125, -1.841552734375, -1.6488037109375, -1.4560546875, -1.2633056640625, -1.070556640625, -0.8778076171875, -0.68505859375, -0.4923095703125, -0.299560546875, -0.1068115234375, 0.0859375, 0.2786865234375, 0.471435546875, 0.6641845703125, 0.85693359375, 1.0496826171875, 1.242431640625, 1.4351806640625, 1.6279296875, 1.8206787109375, 2.013427734375, 2.2061767578125, 2.39892578125, 2.5916748046875, 2.784423828125, 2.9771728515625, 3.169921875, 3.3626708984375, 3.555419921875, 3.7481689453125, 3.94091796875, 4.1336669921875, 4.326416015625, 4.5191650390625, 4.7119140625, 4.9046630859375, 5.097412109375, 5.2901611328125, 5.48291015625, 5.6756591796875, 5.868408203125, 6.0611572265625, 6.25390625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 10.0, 12.0, 6.0, 10.0, 13.0, 20.0, 31.0, 45.0, 51.0, 65.0, 76.0, 98.0, 131.0, 165.0, 222.0, 287.0, 366.0, 394.0, 434.0, 383.0, 271.0, 246.0, 195.0, 132.0, 105.0, 73.0, 41.0, 49.0, 33.0, 26.0, 16.0, 13.0, 12.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.19140625, -4.0518798828125, -3.912353515625, -3.7728271484375, -3.63330078125, -3.4937744140625, -3.354248046875, -3.2147216796875, -3.0751953125, -2.9356689453125, -2.796142578125, -2.6566162109375, -2.51708984375, -2.3775634765625, -2.238037109375, -2.0985107421875, -1.958984375, -1.8194580078125, -1.679931640625, -1.5404052734375, -1.40087890625, -1.2613525390625, -1.121826171875, -0.9822998046875, -0.8427734375, -0.7032470703125, -0.563720703125, -0.4241943359375, -0.28466796875, -0.1451416015625, -0.005615234375, 0.1339111328125, 0.2734375, 0.4129638671875, 0.552490234375, 0.6920166015625, 0.83154296875, 0.9710693359375, 1.110595703125, 1.2501220703125, 1.3896484375, 1.5291748046875, 1.668701171875, 1.8082275390625, 1.94775390625, 2.0872802734375, 2.226806640625, 2.3663330078125, 2.505859375, 2.6453857421875, 2.784912109375, 2.9244384765625, 3.06396484375, 3.2034912109375, 3.343017578125, 3.4825439453125, 3.6220703125, 3.7615966796875, 3.901123046875, 4.0406494140625, 4.18017578125, 4.3197021484375, 4.459228515625, 4.5987548828125, 4.73828125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 7.0, 6.0, 9.0, 18.0, 17.0, 32.0, 37.0, 57.0, 97.0, 145.0, 183.0, 395.0, 871.0, 2225.0, 8003.0, 43844.0, 374338.0, 2710307.0, 935685.0, 97555.0, 14470.0, 3484.0, 1160.0, 500.0, 279.0, 176.0, 117.0, 66.0, 45.0, 34.0, 29.0, 20.0, 16.0, 13.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.052978515625, -7.76220703125, -7.471435546875, -7.1806640625, -6.889892578125, -6.59912109375, -6.308349609375, -6.017578125, -5.726806640625, -5.43603515625, -5.145263671875, -4.8544921875, -4.563720703125, -4.27294921875, -3.982177734375, -3.69140625, -3.400634765625, -3.10986328125, -2.819091796875, -2.5283203125, -2.237548828125, -1.94677734375, -1.656005859375, -1.365234375, -1.074462890625, -0.78369140625, -0.492919921875, -0.2021484375, 0.088623046875, 0.37939453125, 0.670166015625, 0.9609375, 1.251708984375, 1.54248046875, 1.833251953125, 2.1240234375, 2.414794921875, 2.70556640625, 2.996337890625, 3.287109375, 3.577880859375, 3.86865234375, 4.159423828125, 4.4501953125, 4.740966796875, 5.03173828125, 5.322509765625, 5.61328125, 5.904052734375, 6.19482421875, 6.485595703125, 6.7763671875, 7.067138671875, 7.35791015625, 7.648681640625, 7.939453125, 8.230224609375, 8.52099609375, 8.811767578125, 9.1025390625, 9.393310546875, 9.68408203125, 9.974853515625, 10.265625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 14.0, 20.0, 24.0, 29.0, 49.0, 74.0, 104.0, 109.0, 112.0, 104.0, 109.0, 81.0, 52.0, 37.0, 31.0, 23.0, 18.0, 9.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.6882381439209, -18.952835083007812, -18.21743392944336, -17.482030868530273, -16.746627807617188, -16.011226654052734, -15.275823593139648, -14.540421485900879, -13.80501937866211, -13.06961727142334, -12.33421516418457, -11.598812103271484, -10.863409996032715, -10.128007888793945, -9.39260482788086, -8.65720272064209, -7.92180061340332, -7.186398506164551, -6.450995922088623, -5.715593338012695, -4.980191230773926, -4.244789123535156, -3.5093865394592285, -2.773983955383301, -2.0385818481445312, -1.3031795024871826, -0.567777156829834, 0.16762518882751465, 0.9030275344848633, 1.638429880142212, 2.3738322257995605, 3.1092348098754883, 3.844635009765625, 4.5800371170043945, 5.315439701080322, 6.05084228515625, 6.7862443923950195, 7.521646499633789, 8.257049560546875, 8.992451667785645, 9.727853775024414, 10.463255882263184, 11.198657989501953, 11.934061050415039, 12.669463157653809, 13.404865264892578, 14.140268325805664, 14.875670433044434, 15.611072540283203, 16.34647560119629, 17.081876754760742, 17.817279815673828, 18.55268096923828, 19.288084030151367, 20.023487091064453, 20.758888244628906, 21.494291305541992, 22.229694366455078, 22.96509552001953, 23.700498580932617, 24.435901641845703, 25.171302795410156, 25.906705856323242, 26.642108917236328, 27.37751007080078]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 4.0, 9.0, 6.0, 6.0, 4.0, 7.0, 13.0, 8.0, 10.0, 17.0, 18.0, 15.0, 15.0, 23.0, 25.0, 23.0, 29.0, 28.0, 31.0, 35.0, 33.0, 39.0, 28.0, 42.0, 31.0, 35.0, 40.0, 40.0, 32.0, 26.0, 42.0, 43.0, 26.0, 35.0, 19.0, 28.0, 21.0, 19.0, 13.0, 16.0, 7.0, 18.0, 9.0, 11.0, 7.0, 6.0, 3.0, 5.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.579944610595703, -13.124553680419922, -12.669161796569824, -12.213770866394043, -11.758379936218262, -11.302988052368164, -10.847597122192383, -10.392206192016602, -9.936814308166504, -9.481423377990723, -9.026031494140625, -8.570640563964844, -8.115249633789062, -7.659857749938965, -7.204466819763184, -6.749075412750244, -6.293684482574463, -5.838293075561523, -5.382902145385742, -4.927510738372803, -4.472119331359863, -4.016728401184082, -3.5613369941711426, -3.105945587158203, -2.6505544185638428, -2.1951632499694824, -1.739771842956543, -1.2843806743621826, -0.8289893865585327, -0.3735980987548828, 0.08179306983947754, 0.537184476852417, 0.9925756454467773, 1.4479669332504272, 1.9033582210540771, 2.3587493896484375, 2.814140796661377, 3.2695319652557373, 3.7249231338500977, 4.180314540863037, 4.635705947875977, 5.091097354888916, 5.546488285064697, 6.001879692077637, 6.457271099090576, 6.912662506103516, 7.368053436279297, 7.823444843292236, 8.27883529663086, 8.73422622680664, 9.189618110656738, 9.64500904083252, 10.1003999710083, 10.555791854858398, 11.01118278503418, 11.466573715209961, 11.921965599060059, 12.37735652923584, 12.832748413085938, 13.288139343261719, 13.7435302734375, 14.198922157287598, 14.654313087463379, 15.109704971313477, 15.565095901489258]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 11.0, 1.0, 10.0, 9.0, 7.0, 8.0, 11.0, 14.0, 16.0, 23.0, 18.0, 23.0, 22.0, 23.0, 33.0, 33.0, 34.0, 34.0, 50.0, 41.0, 27.0, 44.0, 45.0, 40.0, 25.0, 32.0, 28.0, 36.0, 37.0, 19.0, 26.0, 25.0, 23.0, 24.0, 18.0, 20.0, 14.0, 17.0, 7.0, 15.0, 9.0, 9.0, 5.0, 9.0, 7.0, 5.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.509765625, -1.463134765625, -1.41650390625, -1.369873046875, -1.3232421875, -1.276611328125, -1.22998046875, -1.183349609375, -1.13671875, -1.090087890625, -1.04345703125, -0.996826171875, -0.9501953125, -0.903564453125, -0.85693359375, -0.810302734375, -0.763671875, -0.717041015625, -0.67041015625, -0.623779296875, -0.5771484375, -0.530517578125, -0.48388671875, -0.437255859375, -0.390625, -0.343994140625, -0.29736328125, -0.250732421875, -0.2041015625, -0.157470703125, -0.11083984375, -0.064208984375, -0.017578125, 0.029052734375, 0.07568359375, 0.122314453125, 0.1689453125, 0.215576171875, 0.26220703125, 0.308837890625, 0.35546875, 0.402099609375, 0.44873046875, 0.495361328125, 0.5419921875, 0.588623046875, 0.63525390625, 0.681884765625, 0.728515625, 0.775146484375, 0.82177734375, 0.868408203125, 0.9150390625, 0.961669921875, 1.00830078125, 1.054931640625, 1.1015625, 1.148193359375, 1.19482421875, 1.241455078125, 1.2880859375, 1.334716796875, 1.38134765625, 1.427978515625, 1.474609375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 5.0, 4.0, 4.0, 9.0, 17.0, 13.0, 21.0, 37.0, 36.0, 58.0, 77.0, 106.0, 163.0, 246.0, 335.0, 486.0, 725.0, 1045.0, 1560.0, 2322.0, 3359.0, 5089.0, 7542.0, 11598.0, 17925.0, 28348.0, 44976.0, 73098.0, 117032.0, 171461.0, 186180.0, 136682.0, 88167.0, 53771.0, 33723.0, 21182.0, 13805.0, 9049.0, 5935.0, 3978.0, 2656.0, 1813.0, 1232.0, 783.0, 579.0, 409.0, 266.0, 200.0, 132.0, 80.0, 68.0, 59.0, 41.0, 25.0, 16.0, 15.0, 3.0, 5.0, 6.0, 4.0, 5.0, 2.0, 2.0], "bins": [-0.159912109375, -0.15478515625, -0.149658203125, -0.14453125, -0.139404296875, -0.13427734375, -0.129150390625, -0.1240234375, -0.118896484375, -0.11376953125, -0.108642578125, -0.103515625, -0.098388671875, -0.09326171875, -0.088134765625, -0.0830078125, -0.077880859375, -0.07275390625, -0.067626953125, -0.0625, -0.057373046875, -0.05224609375, -0.047119140625, -0.0419921875, -0.036865234375, -0.03173828125, -0.026611328125, -0.021484375, -0.016357421875, -0.01123046875, -0.006103515625, -0.0009765625, 0.004150390625, 0.00927734375, 0.014404296875, 0.01953125, 0.024658203125, 0.02978515625, 0.034912109375, 0.0400390625, 0.045166015625, 0.05029296875, 0.055419921875, 0.060546875, 0.065673828125, 0.07080078125, 0.075927734375, 0.0810546875, 0.086181640625, 0.09130859375, 0.096435546875, 0.1015625, 0.106689453125, 0.11181640625, 0.116943359375, 0.1220703125, 0.127197265625, 0.13232421875, 0.137451171875, 0.142578125, 0.147705078125, 0.15283203125, 0.157958984375, 0.1630859375, 0.168212890625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 11.0, 7.0, 7.0, 12.0, 17.0, 21.0, 20.0, 17.0, 22.0, 33.0, 36.0, 35.0, 29.0, 40.0, 46.0, 30.0, 32.0, 42.0, 40.0, 1062.0, 40.0, 39.0, 45.0, 33.0, 33.0, 33.0, 31.0, 30.0, 21.0, 17.0, 20.0, 16.0, 13.0, 16.0, 17.0, 12.0, 9.0, 8.0, 3.0, 1.0, 3.0, 7.0, 4.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.99560546875, -0.9640121459960938, -0.9324188232421875, -0.9008255004882812, -0.869232177734375, -0.8376388549804688, -0.8060455322265625, -0.7744522094726562, -0.74285888671875, -0.7112655639648438, -0.6796722412109375, -0.6480789184570312, -0.616485595703125, -0.5848922729492188, -0.5532989501953125, -0.5217056274414062, -0.4901123046875, -0.45851898193359375, -0.4269256591796875, -0.39533233642578125, -0.363739013671875, -0.33214569091796875, -0.3005523681640625, -0.26895904541015625, -0.23736572265625, -0.20577239990234375, -0.1741790771484375, -0.14258575439453125, -0.110992431640625, -0.07939910888671875, -0.0478057861328125, -0.01621246337890625, 0.015380859375, 0.04697418212890625, 0.0785675048828125, 0.11016082763671875, 0.141754150390625, 0.17334747314453125, 0.2049407958984375, 0.23653411865234375, 0.26812744140625, 0.29972076416015625, 0.3313140869140625, 0.36290740966796875, 0.394500732421875, 0.42609405517578125, 0.4576873779296875, 0.48928070068359375, 0.5208740234375, 0.5524673461914062, 0.5840606689453125, 0.6156539916992188, 0.647247314453125, 0.6788406372070312, 0.7104339599609375, 0.7420272827148438, 0.77362060546875, 0.8052139282226562, 0.8368072509765625, 0.8684005737304688, 0.899993896484375, 0.9315872192382812, 0.9631805419921875, 0.9947738647460938, 1.0263671875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 4.0, 14.0, 17.0, 24.0, 60.0, 76.0, 118.0, 172.0, 255.0, 395.0, 613.0, 932.0, 1466.0, 2232.0, 3379.0, 5308.0, 8297.0, 12762.0, 20416.0, 31888.0, 49070.0, 74900.0, 112699.0, 167548.0, 1206192.0, 135046.0, 92339.0, 60707.0, 39714.0, 25641.0, 16001.0, 10371.0, 6550.0, 4152.0, 2648.0, 1734.0, 1204.0, 762.0, 485.0, 300.0, 232.0, 150.0, 107.0, 49.0, 39.0, 26.0, 11.0, 5.0, 8.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.11090087890625, -0.10746192932128906, -0.10402297973632812, -0.10058403015136719, -0.09714508056640625, -0.09370613098144531, -0.09026718139648438, -0.08682823181152344, -0.0833892822265625, -0.07995033264160156, -0.07651138305664062, -0.07307243347167969, -0.06963348388671875, -0.06619453430175781, -0.06275558471679688, -0.05931663513183594, -0.055877685546875, -0.05243873596191406, -0.048999786376953125, -0.04556083679199219, -0.04212188720703125, -0.03868293762207031, -0.035243988037109375, -0.03180503845214844, -0.0283660888671875, -0.024927139282226562, -0.021488189697265625, -0.018049240112304688, -0.01461029052734375, -0.011171340942382812, -0.007732391357421875, -0.0042934417724609375, -0.0008544921875, 0.0025844573974609375, 0.006023406982421875, 0.009462356567382812, 0.01290130615234375, 0.016340255737304688, 0.019779205322265625, 0.023218154907226562, 0.0266571044921875, 0.030096054077148438, 0.033535003662109375, 0.03697395324707031, 0.04041290283203125, 0.04385185241699219, 0.047290802001953125, 0.05072975158691406, 0.054168701171875, 0.05760765075683594, 0.061046600341796875, 0.06448554992675781, 0.06792449951171875, 0.07136344909667969, 0.07480239868164062, 0.07824134826660156, 0.0816802978515625, 0.08511924743652344, 0.08855819702148438, 0.09199714660644531, 0.09543609619140625, 0.09887504577636719, 0.10231399536132812, 0.10575294494628906, 0.10919189453125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 0.0, 4.0, 5.0, 7.0, 11.0, 20.0, 37.0, 38.0, 61.0, 81.0, 107.0, 134.0, 132.0, 106.0, 75.0, 57.0, 35.0, 15.0, 14.0, 14.0, 9.0, 8.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003635406494140625, -0.003517657518386841, -0.0033999085426330566, -0.0032821595668792725, -0.0031644105911254883, -0.003046661615371704, -0.00292891263961792, -0.0028111636638641357, -0.0026934146881103516, -0.0025756657123565674, -0.002457916736602783, -0.002340167760848999, -0.002222418785095215, -0.0021046698093414307, -0.0019869208335876465, -0.0018691718578338623, -0.0017514228820800781, -0.001633673906326294, -0.0015159249305725098, -0.0013981759548187256, -0.0012804269790649414, -0.0011626780033111572, -0.001044929027557373, -0.0009271800518035889, -0.0008094310760498047, -0.0006916821002960205, -0.0005739331245422363, -0.00045618414878845215, -0.00033843517303466797, -0.0002206861972808838, -0.00010293722152709961, 1.481175422668457e-05, 0.00013256072998046875, 0.00025030970573425293, 0.0003680586814880371, 0.0004858076572418213, 0.0006035566329956055, 0.0007213056087493896, 0.0008390545845031738, 0.000956803560256958, 0.0010745525360107422, 0.0011923015117645264, 0.0013100504875183105, 0.0014277994632720947, 0.001545548439025879, 0.001663297414779663, 0.0017810463905334473, 0.0018987953662872314, 0.0020165443420410156, 0.0021342933177948, 0.002252042293548584, 0.002369791269302368, 0.0024875402450561523, 0.0026052892208099365, 0.0027230381965637207, 0.002840787172317505, 0.002958536148071289, 0.0030762851238250732, 0.0031940340995788574, 0.0033117830753326416, 0.0034295320510864258, 0.00354728102684021, 0.003665030002593994, 0.0037827789783477783, 0.0039005279541015625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 10.0, 12.0, 26.0, 18.0, 34.0, 22.0, 35.0, 74.0, 152.0, 298.0, 971.0, 198370.0, 846218.0, 1554.0, 318.0, 153.0, 98.0, 49.0, 43.0, 21.0, 17.0, 5.0, 9.0, 11.0, 2.0, 5.0, 3.0, 7.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07318115234375, -0.0709695816040039, -0.06875801086425781, -0.06654644012451172, -0.06433486938476562, -0.06212329864501953, -0.05991172790527344, -0.057700157165527344, -0.05548858642578125, -0.053277015686035156, -0.05106544494628906, -0.04885387420654297, -0.046642303466796875, -0.04443073272705078, -0.04221916198730469, -0.040007591247558594, -0.0377960205078125, -0.035584449768066406, -0.03337287902832031, -0.03116130828857422, -0.028949737548828125, -0.02673816680908203, -0.024526596069335938, -0.022315025329589844, -0.02010345458984375, -0.017891883850097656, -0.015680313110351562, -0.013468742370605469, -0.011257171630859375, -0.009045600891113281, -0.0068340301513671875, -0.004622459411621094, -0.002410888671875, -0.00019931793212890625, 0.0020122528076171875, 0.004223823547363281, 0.006435394287109375, 0.008646965026855469, 0.010858535766601562, 0.013070106506347656, 0.01528167724609375, 0.017493247985839844, 0.019704818725585938, 0.02191638946533203, 0.024127960205078125, 0.02633953094482422, 0.028551101684570312, 0.030762672424316406, 0.0329742431640625, 0.035185813903808594, 0.03739738464355469, 0.03960895538330078, 0.041820526123046875, 0.04403209686279297, 0.04624366760253906, 0.048455238342285156, 0.05066680908203125, 0.052878379821777344, 0.05508995056152344, 0.05730152130126953, 0.059513092041015625, 0.06172466278076172, 0.06393623352050781, 0.0661478042602539, 0.068359375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 11.0, 640.0, 358.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02134220488369465, -0.020367683842778206, -0.019393162801861763, -0.01841864176094532, -0.017444120720028877, -0.016469599679112434, -0.015495077706873417, -0.014520556665956974, -0.013546035625040531, -0.012571514584124088, -0.011596993543207645, -0.010622471570968628, -0.009647950530052185, -0.008673429489135742, -0.007698908448219299, -0.0067243874073028564, -0.005749866366386414, -0.004775345325469971, -0.003800824051722884, -0.0028263027779757977, -0.0018517817370593548, -0.0008772606961429119, 9.726081043481827e-05, 0.0010717818513512611, 0.002046302892267704, 0.003020823933184147, 0.00399534497410059, 0.00496986648067832, 0.005944387521594763, 0.006918908562511206, 0.007893430069088936, 0.008867951110005379, 0.00984247401356697, 0.010816995054483414, 0.011791516095399857, 0.0127660371363163, 0.013740558177232742, 0.014715079218149185, 0.015689600259065628, 0.01666412129998207, 0.017638642340898514, 0.018613163381814957, 0.0195876844227314, 0.020562205463647842, 0.021536726504564285, 0.022511247545480728, 0.02348576858639717, 0.024460289627313614, 0.025434812530875206, 0.02640933357179165, 0.027383854612708092, 0.028358375653624535, 0.029332896694540977, 0.03030741773545742, 0.03128194063901901, 0.032256461679935455, 0.0332309827208519, 0.03420550376176834, 0.035180024802684784, 0.03615454584360123, 0.03712906688451767, 0.03810358792543411, 0.039078108966350555, 0.040052630007267, 0.04102715104818344]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 13.0, 13.0, 16.0, 18.0, 22.0, 26.0, 45.0, 39.0, 44.0, 54.0, 61.0, 58.0, 50.0, 63.0, 60.0, 64.0, 43.0, 55.0, 47.0, 36.0, 42.0, 26.0, 23.0, 20.0, 11.0, 18.0, 10.0, 4.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025127530097961426, -0.0024291574954986572, -0.002345561981201172, -0.0022619664669036865, -0.002178370952606201, -0.002094775438308716, -0.0020111799240112305, -0.0019275844097137451, -0.0018439888954162598, -0.0017603933811187744, -0.001676797866821289, -0.0015932023525238037, -0.0015096068382263184, -0.001426011323928833, -0.0013424158096313477, -0.0012588202953338623, -0.001175224781036377, -0.0010916292667388916, -0.0010080337524414062, -0.0009244382381439209, -0.0008408427238464355, -0.0007572472095489502, -0.0006736516952514648, -0.0005900561809539795, -0.0005064606666564941, -0.0004228651523590088, -0.00033926963806152344, -0.0002556741237640381, -0.00017207860946655273, -8.848309516906738e-05, -4.887580871582031e-06, 7.870793342590332e-05, 0.00016230344772338867, 0.000245898962020874, 0.0003294944763183594, 0.0004130899906158447, 0.0004966855049133301, 0.0005802810192108154, 0.0006638765335083008, 0.0007474720478057861, 0.0008310675621032715, 0.0009146630764007568, 0.0009982585906982422, 0.0010818541049957275, 0.0011654496192932129, 0.0012490451335906982, 0.0013326406478881836, 0.001416236162185669, 0.0014998316764831543, 0.0015834271907806396, 0.001667022705078125, 0.0017506182193756104, 0.0018342137336730957, 0.001917809247970581, 0.0020014047622680664, 0.0020850002765655518, 0.002168595790863037, 0.0022521913051605225, 0.002335786819458008, 0.002419382333755493, 0.0025029778480529785, 0.002586573362350464, 0.0026701688766479492, 0.0027537643909454346, 0.00283735990524292]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 11.0, 1.0, 10.0, 9.0, 7.0, 8.0, 11.0, 14.0, 16.0, 23.0, 18.0, 23.0, 22.0, 23.0, 33.0, 33.0, 34.0, 34.0, 50.0, 41.0, 27.0, 44.0, 45.0, 40.0, 25.0, 32.0, 28.0, 36.0, 37.0, 19.0, 26.0, 25.0, 23.0, 24.0, 18.0, 20.0, 14.0, 17.0, 7.0, 15.0, 9.0, 9.0, 5.0, 9.0, 7.0, 5.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.509765625, -1.463134765625, -1.41650390625, -1.369873046875, -1.3232421875, -1.276611328125, -1.22998046875, -1.183349609375, -1.13671875, -1.090087890625, -1.04345703125, -0.996826171875, -0.9501953125, -0.903564453125, -0.85693359375, -0.810302734375, -0.763671875, -0.717041015625, -0.67041015625, -0.623779296875, -0.5771484375, -0.530517578125, -0.48388671875, -0.437255859375, -0.390625, -0.343994140625, -0.29736328125, -0.250732421875, -0.2041015625, -0.157470703125, -0.11083984375, -0.064208984375, -0.017578125, 0.029052734375, 0.07568359375, 0.122314453125, 0.1689453125, 0.215576171875, 0.26220703125, 0.308837890625, 0.35546875, 0.402099609375, 0.44873046875, 0.495361328125, 0.5419921875, 0.588623046875, 0.63525390625, 0.681884765625, 0.728515625, 0.775146484375, 0.82177734375, 0.868408203125, 0.9150390625, 0.961669921875, 1.00830078125, 1.054931640625, 1.1015625, 1.148193359375, 1.19482421875, 1.241455078125, 1.2880859375, 1.334716796875, 1.38134765625, 1.427978515625, 1.474609375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 6.0, 12.0, 8.0, 10.0, 12.0, 21.0, 34.0, 48.0, 50.0, 72.0, 100.0, 127.0, 226.0, 340.0, 607.0, 1019.0, 1950.0, 3767.0, 8012.0, 17865.0, 43735.0, 133217.0, 383114.0, 299616.0, 94176.0, 33214.0, 13806.0, 6462.0, 3018.0, 1587.0, 818.0, 539.0, 308.0, 182.0, 119.0, 86.0, 69.0, 53.0, 32.0, 34.0, 15.0, 14.0, 16.0, 10.0, 9.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8935546875, -1.8279266357421875, -1.762298583984375, -1.6966705322265625, -1.63104248046875, -1.5654144287109375, -1.499786376953125, -1.4341583251953125, -1.3685302734375, -1.3029022216796875, -1.237274169921875, -1.1716461181640625, -1.10601806640625, -1.0403900146484375, -0.974761962890625, -0.9091339111328125, -0.843505859375, -0.7778778076171875, -0.712249755859375, -0.6466217041015625, -0.58099365234375, -0.5153656005859375, -0.449737548828125, -0.3841094970703125, -0.3184814453125, -0.2528533935546875, -0.187225341796875, -0.1215972900390625, -0.05596923828125, 0.0096588134765625, 0.075286865234375, 0.1409149169921875, 0.20654296875, 0.2721710205078125, 0.337799072265625, 0.4034271240234375, 0.46905517578125, 0.5346832275390625, 0.600311279296875, 0.6659393310546875, 0.7315673828125, 0.7971954345703125, 0.862823486328125, 0.9284515380859375, 0.99407958984375, 1.0597076416015625, 1.125335693359375, 1.1909637451171875, 1.256591796875, 1.3222198486328125, 1.387847900390625, 1.4534759521484375, 1.51910400390625, 1.5847320556640625, 1.650360107421875, 1.7159881591796875, 1.7816162109375, 1.8472442626953125, 1.912872314453125, 1.9785003662109375, 2.04412841796875, 2.1097564697265625, 2.175384521484375, 2.2410125732421875, 2.306640625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 6.0, 11.0, 14.0, 13.0, 18.0, 24.0, 30.0, 23.0, 40.0, 43.0, 44.0, 49.0, 61.0, 99.0, 222.0, 1541.0, 219.0, 100.0, 65.0, 57.0, 60.0, 36.0, 38.0, 39.0, 24.0, 16.0, 20.0, 21.0, 13.0, 14.0, 13.0, 14.0, 5.0, 11.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.42578125, -6.2342529296875, -6.042724609375, -5.8511962890625, -5.65966796875, -5.4681396484375, -5.276611328125, -5.0850830078125, -4.8935546875, -4.7020263671875, -4.510498046875, -4.3189697265625, -4.12744140625, -3.9359130859375, -3.744384765625, -3.5528564453125, -3.361328125, -3.1697998046875, -2.978271484375, -2.7867431640625, -2.59521484375, -2.4036865234375, -2.212158203125, -2.0206298828125, -1.8291015625, -1.6375732421875, -1.446044921875, -1.2545166015625, -1.06298828125, -0.8714599609375, -0.679931640625, -0.4884033203125, -0.296875, -0.1053466796875, 0.086181640625, 0.2777099609375, 0.46923828125, 0.6607666015625, 0.852294921875, 1.0438232421875, 1.2353515625, 1.4268798828125, 1.618408203125, 1.8099365234375, 2.00146484375, 2.1929931640625, 2.384521484375, 2.5760498046875, 2.767578125, 2.9591064453125, 3.150634765625, 3.3421630859375, 3.53369140625, 3.7252197265625, 3.916748046875, 4.1082763671875, 4.2998046875, 4.4913330078125, 4.682861328125, 4.8743896484375, 5.06591796875, 5.2574462890625, 5.448974609375, 5.6405029296875, 5.83203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 10.0, 13.0, 16.0, 23.0, 23.0, 29.0, 28.0, 43.0, 62.0, 65.0, 90.0, 137.0, 238.0, 532.0, 1522.0, 8599.0, 126543.0, 2885167.0, 111647.0, 8127.0, 1449.0, 515.0, 244.0, 142.0, 101.0, 73.0, 45.0, 40.0, 24.0, 25.0, 19.0, 18.0, 14.0, 6.0, 7.0, 7.0, 7.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-8.796875, -8.5174560546875, -8.238037109375, -7.9586181640625, -7.67919921875, -7.3997802734375, -7.120361328125, -6.8409423828125, -6.5615234375, -6.2821044921875, -6.002685546875, -5.7232666015625, -5.44384765625, -5.1644287109375, -4.885009765625, -4.6055908203125, -4.326171875, -4.0467529296875, -3.767333984375, -3.4879150390625, -3.20849609375, -2.9290771484375, -2.649658203125, -2.3702392578125, -2.0908203125, -1.8114013671875, -1.531982421875, -1.2525634765625, -0.97314453125, -0.6937255859375, -0.414306640625, -0.1348876953125, 0.14453125, 0.4239501953125, 0.703369140625, 0.9827880859375, 1.26220703125, 1.5416259765625, 1.821044921875, 2.1004638671875, 2.3798828125, 2.6593017578125, 2.938720703125, 3.2181396484375, 3.49755859375, 3.7769775390625, 4.056396484375, 4.3358154296875, 4.615234375, 4.8946533203125, 5.174072265625, 5.4534912109375, 5.73291015625, 6.0123291015625, 6.291748046875, 6.5711669921875, 6.8505859375, 7.1300048828125, 7.409423828125, 7.6888427734375, 7.96826171875, 8.2476806640625, 8.527099609375, 8.8065185546875, 9.0859375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [6.0, 885.0, 125.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.826216220855713, -3.380767822265625, 1.064680576324463, 5.510129451751709, 9.955577850341797, 14.401025772094727, 18.84647560119629, 23.29192352294922, 27.73737144470215, 32.18281936645508, 36.62826919555664, 41.07371520996094, 45.5191650390625, 49.96461486816406, 54.410064697265625, 58.85551071166992, 63.30095672607422, 67.74640655517578, 72.19185638427734, 76.63729858398438, 81.08274841308594, 85.5281982421875, 89.97364807128906, 94.41909790039062, 98.86454772949219, 103.30999755859375, 107.75544738769531, 112.20089721679688, 116.6463394165039, 121.09178924560547, 125.53723907470703, 129.98268127441406, 134.4281463623047, 138.87359619140625, 143.3190460205078, 147.76449584960938, 152.20994567871094, 156.6553955078125, 161.100830078125, 165.54627990722656, 169.99172973632812, 174.4371795654297, 178.88262939453125, 183.3280792236328, 187.77352905273438, 192.21896362304688, 196.6644287109375, 201.10986328125, 205.55532836914062, 210.0007781982422, 214.44622802734375, 218.8916778564453, 223.33712768554688, 227.78256225585938, 232.22802734375, 236.6734619140625, 241.11891174316406, 245.56436157226562, 250.0098114013672, 254.45526123046875, 258.90069580078125, 263.3461608886719, 267.7915954589844, 272.237060546875, 276.6824951171875]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 1.0, 7.0, 13.0, 12.0, 12.0, 15.0, 15.0, 28.0, 23.0, 26.0, 18.0, 27.0, 25.0, 29.0, 32.0, 44.0, 32.0, 41.0, 36.0, 33.0, 29.0, 38.0, 43.0, 46.0, 41.0, 42.0, 34.0, 40.0, 21.0, 30.0, 24.0, 18.0, 15.0, 16.0, 16.0, 14.0, 13.0, 9.0, 6.0, 12.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.103717803955078, -18.5260066986084, -17.94829750061035, -17.370586395263672, -16.792877197265625, -16.215166091918945, -15.637455940246582, -15.059745788574219, -14.482034683227539, -13.904324531555176, -13.326614379882812, -12.748903274536133, -12.17119312286377, -11.593482971191406, -11.015772819519043, -10.43806266784668, -9.860352516174316, -9.282642364501953, -8.70493221282959, -8.127222061157227, -7.549510955810547, -6.971800804138184, -6.39409065246582, -5.816380023956299, -5.2386698722839355, -4.660959720611572, -4.083249092102051, -3.5055389404296875, -2.927828550338745, -2.3501181602478027, -1.7724080085754395, -1.194697380065918, -0.6169872283935547, -0.03927689790725708, 0.5384334325790405, 1.1161437034606934, 1.6938540935516357, 2.271564483642578, 2.8492746353149414, 3.426985263824463, 4.004695415496826, 4.5824055671691895, 5.160116195678711, 5.737826347351074, 6.3155364990234375, 6.893247127532959, 7.470957279205322, 8.048667907714844, 8.626378059387207, 9.20408821105957, 9.781798362731934, 10.359508514404297, 10.937219619750977, 11.51492977142334, 12.092639923095703, 12.670351028442383, 13.24806022644043, 13.825770378112793, 14.403480529785156, 14.981191635131836, 15.5589017868042, 16.136611938476562, 16.71432113647461, 17.29203224182129, 17.86974334716797]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 4.0, 11.0, 11.0, 9.0, 9.0, 10.0, 22.0, 18.0, 19.0, 20.0, 31.0, 38.0, 39.0, 35.0, 27.0, 39.0, 53.0, 37.0, 43.0, 53.0, 43.0, 29.0, 34.0, 37.0, 32.0, 32.0, 24.0, 28.0, 26.0, 29.0, 21.0, 18.0, 15.0, 14.0, 20.0, 10.0, 4.0, 7.0, 8.0, 12.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6748046875, -1.62152099609375, -1.5682373046875, -1.51495361328125, -1.461669921875, -1.40838623046875, -1.3551025390625, -1.30181884765625, -1.24853515625, -1.19525146484375, -1.1419677734375, -1.08868408203125, -1.035400390625, -0.98211669921875, -0.9288330078125, -0.87554931640625, -0.822265625, -0.76898193359375, -0.7156982421875, -0.66241455078125, -0.609130859375, -0.55584716796875, -0.5025634765625, -0.44927978515625, -0.39599609375, -0.34271240234375, -0.2894287109375, -0.23614501953125, -0.182861328125, -0.12957763671875, -0.0762939453125, -0.02301025390625, 0.0302734375, 0.08355712890625, 0.1368408203125, 0.19012451171875, 0.243408203125, 0.29669189453125, 0.3499755859375, 0.40325927734375, 0.45654296875, 0.50982666015625, 0.5631103515625, 0.61639404296875, 0.669677734375, 0.72296142578125, 0.7762451171875, 0.82952880859375, 0.8828125, 0.93609619140625, 0.9893798828125, 1.04266357421875, 1.095947265625, 1.14923095703125, 1.2025146484375, 1.25579833984375, 1.30908203125, 1.36236572265625, 1.4156494140625, 1.46893310546875, 1.522216796875, 1.57550048828125, 1.6287841796875, 1.68206787109375, 1.7353515625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 11.0, 9.0, 11.0, 22.0, 18.0, 35.0, 31.0, 49.0, 59.0, 96.0, 167.0, 240.0, 499.0, 1134.0, 2633.0, 7033.0, 19853.0, 63388.0, 247680.0, 1133952.0, 1944931.0, 585013.0, 130007.0, 37168.0, 12076.0, 4572.0, 1820.0, 802.0, 339.0, 186.0, 132.0, 76.0, 64.0, 35.0, 23.0, 23.0, 17.0, 11.0, 16.0, 16.0, 9.0, 5.0, 7.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.423828125, -3.314361572265625, -3.20489501953125, -3.095428466796875, -2.9859619140625, -2.876495361328125, -2.76702880859375, -2.657562255859375, -2.548095703125, -2.438629150390625, -2.32916259765625, -2.219696044921875, -2.1102294921875, -2.000762939453125, -1.89129638671875, -1.781829833984375, -1.67236328125, -1.562896728515625, -1.45343017578125, -1.343963623046875, -1.2344970703125, -1.125030517578125, -1.01556396484375, -0.906097412109375, -0.796630859375, -0.687164306640625, -0.57769775390625, -0.468231201171875, -0.3587646484375, -0.249298095703125, -0.13983154296875, -0.030364990234375, 0.0791015625, 0.188568115234375, 0.29803466796875, 0.407501220703125, 0.5169677734375, 0.626434326171875, 0.73590087890625, 0.845367431640625, 0.954833984375, 1.064300537109375, 1.17376708984375, 1.283233642578125, 1.3927001953125, 1.502166748046875, 1.61163330078125, 1.721099853515625, 1.83056640625, 1.940032958984375, 2.04949951171875, 2.158966064453125, 2.2684326171875, 2.377899169921875, 2.48736572265625, 2.596832275390625, 2.706298828125, 2.815765380859375, 2.92523193359375, 3.034698486328125, 3.1441650390625, 3.253631591796875, 3.36309814453125, 3.472564697265625, 3.58203125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 12.0, 18.0, 29.0, 38.0, 45.0, 65.0, 77.0, 141.0, 181.0, 253.0, 324.0, 416.0, 511.0, 470.0, 429.0, 256.0, 200.0, 162.0, 122.0, 79.0, 60.0, 40.0, 36.0, 24.0, 17.0, 11.0, 14.0, 9.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-6.65234375, -6.48492431640625, -6.3175048828125, -6.15008544921875, -5.982666015625, -5.81524658203125, -5.6478271484375, -5.48040771484375, -5.31298828125, -5.14556884765625, -4.9781494140625, -4.81072998046875, -4.643310546875, -4.47589111328125, -4.3084716796875, -4.14105224609375, -3.9736328125, -3.80621337890625, -3.6387939453125, -3.47137451171875, -3.303955078125, -3.13653564453125, -2.9691162109375, -2.80169677734375, -2.63427734375, -2.46685791015625, -2.2994384765625, -2.13201904296875, -1.964599609375, -1.79718017578125, -1.6297607421875, -1.46234130859375, -1.294921875, -1.12750244140625, -0.9600830078125, -0.79266357421875, -0.625244140625, -0.45782470703125, -0.2904052734375, -0.12298583984375, 0.04443359375, 0.21185302734375, 0.3792724609375, 0.54669189453125, 0.714111328125, 0.88153076171875, 1.0489501953125, 1.21636962890625, 1.3837890625, 1.55120849609375, 1.7186279296875, 1.88604736328125, 2.053466796875, 2.22088623046875, 2.3883056640625, 2.55572509765625, 2.72314453125, 2.89056396484375, 3.0579833984375, 3.22540283203125, 3.392822265625, 3.56024169921875, 3.7276611328125, 3.89508056640625, 4.0625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 10.0, 4.0, 8.0, 8.0, 7.0, 25.0, 23.0, 49.0, 64.0, 115.0, 207.0, 395.0, 839.0, 2137.0, 7411.0, 42477.0, 380073.0, 2781556.0, 872970.0, 88034.0, 12460.0, 3186.0, 1033.0, 535.0, 275.0, 146.0, 65.0, 58.0, 37.0, 21.0, 15.0, 12.0, 10.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.6624755859375, -7.364013671875, -7.0655517578125, -6.76708984375, -6.4686279296875, -6.170166015625, -5.8717041015625, -5.5732421875, -5.2747802734375, -4.976318359375, -4.6778564453125, -4.37939453125, -4.0809326171875, -3.782470703125, -3.4840087890625, -3.185546875, -2.8870849609375, -2.588623046875, -2.2901611328125, -1.99169921875, -1.6932373046875, -1.394775390625, -1.0963134765625, -0.7978515625, -0.4993896484375, -0.200927734375, 0.0975341796875, 0.39599609375, 0.6944580078125, 0.992919921875, 1.2913818359375, 1.58984375, 1.8883056640625, 2.186767578125, 2.4852294921875, 2.78369140625, 3.0821533203125, 3.380615234375, 3.6790771484375, 3.9775390625, 4.2760009765625, 4.574462890625, 4.8729248046875, 5.17138671875, 5.4698486328125, 5.768310546875, 6.0667724609375, 6.365234375, 6.6636962890625, 6.962158203125, 7.2606201171875, 7.55908203125, 7.8575439453125, 8.156005859375, 8.4544677734375, 8.7529296875, 9.0513916015625, 9.349853515625, 9.6483154296875, 9.94677734375, 10.2452392578125, 10.543701171875, 10.8421630859375, 11.140625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 15.0, 71.0, 164.0, 242.0, 253.0, 170.0, 58.0, 23.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.94883728027344, -73.07416534423828, -71.19949340820312, -69.3248291015625, -67.45015716552734, -65.57548522949219, -63.70081329345703, -61.82614517211914, -59.95147705078125, -58.076805114746094, -56.2021369934082, -54.32746505737305, -52.452796936035156, -50.578125, -48.703453063964844, -46.82878494262695, -44.9541130065918, -43.07944107055664, -41.20477294921875, -39.330101013183594, -37.4554328918457, -35.58076095581055, -33.706092834472656, -31.8314208984375, -29.956750869750977, -28.082080841064453, -26.20741081237793, -24.332740783691406, -22.45806884765625, -20.58340072631836, -18.708728790283203, -16.83405876159668, -14.959388732910156, -13.084718704223633, -11.21004867553711, -9.33537769317627, -7.460707664489746, -5.586037635803223, -3.711366653442383, -1.8366966247558594, 0.03797340393066406, 1.9126436710357666, 3.787313938140869, 5.661984443664551, 7.536654472351074, 9.411324501037598, 11.285995483398438, 13.160665512084961, 15.035335540771484, 16.910005569458008, 18.78467559814453, 20.659347534179688, 22.534015655517578, 24.408687591552734, 26.283357620239258, 28.15802764892578, 30.032697677612305, 31.907367706298828, 33.782039642333984, 35.656707763671875, 37.53137969970703, 39.40604782104492, 41.28071975708008, 43.15538787841797, 45.030059814453125]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 7.0, 6.0, 10.0, 11.0, 13.0, 12.0, 17.0, 21.0, 20.0, 22.0, 17.0, 24.0, 26.0, 23.0, 30.0, 32.0, 38.0, 34.0, 35.0, 43.0, 33.0, 39.0, 26.0, 38.0, 48.0, 39.0, 34.0, 34.0, 18.0, 29.0, 20.0, 25.0, 23.0, 20.0, 18.0, 17.0, 16.0, 11.0, 9.0, 7.0, 9.0, 6.0, 9.0, 5.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-15.537351608276367, -15.064696311950684, -14.592041015625, -14.119385719299316, -13.646730422973633, -13.17407512664795, -12.701419830322266, -12.228764533996582, -11.756109237670898, -11.283453941345215, -10.810798645019531, -10.338143348693848, -9.865488052368164, -9.39283275604248, -8.920177459716797, -8.447522163391113, -7.9748663902282715, -7.502211093902588, -7.029555797576904, -6.556900501251221, -6.084245204925537, -5.611589431762695, -5.138934135437012, -4.666278839111328, -4.1936235427856445, -3.720968246459961, -3.2483129501342773, -2.7756576538085938, -2.30300235748291, -1.8303468227386475, -1.3576915264129639, -0.8850362300872803, -0.4123811721801758, 0.0602741539478302, 0.5329294800758362, 1.0055848360061646, 1.4782401323318481, 1.9508955478668213, 2.423550844192505, 2.8962061405181885, 3.368861436843872, 3.8415167331695557, 4.314172267913818, 4.786827564239502, 5.2594828605651855, 5.732138156890869, 6.204793453216553, 6.677448749542236, 7.15010404586792, 7.6227593421936035, 8.095415115356445, 8.568070411682129, 9.040725708007812, 9.513381004333496, 9.98603630065918, 10.458691596984863, 10.931346893310547, 11.40400218963623, 11.876657485961914, 12.349312782287598, 12.821968078613281, 13.294623374938965, 13.767278671264648, 14.239933967590332, 14.712589263916016]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 4.0, 11.0, 11.0, 14.0, 11.0, 13.0, 34.0, 21.0, 30.0, 26.0, 41.0, 42.0, 43.0, 28.0, 43.0, 37.0, 38.0, 36.0, 51.0, 36.0, 39.0, 41.0, 35.0, 33.0, 45.0, 30.0, 17.0, 23.0, 33.0, 17.0, 13.0, 17.0, 18.0, 12.0, 11.0, 6.0, 9.0, 6.0, 2.0, 8.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.755859375, -1.6979217529296875, -1.639984130859375, -1.5820465087890625, -1.52410888671875, -1.4661712646484375, -1.408233642578125, -1.3502960205078125, -1.2923583984375, -1.2344207763671875, -1.176483154296875, -1.1185455322265625, -1.06060791015625, -1.0026702880859375, -0.944732666015625, -0.8867950439453125, -0.828857421875, -0.7709197998046875, -0.712982177734375, -0.6550445556640625, -0.59710693359375, -0.5391693115234375, -0.481231689453125, -0.4232940673828125, -0.3653564453125, -0.3074188232421875, -0.249481201171875, -0.1915435791015625, -0.13360595703125, -0.0756683349609375, -0.017730712890625, 0.0402069091796875, 0.09814453125, 0.1560821533203125, 0.214019775390625, 0.2719573974609375, 0.32989501953125, 0.3878326416015625, 0.445770263671875, 0.5037078857421875, 0.5616455078125, 0.6195831298828125, 0.677520751953125, 0.7354583740234375, 0.79339599609375, 0.8513336181640625, 0.909271240234375, 0.9672088623046875, 1.025146484375, 1.0830841064453125, 1.141021728515625, 1.1989593505859375, 1.25689697265625, 1.3148345947265625, 1.372772216796875, 1.4307098388671875, 1.4886474609375, 1.5465850830078125, 1.604522705078125, 1.6624603271484375, 1.72039794921875, 1.7783355712890625, 1.836273193359375, 1.8942108154296875, 1.9521484375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 8.0, 10.0, 16.0, 23.0, 35.0, 58.0, 86.0, 102.0, 164.0, 268.0, 366.0, 553.0, 882.0, 1249.0, 2089.0, 3179.0, 4917.0, 7525.0, 12432.0, 19607.0, 32348.0, 54282.0, 89995.0, 148683.0, 210646.0, 176947.0, 110856.0, 66407.0, 39858.0, 24087.0, 14707.0, 9323.0, 5882.0, 3774.0, 2435.0, 1603.0, 1022.0, 702.0, 449.0, 296.0, 235.0, 159.0, 108.0, 61.0, 43.0, 21.0, 17.0, 13.0, 5.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.2025146484375, -0.19612693786621094, -0.18973922729492188, -0.1833515167236328, -0.17696380615234375, -0.1705760955810547, -0.16418838500976562, -0.15780067443847656, -0.1514129638671875, -0.14502525329589844, -0.13863754272460938, -0.1322498321533203, -0.12586212158203125, -0.11947441101074219, -0.11308670043945312, -0.10669898986816406, -0.100311279296875, -0.09392356872558594, -0.08753585815429688, -0.08114814758300781, -0.07476043701171875, -0.06837272644042969, -0.061985015869140625, -0.05559730529785156, -0.0492095947265625, -0.04282188415527344, -0.036434173583984375, -0.030046463012695312, -0.02365875244140625, -0.017271041870117188, -0.010883331298828125, -0.0044956207275390625, 0.00189208984375, 0.008279800415039062, 0.014667510986328125, 0.021055221557617188, 0.02744293212890625, 0.03383064270019531, 0.040218353271484375, 0.04660606384277344, 0.0529937744140625, 0.05938148498535156, 0.06576919555664062, 0.07215690612792969, 0.07854461669921875, 0.08493232727050781, 0.09132003784179688, 0.09770774841308594, 0.104095458984375, 0.11048316955566406, 0.11687088012695312, 0.12325859069824219, 0.12964630126953125, 0.1360340118408203, 0.14242172241210938, 0.14880943298339844, 0.1551971435546875, 0.16158485412597656, 0.16797256469726562, 0.1743602752685547, 0.18074798583984375, 0.1871356964111328, 0.19352340698242188, 0.19991111755371094, 0.206298828125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 3.0, 8.0, 14.0, 16.0, 12.0, 11.0, 14.0, 13.0, 20.0, 27.0, 42.0, 30.0, 31.0, 33.0, 31.0, 42.0, 44.0, 53.0, 40.0, 1069.0, 47.0, 36.0, 40.0, 35.0, 38.0, 33.0, 38.0, 27.0, 31.0, 24.0, 15.0, 15.0, 13.0, 17.0, 10.0, 6.0, 12.0, 11.0, 2.0, 6.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.1416168212890625, -1.102569580078125, -1.0635223388671875, -1.02447509765625, -0.9854278564453125, -0.946380615234375, -0.9073333740234375, -0.8682861328125, -0.8292388916015625, -0.790191650390625, -0.7511444091796875, -0.71209716796875, -0.6730499267578125, -0.634002685546875, -0.5949554443359375, -0.555908203125, -0.5168609619140625, -0.477813720703125, -0.4387664794921875, -0.39971923828125, -0.3606719970703125, -0.321624755859375, -0.2825775146484375, -0.2435302734375, -0.2044830322265625, -0.165435791015625, -0.1263885498046875, -0.08734130859375, -0.0482940673828125, -0.009246826171875, 0.0298004150390625, 0.06884765625, 0.1078948974609375, 0.146942138671875, 0.1859893798828125, 0.22503662109375, 0.2640838623046875, 0.303131103515625, 0.3421783447265625, 0.3812255859375, 0.4202728271484375, 0.459320068359375, 0.4983673095703125, 0.53741455078125, 0.5764617919921875, 0.615509033203125, 0.6545562744140625, 0.693603515625, 0.7326507568359375, 0.771697998046875, 0.8107452392578125, 0.84979248046875, 0.8888397216796875, 0.927886962890625, 0.9669342041015625, 1.0059814453125, 1.0450286865234375, 1.084075927734375, 1.1231231689453125, 1.16217041015625, 1.2012176513671875, 1.240264892578125, 1.2793121337890625, 1.318359375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 11.0, 17.0, 28.0, 43.0, 57.0, 83.0, 119.0, 184.0, 272.0, 398.0, 607.0, 920.0, 1265.0, 1869.0, 2821.0, 4241.0, 6363.0, 9747.0, 15049.0, 22926.0, 35009.0, 52963.0, 79526.0, 116782.0, 254557.0, 1109481.0, 125632.0, 86726.0, 58078.0, 38105.0, 25320.0, 16298.0, 10636.0, 6959.0, 4691.0, 3010.0, 2050.0, 1349.0, 924.0, 617.0, 426.0, 312.0, 242.0, 136.0, 95.0, 63.0, 40.0, 24.0, 22.0, 10.0, 5.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.1190185546875, -0.11519241333007812, -0.11136627197265625, -0.10754013061523438, -0.1037139892578125, -0.09988784790039062, -0.09606170654296875, -0.09223556518554688, -0.088409423828125, -0.08458328247070312, -0.08075714111328125, -0.07693099975585938, -0.0731048583984375, -0.06927871704101562, -0.06545257568359375, -0.061626434326171875, -0.05780029296875, -0.053974151611328125, -0.05014801025390625, -0.046321868896484375, -0.0424957275390625, -0.038669586181640625, -0.03484344482421875, -0.031017303466796875, -0.027191162109375, -0.023365020751953125, -0.01953887939453125, -0.015712738037109375, -0.0118865966796875, -0.008060455322265625, -0.00423431396484375, -0.000408172607421875, 0.00341796875, 0.007244110107421875, 0.01107025146484375, 0.014896392822265625, 0.0187225341796875, 0.022548675537109375, 0.02637481689453125, 0.030200958251953125, 0.034027099609375, 0.037853240966796875, 0.04167938232421875, 0.045505523681640625, 0.0493316650390625, 0.053157806396484375, 0.05698394775390625, 0.060810089111328125, 0.06463623046875, 0.06846237182617188, 0.07228851318359375, 0.07611465454101562, 0.0799407958984375, 0.08376693725585938, 0.08759307861328125, 0.09141921997070312, 0.095245361328125, 0.09907150268554688, 0.10289764404296875, 0.10672378540039062, 0.1105499267578125, 0.11437606811523438, 0.11820220947265625, 0.12202835083007812, 0.1258544921875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 3.0, 7.0, 9.0, 6.0, 7.0, 20.0, 14.0, 21.0, 30.0, 30.0, 64.0, 114.0, 184.0, 163.0, 109.0, 48.0, 36.0, 34.0, 25.0, 20.0, 12.0, 12.0, 8.0, 11.0, 3.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0039215087890625, -0.0037575960159301758, -0.0035936832427978516, -0.0034297704696655273, -0.003265857696533203, -0.003101944923400879, -0.0029380321502685547, -0.0027741193771362305, -0.0026102066040039062, -0.002446293830871582, -0.002282381057739258, -0.0021184682846069336, -0.0019545555114746094, -0.0017906427383422852, -0.001626729965209961, -0.0014628171920776367, -0.0012989044189453125, -0.0011349916458129883, -0.0009710788726806641, -0.0008071660995483398, -0.0006432533264160156, -0.0004793405532836914, -0.0003154277801513672, -0.00015151500701904297, 1.239776611328125e-05, 0.00017631053924560547, 0.0003402233123779297, 0.0005041360855102539, 0.0006680488586425781, 0.0008319616317749023, 0.0009958744049072266, 0.0011597871780395508, 0.001323699951171875, 0.0014876127243041992, 0.0016515254974365234, 0.0018154382705688477, 0.001979351043701172, 0.002143263816833496, 0.0023071765899658203, 0.0024710893630981445, 0.0026350021362304688, 0.002798914909362793, 0.002962827682495117, 0.0031267404556274414, 0.0032906532287597656, 0.00345456600189209, 0.003618478775024414, 0.0037823915481567383, 0.0039463043212890625, 0.004110217094421387, 0.004274129867553711, 0.004438042640686035, 0.004601955413818359, 0.004765868186950684, 0.004929780960083008, 0.005093693733215332, 0.005257606506347656, 0.0054215192794799805, 0.005585432052612305, 0.005749344825744629, 0.005913257598876953, 0.006077170372009277, 0.0062410831451416016, 0.006404995918273926, 0.00656890869140625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 7.0, 7.0, 14.0, 17.0, 30.0, 33.0, 53.0, 63.0, 107.0, 128.0, 375.0, 2933.0, 889838.0, 152725.0, 1542.0, 260.0, 133.0, 83.0, 50.0, 36.0, 38.0, 21.0, 15.0, 13.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.1016845703125, -0.0989999771118164, -0.09631538391113281, -0.09363079071044922, -0.09094619750976562, -0.08826160430908203, -0.08557701110839844, -0.08289241790771484, -0.08020782470703125, -0.07752323150634766, -0.07483863830566406, -0.07215404510498047, -0.06946945190429688, -0.06678485870361328, -0.06410026550292969, -0.061415672302246094, -0.0587310791015625, -0.056046485900878906, -0.05336189270019531, -0.05067729949951172, -0.047992706298828125, -0.04530811309814453, -0.04262351989746094, -0.039938926696777344, -0.03725433349609375, -0.034569740295410156, -0.03188514709472656, -0.02920055389404297, -0.026515960693359375, -0.02383136749267578, -0.021146774291992188, -0.018462181091308594, -0.015777587890625, -0.013092994689941406, -0.010408401489257812, -0.007723808288574219, -0.005039215087890625, -0.0023546218872070312, 0.0003299713134765625, 0.0030145645141601562, 0.00569915771484375, 0.008383750915527344, 0.011068344116210938, 0.013752937316894531, 0.016437530517578125, 0.01912212371826172, 0.021806716918945312, 0.024491310119628906, 0.0271759033203125, 0.029860496520996094, 0.03254508972167969, 0.03522968292236328, 0.037914276123046875, 0.04059886932373047, 0.04328346252441406, 0.045968055725097656, 0.04865264892578125, 0.051337242126464844, 0.05402183532714844, 0.05670642852783203, 0.059391021728515625, 0.06207561492919922, 0.06476020812988281, 0.0674448013305664, 0.07012939453125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 16.0, 107.0, 571.0, 253.0, 54.0, 18.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004443892743438482, -0.0038606177549809217, -0.003277342766523361, -0.0026940680108964443, -0.0021107930224388838, -0.0015275180339813232, -0.0009442432783544064, -0.00036096805706620216, 0.00022230669856071472, 0.0008055816288106143, 0.001388856559060514, 0.0019721314311027527, 0.0025554064195603132, 0.0031386814080178738, 0.0037219561636447906, 0.004305231384932995, 0.004888506140559912, 0.005471780896186829, 0.006055056117475033, 0.00663833087310195, 0.007221605628728867, 0.007804880850017071, 0.008388156071305275, 0.008971430361270905, 0.009554705582559109, 0.010137980803847313, 0.010721255093812943, 0.011304530315101147, 0.011887805536389351, 0.01247107982635498, 0.013054355047643185, 0.013637630268931389, 0.014220906421542168, 0.014804181642830372, 0.015387455932796001, 0.015970731154084206, 0.016554005444049835, 0.017137281596660614, 0.017720555886626244, 0.018303830176591873, 0.018887106329202652, 0.01947038061916828, 0.02005365677177906, 0.02063693106174469, 0.02122020535171032, 0.0218034815043211, 0.022386755794286728, 0.022970031946897507, 0.023553304374217987, 0.024136578664183617, 0.024719854816794395, 0.025303129106760025, 0.025886403396725655, 0.026469679549336433, 0.027052953839302063, 0.027636229991912842, 0.02821950428187847, 0.0288027785718441, 0.02938605472445488, 0.02996932901442051, 0.03055260330438614, 0.031135879456996918, 0.0317191556096077, 0.03230242803692818, 0.032885704189538956]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 3.0, 6.0, 8.0, 6.0, 12.0, 13.0, 13.0, 18.0, 20.0, 24.0, 25.0, 37.0, 50.0, 39.0, 32.0, 32.0, 40.0, 36.0, 41.0, 41.0, 32.0, 49.0, 35.0, 43.0, 32.0, 38.0, 32.0, 34.0, 25.0, 26.0, 20.0, 21.0, 20.0, 11.0, 9.0, 11.0, 9.0, 9.0, 3.0, 8.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0018526911735534668, -0.0017955005168914795, -0.0017383098602294922, -0.0016811192035675049, -0.0016239285469055176, -0.0015667378902435303, -0.001509547233581543, -0.0014523565769195557, -0.0013951659202575684, -0.001337975263595581, -0.0012807846069335938, -0.0012235939502716064, -0.0011664032936096191, -0.0011092126369476318, -0.0010520219802856445, -0.0009948313236236572, -0.0009376406669616699, -0.0008804500102996826, -0.0008232593536376953, -0.000766068696975708, -0.0007088780403137207, -0.0006516873836517334, -0.0005944967269897461, -0.0005373060703277588, -0.0004801154136657715, -0.0004229247570037842, -0.0003657341003417969, -0.00030854344367980957, -0.00025135278701782227, -0.00019416213035583496, -0.00013697147369384766, -7.978081703186035e-05, -2.2590160369873047e-05, 3.460049629211426e-05, 9.179115295410156e-05, 0.00014898180961608887, 0.00020617246627807617, 0.0002633631229400635, 0.0003205537796020508, 0.0003777444362640381, 0.0004349350929260254, 0.0004921257495880127, 0.00054931640625, 0.0006065070629119873, 0.0006636977195739746, 0.0007208883762359619, 0.0007780790328979492, 0.0008352696895599365, 0.0008924603462219238, 0.0009496510028839111, 0.0010068416595458984, 0.0010640323162078857, 0.001121222972869873, 0.0011784136295318604, 0.0012356042861938477, 0.001292794942855835, 0.0013499855995178223, 0.0014071762561798096, 0.0014643669128417969, 0.0015215575695037842, 0.0015787482261657715, 0.0016359388828277588, 0.001693129539489746, 0.0017503201961517334, 0.0018075108528137207]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 4.0, 11.0, 11.0, 14.0, 11.0, 13.0, 34.0, 21.0, 30.0, 27.0, 40.0, 42.0, 43.0, 28.0, 43.0, 37.0, 38.0, 36.0, 51.0, 36.0, 39.0, 41.0, 35.0, 33.0, 45.0, 30.0, 17.0, 23.0, 33.0, 17.0, 13.0, 17.0, 18.0, 12.0, 11.0, 6.0, 9.0, 6.0, 2.0, 8.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.755859375, -1.6979217529296875, -1.639984130859375, -1.5820465087890625, -1.52410888671875, -1.4661712646484375, -1.408233642578125, -1.3502960205078125, -1.2923583984375, -1.2344207763671875, -1.176483154296875, -1.1185455322265625, -1.06060791015625, -1.0026702880859375, -0.944732666015625, -0.8867950439453125, -0.828857421875, -0.7709197998046875, -0.712982177734375, -0.6550445556640625, -0.59710693359375, -0.5391693115234375, -0.481231689453125, -0.4232940673828125, -0.3653564453125, -0.3074188232421875, -0.249481201171875, -0.1915435791015625, -0.13360595703125, -0.0756683349609375, -0.017730712890625, 0.0402069091796875, 0.09814453125, 0.1560821533203125, 0.214019775390625, 0.2719573974609375, 0.32989501953125, 0.3878326416015625, 0.445770263671875, 0.5037078857421875, 0.5616455078125, 0.6195831298828125, 0.677520751953125, 0.7354583740234375, 0.79339599609375, 0.8513336181640625, 0.909271240234375, 0.9672088623046875, 1.025146484375, 1.0830841064453125, 1.141021728515625, 1.1989593505859375, 1.25689697265625, 1.3148345947265625, 1.372772216796875, 1.4307098388671875, 1.4886474609375, 1.5465850830078125, 1.604522705078125, 1.6624603271484375, 1.72039794921875, 1.7783355712890625, 1.836273193359375, 1.8942108154296875, 1.9521484375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 10.0, 10.0, 11.0, 24.0, 38.0, 41.0, 65.0, 112.0, 173.0, 313.0, 546.0, 896.0, 1563.0, 2795.0, 5105.0, 9623.0, 18285.0, 35355.0, 67475.0, 126055.0, 207198.0, 233113.0, 156432.0, 86900.0, 45411.0, 23828.0, 12432.0, 6618.0, 3505.0, 1958.0, 1120.0, 591.0, 339.0, 226.0, 136.0, 78.0, 56.0, 26.0, 20.0, 19.0, 18.0, 9.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.3154296875, -1.2718658447265625, -1.228302001953125, -1.1847381591796875, -1.14117431640625, -1.0976104736328125, -1.054046630859375, -1.0104827880859375, -0.9669189453125, -0.9233551025390625, -0.879791259765625, -0.8362274169921875, -0.79266357421875, -0.7490997314453125, -0.705535888671875, -0.6619720458984375, -0.618408203125, -0.5748443603515625, -0.531280517578125, -0.4877166748046875, -0.44415283203125, -0.4005889892578125, -0.357025146484375, -0.3134613037109375, -0.2698974609375, -0.2263336181640625, -0.182769775390625, -0.1392059326171875, -0.09564208984375, -0.0520782470703125, -0.008514404296875, 0.0350494384765625, 0.07861328125, 0.1221771240234375, 0.165740966796875, 0.2093048095703125, 0.25286865234375, 0.2964324951171875, 0.339996337890625, 0.3835601806640625, 0.4271240234375, 0.4706878662109375, 0.514251708984375, 0.5578155517578125, 0.60137939453125, 0.6449432373046875, 0.688507080078125, 0.7320709228515625, 0.775634765625, 0.8191986083984375, 0.862762451171875, 0.9063262939453125, 0.94989013671875, 0.9934539794921875, 1.037017822265625, 1.0805816650390625, 1.1241455078125, 1.1677093505859375, 1.211273193359375, 1.2548370361328125, 1.29840087890625, 1.3419647216796875, 1.385528564453125, 1.4290924072265625, 1.47265625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 3.0, 6.0, 10.0, 8.0, 19.0, 16.0, 26.0, 27.0, 27.0, 30.0, 39.0, 49.0, 44.0, 50.0, 92.0, 128.0, 299.0, 1399.0, 223.0, 108.0, 74.0, 55.0, 37.0, 42.0, 24.0, 29.0, 21.0, 29.0, 26.0, 22.0, 7.0, 11.0, 20.0, 15.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.93359375, -6.71893310546875, -6.5042724609375, -6.28961181640625, -6.074951171875, -5.86029052734375, -5.6456298828125, -5.43096923828125, -5.21630859375, -5.00164794921875, -4.7869873046875, -4.57232666015625, -4.357666015625, -4.14300537109375, -3.9283447265625, -3.71368408203125, -3.4990234375, -3.28436279296875, -3.0697021484375, -2.85504150390625, -2.640380859375, -2.42572021484375, -2.2110595703125, -1.99639892578125, -1.78173828125, -1.56707763671875, -1.3524169921875, -1.13775634765625, -0.923095703125, -0.70843505859375, -0.4937744140625, -0.27911376953125, -0.064453125, 0.15020751953125, 0.3648681640625, 0.57952880859375, 0.794189453125, 1.00885009765625, 1.2235107421875, 1.43817138671875, 1.65283203125, 1.86749267578125, 2.0821533203125, 2.29681396484375, 2.511474609375, 2.72613525390625, 2.9407958984375, 3.15545654296875, 3.3701171875, 3.58477783203125, 3.7994384765625, 4.01409912109375, 4.228759765625, 4.44342041015625, 4.6580810546875, 4.87274169921875, 5.08740234375, 5.30206298828125, 5.5167236328125, 5.73138427734375, 5.946044921875, 6.16070556640625, 6.3753662109375, 6.59002685546875, 6.8046875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 4.0, 17.0, 18.0, 32.0, 36.0, 44.0, 95.0, 150.0, 261.0, 696.0, 4027.0, 588031.0, 2543439.0, 7167.0, 898.0, 338.0, 155.0, 87.0, 65.0, 54.0, 21.0, 21.0, 14.0, 9.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.567626953125, -19.01025390625, -18.452880859375, -17.8955078125, -17.338134765625, -16.78076171875, -16.223388671875, -15.666015625, -15.108642578125, -14.55126953125, -13.993896484375, -13.4365234375, -12.879150390625, -12.32177734375, -11.764404296875, -11.20703125, -10.649658203125, -10.09228515625, -9.534912109375, -8.9775390625, -8.420166015625, -7.86279296875, -7.305419921875, -6.748046875, -6.190673828125, -5.63330078125, -5.075927734375, -4.5185546875, -3.961181640625, -3.40380859375, -2.846435546875, -2.2890625, -1.731689453125, -1.17431640625, -0.616943359375, -0.0595703125, 0.497802734375, 1.05517578125, 1.612548828125, 2.169921875, 2.727294921875, 3.28466796875, 3.842041015625, 4.3994140625, 4.956787109375, 5.51416015625, 6.071533203125, 6.62890625, 7.186279296875, 7.74365234375, 8.301025390625, 8.8583984375, 9.415771484375, 9.97314453125, 10.530517578125, 11.087890625, 11.645263671875, 12.20263671875, 12.760009765625, 13.3173828125, 13.874755859375, 14.43212890625, 14.989501953125, 15.546875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 25.0, 99.0, 228.0, 332.0, 221.0, 84.0, 15.0, 4.0], "bins": [-56.3259162902832, -55.37737274169922, -54.42882537841797, -53.48027801513672, -52.531734466552734, -51.58319091796875, -50.6346435546875, -49.68609619140625, -48.737552642822266, -47.78900909423828, -46.84046173095703, -45.89191436767578, -44.9433708190918, -43.99482727050781, -43.04627990722656, -42.09773254394531, -41.14918899536133, -40.200645446777344, -39.252098083496094, -38.303550720214844, -37.35500717163086, -36.406463623046875, -35.457916259765625, -34.509368896484375, -33.56082534790039, -32.612281799316406, -31.663734436035156, -30.71518898010254, -29.766643524169922, -28.818098068237305, -27.869552612304688, -26.92100715637207, -25.972461700439453, -25.023916244506836, -24.07537078857422, -23.1268253326416, -22.178279876708984, -21.229734420776367, -20.28118896484375, -19.332643508911133, -18.384098052978516, -17.4355525970459, -16.48700714111328, -15.538461685180664, -14.589916229248047, -13.64137077331543, -12.692825317382812, -11.744279861450195, -10.795734405517578, -9.847188949584961, -8.898643493652344, -7.950098037719727, -7.001552581787109, -6.053007125854492, -5.104461669921875, -4.155916213989258, -3.2073707580566406, -2.2588253021240234, -1.3102798461914062, -0.36173439025878906, 0.5868110656738281, 1.5353565216064453, 2.4839019775390625, 3.4324474334716797, 4.380992889404297]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 6.0, 15.0, 13.0, 9.0, 9.0, 15.0, 21.0, 16.0, 19.0, 22.0, 27.0, 30.0, 37.0, 40.0, 35.0, 38.0, 43.0, 53.0, 37.0, 36.0, 32.0, 44.0, 33.0, 41.0, 30.0, 21.0, 30.0, 34.0, 34.0, 27.0, 16.0, 19.0, 17.0, 15.0, 13.0, 9.0, 14.0, 4.0, 5.0, 8.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-21.65929412841797, -21.034812927246094, -20.41033363342285, -19.785852432250977, -19.161373138427734, -18.53689193725586, -17.912410736083984, -17.28792953491211, -16.663450241088867, -16.038969039916992, -15.41448974609375, -14.790008544921875, -14.165528297424316, -13.541048049926758, -12.916566848754883, -12.292086601257324, -11.667606353759766, -11.043126106262207, -10.418645858764648, -9.794164657592773, -9.169684410095215, -8.545204162597656, -7.9207234382629395, -7.296242713928223, -6.671762466430664, -6.0472822189331055, -5.422801494598389, -4.798320770263672, -4.173840522766113, -3.5493600368499756, -2.924879550933838, -2.300398826599121, -1.6759204864501953, -1.0514400005340576, -0.4269595146179199, 0.19752097129821777, 0.8220014572143555, 1.4464819431304932, 2.070962429046631, 2.6954431533813477, 3.3199234008789062, 3.944403886795044, 4.568884372711182, 5.193365097045898, 5.817845344543457, 6.442325592041016, 7.066806316375732, 7.691287040710449, 8.315767288208008, 8.940247535705566, 9.564727783203125, 10.189208984375, 10.813689231872559, 11.438169479370117, 12.062650680541992, 12.68713092803955, 13.31161117553711, 13.936091423034668, 14.560571670532227, 15.185052871704102, 15.80953311920166, 16.43401336669922, 17.058494567871094, 17.68297576904297, 18.30745506286621]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 5.0, 7.0, 17.0, 18.0, 14.0, 26.0, 30.0, 23.0, 42.0, 33.0, 36.0, 53.0, 43.0, 29.0, 45.0, 40.0, 41.0, 34.0, 51.0, 46.0, 27.0, 47.0, 36.0, 38.0, 26.0, 21.0, 19.0, 24.0, 26.0, 16.0, 19.0, 9.0, 10.0, 4.0, 11.0, 7.0, 3.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.865234375, -1.800689697265625, -1.73614501953125, -1.671600341796875, -1.6070556640625, -1.542510986328125, -1.47796630859375, -1.413421630859375, -1.348876953125, -1.284332275390625, -1.21978759765625, -1.155242919921875, -1.0906982421875, -1.026153564453125, -0.96160888671875, -0.897064208984375, -0.83251953125, -0.767974853515625, -0.70343017578125, -0.638885498046875, -0.5743408203125, -0.509796142578125, -0.44525146484375, -0.380706787109375, -0.316162109375, -0.251617431640625, -0.18707275390625, -0.122528076171875, -0.0579833984375, 0.006561279296875, 0.07110595703125, 0.135650634765625, 0.2001953125, 0.264739990234375, 0.32928466796875, 0.393829345703125, 0.4583740234375, 0.522918701171875, 0.58746337890625, 0.652008056640625, 0.716552734375, 0.781097412109375, 0.84564208984375, 0.910186767578125, 0.9747314453125, 1.039276123046875, 1.10382080078125, 1.168365478515625, 1.23291015625, 1.297454833984375, 1.36199951171875, 1.426544189453125, 1.4910888671875, 1.555633544921875, 1.62017822265625, 1.684722900390625, 1.749267578125, 1.813812255859375, 1.87835693359375, 1.942901611328125, 2.0074462890625, 2.071990966796875, 2.13653564453125, 2.201080322265625, 2.265625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 5.0, 7.0, 12.0, 7.0, 16.0, 14.0, 20.0, 32.0, 43.0, 61.0, 100.0, 174.0, 271.0, 616.0, 1485.0, 4632.0, 15957.0, 66123.0, 337695.0, 1714791.0, 1660259.0, 308070.0, 61061.0, 15323.0, 4550.0, 1506.0, 609.0, 325.0, 185.0, 89.0, 50.0, 48.0, 30.0, 27.0, 18.0, 18.0, 11.0, 9.0, 8.0, 9.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.20703125, -4.07122802734375, -3.9354248046875, -3.79962158203125, -3.663818359375, -3.52801513671875, -3.3922119140625, -3.25640869140625, -3.12060546875, -2.98480224609375, -2.8489990234375, -2.71319580078125, -2.577392578125, -2.44158935546875, -2.3057861328125, -2.16998291015625, -2.0341796875, -1.89837646484375, -1.7625732421875, -1.62677001953125, -1.490966796875, -1.35516357421875, -1.2193603515625, -1.08355712890625, -0.94775390625, -0.81195068359375, -0.6761474609375, -0.54034423828125, -0.404541015625, -0.26873779296875, -0.1329345703125, 0.00286865234375, 0.138671875, 0.27447509765625, 0.4102783203125, 0.54608154296875, 0.681884765625, 0.81768798828125, 0.9534912109375, 1.08929443359375, 1.22509765625, 1.36090087890625, 1.4967041015625, 1.63250732421875, 1.768310546875, 1.90411376953125, 2.0399169921875, 2.17572021484375, 2.3115234375, 2.44732666015625, 2.5831298828125, 2.71893310546875, 2.854736328125, 2.99053955078125, 3.1263427734375, 3.26214599609375, 3.39794921875, 3.53375244140625, 3.6695556640625, 3.80535888671875, 3.941162109375, 4.07696533203125, 4.2127685546875, 4.34857177734375, 4.484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 8.0, 24.0, 27.0, 59.0, 82.0, 111.0, 164.0, 286.0, 444.0, 616.0, 730.0, 556.0, 368.0, 220.0, 128.0, 96.0, 58.0, 34.0, 23.0, 9.0, 5.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1796875, -9.92034912109375, -9.6610107421875, -9.40167236328125, -9.142333984375, -8.88299560546875, -8.6236572265625, -8.36431884765625, -8.10498046875, -7.84564208984375, -7.5863037109375, -7.32696533203125, -7.067626953125, -6.80828857421875, -6.5489501953125, -6.28961181640625, -6.0302734375, -5.77093505859375, -5.5115966796875, -5.25225830078125, -4.992919921875, -4.73358154296875, -4.4742431640625, -4.21490478515625, -3.95556640625, -3.69622802734375, -3.4368896484375, -3.17755126953125, -2.918212890625, -2.65887451171875, -2.3995361328125, -2.14019775390625, -1.880859375, -1.62152099609375, -1.3621826171875, -1.10284423828125, -0.843505859375, -0.58416748046875, -0.3248291015625, -0.06549072265625, 0.19384765625, 0.45318603515625, 0.7125244140625, 0.97186279296875, 1.231201171875, 1.49053955078125, 1.7498779296875, 2.00921630859375, 2.2685546875, 2.52789306640625, 2.7872314453125, 3.04656982421875, 3.305908203125, 3.56524658203125, 3.8245849609375, 4.08392333984375, 4.34326171875, 4.60260009765625, 4.8619384765625, 5.12127685546875, 5.380615234375, 5.63995361328125, 5.8992919921875, 6.15863037109375, 6.41796875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 12.0, 18.0, 33.0, 33.0, 71.0, 120.0, 237.0, 427.0, 835.0, 1914.0, 6828.0, 48712.0, 653972.0, 3051337.0, 390375.0, 31113.0, 5022.0, 1581.0, 716.0, 391.0, 218.0, 120.0, 73.0, 35.0, 24.0, 19.0, 9.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.6607666015625, -8.305908203125, -7.9510498046875, -7.59619140625, -7.2413330078125, -6.886474609375, -6.5316162109375, -6.1767578125, -5.8218994140625, -5.467041015625, -5.1121826171875, -4.75732421875, -4.4024658203125, -4.047607421875, -3.6927490234375, -3.337890625, -2.9830322265625, -2.628173828125, -2.2733154296875, -1.91845703125, -1.5635986328125, -1.208740234375, -0.8538818359375, -0.4990234375, -0.1441650390625, 0.210693359375, 0.5655517578125, 0.92041015625, 1.2752685546875, 1.630126953125, 1.9849853515625, 2.33984375, 2.6947021484375, 3.049560546875, 3.4044189453125, 3.75927734375, 4.1141357421875, 4.468994140625, 4.8238525390625, 5.1787109375, 5.5335693359375, 5.888427734375, 6.2432861328125, 6.59814453125, 6.9530029296875, 7.307861328125, 7.6627197265625, 8.017578125, 8.3724365234375, 8.727294921875, 9.0821533203125, 9.43701171875, 9.7918701171875, 10.146728515625, 10.5015869140625, 10.8564453125, 11.2113037109375, 11.566162109375, 11.9210205078125, 12.27587890625, 12.6307373046875, 12.985595703125, 13.3404541015625, 13.6953125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 19.0, 66.0, 135.0, 253.0, 242.0, 161.0, 90.0, 29.0, 9.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.59773254394531, -42.5008659362793, -40.40399932861328, -38.30712890625, -36.210262298583984, -34.11339569091797, -32.01652526855469, -29.919658660888672, -27.822792053222656, -25.72592544555664, -23.629056930541992, -21.532188415527344, -19.435321807861328, -17.338455200195312, -15.241586685180664, -13.144719123840332, -11.0478515625, -8.950984001159668, -6.854116439819336, -4.757248878479004, -2.660381317138672, -0.5635137557983398, 1.5333538055419922, 3.630221366882324, 5.727088928222656, 7.823956489562988, 9.92082405090332, 12.017691612243652, 14.114559173583984, 16.21142578125, 18.30829429626465, 20.405162811279297, 22.502029418945312, 24.598896026611328, 26.695764541625977, 28.792633056640625, 30.88949966430664, 32.986366271972656, 35.08323669433594, 37.18010330200195, 39.27696990966797, 41.373836517333984, 43.470703125, 45.56757354736328, 47.6644401550293, 49.76130676269531, 51.858177185058594, 53.95504379272461, 56.051910400390625, 58.14877700805664, 60.245643615722656, 62.34251403808594, 64.43937683105469, 66.53624725341797, 68.63311767578125, 70.72998046875, 72.82685089111328, 74.92372131347656, 77.02058410644531, 79.1174545288086, 81.21432495117188, 83.31118774414062, 85.4080581665039, 87.50492095947266, 89.60179138183594]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 10.0, 7.0, 11.0, 11.0, 15.0, 12.0, 13.0, 12.0, 17.0, 24.0, 25.0, 32.0, 26.0, 33.0, 34.0, 43.0, 49.0, 46.0, 37.0, 46.0, 36.0, 36.0, 36.0, 36.0, 39.0, 40.0, 34.0, 29.0, 37.0, 26.0, 26.0, 24.0, 18.0, 16.0, 11.0, 9.0, 10.0, 9.0, 5.0, 9.0, 1.0, 0.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.118377685546875, -19.504465103149414, -18.890554428100586, -18.276641845703125, -17.662731170654297, -17.048818588256836, -16.434906005859375, -15.82099437713623, -15.207082748413086, -14.593171119689941, -13.979259490966797, -13.365346908569336, -12.751435279846191, -12.137523651123047, -11.523611068725586, -10.909699440002441, -10.295787811279297, -9.681876182556152, -9.067964553833008, -8.454051971435547, -7.840140342712402, -7.226228713989258, -6.612316608428955, -5.998404502868652, -5.384492874145508, -4.770581245422363, -4.1566691398620605, -3.542757272720337, -2.9288454055786133, -2.3149335384368896, -1.701021671295166, -1.0871095657348633, -0.47319793701171875, 0.14071393013000488, 0.7546257972717285, 1.3685376644134521, 1.9824495315551758, 2.5963613986968994, 3.210273265838623, 3.824185371398926, 4.43809700012207, 5.052008628845215, 5.665920734405518, 6.27983283996582, 6.893744468688965, 7.507656097412109, 8.12156867980957, 8.735480308532715, 9.34939193725586, 9.963303565979004, 10.577215194702148, 11.19112777709961, 11.805039405822754, 12.418951034545898, 13.03286361694336, 13.646775245666504, 14.260686874389648, 14.874598503112793, 15.488510131835938, 16.1024227142334, 16.71633529663086, 17.330245971679688, 17.94415855407715, 18.55807113647461, 19.171981811523438]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 3.0, 9.0, 5.0, 7.0, 8.0, 8.0, 18.0, 13.0, 22.0, 25.0, 28.0, 29.0, 25.0, 36.0, 28.0, 29.0, 37.0, 39.0, 27.0, 34.0, 46.0, 36.0, 36.0, 38.0, 37.0, 36.0, 36.0, 30.0, 27.0, 31.0, 35.0, 26.0, 24.0, 12.0, 19.0, 17.0, 16.0, 12.0, 12.0, 8.0, 8.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.6920318603515625, -1.633087158203125, -1.5741424560546875, -1.51519775390625, -1.4562530517578125, -1.397308349609375, -1.3383636474609375, -1.2794189453125, -1.2204742431640625, -1.161529541015625, -1.1025848388671875, -1.04364013671875, -0.9846954345703125, -0.925750732421875, -0.8668060302734375, -0.807861328125, -0.7489166259765625, -0.689971923828125, -0.6310272216796875, -0.57208251953125, -0.5131378173828125, -0.454193115234375, -0.3952484130859375, -0.3363037109375, -0.2773590087890625, -0.218414306640625, -0.1594696044921875, -0.10052490234375, -0.0415802001953125, 0.017364501953125, 0.0763092041015625, 0.13525390625, 0.1941986083984375, 0.253143310546875, 0.3120880126953125, 0.37103271484375, 0.4299774169921875, 0.488922119140625, 0.5478668212890625, 0.6068115234375, 0.6657562255859375, 0.724700927734375, 0.7836456298828125, 0.84259033203125, 0.9015350341796875, 0.960479736328125, 1.0194244384765625, 1.078369140625, 1.1373138427734375, 1.196258544921875, 1.2552032470703125, 1.31414794921875, 1.3730926513671875, 1.432037353515625, 1.4909820556640625, 1.5499267578125, 1.6088714599609375, 1.667816162109375, 1.7267608642578125, 1.78570556640625, 1.8446502685546875, 1.903594970703125, 1.9625396728515625, 2.021484375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 25.0, 26.0, 48.0, 72.0, 80.0, 146.0, 197.0, 341.0, 553.0, 828.0, 1247.0, 1908.0, 2873.0, 4402.0, 7093.0, 10736.0, 17465.0, 28265.0, 46717.0, 77269.0, 127927.0, 195102.0, 195737.0, 127887.0, 77386.0, 47114.0, 28679.0, 17401.0, 10984.0, 7062.0, 4461.0, 2968.0, 1954.0, 1243.0, 823.0, 533.0, 325.0, 235.0, 168.0, 95.0, 66.0, 29.0, 18.0, 22.0, 13.0, 3.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.2462158203125, -0.2387561798095703, -0.23129653930664062, -0.22383689880371094, -0.21637725830078125, -0.20891761779785156, -0.20145797729492188, -0.1939983367919922, -0.1865386962890625, -0.1790790557861328, -0.17161941528320312, -0.16415977478027344, -0.15670013427734375, -0.14924049377441406, -0.14178085327148438, -0.1343212127685547, -0.126861572265625, -0.11940193176269531, -0.11194229125976562, -0.10448265075683594, -0.09702301025390625, -0.08956336975097656, -0.08210372924804688, -0.07464408874511719, -0.0671844482421875, -0.05972480773925781, -0.052265167236328125, -0.04480552673339844, -0.03734588623046875, -0.029886245727539062, -0.022426605224609375, -0.014966964721679688, -0.00750732421875, -4.76837158203125e-05, 0.007411956787109375, 0.014871597290039062, 0.02233123779296875, 0.029790878295898438, 0.037250518798828125, 0.04471015930175781, 0.0521697998046875, 0.05962944030761719, 0.06708908081054688, 0.07454872131347656, 0.08200836181640625, 0.08946800231933594, 0.09692764282226562, 0.10438728332519531, 0.111846923828125, 0.11930656433105469, 0.12676620483398438, 0.13422584533691406, 0.14168548583984375, 0.14914512634277344, 0.15660476684570312, 0.1640644073486328, 0.1715240478515625, 0.1789836883544922, 0.18644332885742188, 0.19390296936035156, 0.20136260986328125, 0.20882225036621094, 0.21628189086914062, 0.2237415313720703, 0.231201171875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 9.0, 10.0, 7.0, 12.0, 8.0, 17.0, 13.0, 17.0, 18.0, 17.0, 31.0, 22.0, 31.0, 36.0, 51.0, 43.0, 34.0, 40.0, 47.0, 1070.0, 44.0, 35.0, 45.0, 35.0, 42.0, 30.0, 27.0, 25.0, 31.0, 24.0, 17.0, 20.0, 17.0, 10.0, 11.0, 12.0, 13.0, 11.0, 10.0, 9.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.3076171875, -1.2667236328125, -1.225830078125, -1.1849365234375, -1.14404296875, -1.1031494140625, -1.062255859375, -1.0213623046875, -0.98046875, -0.9395751953125, -0.898681640625, -0.8577880859375, -0.81689453125, -0.7760009765625, -0.735107421875, -0.6942138671875, -0.6533203125, -0.6124267578125, -0.571533203125, -0.5306396484375, -0.48974609375, -0.4488525390625, -0.407958984375, -0.3670654296875, -0.326171875, -0.2852783203125, -0.244384765625, -0.2034912109375, -0.16259765625, -0.1217041015625, -0.080810546875, -0.0399169921875, 0.0009765625, 0.0418701171875, 0.082763671875, 0.1236572265625, 0.16455078125, 0.2054443359375, 0.246337890625, 0.2872314453125, 0.328125, 0.3690185546875, 0.409912109375, 0.4508056640625, 0.49169921875, 0.5325927734375, 0.573486328125, 0.6143798828125, 0.6552734375, 0.6961669921875, 0.737060546875, 0.7779541015625, 0.81884765625, 0.8597412109375, 0.900634765625, 0.9415283203125, 0.982421875, 1.0233154296875, 1.064208984375, 1.1051025390625, 1.14599609375, 1.1868896484375, 1.227783203125, 1.2686767578125, 1.3095703125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 5.0, 10.0, 9.0, 17.0, 48.0, 40.0, 64.0, 78.0, 102.0, 132.0, 233.0, 305.0, 403.0, 538.0, 714.0, 1031.0, 1442.0, 1894.0, 2772.0, 3745.0, 5234.0, 7243.0, 10576.0, 14633.0, 20615.0, 28856.0, 40900.0, 57034.0, 78854.0, 107173.0, 332835.0, 977157.0, 111686.0, 83208.0, 59843.0, 42498.0, 30241.0, 21602.0, 15357.0, 10830.0, 7740.0, 5467.0, 3868.0, 2807.0, 1990.0, 1450.0, 1080.0, 763.0, 586.0, 387.0, 307.0, 205.0, 163.0, 104.0, 79.0, 60.0, 43.0, 27.0, 21.0, 24.0, 7.0, 8.0, 4.0], "bins": [-0.11614990234375, -0.11252880096435547, -0.10890769958496094, -0.1052865982055664, -0.10166549682617188, -0.09804439544677734, -0.09442329406738281, -0.09080219268798828, -0.08718109130859375, -0.08355998992919922, -0.07993888854980469, -0.07631778717041016, -0.07269668579101562, -0.0690755844116211, -0.06545448303222656, -0.06183338165283203, -0.0582122802734375, -0.05459117889404297, -0.05097007751464844, -0.047348976135253906, -0.043727874755859375, -0.040106773376464844, -0.03648567199707031, -0.03286457061767578, -0.02924346923828125, -0.02562236785888672, -0.022001266479492188, -0.018380165100097656, -0.014759063720703125, -0.011137962341308594, -0.0075168609619140625, -0.0038957595825195312, -0.000274658203125, 0.0033464431762695312, 0.0069675445556640625, 0.010588645935058594, 0.014209747314453125, 0.017830848693847656, 0.021451950073242188, 0.02507305145263672, 0.02869415283203125, 0.03231525421142578, 0.03593635559082031, 0.039557456970214844, 0.043178558349609375, 0.046799659729003906, 0.05042076110839844, 0.05404186248779297, 0.0576629638671875, 0.06128406524658203, 0.06490516662597656, 0.0685262680053711, 0.07214736938476562, 0.07576847076416016, 0.07938957214355469, 0.08301067352294922, 0.08663177490234375, 0.09025287628173828, 0.09387397766113281, 0.09749507904052734, 0.10111618041992188, 0.1047372817993164, 0.10835838317871094, 0.11197948455810547, 0.1156005859375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 7.0, 11.0, 13.0, 17.0, 26.0, 25.0, 33.0, 45.0, 63.0, 96.0, 110.0, 133.0, 106.0, 75.0, 56.0, 34.0, 28.0, 22.0, 16.0, 16.0, 9.0, 6.0, 5.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0060272216796875, -0.00585561990737915, -0.005684018135070801, -0.005512416362762451, -0.0053408145904541016, -0.005169212818145752, -0.004997611045837402, -0.004826009273529053, -0.004654407501220703, -0.0044828057289123535, -0.004311203956604004, -0.004139602184295654, -0.003968000411987305, -0.003796398639678955, -0.0036247968673706055, -0.003453195095062256, -0.0032815933227539062, -0.0031099915504455566, -0.002938389778137207, -0.0027667880058288574, -0.002595186233520508, -0.002423584461212158, -0.0022519826889038086, -0.002080380916595459, -0.0019087791442871094, -0.0017371773719787598, -0.0015655755996704102, -0.0013939738273620605, -0.001222372055053711, -0.0010507702827453613, -0.0008791685104370117, -0.0007075667381286621, -0.0005359649658203125, -0.0003643631935119629, -0.00019276142120361328, -2.1159648895263672e-05, 0.00015044212341308594, 0.00032204389572143555, 0.0004936456680297852, 0.0006652474403381348, 0.0008368492126464844, 0.001008450984954834, 0.0011800527572631836, 0.0013516545295715332, 0.0015232563018798828, 0.0016948580741882324, 0.001866459846496582, 0.0020380616188049316, 0.0022096633911132812, 0.002381265163421631, 0.0025528669357299805, 0.00272446870803833, 0.0028960704803466797, 0.0030676722526550293, 0.003239274024963379, 0.0034108757972717285, 0.003582477569580078, 0.0037540793418884277, 0.003925681114196777, 0.004097282886505127, 0.0042688846588134766, 0.004440486431121826, 0.004612088203430176, 0.004783689975738525, 0.004955291748046875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 9.0, 4.0, 7.0, 12.0, 19.0, 31.0, 32.0, 52.0, 76.0, 122.0, 182.0, 326.0, 737.0, 39118.0, 999760.0, 6832.0, 496.0, 279.0, 144.0, 95.0, 65.0, 38.0, 29.0, 21.0, 14.0, 14.0, 12.0, 3.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0849609375, -0.08196353912353516, -0.07896614074707031, -0.07596874237060547, -0.07297134399414062, -0.06997394561767578, -0.06697654724121094, -0.0639791488647461, -0.06098175048828125, -0.057984352111816406, -0.05498695373535156, -0.05198955535888672, -0.048992156982421875, -0.04599475860595703, -0.04299736022949219, -0.039999961853027344, -0.0370025634765625, -0.034005165100097656, -0.031007766723632812, -0.02801036834716797, -0.025012969970703125, -0.02201557159423828, -0.019018173217773438, -0.016020774841308594, -0.01302337646484375, -0.010025978088378906, -0.0070285797119140625, -0.004031181335449219, -0.001033782958984375, 0.0019636154174804688, 0.0049610137939453125, 0.007958412170410156, 0.010955810546875, 0.013953208923339844, 0.016950607299804688, 0.01994800567626953, 0.022945404052734375, 0.02594280242919922, 0.028940200805664062, 0.031937599182128906, 0.03493499755859375, 0.037932395935058594, 0.04092979431152344, 0.04392719268798828, 0.046924591064453125, 0.04992198944091797, 0.05291938781738281, 0.055916786193847656, 0.0589141845703125, 0.061911582946777344, 0.06490898132324219, 0.06790637969970703, 0.07090377807617188, 0.07390117645263672, 0.07689857482910156, 0.0798959732055664, 0.08289337158203125, 0.0858907699584961, 0.08888816833496094, 0.09188556671142578, 0.09488296508789062, 0.09788036346435547, 0.10087776184082031, 0.10387516021728516, 0.10687255859375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 62.0, 756.0, 171.0, 23.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03756740316748619, -0.03647802025079727, -0.03538864105939865, -0.03429925814270973, -0.03320987522602081, -0.03212049603462219, -0.031031113117933273, -0.029941730201244354, -0.028852349147200584, -0.027762968093156815, -0.026673585176467896, -0.025584204122424126, -0.024494823068380356, -0.023405440151691437, -0.022316059097647667, -0.021226678043603897, -0.020137295126914978, -0.019047914072871208, -0.01795853115618229, -0.01686915010213852, -0.0157797671854496, -0.01469038613140583, -0.01360100507736206, -0.012511623091995716, -0.011422241106629372, -0.010332859121263027, -0.009243477135896683, -0.008154096081852913, -0.0070647140964865685, -0.005975332111120224, -0.004885950591415167, -0.0037965690717101097, -0.0027071870863437653, -0.0016178053338080645, -0.0005284235812723637, 0.0005609581712633371, 0.001650339923799038, 0.0027397219091653824, 0.0038291034288704395, 0.004918484948575497, 0.006007866933941841, 0.007097248919308186, 0.00818663090467453, 0.0092760119587183, 0.010365393944084644, 0.011454775929450989, 0.012544156983494759, 0.013633538968861103, 0.014722920954227448, 0.015812302008271217, 0.016901684924960136, 0.017991065979003906, 0.019080448895692825, 0.020169829949736595, 0.021259211003780365, 0.022348593920469284, 0.023437974974513054, 0.024527356028556824, 0.025616738945245743, 0.026706119999289513, 0.027795501053333282, 0.0288848839700222, 0.02997426502406597, 0.03106364607810974, 0.03215302899479866]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 8.0, 13.0, 12.0, 19.0, 18.0, 28.0, 14.0, 30.0, 27.0, 30.0, 36.0, 50.0, 53.0, 49.0, 48.0, 44.0, 49.0, 56.0, 49.0, 53.0, 30.0, 47.0, 37.0, 30.0, 36.0, 20.0, 24.0, 21.0, 14.0, 11.0, 10.0, 9.0, 6.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034987926483154297, -0.0033738669008016586, -0.0032489411532878876, -0.0031240154057741165, -0.0029990896582603455, -0.0028741639107465744, -0.0027492381632328033, -0.0026243124157190323, -0.0024993866682052612, -0.00237446092069149, -0.002249535173177719, -0.002124609425663948, -0.001999683678150177, -0.001874757930636406, -0.0017498321831226349, -0.0016249064356088638, -0.0014999806880950928, -0.0013750549405813217, -0.0012501291930675507, -0.0011252034455537796, -0.0010002776980400085, -0.0008753519505262375, -0.0007504262030124664, -0.0006255004554986954, -0.0005005747079849243, -0.00037564896047115326, -0.0002507232129573822, -0.00012579746544361115, -8.717179298400879e-07, 0.00012405402958393097, 0.000248979777097702, 0.0003739055246114731, 0.0004988312721252441, 0.0006237570196390152, 0.0007486827671527863, 0.0008736085146665573, 0.0009985342621803284, 0.0011234600096940994, 0.0012483857572078705, 0.0013733115047216415, 0.0014982372522354126, 0.0016231629997491837, 0.0017480887472629547, 0.0018730144947767258, 0.001997940242290497, 0.002122865989804268, 0.002247791737318039, 0.00237271748483181, 0.002497643232345581, 0.002622568979859352, 0.002747494727373123, 0.0028724204748868942, 0.0029973462224006653, 0.0031222719699144363, 0.0032471977174282074, 0.0033721234649419785, 0.0034970492124557495, 0.0036219749599695206, 0.0037469007074832916, 0.0038718264549970627, 0.003996752202510834, 0.004121677950024605, 0.004246603697538376, 0.004371529445052147, 0.004496455192565918]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 3.0, 9.0, 5.0, 7.0, 8.0, 8.0, 18.0, 13.0, 22.0, 25.0, 28.0, 29.0, 25.0, 36.0, 28.0, 29.0, 37.0, 39.0, 27.0, 34.0, 46.0, 36.0, 36.0, 38.0, 37.0, 36.0, 36.0, 30.0, 27.0, 31.0, 35.0, 26.0, 24.0, 12.0, 19.0, 17.0, 16.0, 12.0, 12.0, 8.0, 8.0, 5.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.6920318603515625, -1.633087158203125, -1.5741424560546875, -1.51519775390625, -1.4562530517578125, -1.397308349609375, -1.3383636474609375, -1.2794189453125, -1.2204742431640625, -1.161529541015625, -1.1025848388671875, -1.04364013671875, -0.9846954345703125, -0.925750732421875, -0.8668060302734375, -0.807861328125, -0.7489166259765625, -0.689971923828125, -0.6310272216796875, -0.57208251953125, -0.5131378173828125, -0.454193115234375, -0.3952484130859375, -0.3363037109375, -0.2773590087890625, -0.218414306640625, -0.1594696044921875, -0.10052490234375, -0.0415802001953125, 0.017364501953125, 0.0763092041015625, 0.13525390625, 0.1941986083984375, 0.253143310546875, 0.3120880126953125, 0.37103271484375, 0.4299774169921875, 0.488922119140625, 0.5478668212890625, 0.6068115234375, 0.6657562255859375, 0.724700927734375, 0.7836456298828125, 0.84259033203125, 0.9015350341796875, 0.960479736328125, 1.0194244384765625, 1.078369140625, 1.1373138427734375, 1.196258544921875, 1.2552032470703125, 1.31414794921875, 1.3730926513671875, 1.432037353515625, 1.4909820556640625, 1.5499267578125, 1.6088714599609375, 1.667816162109375, 1.7267608642578125, 1.78570556640625, 1.8446502685546875, 1.903594970703125, 1.9625396728515625, 2.021484375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 5.0, 3.0, 8.0, 9.0, 22.0, 32.0, 45.0, 56.0, 89.0, 94.0, 175.0, 220.0, 357.0, 559.0, 924.0, 1485.0, 2574.0, 4520.0, 8045.0, 15140.0, 30920.0, 69231.0, 171740.0, 394650.0, 197573.0, 77829.0, 34641.0, 16786.0, 8588.0, 4985.0, 2703.0, 1595.0, 1048.0, 632.0, 435.0, 269.0, 189.0, 109.0, 92.0, 55.0, 31.0, 39.0, 12.0, 8.0, 7.0, 7.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.843048095703125, -2.75836181640625, -2.673675537109375, -2.5889892578125, -2.504302978515625, -2.41961669921875, -2.334930419921875, -2.250244140625, -2.165557861328125, -2.08087158203125, -1.996185302734375, -1.9114990234375, -1.826812744140625, -1.74212646484375, -1.657440185546875, -1.57275390625, -1.488067626953125, -1.40338134765625, -1.318695068359375, -1.2340087890625, -1.149322509765625, -1.06463623046875, -0.979949951171875, -0.895263671875, -0.810577392578125, -0.72589111328125, -0.641204833984375, -0.5565185546875, -0.471832275390625, -0.38714599609375, -0.302459716796875, -0.2177734375, -0.133087158203125, -0.04840087890625, 0.036285400390625, 0.1209716796875, 0.205657958984375, 0.29034423828125, 0.375030517578125, 0.459716796875, 0.544403076171875, 0.62908935546875, 0.713775634765625, 0.7984619140625, 0.883148193359375, 0.96783447265625, 1.052520751953125, 1.13720703125, 1.221893310546875, 1.30657958984375, 1.391265869140625, 1.4759521484375, 1.560638427734375, 1.64532470703125, 1.730010986328125, 1.814697265625, 1.899383544921875, 1.98406982421875, 2.068756103515625, 2.1534423828125, 2.238128662109375, 2.32281494140625, 2.407501220703125, 2.4921875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 2.0, 2.0, 9.0, 12.0, 16.0, 15.0, 18.0, 25.0, 23.0, 39.0, 23.0, 26.0, 37.0, 42.0, 46.0, 45.0, 89.0, 146.0, 305.0, 1411.0, 209.0, 92.0, 58.0, 52.0, 49.0, 37.0, 28.0, 29.0, 27.0, 23.0, 15.0, 17.0, 9.0, 23.0, 9.0, 8.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.56640625, -7.33868408203125, -7.1109619140625, -6.88323974609375, -6.655517578125, -6.42779541015625, -6.2000732421875, -5.97235107421875, -5.74462890625, -5.51690673828125, -5.2891845703125, -5.06146240234375, -4.833740234375, -4.60601806640625, -4.3782958984375, -4.15057373046875, -3.9228515625, -3.69512939453125, -3.4674072265625, -3.23968505859375, -3.011962890625, -2.78424072265625, -2.5565185546875, -2.32879638671875, -2.10107421875, -1.87335205078125, -1.6456298828125, -1.41790771484375, -1.190185546875, -0.96246337890625, -0.7347412109375, -0.50701904296875, -0.279296875, -0.05157470703125, 0.1761474609375, 0.40386962890625, 0.631591796875, 0.85931396484375, 1.0870361328125, 1.31475830078125, 1.54248046875, 1.77020263671875, 1.9979248046875, 2.22564697265625, 2.453369140625, 2.68109130859375, 2.9088134765625, 3.13653564453125, 3.3642578125, 3.59197998046875, 3.8197021484375, 4.04742431640625, 4.275146484375, 4.50286865234375, 4.7305908203125, 4.95831298828125, 5.18603515625, 5.41375732421875, 5.6414794921875, 5.86920166015625, 6.096923828125, 6.32464599609375, 6.5523681640625, 6.78009033203125, 7.0078125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 2.0, 7.0, 9.0, 8.0, 15.0, 18.0, 22.0, 44.0, 54.0, 72.0, 109.0, 195.0, 297.0, 804.0, 4921.0, 173933.0, 2926097.0, 35534.0, 2224.0, 550.0, 259.0, 172.0, 90.0, 55.0, 47.0, 39.0, 20.0, 27.0, 14.0, 16.0, 9.0, 3.0, 12.0, 5.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.918212890625, -16.32080078125, -15.723388671875, -15.1259765625, -14.528564453125, -13.93115234375, -13.333740234375, -12.736328125, -12.138916015625, -11.54150390625, -10.944091796875, -10.3466796875, -9.749267578125, -9.15185546875, -8.554443359375, -7.95703125, -7.359619140625, -6.76220703125, -6.164794921875, -5.5673828125, -4.969970703125, -4.37255859375, -3.775146484375, -3.177734375, -2.580322265625, -1.98291015625, -1.385498046875, -0.7880859375, -0.190673828125, 0.40673828125, 1.004150390625, 1.6015625, 2.198974609375, 2.79638671875, 3.393798828125, 3.9912109375, 4.588623046875, 5.18603515625, 5.783447265625, 6.380859375, 6.978271484375, 7.57568359375, 8.173095703125, 8.7705078125, 9.367919921875, 9.96533203125, 10.562744140625, 11.16015625, 11.757568359375, 12.35498046875, 12.952392578125, 13.5498046875, 14.147216796875, 14.74462890625, 15.342041015625, 15.939453125, 16.536865234375, 17.13427734375, 17.731689453125, 18.3291015625, 18.926513671875, 19.52392578125, 20.121337890625, 20.71875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 247.0, 647.0, 107.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.783203125, -164.63406372070312, -161.48492431640625, -158.33578491210938, -155.18666076660156, -152.0375213623047, -148.8883819580078, -145.73924255371094, -142.59010314941406, -139.4409637451172, -136.2918243408203, -133.1427001953125, -129.99356079101562, -126.84442138671875, -123.69528198242188, -120.546142578125, -117.39701080322266, -114.24787139892578, -111.09873962402344, -107.94960021972656, -104.80046081542969, -101.65132141113281, -98.50218963623047, -95.3530502319336, -92.20391845703125, -89.05477905273438, -85.90564727783203, -82.75650787353516, -79.60736846923828, -76.45823669433594, -73.30909729003906, -70.15995788574219, -67.01081848144531, -63.8616828918457, -60.71254348754883, -57.56340789794922, -54.414268493652344, -51.265132904052734, -48.115997314453125, -44.96685791015625, -41.817718505859375, -38.668582916259766, -35.51944351196289, -32.37030792236328, -29.22117042541504, -26.072032928466797, -22.922897338867188, -19.773759841918945, -16.624622344970703, -13.475484848022461, -10.326348304748535, -7.177211761474609, -4.028074264526367, -0.878936767578125, 2.2701988220214844, 5.419336318969727, 8.568473815917969, 11.717611312866211, 14.866747856140137, 18.015884399414062, 21.165021896362305, 24.314159393310547, 27.463294982910156, 30.6124324798584, 33.76156997680664]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 7.0, 8.0, 6.0, 15.0, 13.0, 16.0, 12.0, 25.0, 22.0, 26.0, 29.0, 24.0, 34.0, 33.0, 41.0, 37.0, 40.0, 27.0, 55.0, 49.0, 47.0, 49.0, 34.0, 50.0, 43.0, 33.0, 31.0, 26.0, 27.0, 16.0, 21.0, 17.0, 16.0, 10.0, 9.0, 4.0, 16.0, 7.0, 7.0, 7.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.582107543945312, -20.904064178466797, -20.22602081298828, -19.547977447509766, -18.86993408203125, -18.191890716552734, -17.51384735107422, -16.835803985595703, -16.157760620117188, -15.479717254638672, -14.801673889160156, -14.12363052368164, -13.445587158203125, -12.76754379272461, -12.089499473571777, -11.411456108093262, -10.73341178894043, -10.055368423461914, -9.377325057983398, -8.699281692504883, -8.021238327026367, -7.343194484710693, -6.6651506423950195, -5.987107276916504, -5.309063911437988, -4.631020545959473, -3.952976942062378, -3.274933338165283, -2.5968899726867676, -1.918846607208252, -1.2408027648925781, -0.5627593994140625, 0.11528396606445312, 0.7933274507522583, 1.4713709354400635, 2.149414539337158, 2.827457904815674, 3.5055012702941895, 4.183545112609863, 4.861588478088379, 5.5396318435668945, 6.21767520904541, 6.895718574523926, 7.5737624168396, 8.251806259155273, 8.929849624633789, 9.607892990112305, 10.28593635559082, 10.963979721069336, 11.642023086547852, 12.320066452026367, 12.998109817504883, 13.676153182983398, 14.354196548461914, 15.032240867614746, 15.710284233093262, 16.388328552246094, 17.06637191772461, 17.744415283203125, 18.42245864868164, 19.100502014160156, 19.778545379638672, 20.456588745117188, 21.134632110595703, 21.81267547607422]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 5.0, 1.0, 10.0, 9.0, 8.0, 12.0, 24.0, 22.0, 26.0, 21.0, 19.0, 21.0, 38.0, 26.0, 40.0, 38.0, 37.0, 34.0, 40.0, 42.0, 45.0, 40.0, 36.0, 39.0, 34.0, 37.0, 32.0, 34.0, 24.0, 24.0, 25.0, 22.0, 19.0, 25.0, 16.0, 14.0, 8.0, 8.0, 11.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.853515625, -1.788909912109375, -1.72430419921875, -1.659698486328125, -1.5950927734375, -1.530487060546875, -1.46588134765625, -1.401275634765625, -1.336669921875, -1.272064208984375, -1.20745849609375, -1.142852783203125, -1.0782470703125, -1.013641357421875, -0.94903564453125, -0.884429931640625, -0.81982421875, -0.755218505859375, -0.69061279296875, -0.626007080078125, -0.5614013671875, -0.496795654296875, -0.43218994140625, -0.367584228515625, -0.302978515625, -0.238372802734375, -0.17376708984375, -0.109161376953125, -0.0445556640625, 0.020050048828125, 0.08465576171875, 0.149261474609375, 0.2138671875, 0.278472900390625, 0.34307861328125, 0.407684326171875, 0.4722900390625, 0.536895751953125, 0.60150146484375, 0.666107177734375, 0.730712890625, 0.795318603515625, 0.85992431640625, 0.924530029296875, 0.9891357421875, 1.053741455078125, 1.11834716796875, 1.182952880859375, 1.24755859375, 1.312164306640625, 1.37677001953125, 1.441375732421875, 1.5059814453125, 1.570587158203125, 1.63519287109375, 1.699798583984375, 1.764404296875, 1.829010009765625, 1.89361572265625, 1.958221435546875, 2.0228271484375, 2.087432861328125, 2.15203857421875, 2.216644287109375, 2.28125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 8.0, 11.0, 14.0, 28.0, 29.0, 42.0, 71.0, 97.0, 141.0, 224.0, 362.0, 658.0, 1260.0, 2434.0, 5220.0, 11840.0, 28439.0, 72953.0, 204736.0, 588378.0, 1303727.0, 1206256.0, 493497.0, 169017.0, 60951.0, 24044.0, 10178.0, 4545.0, 2203.0, 1200.0, 658.0, 362.0, 247.0, 137.0, 89.0, 66.0, 50.0, 23.0, 23.0, 17.0, 19.0, 3.0, 12.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0], "bins": [-3.076171875, -2.988067626953125, -2.89996337890625, -2.811859130859375, -2.7237548828125, -2.635650634765625, -2.54754638671875, -2.459442138671875, -2.371337890625, -2.283233642578125, -2.19512939453125, -2.107025146484375, -2.0189208984375, -1.930816650390625, -1.84271240234375, -1.754608154296875, -1.66650390625, -1.578399658203125, -1.49029541015625, -1.402191162109375, -1.3140869140625, -1.225982666015625, -1.13787841796875, -1.049774169921875, -0.961669921875, -0.873565673828125, -0.78546142578125, -0.697357177734375, -0.6092529296875, -0.521148681640625, -0.43304443359375, -0.344940185546875, -0.2568359375, -0.168731689453125, -0.08062744140625, 0.007476806640625, 0.0955810546875, 0.183685302734375, 0.27178955078125, 0.359893798828125, 0.447998046875, 0.536102294921875, 0.62420654296875, 0.712310791015625, 0.8004150390625, 0.888519287109375, 0.97662353515625, 1.064727783203125, 1.15283203125, 1.240936279296875, 1.32904052734375, 1.417144775390625, 1.5052490234375, 1.593353271484375, 1.68145751953125, 1.769561767578125, 1.857666015625, 1.945770263671875, 2.03387451171875, 2.121978759765625, 2.2100830078125, 2.298187255859375, 2.38629150390625, 2.474395751953125, 2.5625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 8.0, 8.0, 11.0, 19.0, 24.0, 30.0, 51.0, 77.0, 102.0, 135.0, 252.0, 322.0, 436.0, 549.0, 527.0, 477.0, 303.0, 221.0, 176.0, 112.0, 93.0, 38.0, 31.0, 28.0, 17.0, 9.0, 5.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.30792236328125, -8.0767822265625, -7.84564208984375, -7.614501953125, -7.38336181640625, -7.1522216796875, -6.92108154296875, -6.68994140625, -6.45880126953125, -6.2276611328125, -5.99652099609375, -5.765380859375, -5.53424072265625, -5.3031005859375, -5.07196044921875, -4.8408203125, -4.60968017578125, -4.3785400390625, -4.14739990234375, -3.916259765625, -3.68511962890625, -3.4539794921875, -3.22283935546875, -2.99169921875, -2.76055908203125, -2.5294189453125, -2.29827880859375, -2.067138671875, -1.83599853515625, -1.6048583984375, -1.37371826171875, -1.142578125, -0.91143798828125, -0.6802978515625, -0.44915771484375, -0.218017578125, 0.01312255859375, 0.2442626953125, 0.47540283203125, 0.70654296875, 0.93768310546875, 1.1688232421875, 1.39996337890625, 1.631103515625, 1.86224365234375, 2.0933837890625, 2.32452392578125, 2.5556640625, 2.78680419921875, 3.0179443359375, 3.24908447265625, 3.480224609375, 3.71136474609375, 3.9425048828125, 4.17364501953125, 4.40478515625, 4.63592529296875, 4.8670654296875, 5.09820556640625, 5.329345703125, 5.56048583984375, 5.7916259765625, 6.02276611328125, 6.25390625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 4.0, 12.0, 21.0, 19.0, 48.0, 50.0, 78.0, 136.0, 201.0, 373.0, 859.0, 2341.0, 10909.0, 82518.0, 839611.0, 2772324.0, 430522.0, 44655.0, 6477.0, 1669.0, 640.0, 313.0, 173.0, 115.0, 75.0, 34.0, 33.0, 22.0, 16.0, 12.0, 8.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.5234375, -8.2000732421875, -7.876708984375, -7.5533447265625, -7.22998046875, -6.9066162109375, -6.583251953125, -6.2598876953125, -5.9365234375, -5.6131591796875, -5.289794921875, -4.9664306640625, -4.64306640625, -4.3197021484375, -3.996337890625, -3.6729736328125, -3.349609375, -3.0262451171875, -2.702880859375, -2.3795166015625, -2.05615234375, -1.7327880859375, -1.409423828125, -1.0860595703125, -0.7626953125, -0.4393310546875, -0.115966796875, 0.2073974609375, 0.53076171875, 0.8541259765625, 1.177490234375, 1.5008544921875, 1.82421875, 2.1475830078125, 2.470947265625, 2.7943115234375, 3.11767578125, 3.4410400390625, 3.764404296875, 4.0877685546875, 4.4111328125, 4.7344970703125, 5.057861328125, 5.3812255859375, 5.70458984375, 6.0279541015625, 6.351318359375, 6.6746826171875, 6.998046875, 7.3214111328125, 7.644775390625, 7.9681396484375, 8.29150390625, 8.6148681640625, 8.938232421875, 9.2615966796875, 9.5849609375, 9.9083251953125, 10.231689453125, 10.5550537109375, 10.87841796875, 11.2017822265625, 11.525146484375, 11.8485107421875, 12.171875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 10.0, 26.0, 58.0, 139.0, 153.0, 198.0, 187.0, 131.0, 66.0, 25.0, 9.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.074621200561523, -23.458099365234375, -21.84157943725586, -20.22505760192871, -18.608535766601562, -16.992015838623047, -15.375494003295898, -13.758973121643066, -12.142452239990234, -10.525931358337402, -8.90941047668457, -7.292888641357422, -5.67636775970459, -4.059846878051758, -2.4433250427246094, -0.8268041610717773, 0.7897167205810547, 2.406237840652466, 4.022758960723877, 5.639280319213867, 7.255801200866699, 8.872322082519531, 10.48884391784668, 12.105364799499512, 13.721885681152344, 15.338406562805176, 16.954927444458008, 18.571449279785156, 20.187969207763672, 21.80449104309082, 23.42101287841797, 25.037532806396484, 26.654052734375, 28.27057456970215, 29.887094497680664, 31.503616333007812, 33.12013626098633, 34.736656188964844, 36.353179931640625, 37.96969985961914, 39.586219787597656, 41.20273971557617, 42.81926345825195, 44.43578338623047, 46.052303314208984, 47.6688232421875, 49.28534698486328, 50.9018669128418, 52.51839065551758, 54.134910583496094, 55.751434326171875, 57.36795425415039, 58.984474182128906, 60.60099792480469, 62.2175178527832, 63.83403778076172, 65.4505615234375, 67.06708526611328, 68.68360137939453, 70.30012512207031, 71.9166488647461, 73.53316497802734, 75.14968872070312, 76.7662124633789, 78.38272857666016]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 9.0, 11.0, 14.0, 11.0, 21.0, 13.0, 20.0, 16.0, 17.0, 14.0, 22.0, 27.0, 31.0, 37.0, 44.0, 43.0, 45.0, 37.0, 37.0, 41.0, 45.0, 44.0, 45.0, 39.0, 36.0, 34.0, 30.0, 29.0, 20.0, 19.0, 27.0, 20.0, 14.0, 18.0, 6.0, 10.0, 7.0, 10.0, 7.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-20.340396881103516, -19.748149871826172, -19.155900955200195, -18.56365394592285, -17.971406936645508, -17.37915802001953, -16.786911010742188, -16.194664001464844, -15.602415084838867, -15.010167121887207, -14.417920112609863, -13.825672149658203, -13.233424186706543, -12.641176223754883, -12.048929214477539, -11.456681251525879, -10.864434242248535, -10.272186279296875, -9.679939270019531, -9.087691307067871, -8.495443344116211, -7.903195858001709, -7.310948371887207, -6.718700408935547, -6.126452922821045, -5.534205436706543, -4.941957473754883, -4.349709987640381, -3.7574622631073, -3.1652145385742188, -2.572967052459717, -1.9807190895080566, -1.3884716033935547, -0.7962239384651184, -0.20397627353668213, 0.3882713317871094, 0.9805190563201904, 1.5727667808532715, 2.1650142669677734, 2.7572622299194336, 3.3495097160339355, 3.9417574405670166, 4.534005165100098, 5.1262526512146, 5.718500137329102, 6.310748100280762, 6.902995586395264, 7.495243549346924, 8.087491035461426, 8.679738998413086, 9.27198600769043, 9.86423397064209, 10.45648193359375, 11.048728942871094, 11.640976905822754, 12.233224868774414, 12.825471878051758, 13.417719841003418, 14.009966850280762, 14.602214813232422, 15.194462776184082, 15.786710739135742, 16.378957748413086, 16.971206665039062, 17.563453674316406]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 1.0, 9.0, 13.0, 9.0, 4.0, 12.0, 17.0, 17.0, 18.0, 25.0, 27.0, 23.0, 28.0, 28.0, 25.0, 26.0, 37.0, 36.0, 52.0, 37.0, 44.0, 41.0, 35.0, 43.0, 32.0, 39.0, 26.0, 27.0, 31.0, 33.0, 26.0, 19.0, 17.0, 27.0, 16.0, 21.0, 8.0, 16.0, 7.0, 7.0, 8.0, 6.0, 6.0, 4.0, 4.0, 1.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.025390625, -1.960723876953125, -1.89605712890625, -1.831390380859375, -1.7667236328125, -1.702056884765625, -1.63739013671875, -1.572723388671875, -1.508056640625, -1.443389892578125, -1.37872314453125, -1.314056396484375, -1.2493896484375, -1.184722900390625, -1.12005615234375, -1.055389404296875, -0.99072265625, -0.926055908203125, -0.86138916015625, -0.796722412109375, -0.7320556640625, -0.667388916015625, -0.60272216796875, -0.538055419921875, -0.473388671875, -0.408721923828125, -0.34405517578125, -0.279388427734375, -0.2147216796875, -0.150054931640625, -0.08538818359375, -0.020721435546875, 0.0439453125, 0.108612060546875, 0.17327880859375, 0.237945556640625, 0.3026123046875, 0.367279052734375, 0.43194580078125, 0.496612548828125, 0.561279296875, 0.625946044921875, 0.69061279296875, 0.755279541015625, 0.8199462890625, 0.884613037109375, 0.94927978515625, 1.013946533203125, 1.07861328125, 1.143280029296875, 1.20794677734375, 1.272613525390625, 1.3372802734375, 1.401947021484375, 1.46661376953125, 1.531280517578125, 1.595947265625, 1.660614013671875, 1.72528076171875, 1.789947509765625, 1.8546142578125, 1.919281005859375, 1.98394775390625, 2.048614501953125, 2.11328125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 8.0, 13.0, 11.0, 26.0, 42.0, 59.0, 80.0, 127.0, 206.0, 274.0, 421.0, 600.0, 787.0, 1224.0, 1778.0, 2673.0, 3691.0, 5720.0, 8443.0, 12780.0, 19459.0, 30433.0, 47517.0, 76065.0, 119999.0, 181455.0, 186968.0, 125237.0, 79555.0, 50062.0, 31669.0, 20576.0, 13514.0, 8809.0, 5863.0, 3875.0, 2695.0, 1780.0, 1269.0, 885.0, 614.0, 397.0, 298.0, 194.0, 136.0, 112.0, 68.0, 38.0, 22.0, 9.0, 10.0, 5.0, 5.0, 3.0, 4.0, 1.0], "bins": [-0.25341796875, -0.24597549438476562, -0.23853302001953125, -0.23109054565429688, -0.2236480712890625, -0.21620559692382812, -0.20876312255859375, -0.20132064819335938, -0.193878173828125, -0.18643569946289062, -0.17899322509765625, -0.17155075073242188, -0.1641082763671875, -0.15666580200195312, -0.14922332763671875, -0.14178085327148438, -0.13433837890625, -0.12689590454101562, -0.11945343017578125, -0.11201095581054688, -0.1045684814453125, -0.09712600708007812, -0.08968353271484375, -0.08224105834960938, -0.074798583984375, -0.06735610961914062, -0.05991363525390625, -0.052471160888671875, -0.0450286865234375, -0.037586212158203125, -0.03014373779296875, -0.022701263427734375, -0.0152587890625, -0.007816314697265625, -0.00037384033203125, 0.007068634033203125, 0.0145111083984375, 0.021953582763671875, 0.02939605712890625, 0.036838531494140625, 0.044281005859375, 0.051723480224609375, 0.05916595458984375, 0.06660842895507812, 0.0740509033203125, 0.08149337768554688, 0.08893585205078125, 0.09637832641601562, 0.10382080078125, 0.11126327514648438, 0.11870574951171875, 0.12614822387695312, 0.1335906982421875, 0.14103317260742188, 0.14847564697265625, 0.15591812133789062, 0.163360595703125, 0.17080307006835938, 0.17824554443359375, 0.18568801879882812, 0.1931304931640625, 0.20057296752929688, 0.20801544189453125, 0.21545791625976562, 0.222900390625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 12.0, 10.0, 13.0, 14.0, 19.0, 25.0, 19.0, 32.0, 26.0, 25.0, 30.0, 43.0, 42.0, 42.0, 43.0, 46.0, 44.0, 1052.0, 35.0, 42.0, 37.0, 42.0, 41.0, 40.0, 34.0, 28.0, 29.0, 15.0, 22.0, 18.0, 15.0, 14.0, 14.0, 10.0, 9.0, 3.0, 7.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.228515625, -1.1830291748046875, -1.137542724609375, -1.0920562744140625, -1.04656982421875, -1.0010833740234375, -0.955596923828125, -0.9101104736328125, -0.8646240234375, -0.8191375732421875, -0.773651123046875, -0.7281646728515625, -0.68267822265625, -0.6371917724609375, -0.591705322265625, -0.5462188720703125, -0.500732421875, -0.4552459716796875, -0.409759521484375, -0.3642730712890625, -0.31878662109375, -0.2733001708984375, -0.227813720703125, -0.1823272705078125, -0.1368408203125, -0.0913543701171875, -0.045867919921875, -0.0003814697265625, 0.04510498046875, 0.0905914306640625, 0.136077880859375, 0.1815643310546875, 0.22705078125, 0.2725372314453125, 0.318023681640625, 0.3635101318359375, 0.40899658203125, 0.4544830322265625, 0.499969482421875, 0.5454559326171875, 0.5909423828125, 0.6364288330078125, 0.681915283203125, 0.7274017333984375, 0.77288818359375, 0.8183746337890625, 0.863861083984375, 0.9093475341796875, 0.954833984375, 1.0003204345703125, 1.045806884765625, 1.0912933349609375, 1.13677978515625, 1.1822662353515625, 1.227752685546875, 1.2732391357421875, 1.3187255859375, 1.3642120361328125, 1.409698486328125, 1.4551849365234375, 1.50067138671875, 1.5461578369140625, 1.591644287109375, 1.6371307373046875, 1.6826171875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 14.0, 6.0, 13.0, 30.0, 40.0, 59.0, 56.0, 113.0, 119.0, 244.0, 325.0, 447.0, 653.0, 943.0, 1396.0, 2031.0, 3062.0, 4546.0, 6931.0, 10534.0, 16378.0, 24891.0, 37873.0, 58389.0, 89631.0, 133324.0, 1168709.0, 205998.0, 113353.0, 75243.0, 48781.0, 31953.0, 20843.0, 13520.0, 8792.0, 5814.0, 3831.0, 2686.0, 1738.0, 1235.0, 768.0, 545.0, 411.0, 277.0, 198.0, 115.0, 91.0, 67.0, 36.0, 31.0, 27.0, 7.0, 10.0, 9.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.156494140625, -0.15157127380371094, -0.14664840698242188, -0.1417255401611328, -0.13680267333984375, -0.1318798065185547, -0.12695693969726562, -0.12203407287597656, -0.1171112060546875, -0.11218833923339844, -0.10726547241210938, -0.10234260559082031, -0.09741973876953125, -0.09249687194824219, -0.08757400512695312, -0.08265113830566406, -0.077728271484375, -0.07280540466308594, -0.06788253784179688, -0.06295967102050781, -0.05803680419921875, -0.05311393737792969, -0.048191070556640625, -0.04326820373535156, -0.0383453369140625, -0.03342247009277344, -0.028499603271484375, -0.023576736450195312, -0.01865386962890625, -0.013731002807617188, -0.008808135986328125, -0.0038852691650390625, 0.00103759765625, 0.0059604644775390625, 0.010883331298828125, 0.015806198120117188, 0.02072906494140625, 0.025651931762695312, 0.030574798583984375, 0.03549766540527344, 0.0404205322265625, 0.04534339904785156, 0.050266265869140625, 0.05518913269042969, 0.06011199951171875, 0.06503486633300781, 0.06995773315429688, 0.07488059997558594, 0.079803466796875, 0.08472633361816406, 0.08964920043945312, 0.09457206726074219, 0.09949493408203125, 0.10441780090332031, 0.10934066772460938, 0.11426353454589844, 0.1191864013671875, 0.12410926818847656, 0.12903213500976562, 0.1339550018310547, 0.13887786865234375, 0.1438007354736328, 0.14872360229492188, 0.15364646911621094, 0.1585693359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 8.0, 12.0, 8.0, 18.0, 18.0, 14.0, 15.0, 26.0, 24.0, 18.0, 31.0, 48.0, 36.0, 50.0, 84.0, 103.0, 107.0, 73.0, 41.0, 33.0, 32.0, 29.0, 20.0, 23.0, 23.0, 15.0, 17.0, 7.0, 10.0, 5.0, 5.0, 7.0, 8.0, 6.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0044097900390625, -0.004250943660736084, -0.004092097282409668, -0.003933250904083252, -0.003774404525756836, -0.00361555814743042, -0.003456711769104004, -0.003297865390777588, -0.003139019012451172, -0.002980172634124756, -0.00282132625579834, -0.002662479877471924, -0.002503633499145508, -0.002344787120819092, -0.0021859407424926758, -0.0020270943641662598, -0.0018682479858398438, -0.0017094016075134277, -0.0015505552291870117, -0.0013917088508605957, -0.0012328624725341797, -0.0010740160942077637, -0.0009151697158813477, -0.0007563233375549316, -0.0005974769592285156, -0.0004386305809020996, -0.0002797842025756836, -0.00012093782424926758, 3.790855407714844e-05, 0.00019675493240356445, 0.00035560131072998047, 0.0005144476890563965, 0.0006732940673828125, 0.0008321404457092285, 0.0009909868240356445, 0.0011498332023620605, 0.0013086795806884766, 0.0014675259590148926, 0.0016263723373413086, 0.0017852187156677246, 0.0019440650939941406, 0.0021029114723205566, 0.0022617578506469727, 0.0024206042289733887, 0.0025794506072998047, 0.0027382969856262207, 0.0028971433639526367, 0.0030559897422790527, 0.0032148361206054688, 0.0033736824989318848, 0.0035325288772583008, 0.003691375255584717, 0.003850221633911133, 0.004009068012237549, 0.004167914390563965, 0.004326760768890381, 0.004485607147216797, 0.004644453525543213, 0.004803299903869629, 0.004962146282196045, 0.005120992660522461, 0.005279839038848877, 0.005438685417175293, 0.005597531795501709, 0.005756378173828125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 8.0, 5.0, 9.0, 8.0, 9.0, 16.0, 25.0, 34.0, 46.0, 58.0, 78.0, 118.0, 136.0, 191.0, 287.0, 455.0, 1917.0, 91047.0, 938670.0, 13356.0, 842.0, 358.0, 214.0, 153.0, 122.0, 98.0, 56.0, 51.0, 51.0, 28.0, 28.0, 28.0, 11.0, 9.0, 10.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0859375, -0.08335590362548828, -0.08077430725097656, -0.07819271087646484, -0.07561111450195312, -0.0730295181274414, -0.07044792175292969, -0.06786632537841797, -0.06528472900390625, -0.06270313262939453, -0.06012153625488281, -0.057539939880371094, -0.054958343505859375, -0.052376747131347656, -0.04979515075683594, -0.04721355438232422, -0.0446319580078125, -0.04205036163330078, -0.03946876525878906, -0.036887168884277344, -0.034305572509765625, -0.031723976135253906, -0.029142379760742188, -0.02656078338623047, -0.02397918701171875, -0.02139759063720703, -0.018815994262695312, -0.016234397888183594, -0.013652801513671875, -0.011071205139160156, -0.008489608764648438, -0.005908012390136719, -0.003326416015625, -0.0007448196411132812, 0.0018367767333984375, 0.004418373107910156, 0.006999969482421875, 0.009581565856933594, 0.012163162231445312, 0.014744758605957031, 0.01732635498046875, 0.01990795135498047, 0.022489547729492188, 0.025071144104003906, 0.027652740478515625, 0.030234336853027344, 0.03281593322753906, 0.03539752960205078, 0.0379791259765625, 0.04056072235107422, 0.04314231872558594, 0.045723915100097656, 0.048305511474609375, 0.050887107849121094, 0.05346870422363281, 0.05605030059814453, 0.05863189697265625, 0.06121349334716797, 0.06379508972167969, 0.0663766860961914, 0.06895828247070312, 0.07153987884521484, 0.07412147521972656, 0.07670307159423828, 0.07928466796875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 24.0, 662.0, 287.0, 36.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020383179187774658, -0.019163617864251137, -0.017944056540727615, -0.016724495217204094, -0.015504933893680573, -0.014285372570157051, -0.013065812177956104, -0.011846250854432583, -0.010626689530909061, -0.00940712820738554, -0.008187566883862019, -0.0069680060259997845, -0.005748444702476263, -0.004528883378952742, -0.0033093225210905075, -0.002089761197566986, -0.0008701998740434647, 0.00034936133306473494, 0.0015689225401729345, 0.0027884836308658123, 0.004008044954389334, 0.005227606277912855, 0.006447167135775089, 0.007666728459298611, 0.008886289782822132, 0.010105851106345654, 0.011325412429869175, 0.012544972822070122, 0.013764534145593643, 0.014984095469117165, 0.016203656792640686, 0.017423218116164207, 0.01864277943968773, 0.01986234076321125, 0.02108190208673477, 0.022301463410258293, 0.023521024733781815, 0.024740586057305336, 0.025960147380828857, 0.02717970684170723, 0.0283992700278759, 0.02961883135139942, 0.030838392674922943, 0.032057952135801315, 0.033277515321969986, 0.03449707478284836, 0.03571663796901703, 0.0369361974298954, 0.03815575689077377, 0.039375316351652145, 0.040594879537820816, 0.04181443899869919, 0.04303400218486786, 0.04425356164574623, 0.0454731248319149, 0.046692684292793274, 0.047912247478961945, 0.04913180693984032, 0.05035137012600899, 0.05157092958688736, 0.05279049277305603, 0.0540100522339344, 0.05522961542010307, 0.056449174880981445, 0.057668738067150116]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 6.0, 4.0, 10.0, 8.0, 16.0, 13.0, 25.0, 17.0, 25.0, 37.0, 34.0, 39.0, 39.0, 34.0, 43.0, 45.0, 49.0, 52.0, 56.0, 50.0, 41.0, 45.0, 39.0, 41.0, 44.0, 29.0, 32.0, 28.0, 22.0, 16.0, 18.0, 8.0, 10.0, 7.0, 4.0, 7.0, 4.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005774140357971191, -0.005610007792711258, -0.0054458752274513245, -0.005281742662191391, -0.0051176100969314575, -0.004953477531671524, -0.004789344966411591, -0.004625212401151657, -0.004461079835891724, -0.00429694727063179, -0.004132814705371857, -0.003968682140111923, -0.0038045495748519897, -0.0036404170095920563, -0.003476284444332123, -0.0033121518790721893, -0.003148019313812256, -0.0029838867485523224, -0.002819754183292389, -0.0026556216180324554, -0.002491489052772522, -0.0023273564875125885, -0.002163223922252655, -0.0019990913569927216, -0.001834958791732788, -0.0016708262264728546, -0.0015066936612129211, -0.0013425610959529877, -0.0011784285306930542, -0.0010142959654331207, -0.0008501634001731873, -0.0006860308349132538, -0.0005218982696533203, -0.00035776570439338684, -0.00019363313913345337, -2.9500573873519897e-05, 0.00013463199138641357, 0.00029876455664634705, 0.0004628971219062805, 0.000627029687166214, 0.0007911622524261475, 0.0009552948176860809, 0.0011194273829460144, 0.0012835599482059479, 0.0014476925134658813, 0.0016118250787258148, 0.0017759576439857483, 0.0019400902092456818, 0.0021042227745056152, 0.0022683553397655487, 0.002432487905025482, 0.0025966204702854156, 0.002760753035545349, 0.0029248856008052826, 0.003089018166065216, 0.0032531507313251495, 0.003417283296585083, 0.0035814158618450165, 0.00374554842710495, 0.003909680992364883, 0.004073813557624817, 0.00423794612288475, 0.004402078688144684, 0.004566211253404617, 0.004730343818664551]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 2.0, 5.0, 1.0, 9.0, 13.0, 9.0, 4.0, 12.0, 17.0, 17.0, 18.0, 25.0, 27.0, 23.0, 28.0, 28.0, 25.0, 26.0, 37.0, 36.0, 52.0, 37.0, 44.0, 41.0, 34.0, 44.0, 32.0, 39.0, 26.0, 27.0, 31.0, 33.0, 26.0, 19.0, 17.0, 27.0, 16.0, 21.0, 8.0, 16.0, 7.0, 7.0, 8.0, 6.0, 6.0, 4.0, 4.0, 1.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.025390625, -1.960723876953125, -1.89605712890625, -1.831390380859375, -1.7667236328125, -1.702056884765625, -1.63739013671875, -1.572723388671875, -1.508056640625, -1.443389892578125, -1.37872314453125, -1.314056396484375, -1.2493896484375, -1.184722900390625, -1.12005615234375, -1.055389404296875, -0.99072265625, -0.926055908203125, -0.86138916015625, -0.796722412109375, -0.7320556640625, -0.667388916015625, -0.60272216796875, -0.538055419921875, -0.473388671875, -0.408721923828125, -0.34405517578125, -0.279388427734375, -0.2147216796875, -0.150054931640625, -0.08538818359375, -0.020721435546875, 0.0439453125, 0.108612060546875, 0.17327880859375, 0.237945556640625, 0.3026123046875, 0.367279052734375, 0.43194580078125, 0.496612548828125, 0.561279296875, 0.625946044921875, 0.69061279296875, 0.755279541015625, 0.8199462890625, 0.884613037109375, 0.94927978515625, 1.013946533203125, 1.07861328125, 1.143280029296875, 1.20794677734375, 1.272613525390625, 1.3372802734375, 1.401947021484375, 1.46661376953125, 1.531280517578125, 1.595947265625, 1.660614013671875, 1.72528076171875, 1.789947509765625, 1.8546142578125, 1.919281005859375, 1.98394775390625, 2.048614501953125, 2.11328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 13.0, 11.0, 17.0, 24.0, 28.0, 55.0, 39.0, 100.0, 106.0, 139.0, 267.0, 337.0, 526.0, 836.0, 1148.0, 1843.0, 2712.0, 4386.0, 7064.0, 11898.0, 20890.0, 41017.0, 92905.0, 217514.0, 321987.0, 171622.0, 72752.0, 33163.0, 17601.0, 10160.0, 6164.0, 3878.0, 2446.0, 1601.0, 1063.0, 681.0, 477.0, 314.0, 237.0, 154.0, 114.0, 83.0, 48.0, 44.0, 28.0, 19.0, 13.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.1640625, -2.0927734375, -2.021484375, -1.9501953125, -1.87890625, -1.8076171875, -1.736328125, -1.6650390625, -1.59375, -1.5224609375, -1.451171875, -1.3798828125, -1.30859375, -1.2373046875, -1.166015625, -1.0947265625, -1.0234375, -0.9521484375, -0.880859375, -0.8095703125, -0.73828125, -0.6669921875, -0.595703125, -0.5244140625, -0.453125, -0.3818359375, -0.310546875, -0.2392578125, -0.16796875, -0.0966796875, -0.025390625, 0.0458984375, 0.1171875, 0.1884765625, 0.259765625, 0.3310546875, 0.40234375, 0.4736328125, 0.544921875, 0.6162109375, 0.6875, 0.7587890625, 0.830078125, 0.9013671875, 0.97265625, 1.0439453125, 1.115234375, 1.1865234375, 1.2578125, 1.3291015625, 1.400390625, 1.4716796875, 1.54296875, 1.6142578125, 1.685546875, 1.7568359375, 1.828125, 1.8994140625, 1.970703125, 2.0419921875, 2.11328125, 2.1845703125, 2.255859375, 2.3271484375, 2.3984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 5.0, 2.0, 7.0, 13.0, 12.0, 16.0, 17.0, 14.0, 25.0, 25.0, 26.0, 40.0, 43.0, 50.0, 67.0, 113.0, 135.0, 1392.0, 364.0, 165.0, 108.0, 64.0, 51.0, 53.0, 41.0, 34.0, 35.0, 19.0, 28.0, 16.0, 23.0, 8.0, 8.0, 6.0, 5.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3675537109375, -8.078857421875, -7.7901611328125, -7.50146484375, -7.2127685546875, -6.924072265625, -6.6353759765625, -6.3466796875, -6.0579833984375, -5.769287109375, -5.4805908203125, -5.19189453125, -4.9031982421875, -4.614501953125, -4.3258056640625, -4.037109375, -3.7484130859375, -3.459716796875, -3.1710205078125, -2.88232421875, -2.5936279296875, -2.304931640625, -2.0162353515625, -1.7275390625, -1.4388427734375, -1.150146484375, -0.8614501953125, -0.57275390625, -0.2840576171875, 0.004638671875, 0.2933349609375, 0.58203125, 0.8707275390625, 1.159423828125, 1.4481201171875, 1.73681640625, 2.0255126953125, 2.314208984375, 2.6029052734375, 2.8916015625, 3.1802978515625, 3.468994140625, 3.7576904296875, 4.04638671875, 4.3350830078125, 4.623779296875, 4.9124755859375, 5.201171875, 5.4898681640625, 5.778564453125, 6.0672607421875, 6.35595703125, 6.6446533203125, 6.933349609375, 7.2220458984375, 7.5107421875, 7.7994384765625, 8.088134765625, 8.3768310546875, 8.66552734375, 8.9542236328125, 9.242919921875, 9.5316162109375, 9.8203125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 7.0, 14.0, 18.0, 27.0, 41.0, 68.0, 91.0, 181.0, 331.0, 843.0, 10002.0, 3077145.0, 54640.0, 1393.0, 378.0, 213.0, 114.0, 56.0, 42.0, 27.0, 16.0, 12.0, 12.0, 9.0, 10.0, 2.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.25, -32.232177734375, -31.21435546875, -30.196533203125, -29.1787109375, -28.160888671875, -27.14306640625, -26.125244140625, -25.107421875, -24.089599609375, -23.07177734375, -22.053955078125, -21.0361328125, -20.018310546875, -19.00048828125, -17.982666015625, -16.96484375, -15.947021484375, -14.92919921875, -13.911376953125, -12.8935546875, -11.875732421875, -10.85791015625, -9.840087890625, -8.822265625, -7.804443359375, -6.78662109375, -5.768798828125, -4.7509765625, -3.733154296875, -2.71533203125, -1.697509765625, -0.6796875, 0.338134765625, 1.35595703125, 2.373779296875, 3.3916015625, 4.409423828125, 5.42724609375, 6.445068359375, 7.462890625, 8.480712890625, 9.49853515625, 10.516357421875, 11.5341796875, 12.552001953125, 13.56982421875, 14.587646484375, 15.60546875, 16.623291015625, 17.64111328125, 18.658935546875, 19.6767578125, 20.694580078125, 21.71240234375, 22.730224609375, 23.748046875, 24.765869140625, 25.78369140625, 26.801513671875, 27.8193359375, 28.837158203125, 29.85498046875, 30.872802734375, 31.890625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 335.0, 659.0, 20.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.099002838134766, -49.07429122924805, -45.049583435058594, -41.024871826171875, -37.000160217285156, -32.9754524230957, -28.950740814208984, -24.9260311126709, -20.901321411132812, -16.876611709594727, -12.851901054382324, -8.827190399169922, -4.802480697631836, -0.77777099609375, 3.2469406127929688, 7.271650314331055, 11.29636001586914, 15.321069717407227, 19.345779418945312, 23.37049102783203, 27.395200729370117, 31.419910430908203, 35.44462203979492, 39.469329833984375, 43.494041442871094, 47.51875305175781, 51.543460845947266, 55.568172454833984, 59.59288024902344, 63.617591857910156, 67.64230346679688, 71.6670150756836, 75.69171142578125, 79.71642303466797, 83.74113464355469, 87.76583862304688, 91.7905502319336, 95.81526184082031, 99.83997344970703, 103.86468505859375, 107.88938903808594, 111.91410064697266, 115.93881225585938, 119.96351623535156, 123.98822784423828, 128.012939453125, 132.03765869140625, 136.06236267089844, 140.08706665039062, 144.1117706298828, 148.13648986816406, 152.16119384765625, 156.1859130859375, 160.2106170654297, 164.23532104492188, 168.26004028320312, 172.28475952148438, 176.30946350097656, 180.3341827392578, 184.35888671875, 188.38360595703125, 192.40830993652344, 196.43301391601562, 200.45773315429688, 204.48243713378906]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 9.0, 13.0, 18.0, 14.0, 15.0, 29.0, 18.0, 27.0, 29.0, 37.0, 40.0, 53.0, 27.0, 38.0, 44.0, 51.0, 36.0, 40.0, 47.0, 37.0, 53.0, 40.0, 50.0, 33.0, 33.0, 18.0, 23.0, 24.0, 15.0, 19.0, 11.0, 7.0, 5.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.452285766601562, -18.810428619384766, -18.16857147216797, -17.526714324951172, -16.884857177734375, -16.24300193786621, -15.601144790649414, -14.959287643432617, -14.31743049621582, -13.675573348999023, -13.033716201782227, -12.391860008239746, -11.75000286102295, -11.108145713806152, -10.466289520263672, -9.824432373046875, -9.182575225830078, -8.540718078613281, -7.898861408233643, -7.257004737854004, -6.615147590637207, -5.97329044342041, -5.3314337730407715, -4.689577102661133, -4.047719955444336, -3.405863046646118, -2.7640061378479004, -2.1221492290496826, -1.4802923202514648, -0.8384354114532471, -0.1965785026550293, 0.4452781677246094, 1.0871353149414062, 1.728992223739624, 2.370849132537842, 3.0127060413360596, 3.6545629501342773, 4.296420097351074, 4.938276767730713, 5.580133438110352, 6.221990585327148, 6.863847732543945, 7.505704402923584, 8.147561073303223, 8.78941822052002, 9.431275367736816, 10.073131561279297, 10.714988708496094, 11.35684585571289, 11.998703002929688, 12.640560150146484, 13.282416343688965, 13.924273490905762, 14.566130638122559, 15.207986831665039, 15.849843978881836, 16.491701126098633, 17.13355827331543, 17.775415420532227, 18.417272567749023, 19.059127807617188, 19.700984954833984, 20.34284210205078, 20.984699249267578, 21.626556396484375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 3.0, 3.0, 0.0, 5.0, 5.0, 8.0, 11.0, 7.0, 12.0, 13.0, 9.0, 15.0, 19.0, 17.0, 17.0, 24.0, 27.0, 27.0, 32.0, 22.0, 42.0, 34.0, 32.0, 32.0, 39.0, 39.0, 34.0, 38.0, 46.0, 39.0, 32.0, 20.0, 31.0, 32.0, 30.0, 22.0, 20.0, 26.0, 11.0, 22.0, 14.0, 14.0, 9.0, 14.0, 15.0, 7.0, 9.0, 5.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.927734375, -1.86212158203125, -1.7965087890625, -1.73089599609375, -1.665283203125, -1.59967041015625, -1.5340576171875, -1.46844482421875, -1.40283203125, -1.33721923828125, -1.2716064453125, -1.20599365234375, -1.140380859375, -1.07476806640625, -1.0091552734375, -0.94354248046875, -0.8779296875, -0.81231689453125, -0.7467041015625, -0.68109130859375, -0.615478515625, -0.54986572265625, -0.4842529296875, -0.41864013671875, -0.35302734375, -0.28741455078125, -0.2218017578125, -0.15618896484375, -0.090576171875, -0.02496337890625, 0.0406494140625, 0.10626220703125, 0.171875, 0.23748779296875, 0.3031005859375, 0.36871337890625, 0.434326171875, 0.49993896484375, 0.5655517578125, 0.63116455078125, 0.69677734375, 0.76239013671875, 0.8280029296875, 0.89361572265625, 0.959228515625, 1.02484130859375, 1.0904541015625, 1.15606689453125, 1.2216796875, 1.28729248046875, 1.3529052734375, 1.41851806640625, 1.484130859375, 1.54974365234375, 1.6153564453125, 1.68096923828125, 1.74658203125, 1.81219482421875, 1.8778076171875, 1.94342041015625, 2.009033203125, 2.07464599609375, 2.1402587890625, 2.20587158203125, 2.271484375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 5.0, 9.0, 9.0, 8.0, 14.0, 22.0, 18.0, 26.0, 23.0, 40.0, 44.0, 37.0, 48.0, 44.0, 60.0, 95.0, 115.0, 197.0, 438.0, 1568.0, 10289.0, 126272.0, 2137958.0, 1807124.0, 98354.0, 8725.0, 1500.0, 455.0, 206.0, 107.0, 83.0, 51.0, 46.0, 48.0, 31.0, 40.0, 34.0, 24.0, 19.0, 19.0, 15.0, 15.0, 13.0, 11.0, 4.0, 6.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.7265625, -8.4534912109375, -8.180419921875, -7.9073486328125, -7.63427734375, -7.3612060546875, -7.088134765625, -6.8150634765625, -6.5419921875, -6.2689208984375, -5.995849609375, -5.7227783203125, -5.44970703125, -5.1766357421875, -4.903564453125, -4.6304931640625, -4.357421875, -4.0843505859375, -3.811279296875, -3.5382080078125, -3.26513671875, -2.9920654296875, -2.718994140625, -2.4459228515625, -2.1728515625, -1.8997802734375, -1.626708984375, -1.3536376953125, -1.08056640625, -0.8074951171875, -0.534423828125, -0.2613525390625, 0.01171875, 0.2847900390625, 0.557861328125, 0.8309326171875, 1.10400390625, 1.3770751953125, 1.650146484375, 1.9232177734375, 2.1962890625, 2.4693603515625, 2.742431640625, 3.0155029296875, 3.28857421875, 3.5616455078125, 3.834716796875, 4.1077880859375, 4.380859375, 4.6539306640625, 4.927001953125, 5.2000732421875, 5.47314453125, 5.7462158203125, 6.019287109375, 6.2923583984375, 6.5654296875, 6.8385009765625, 7.111572265625, 7.3846435546875, 7.65771484375, 7.9307861328125, 8.203857421875, 8.4769287109375, 8.75]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 6.0, 5.0, 8.0, 16.0, 14.0, 19.0, 31.0, 47.0, 75.0, 132.0, 213.0, 344.0, 461.0, 665.0, 630.0, 505.0, 311.0, 201.0, 151.0, 77.0, 55.0, 40.0, 24.0, 10.0, 18.0, 9.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9375, -11.65325927734375, -11.3690185546875, -11.08477783203125, -10.800537109375, -10.51629638671875, -10.2320556640625, -9.94781494140625, -9.66357421875, -9.37933349609375, -9.0950927734375, -8.81085205078125, -8.526611328125, -8.24237060546875, -7.9581298828125, -7.67388916015625, -7.3896484375, -7.10540771484375, -6.8211669921875, -6.53692626953125, -6.252685546875, -5.96844482421875, -5.6842041015625, -5.39996337890625, -5.11572265625, -4.83148193359375, -4.5472412109375, -4.26300048828125, -3.978759765625, -3.69451904296875, -3.4102783203125, -3.12603759765625, -2.841796875, -2.55755615234375, -2.2733154296875, -1.98907470703125, -1.704833984375, -1.42059326171875, -1.1363525390625, -0.85211181640625, -0.56787109375, -0.28363037109375, 0.0006103515625, 0.28485107421875, 0.569091796875, 0.85333251953125, 1.1375732421875, 1.42181396484375, 1.7060546875, 1.99029541015625, 2.2745361328125, 2.55877685546875, 2.843017578125, 3.12725830078125, 3.4114990234375, 3.69573974609375, 3.97998046875, 4.26422119140625, 4.5484619140625, 4.83270263671875, 5.116943359375, 5.40118408203125, 5.6854248046875, 5.96966552734375, 6.25390625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 11.0, 6.0, 17.0, 28.0, 46.0, 75.0, 121.0, 223.0, 427.0, 1187.0, 13949.0, 2252129.0, 1911957.0, 12090.0, 1156.0, 381.0, 207.0, 105.0, 65.0, 30.0, 23.0, 15.0, 10.0, 8.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.214111328125, -14.41259765625, -13.611083984375, -12.8095703125, -12.008056640625, -11.20654296875, -10.405029296875, -9.603515625, -8.802001953125, -8.00048828125, -7.198974609375, -6.3974609375, -5.595947265625, -4.79443359375, -3.992919921875, -3.19140625, -2.389892578125, -1.58837890625, -0.786865234375, 0.0146484375, 0.816162109375, 1.61767578125, 2.419189453125, 3.220703125, 4.022216796875, 4.82373046875, 5.625244140625, 6.4267578125, 7.228271484375, 8.02978515625, 8.831298828125, 9.6328125, 10.434326171875, 11.23583984375, 12.037353515625, 12.8388671875, 13.640380859375, 14.44189453125, 15.243408203125, 16.044921875, 16.846435546875, 17.64794921875, 18.449462890625, 19.2509765625, 20.052490234375, 20.85400390625, 21.655517578125, 22.45703125, 23.258544921875, 24.06005859375, 24.861572265625, 25.6630859375, 26.464599609375, 27.26611328125, 28.067626953125, 28.869140625, 29.670654296875, 30.47216796875, 31.273681640625, 32.0751953125, 32.876708984375, 33.67822265625, 34.479736328125, 35.28125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 12.0, 13.0, 37.0, 29.0, 62.0, 79.0, 76.0, 111.0, 112.0, 117.0, 97.0, 88.0, 61.0, 38.0, 29.0, 21.0, 12.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.321203231811523, -12.275741577148438, -11.230279922485352, -10.184818267822266, -9.13935661315918, -8.093894958496094, -7.048433303833008, -6.002971649169922, -4.957509994506836, -3.91204833984375, -2.866586685180664, -1.8211250305175781, -0.7756633758544922, 0.26979827880859375, 1.3152599334716797, 2.3607215881347656, 3.4061832427978516, 4.4516448974609375, 5.497106552124023, 6.542568206787109, 7.588029861450195, 8.633491516113281, 9.678953170776367, 10.724414825439453, 11.769876480102539, 12.815338134765625, 13.860799789428711, 14.906261444091797, 15.951723098754883, 16.99718475341797, 18.042646408081055, 19.08810806274414, 20.133567810058594, 21.17902946472168, 22.224491119384766, 23.26995277404785, 24.315414428710938, 25.360876083374023, 26.40633773803711, 27.451799392700195, 28.49726104736328, 29.542722702026367, 30.588184356689453, 31.63364601135254, 32.679107666015625, 33.724571228027344, 34.7700309753418, 35.81549072265625, 36.86095428466797, 37.90641784667969, 38.95187759399414, 39.997337341308594, 41.04280090332031, 42.08826446533203, 43.133724212646484, 44.17918395996094, 45.224647521972656, 46.270111083984375, 47.31557083129883, 48.36103057861328, 49.406494140625, 50.45195770263672, 51.49741744995117, 52.542877197265625, 53.588340759277344]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 4.0, 7.0, 10.0, 20.0, 16.0, 21.0, 14.0, 24.0, 24.0, 23.0, 36.0, 27.0, 35.0, 33.0, 45.0, 40.0, 41.0, 46.0, 44.0, 37.0, 47.0, 38.0, 40.0, 44.0, 40.0, 16.0, 27.0, 24.0, 28.0, 28.0, 18.0, 12.0, 12.0, 20.0, 8.0, 12.0, 4.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.31110382080078, -20.648548126220703, -19.985992431640625, -19.32343864440918, -18.6608829498291, -17.998327255249023, -17.335773468017578, -16.6732177734375, -16.010662078857422, -15.348106384277344, -14.685551643371582, -14.02299690246582, -13.360441207885742, -12.697885513305664, -12.035330772399902, -11.37277603149414, -10.710220336914062, -10.047664642333984, -9.385109901428223, -8.722555160522461, -8.059999465942383, -7.397444248199463, -6.734889030456543, -6.072333812713623, -5.409778594970703, -4.747223377227783, -4.084668159484863, -3.4221129417419434, -2.7595577239990234, -2.0970025062561035, -1.4344472885131836, -0.7718920707702637, -0.10933685302734375, 0.5532183647155762, 1.215773582458496, 1.878328800201416, 2.540884017944336, 3.203439235687256, 3.865994453430176, 4.528549671173096, 5.191104888916016, 5.8536601066589355, 6.5162153244018555, 7.178770542144775, 7.841325759887695, 8.503881454467773, 9.166436195373535, 9.828990936279297, 10.491546630859375, 11.154102325439453, 11.816657066345215, 12.479211807250977, 13.141767501831055, 13.804323196411133, 14.466877937316895, 15.129432678222656, 15.791988372802734, 16.454544067382812, 17.11709976196289, 17.779653549194336, 18.442209243774414, 19.104764938354492, 19.767318725585938, 20.429874420166016, 21.092430114746094]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 6.0, 6.0, 10.0, 14.0, 12.0, 19.0, 15.0, 23.0, 21.0, 32.0, 29.0, 32.0, 33.0, 33.0, 30.0, 31.0, 47.0, 43.0, 38.0, 34.0, 43.0, 37.0, 41.0, 39.0, 29.0, 23.0, 27.0, 25.0, 24.0, 24.0, 21.0, 22.0, 15.0, 21.0, 12.0, 12.0, 13.0, 13.0, 9.0, 5.0, 4.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.197265625, -2.126922607421875, -2.05657958984375, -1.986236572265625, -1.9158935546875, -1.845550537109375, -1.77520751953125, -1.704864501953125, -1.634521484375, -1.564178466796875, -1.49383544921875, -1.423492431640625, -1.3531494140625, -1.282806396484375, -1.21246337890625, -1.142120361328125, -1.07177734375, -1.001434326171875, -0.93109130859375, -0.860748291015625, -0.7904052734375, -0.720062255859375, -0.64971923828125, -0.579376220703125, -0.509033203125, -0.438690185546875, -0.36834716796875, -0.298004150390625, -0.2276611328125, -0.157318115234375, -0.08697509765625, -0.016632080078125, 0.0537109375, 0.124053955078125, 0.19439697265625, 0.264739990234375, 0.3350830078125, 0.405426025390625, 0.47576904296875, 0.546112060546875, 0.616455078125, 0.686798095703125, 0.75714111328125, 0.827484130859375, 0.8978271484375, 0.968170166015625, 1.03851318359375, 1.108856201171875, 1.17919921875, 1.249542236328125, 1.31988525390625, 1.390228271484375, 1.4605712890625, 1.530914306640625, 1.60125732421875, 1.671600341796875, 1.741943359375, 1.812286376953125, 1.88262939453125, 1.952972412109375, 2.0233154296875, 2.093658447265625, 2.16400146484375, 2.234344482421875, 2.3046875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 8.0, 16.0, 24.0, 28.0, 54.0, 71.0, 110.0, 169.0, 248.0, 310.0, 506.0, 692.0, 1014.0, 1495.0, 2223.0, 3160.0, 4867.0, 7194.0, 11167.0, 16923.0, 27231.0, 44250.0, 73761.0, 120876.0, 183323.0, 193965.0, 136114.0, 83033.0, 49944.0, 30338.0, 18868.0, 12091.0, 8055.0, 5237.0, 3537.0, 2396.0, 1678.0, 1124.0, 750.0, 531.0, 388.0, 242.0, 182.0, 122.0, 83.0, 50.0, 31.0, 25.0, 13.0, 13.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.2822265625, -0.27370452880859375, -0.2651824951171875, -0.25666046142578125, -0.248138427734375, -0.23961639404296875, -0.2310943603515625, -0.22257232666015625, -0.21405029296875, -0.20552825927734375, -0.1970062255859375, -0.18848419189453125, -0.179962158203125, -0.17144012451171875, -0.1629180908203125, -0.15439605712890625, -0.1458740234375, -0.13735198974609375, -0.1288299560546875, -0.12030792236328125, -0.111785888671875, -0.10326385498046875, -0.0947418212890625, -0.08621978759765625, -0.07769775390625, -0.06917572021484375, -0.0606536865234375, -0.05213165283203125, -0.043609619140625, -0.03508758544921875, -0.0265655517578125, -0.01804351806640625, -0.009521484375, -0.00099945068359375, 0.0075225830078125, 0.01604461669921875, 0.024566650390625, 0.03308868408203125, 0.0416107177734375, 0.05013275146484375, 0.05865478515625, 0.06717681884765625, 0.0756988525390625, 0.08422088623046875, 0.092742919921875, 0.10126495361328125, 0.1097869873046875, 0.11830902099609375, 0.1268310546875, 0.13535308837890625, 0.1438751220703125, 0.15239715576171875, 0.160919189453125, 0.16944122314453125, 0.1779632568359375, 0.18648529052734375, 0.19500732421875, 0.20352935791015625, 0.2120513916015625, 0.22057342529296875, 0.229095458984375, 0.23761749267578125, 0.2461395263671875, 0.25466156005859375, 0.26318359375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 1.0, 4.0, 9.0, 12.0, 3.0, 10.0, 16.0, 11.0, 18.0, 24.0, 21.0, 29.0, 38.0, 27.0, 34.0, 32.0, 38.0, 37.0, 40.0, 48.0, 37.0, 1063.0, 33.0, 51.0, 44.0, 33.0, 36.0, 33.0, 35.0, 27.0, 26.0, 23.0, 25.0, 14.0, 11.0, 16.0, 14.0, 10.0, 9.0, 4.0, 6.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.318359375, -1.2699127197265625, -1.221466064453125, -1.1730194091796875, -1.12457275390625, -1.0761260986328125, -1.027679443359375, -0.9792327880859375, -0.9307861328125, -0.8823394775390625, -0.833892822265625, -0.7854461669921875, -0.73699951171875, -0.6885528564453125, -0.640106201171875, -0.5916595458984375, -0.543212890625, -0.4947662353515625, -0.446319580078125, -0.3978729248046875, -0.34942626953125, -0.3009796142578125, -0.252532958984375, -0.2040863037109375, -0.1556396484375, -0.1071929931640625, -0.058746337890625, -0.0102996826171875, 0.03814697265625, 0.0865936279296875, 0.135040283203125, 0.1834869384765625, 0.23193359375, 0.2803802490234375, 0.328826904296875, 0.3772735595703125, 0.42572021484375, 0.4741668701171875, 0.522613525390625, 0.5710601806640625, 0.6195068359375, 0.6679534912109375, 0.716400146484375, 0.7648468017578125, 0.81329345703125, 0.8617401123046875, 0.910186767578125, 0.9586334228515625, 1.007080078125, 1.0555267333984375, 1.103973388671875, 1.1524200439453125, 1.20086669921875, 1.2493133544921875, 1.297760009765625, 1.3462066650390625, 1.3946533203125, 1.4430999755859375, 1.491546630859375, 1.5399932861328125, 1.58843994140625, 1.6368865966796875, 1.685333251953125, 1.7337799072265625, 1.7822265625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 18.0, 15.0, 35.0, 58.0, 85.0, 138.0, 164.0, 254.0, 332.0, 504.0, 725.0, 1078.0, 1559.0, 2252.0, 3336.0, 4684.0, 6898.0, 10238.0, 14954.0, 22031.0, 32684.0, 47537.0, 69414.0, 98790.0, 137154.0, 1191221.0, 135467.0, 98529.0, 68417.0, 47248.0, 32562.0, 21946.0, 14912.0, 10047.0, 6903.0, 4642.0, 3160.0, 2187.0, 1570.0, 1068.0, 717.0, 475.0, 348.0, 210.0, 189.0, 128.0, 86.0, 54.0, 45.0, 28.0, 20.0, 9.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.1546630859375, -0.14990234375, -0.1451416015625, -0.140380859375, -0.1356201171875, -0.130859375, -0.1260986328125, -0.121337890625, -0.1165771484375, -0.11181640625, -0.1070556640625, -0.102294921875, -0.0975341796875, -0.0927734375, -0.0880126953125, -0.083251953125, -0.0784912109375, -0.07373046875, -0.0689697265625, -0.064208984375, -0.0594482421875, -0.0546875, -0.0499267578125, -0.045166015625, -0.0404052734375, -0.03564453125, -0.0308837890625, -0.026123046875, -0.0213623046875, -0.0166015625, -0.0118408203125, -0.007080078125, -0.0023193359375, 0.00244140625, 0.0072021484375, 0.011962890625, 0.0167236328125, 0.021484375, 0.0262451171875, 0.031005859375, 0.0357666015625, 0.04052734375, 0.0452880859375, 0.050048828125, 0.0548095703125, 0.0595703125, 0.0643310546875, 0.069091796875, 0.0738525390625, 0.07861328125, 0.0833740234375, 0.088134765625, 0.0928955078125, 0.09765625, 0.1024169921875, 0.107177734375, 0.1119384765625, 0.11669921875, 0.1214599609375, 0.126220703125, 0.1309814453125, 0.1357421875, 0.1405029296875, 0.145263671875, 0.1500244140625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 4.0, 14.0, 11.0, 13.0, 11.0, 16.0, 20.0, 23.0, 23.0, 23.0, 33.0, 50.0, 48.0, 68.0, 83.0, 80.0, 77.0, 61.0, 41.0, 43.0, 45.0, 31.0, 27.0, 26.0, 20.0, 20.0, 13.0, 16.0, 8.0, 5.0, 10.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0036468505859375, -0.0035148262977600098, -0.0033828020095825195, -0.0032507777214050293, -0.003118753433227539, -0.002986729145050049, -0.0028547048568725586, -0.0027226805686950684, -0.002590656280517578, -0.002458631992340088, -0.0023266077041625977, -0.0021945834159851074, -0.002062559127807617, -0.001930534839630127, -0.0017985105514526367, -0.0016664862632751465, -0.0015344619750976562, -0.001402437686920166, -0.0012704133987426758, -0.0011383891105651855, -0.0010063648223876953, -0.0008743405342102051, -0.0007423162460327148, -0.0006102919578552246, -0.0004782676696777344, -0.00034624338150024414, -0.0002142190933227539, -8.219480514526367e-05, 4.982948303222656e-05, 0.0001818537712097168, 0.00031387805938720703, 0.00044590234756469727, 0.0005779266357421875, 0.0007099509239196777, 0.000841975212097168, 0.0009739995002746582, 0.0011060237884521484, 0.0012380480766296387, 0.001370072364807129, 0.0015020966529846191, 0.0016341209411621094, 0.0017661452293395996, 0.0018981695175170898, 0.00203019380569458, 0.0021622180938720703, 0.0022942423820495605, 0.0024262666702270508, 0.002558290958404541, 0.0026903152465820312, 0.0028223395347595215, 0.0029543638229370117, 0.003086388111114502, 0.003218412399291992, 0.0033504366874694824, 0.0034824609756469727, 0.003614485263824463, 0.003746509552001953, 0.0038785338401794434, 0.004010558128356934, 0.004142582416534424, 0.004274606704711914, 0.004406630992889404, 0.0045386552810668945, 0.004670679569244385, 0.004802703857421875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 7.0, 8.0, 13.0, 16.0, 30.0, 27.0, 41.0, 58.0, 87.0, 98.0, 141.0, 186.0, 320.0, 742.0, 6044.0, 265180.0, 760900.0, 12483.0, 999.0, 345.0, 219.0, 157.0, 102.0, 69.0, 55.0, 46.0, 29.0, 32.0, 19.0, 20.0, 17.0, 8.0, 13.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0784912109375, -0.07631778717041016, -0.07414436340332031, -0.07197093963623047, -0.06979751586914062, -0.06762409210205078, -0.06545066833496094, -0.0632772445678711, -0.06110382080078125, -0.058930397033691406, -0.05675697326660156, -0.05458354949951172, -0.052410125732421875, -0.05023670196533203, -0.04806327819824219, -0.045889854431152344, -0.0437164306640625, -0.041543006896972656, -0.03936958312988281, -0.03719615936279297, -0.035022735595703125, -0.03284931182861328, -0.030675888061523438, -0.028502464294433594, -0.02632904052734375, -0.024155616760253906, -0.021982192993164062, -0.01980876922607422, -0.017635345458984375, -0.015461921691894531, -0.013288497924804688, -0.011115074157714844, -0.008941650390625, -0.006768226623535156, -0.0045948028564453125, -0.0024213790893554688, -0.000247955322265625, 0.0019254684448242188, 0.0040988922119140625, 0.006272315979003906, 0.00844573974609375, 0.010619163513183594, 0.012792587280273438, 0.014966011047363281, 0.017139434814453125, 0.01931285858154297, 0.021486282348632812, 0.023659706115722656, 0.0258331298828125, 0.028006553649902344, 0.030179977416992188, 0.03235340118408203, 0.034526824951171875, 0.03670024871826172, 0.03887367248535156, 0.041047096252441406, 0.04322052001953125, 0.045393943786621094, 0.04756736755371094, 0.04974079132080078, 0.051914215087890625, 0.05408763885498047, 0.05626106262207031, 0.058434486389160156, 0.06060791015625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 5.0, 88.0, 610.0, 253.0, 47.0, 13.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032626560423523188, -0.002360634272918105, -0.0014586125034838915, -0.0005565907340496778, 0.0003454310353845358, 0.0012474528048187494, 0.002149474574252963, 0.0030514963436871767, 0.003953518345952034, 0.004855540115386248, 0.005757561884820461, 0.006659583654254675, 0.0075616054236888885, 0.008463626727461815, 0.009365648962557316, 0.010267671197652817, 0.011169692501425743, 0.01207171380519867, 0.01297373604029417, 0.013875758275389671, 0.014777779579162598, 0.015679800882935524, 0.01658182218670845, 0.017483845353126526, 0.018385866656899452, 0.01928788796067238, 0.020189911127090454, 0.02109193243086338, 0.021993953734636307, 0.022895975038409233, 0.02379799634218216, 0.024700019508600235, 0.025602038949728012, 0.02650406025350094, 0.027406081557273865, 0.02830810472369194, 0.029210126027464867, 0.030112147331237793, 0.03101417049765587, 0.031916189938783646, 0.03281821310520172, 0.0337202362716198, 0.034622255712747574, 0.03552427887916565, 0.036426298320293427, 0.0373283214867115, 0.03823034465312958, 0.039132364094257355, 0.04003438726067543, 0.040936410427093506, 0.04183842986822128, 0.04274045303463936, 0.043642476201057434, 0.04454449564218521, 0.04544651880860329, 0.046348538249731064, 0.04725056141614914, 0.048152584582567215, 0.04905460402369499, 0.04995662719011307, 0.050858646631240845, 0.05176066979765892, 0.052662692964076996, 0.05356471240520477, 0.05446673557162285]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 11.0, 17.0, 24.0, 15.0, 32.0, 39.0, 54.0, 45.0, 45.0, 71.0, 65.0, 51.0, 68.0, 55.0, 50.0, 56.0, 42.0, 58.0, 34.0, 35.0, 29.0, 21.0, 26.0, 15.0, 10.0, 10.0, 6.0, 5.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.005779087543487549, -0.005636661313474178, -0.005494235083460808, -0.005351808853447437, -0.005209382623434067, -0.005066956393420696, -0.004924530163407326, -0.004782103933393955, -0.004639677703380585, -0.004497251473367214, -0.004354825243353844, -0.004212399013340473, -0.004069972783327103, -0.003927546553313732, -0.0037851203233003616, -0.003642694093286991, -0.0035002678632736206, -0.00335784163326025, -0.0032154154032468796, -0.003072989173233509, -0.0029305629432201385, -0.002788136713206768, -0.0026457104831933975, -0.002503284253180027, -0.0023608580231666565, -0.002218431793153286, -0.0020760055631399155, -0.001933579333126545, -0.0017911531031131744, -0.001648726873099804, -0.0015063006430864334, -0.001363874413073063, -0.0012214481830596924, -0.0010790219530463219, -0.0009365957230329514, -0.0007941694930195808, -0.0006517432630062103, -0.0005093170329928398, -0.0003668908029794693, -0.00022446457296609879, -8.203834295272827e-05, 6.038788706064224e-05, 0.00020281411707401276, 0.00034524034708738327, 0.0004876665771007538, 0.0006300928071141243, 0.0007725190371274948, 0.0009149452671408653, 0.0010573714971542358, 0.0011997977271676064, 0.0013422239571809769, 0.0014846501871943474, 0.001627076417207718, 0.0017695026472210884, 0.001911928877234459, 0.0020543551072478294, 0.0021967813372612, 0.0023392075672745705, 0.002481633797287941, 0.0026240600273013115, 0.002766486257314682, 0.0029089124873280525, 0.003051338717341423, 0.0031937649473547935, 0.003336191177368164]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 6.0, 6.0, 10.0, 14.0, 12.0, 20.0, 14.0, 23.0, 22.0, 31.0, 29.0, 32.0, 33.0, 33.0, 30.0, 31.0, 47.0, 43.0, 38.0, 34.0, 43.0, 37.0, 41.0, 38.0, 31.0, 22.0, 27.0, 24.0, 25.0, 24.0, 21.0, 22.0, 15.0, 21.0, 12.0, 12.0, 13.0, 13.0, 9.0, 5.0, 4.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.197265625, -2.126922607421875, -2.05657958984375, -1.986236572265625, -1.9158935546875, -1.845550537109375, -1.77520751953125, -1.704864501953125, -1.634521484375, -1.564178466796875, -1.49383544921875, -1.423492431640625, -1.3531494140625, -1.282806396484375, -1.21246337890625, -1.142120361328125, -1.07177734375, -1.001434326171875, -0.93109130859375, -0.860748291015625, -0.7904052734375, -0.720062255859375, -0.64971923828125, -0.579376220703125, -0.509033203125, -0.438690185546875, -0.36834716796875, -0.298004150390625, -0.2276611328125, -0.157318115234375, -0.08697509765625, -0.016632080078125, 0.0537109375, 0.124053955078125, 0.19439697265625, 0.264739990234375, 0.3350830078125, 0.405426025390625, 0.47576904296875, 0.546112060546875, 0.616455078125, 0.686798095703125, 0.75714111328125, 0.827484130859375, 0.8978271484375, 0.968170166015625, 1.03851318359375, 1.108856201171875, 1.17919921875, 1.249542236328125, 1.31988525390625, 1.390228271484375, 1.4605712890625, 1.530914306640625, 1.60125732421875, 1.671600341796875, 1.741943359375, 1.812286376953125, 1.88262939453125, 1.952972412109375, 2.0233154296875, 2.093658447265625, 2.16400146484375, 2.234344482421875, 2.3046875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 12.0, 21.0, 21.0, 18.0, 31.0, 56.0, 57.0, 122.0, 236.0, 453.0, 742.0, 1565.0, 2864.0, 5440.0, 10077.0, 18774.0, 34026.0, 67364.0, 161113.0, 337975.0, 224289.0, 89689.0, 42938.0, 23477.0, 12706.0, 6708.0, 3608.0, 1887.0, 1056.0, 533.0, 290.0, 165.0, 81.0, 55.0, 33.0, 20.0, 24.0, 11.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.01885986328125, -1.9459228515625, -1.87298583984375, -1.800048828125, -1.72711181640625, -1.6541748046875, -1.58123779296875, -1.50830078125, -1.43536376953125, -1.3624267578125, -1.28948974609375, -1.216552734375, -1.14361572265625, -1.0706787109375, -0.99774169921875, -0.9248046875, -0.85186767578125, -0.7789306640625, -0.70599365234375, -0.633056640625, -0.56011962890625, -0.4871826171875, -0.41424560546875, -0.34130859375, -0.26837158203125, -0.1954345703125, -0.12249755859375, -0.049560546875, 0.02337646484375, 0.0963134765625, 0.16925048828125, 0.2421875, 0.31512451171875, 0.3880615234375, 0.46099853515625, 0.533935546875, 0.60687255859375, 0.6798095703125, 0.75274658203125, 0.82568359375, 0.89862060546875, 0.9715576171875, 1.04449462890625, 1.117431640625, 1.19036865234375, 1.2633056640625, 1.33624267578125, 1.4091796875, 1.48211669921875, 1.5550537109375, 1.62799072265625, 1.700927734375, 1.77386474609375, 1.8468017578125, 1.91973876953125, 1.99267578125, 2.06561279296875, 2.1385498046875, 2.21148681640625, 2.284423828125, 2.35736083984375, 2.4302978515625, 2.50323486328125, 2.576171875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 8.0, 10.0, 5.0, 7.0, 11.0, 8.0, 17.0, 22.0, 19.0, 23.0, 25.0, 34.0, 23.0, 41.0, 57.0, 43.0, 51.0, 88.0, 175.0, 1495.0, 292.0, 132.0, 77.0, 65.0, 39.0, 47.0, 37.0, 36.0, 31.0, 21.0, 19.0, 18.0, 17.0, 19.0, 7.0, 9.0, 4.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.296875, -9.9920654296875, -9.687255859375, -9.3824462890625, -9.07763671875, -8.7728271484375, -8.468017578125, -8.1632080078125, -7.8583984375, -7.5535888671875, -7.248779296875, -6.9439697265625, -6.63916015625, -6.3343505859375, -6.029541015625, -5.7247314453125, -5.419921875, -5.1151123046875, -4.810302734375, -4.5054931640625, -4.20068359375, -3.8958740234375, -3.591064453125, -3.2862548828125, -2.9814453125, -2.6766357421875, -2.371826171875, -2.0670166015625, -1.76220703125, -1.4573974609375, -1.152587890625, -0.8477783203125, -0.54296875, -0.2381591796875, 0.066650390625, 0.3714599609375, 0.67626953125, 0.9810791015625, 1.285888671875, 1.5906982421875, 1.8955078125, 2.2003173828125, 2.505126953125, 2.8099365234375, 3.11474609375, 3.4195556640625, 3.724365234375, 4.0291748046875, 4.333984375, 4.6387939453125, 4.943603515625, 5.2484130859375, 5.55322265625, 5.8580322265625, 6.162841796875, 6.4676513671875, 6.7724609375, 7.0772705078125, 7.382080078125, 7.6868896484375, 7.99169921875, 8.2965087890625, 8.601318359375, 8.9061279296875, 9.2109375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 8.0, 3.0, 6.0, 11.0, 6.0, 19.0, 20.0, 29.0, 52.0, 77.0, 151.0, 234.0, 508.0, 3001.0, 2982710.0, 156628.0, 1291.0, 410.0, 188.0, 122.0, 78.0, 36.0, 34.0, 25.0, 19.0, 10.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.71875, -43.43505859375, -42.1513671875, -40.86767578125, -39.583984375, -38.30029296875, -37.0166015625, -35.73291015625, -34.44921875, -33.16552734375, -31.8818359375, -30.59814453125, -29.314453125, -28.03076171875, -26.7470703125, -25.46337890625, -24.1796875, -22.89599609375, -21.6123046875, -20.32861328125, -19.044921875, -17.76123046875, -16.4775390625, -15.19384765625, -13.91015625, -12.62646484375, -11.3427734375, -10.05908203125, -8.775390625, -7.49169921875, -6.2080078125, -4.92431640625, -3.640625, -2.35693359375, -1.0732421875, 0.21044921875, 1.494140625, 2.77783203125, 4.0615234375, 5.34521484375, 6.62890625, 7.91259765625, 9.1962890625, 10.47998046875, 11.763671875, 13.04736328125, 14.3310546875, 15.61474609375, 16.8984375, 18.18212890625, 19.4658203125, 20.74951171875, 22.033203125, 23.31689453125, 24.6005859375, 25.88427734375, 27.16796875, 28.45166015625, 29.7353515625, 31.01904296875, 32.302734375, 33.58642578125, 34.8701171875, 36.15380859375, 37.4375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 16.0, 95.0, 286.0, 352.0, 191.0, 57.0, 15.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.50761604309082, -21.030540466308594, -19.553464889526367, -18.07638931274414, -16.599313735961914, -15.122238159179688, -13.645163536071777, -12.16808795928955, -10.691012382507324, -9.213936805725098, -7.736861228942871, -6.259786128997803, -4.782710552215576, -3.3056349754333496, -1.8285598754882812, -0.3514842987060547, 1.1255912780761719, 2.6026668548583984, 4.079742431640625, 5.556817531585693, 7.03389310836792, 8.510969161987305, 9.988043785095215, 11.465119361877441, 12.942194938659668, 14.419270515441895, 15.896346092224121, 17.37342071533203, 18.850496292114258, 20.327571868896484, 21.80464744567871, 23.281723022460938, 24.758800506591797, 26.235876083374023, 27.71295166015625, 29.190027236938477, 30.667102813720703, 32.1441764831543, 33.621253967285156, 35.09832763671875, 36.57540512084961, 38.0524787902832, 39.52955627441406, 41.006629943847656, 42.483707427978516, 43.96078109741211, 45.43785858154297, 46.91493225097656, 48.392005920410156, 49.86907958984375, 51.34615707397461, 52.8232307434082, 54.30030822753906, 55.777381896972656, 57.254459381103516, 58.73153305053711, 60.20861053466797, 61.68568420410156, 63.16276168823242, 64.63983917236328, 66.11691284179688, 67.59398651123047, 69.07106018066406, 70.54814147949219, 72.02521514892578]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 7.0, 8.0, 11.0, 13.0, 23.0, 14.0, 23.0, 31.0, 30.0, 30.0, 24.0, 46.0, 41.0, 48.0, 51.0, 43.0, 44.0, 36.0, 29.0, 49.0, 46.0, 43.0, 51.0, 39.0, 41.0, 37.0, 29.0, 26.0, 19.0, 8.0, 11.0, 13.0, 10.0, 4.0, 9.0, 4.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.62518310546875, -30.683149337768555, -29.74111557006836, -28.799081802368164, -27.85704803466797, -26.91501235961914, -25.972978591918945, -25.03094482421875, -24.088911056518555, -23.14687728881836, -22.204843521118164, -21.26280975341797, -20.32077407836914, -19.378742218017578, -18.43670654296875, -17.494672775268555, -16.55263900756836, -15.610605239868164, -14.668571472167969, -13.726536750793457, -12.784502983093262, -11.842469215393066, -10.900434494018555, -9.95840072631836, -9.016366958618164, -8.074333190917969, -7.132298946380615, -6.190264701843262, -5.248230934143066, -4.306197166442871, -3.3641629219055176, -2.422128677368164, -1.480093002319336, -0.5380589962005615, 0.4039750099182129, 1.3460090160369873, 2.2880430221557617, 3.230076789855957, 4.1721110343933105, 5.114145278930664, 6.056179046630859, 6.998212814331055, 7.940247058868408, 8.882281303405762, 9.824315071105957, 10.766348838806152, 11.708383560180664, 12.65041732788086, 13.592451095581055, 14.53448486328125, 15.476518630981445, 16.41855239868164, 17.36058807373047, 18.30261993408203, 19.24465560913086, 20.186689376831055, 21.12872314453125, 22.070756912231445, 23.01279067993164, 23.954824447631836, 24.89685821533203, 25.83889389038086, 26.780927658081055, 27.72296142578125, 28.664995193481445]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 8.0, 9.0, 7.0, 6.0, 8.0, 9.0, 15.0, 18.0, 12.0, 24.0, 25.0, 32.0, 31.0, 30.0, 30.0, 37.0, 38.0, 32.0, 29.0, 35.0, 31.0, 46.0, 47.0, 37.0, 34.0, 38.0, 30.0, 27.0, 29.0, 29.0, 17.0, 32.0, 24.0, 25.0, 15.0, 16.0, 21.0, 10.0, 16.0, 9.0, 8.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.5078125, -2.430694580078125, -2.35357666015625, -2.276458740234375, -2.1993408203125, -2.122222900390625, -2.04510498046875, -1.967987060546875, -1.890869140625, -1.813751220703125, -1.73663330078125, -1.659515380859375, -1.5823974609375, -1.505279541015625, -1.42816162109375, -1.351043701171875, -1.27392578125, -1.196807861328125, -1.11968994140625, -1.042572021484375, -0.9654541015625, -0.888336181640625, -0.81121826171875, -0.734100341796875, -0.656982421875, -0.579864501953125, -0.50274658203125, -0.425628662109375, -0.3485107421875, -0.271392822265625, -0.19427490234375, -0.117156982421875, -0.0400390625, 0.037078857421875, 0.11419677734375, 0.191314697265625, 0.2684326171875, 0.345550537109375, 0.42266845703125, 0.499786376953125, 0.576904296875, 0.654022216796875, 0.73114013671875, 0.808258056640625, 0.8853759765625, 0.962493896484375, 1.03961181640625, 1.116729736328125, 1.19384765625, 1.270965576171875, 1.34808349609375, 1.425201416015625, 1.5023193359375, 1.579437255859375, 1.65655517578125, 1.733673095703125, 1.810791015625, 1.887908935546875, 1.96502685546875, 2.042144775390625, 2.1192626953125, 2.196380615234375, 2.27349853515625, 2.350616455078125, 2.427734375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 6.0, 8.0, 8.0, 11.0, 9.0, 15.0, 19.0, 23.0, 35.0, 30.0, 50.0, 87.0, 142.0, 237.0, 440.0, 1112.0, 3222.0, 10817.0, 44745.0, 215470.0, 1028154.0, 1925689.0, 763955.0, 154192.0, 32731.0, 8509.0, 2518.0, 925.0, 421.0, 210.0, 156.0, 89.0, 42.0, 39.0, 26.0, 28.0, 23.0, 20.0, 9.0, 9.0, 9.0, 4.0, 3.0, 10.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.1328125, -4.98358154296875, -4.8343505859375, -4.68511962890625, -4.535888671875, -4.38665771484375, -4.2374267578125, -4.08819580078125, -3.93896484375, -3.78973388671875, -3.6405029296875, -3.49127197265625, -3.342041015625, -3.19281005859375, -3.0435791015625, -2.89434814453125, -2.7451171875, -2.59588623046875, -2.4466552734375, -2.29742431640625, -2.148193359375, -1.99896240234375, -1.8497314453125, -1.70050048828125, -1.55126953125, -1.40203857421875, -1.2528076171875, -1.10357666015625, -0.954345703125, -0.80511474609375, -0.6558837890625, -0.50665283203125, -0.357421875, -0.20819091796875, -0.0589599609375, 0.09027099609375, 0.239501953125, 0.38873291015625, 0.5379638671875, 0.68719482421875, 0.83642578125, 0.98565673828125, 1.1348876953125, 1.28411865234375, 1.433349609375, 1.58258056640625, 1.7318115234375, 1.88104248046875, 2.0302734375, 2.17950439453125, 2.3287353515625, 2.47796630859375, 2.627197265625, 2.77642822265625, 2.9256591796875, 3.07489013671875, 3.22412109375, 3.37335205078125, 3.5225830078125, 3.67181396484375, 3.821044921875, 3.97027587890625, 4.1195068359375, 4.26873779296875, 4.41796875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 3.0, 6.0, 14.0, 19.0, 21.0, 28.0, 50.0, 76.0, 97.0, 151.0, 212.0, 278.0, 380.0, 495.0, 507.0, 448.0, 332.0, 288.0, 191.0, 159.0, 98.0, 69.0, 47.0, 29.0, 17.0, 20.0, 13.0, 11.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.90386962890625, -7.6671142578125, -7.43035888671875, -7.193603515625, -6.95684814453125, -6.7200927734375, -6.48333740234375, -6.24658203125, -6.00982666015625, -5.7730712890625, -5.53631591796875, -5.299560546875, -5.06280517578125, -4.8260498046875, -4.58929443359375, -4.3525390625, -4.11578369140625, -3.8790283203125, -3.64227294921875, -3.405517578125, -3.16876220703125, -2.9320068359375, -2.69525146484375, -2.45849609375, -2.22174072265625, -1.9849853515625, -1.74822998046875, -1.511474609375, -1.27471923828125, -1.0379638671875, -0.80120849609375, -0.564453125, -0.32769775390625, -0.0909423828125, 0.14581298828125, 0.382568359375, 0.61932373046875, 0.8560791015625, 1.09283447265625, 1.32958984375, 1.56634521484375, 1.8031005859375, 2.03985595703125, 2.276611328125, 2.51336669921875, 2.7501220703125, 2.98687744140625, 3.2236328125, 3.46038818359375, 3.6971435546875, 3.93389892578125, 4.170654296875, 4.40740966796875, 4.6441650390625, 4.88092041015625, 5.11767578125, 5.35443115234375, 5.5911865234375, 5.82794189453125, 6.064697265625, 6.30145263671875, 6.5382080078125, 6.77496337890625, 7.01171875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 6.0, 10.0, 9.0, 15.0, 23.0, 36.0, 40.0, 50.0, 80.0, 130.0, 158.0, 305.0, 568.0, 1427.0, 8737.0, 118822.0, 2065523.0, 1881897.0, 105896.0, 7906.0, 1331.0, 524.0, 283.0, 157.0, 95.0, 88.0, 50.0, 40.0, 25.0, 11.0, 12.0, 12.0, 7.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.953125, -11.5406494140625, -11.128173828125, -10.7156982421875, -10.30322265625, -9.8907470703125, -9.478271484375, -9.0657958984375, -8.6533203125, -8.2408447265625, -7.828369140625, -7.4158935546875, -7.00341796875, -6.5909423828125, -6.178466796875, -5.7659912109375, -5.353515625, -4.9410400390625, -4.528564453125, -4.1160888671875, -3.70361328125, -3.2911376953125, -2.878662109375, -2.4661865234375, -2.0537109375, -1.6412353515625, -1.228759765625, -0.8162841796875, -0.40380859375, 0.0086669921875, 0.421142578125, 0.8336181640625, 1.24609375, 1.6585693359375, 2.071044921875, 2.4835205078125, 2.89599609375, 3.3084716796875, 3.720947265625, 4.1334228515625, 4.5458984375, 4.9583740234375, 5.370849609375, 5.7833251953125, 6.19580078125, 6.6082763671875, 7.020751953125, 7.4332275390625, 7.845703125, 8.2581787109375, 8.670654296875, 9.0831298828125, 9.49560546875, 9.9080810546875, 10.320556640625, 10.7330322265625, 11.1455078125, 11.5579833984375, 11.970458984375, 12.3829345703125, 12.79541015625, 13.2078857421875, 13.620361328125, 14.0328369140625, 14.4453125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 13.0, 36.0, 73.0, 177.0, 204.0, 211.0, 153.0, 102.0, 22.0, 14.0, 8.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.28544616699219, -80.37281799316406, -78.4601821899414, -76.54755401611328, -74.63492584228516, -72.7222900390625, -70.80966186523438, -68.89703369140625, -66.9843978881836, -65.07176971435547, -63.15913772583008, -61.24650573730469, -59.3338737487793, -57.421241760253906, -55.50861358642578, -53.59598159790039, -51.683353424072266, -49.770721435546875, -47.85809326171875, -45.94546127319336, -44.03282928466797, -42.120201110839844, -40.20756912231445, -38.29493713378906, -36.38230895996094, -34.46967697143555, -32.55704879760742, -30.64441680908203, -28.73178482055664, -26.819154739379883, -24.906524658203125, -22.993892669677734, -21.08126449584961, -19.16863441467285, -17.25600242614746, -15.343372344970703, -13.430741310119629, -11.518110275268555, -9.605480194091797, -7.692849159240723, -5.780218124389648, -3.8675873279571533, -1.9549565315246582, -0.04232597351074219, 1.870305061340332, 3.7829360961914062, 5.695566177368164, 7.608197212219238, 9.520828247070312, 11.433459281921387, 13.346090316772461, 15.258720397949219, 17.17135238647461, 19.083982467651367, 20.996612548828125, 22.909244537353516, 24.821874618530273, 26.73450469970703, 28.647136688232422, 30.55976676940918, 32.47239685058594, 34.38502883911133, 36.29766082763672, 38.210289001464844, 40.122920989990234]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 7.0, 12.0, 10.0, 10.0, 11.0, 17.0, 13.0, 23.0, 21.0, 30.0, 20.0, 38.0, 30.0, 34.0, 34.0, 31.0, 39.0, 43.0, 36.0, 52.0, 32.0, 44.0, 36.0, 33.0, 54.0, 34.0, 34.0, 31.0, 19.0, 13.0, 20.0, 17.0, 17.0, 20.0, 13.0, 8.0, 11.0, 9.0, 11.0, 5.0, 6.0, 2.0, 1.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.209890365600586, -18.562021255493164, -17.914152145385742, -17.26628303527832, -16.618412017822266, -15.97054386138916, -15.322673797607422, -14.6748046875, -14.026935577392578, -13.379066467285156, -12.731197357177734, -12.083327293395996, -11.435458183288574, -10.787589073181152, -10.139719009399414, -9.491849899291992, -8.84398078918457, -8.196111679077148, -7.548242092132568, -6.900372505187988, -6.252503395080566, -5.6046342849731445, -4.9567646980285645, -4.308895111083984, -3.6610260009765625, -3.0131566524505615, -2.3652873039245605, -1.7174179553985596, -1.0695486068725586, -0.4216792583465576, 0.22619009017944336, 0.8740596771240234, 1.5219306945800781, 2.169800043106079, 2.81766939163208, 3.465538740158081, 4.113408088684082, 4.761277198791504, 5.409146785736084, 6.057016372680664, 6.704885482788086, 7.352754592895508, 8.00062370300293, 8.648493766784668, 9.29636287689209, 9.944231986999512, 10.59210205078125, 11.239971160888672, 11.887840270996094, 12.535709381103516, 13.183578491210938, 13.831448554992676, 14.479317665100098, 15.12718677520752, 15.775056838989258, 16.42292594909668, 17.0707950592041, 17.718664169311523, 18.366533279418945, 19.014402389526367, 19.662273406982422, 20.310142517089844, 20.958011627197266, 21.605880737304688, 22.25374984741211]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 5.0, 7.0, 10.0, 8.0, 12.0, 11.0, 19.0, 13.0, 20.0, 30.0, 29.0, 21.0, 22.0, 44.0, 32.0, 33.0, 29.0, 41.0, 37.0, 45.0, 50.0, 33.0, 35.0, 40.0, 30.0, 41.0, 31.0, 28.0, 29.0, 31.0, 29.0, 29.0, 14.0, 15.0, 19.0, 17.0, 11.0, 11.0, 4.0, 6.0, 8.0, 9.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.671875, -2.592071533203125, -2.51226806640625, -2.432464599609375, -2.3526611328125, -2.272857666015625, -2.19305419921875, -2.113250732421875, -2.033447265625, -1.953643798828125, -1.87384033203125, -1.794036865234375, -1.7142333984375, -1.634429931640625, -1.55462646484375, -1.474822998046875, -1.39501953125, -1.315216064453125, -1.23541259765625, -1.155609130859375, -1.0758056640625, -0.996002197265625, -0.91619873046875, -0.836395263671875, -0.756591796875, -0.676788330078125, -0.59698486328125, -0.517181396484375, -0.4373779296875, -0.357574462890625, -0.27777099609375, -0.197967529296875, -0.1181640625, -0.038360595703125, 0.04144287109375, 0.121246337890625, 0.2010498046875, 0.280853271484375, 0.36065673828125, 0.440460205078125, 0.520263671875, 0.600067138671875, 0.67987060546875, 0.759674072265625, 0.8394775390625, 0.919281005859375, 0.99908447265625, 1.078887939453125, 1.15869140625, 1.238494873046875, 1.31829833984375, 1.398101806640625, 1.4779052734375, 1.557708740234375, 1.63751220703125, 1.717315673828125, 1.797119140625, 1.876922607421875, 1.95672607421875, 2.036529541015625, 2.1163330078125, 2.196136474609375, 2.27593994140625, 2.355743408203125, 2.435546875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 15.0, 16.0, 35.0, 35.0, 58.0, 88.0, 138.0, 209.0, 292.0, 480.0, 818.0, 1249.0, 1973.0, 3336.0, 5575.0, 9784.0, 17540.0, 31180.0, 58303.0, 108518.0, 189180.0, 244181.0, 167693.0, 93672.0, 50629.0, 27148.0, 15038.0, 8691.0, 4922.0, 2916.0, 1790.0, 1114.0, 696.0, 386.0, 291.0, 175.0, 132.0, 83.0, 60.0, 37.0, 24.0, 11.0, 14.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.380615234375, -0.3692131042480469, -0.35781097412109375, -0.3464088439941406, -0.3350067138671875, -0.3236045837402344, -0.31220245361328125, -0.3008003234863281, -0.289398193359375, -0.2779960632324219, -0.26659393310546875, -0.2551918029785156, -0.2437896728515625, -0.23238754272460938, -0.22098541259765625, -0.20958328247070312, -0.19818115234375, -0.18677902221679688, -0.17537689208984375, -0.16397476196289062, -0.1525726318359375, -0.14117050170898438, -0.12976837158203125, -0.11836624145507812, -0.106964111328125, -0.09556198120117188, -0.08415985107421875, -0.07275772094726562, -0.0613555908203125, -0.049953460693359375, -0.03855133056640625, -0.027149200439453125, -0.0157470703125, -0.004344940185546875, 0.00705718994140625, 0.018459320068359375, 0.0298614501953125, 0.041263580322265625, 0.05266571044921875, 0.06406784057617188, 0.075469970703125, 0.08687210083007812, 0.09827423095703125, 0.10967636108398438, 0.1210784912109375, 0.13248062133789062, 0.14388275146484375, 0.15528488159179688, 0.16668701171875, 0.17808914184570312, 0.18949127197265625, 0.20089340209960938, 0.2122955322265625, 0.22369766235351562, 0.23509979248046875, 0.24650192260742188, 0.257904052734375, 0.2693061828613281, 0.28070831298828125, 0.2921104431152344, 0.3035125732421875, 0.3149147033691406, 0.32631683349609375, 0.3377189636230469, 0.34912109375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 4.0, 5.0, 12.0, 9.0, 12.0, 12.0, 27.0, 18.0, 24.0, 23.0, 23.0, 27.0, 31.0, 42.0, 30.0, 48.0, 34.0, 32.0, 46.0, 1069.0, 32.0, 50.0, 36.0, 45.0, 32.0, 29.0, 38.0, 34.0, 23.0, 18.0, 23.0, 22.0, 22.0, 14.0, 8.0, 19.0, 13.0, 5.0, 7.0, 7.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.828125, -1.773681640625, -1.71923828125, -1.664794921875, -1.6103515625, -1.555908203125, -1.50146484375, -1.447021484375, -1.392578125, -1.338134765625, -1.28369140625, -1.229248046875, -1.1748046875, -1.120361328125, -1.06591796875, -1.011474609375, -0.95703125, -0.902587890625, -0.84814453125, -0.793701171875, -0.7392578125, -0.684814453125, -0.63037109375, -0.575927734375, -0.521484375, -0.467041015625, -0.41259765625, -0.358154296875, -0.3037109375, -0.249267578125, -0.19482421875, -0.140380859375, -0.0859375, -0.031494140625, 0.02294921875, 0.077392578125, 0.1318359375, 0.186279296875, 0.24072265625, 0.295166015625, 0.349609375, 0.404052734375, 0.45849609375, 0.512939453125, 0.5673828125, 0.621826171875, 0.67626953125, 0.730712890625, 0.78515625, 0.839599609375, 0.89404296875, 0.948486328125, 1.0029296875, 1.057373046875, 1.11181640625, 1.166259765625, 1.220703125, 1.275146484375, 1.32958984375, 1.384033203125, 1.4384765625, 1.492919921875, 1.54736328125, 1.601806640625, 1.65625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 4.0, 12.0, 16.0, 17.0, 13.0, 34.0, 56.0, 62.0, 90.0, 151.0, 223.0, 333.0, 492.0, 746.0, 987.0, 1568.0, 2357.0, 3608.0, 5365.0, 8073.0, 12544.0, 18564.0, 28871.0, 43530.0, 66464.0, 97503.0, 136442.0, 1195092.0, 152944.0, 106886.0, 72621.0, 48193.0, 31735.0, 20954.0, 13701.0, 9051.0, 5970.0, 3916.0, 2602.0, 1730.0, 1148.0, 791.0, 521.0, 355.0, 244.0, 183.0, 116.0, 80.0, 53.0, 42.0, 25.0, 26.0, 8.0, 7.0, 8.0, 4.0, 2.0, 1.0, 4.0, 1.0], "bins": [-0.1751708984375, -0.1696319580078125, -0.164093017578125, -0.1585540771484375, -0.15301513671875, -0.1474761962890625, -0.141937255859375, -0.1363983154296875, -0.130859375, -0.1253204345703125, -0.119781494140625, -0.1142425537109375, -0.10870361328125, -0.1031646728515625, -0.097625732421875, -0.0920867919921875, -0.0865478515625, -0.0810089111328125, -0.075469970703125, -0.0699310302734375, -0.06439208984375, -0.0588531494140625, -0.053314208984375, -0.0477752685546875, -0.042236328125, -0.0366973876953125, -0.031158447265625, -0.0256195068359375, -0.02008056640625, -0.0145416259765625, -0.009002685546875, -0.0034637451171875, 0.0020751953125, 0.0076141357421875, 0.013153076171875, 0.0186920166015625, 0.02423095703125, 0.0297698974609375, 0.035308837890625, 0.0408477783203125, 0.04638671875, 0.0519256591796875, 0.057464599609375, 0.0630035400390625, 0.06854248046875, 0.0740814208984375, 0.079620361328125, 0.0851593017578125, 0.0906982421875, 0.0962371826171875, 0.101776123046875, 0.1073150634765625, 0.11285400390625, 0.1183929443359375, 0.123931884765625, 0.1294708251953125, 0.135009765625, 0.1405487060546875, 0.146087646484375, 0.1516265869140625, 0.15716552734375, 0.1627044677734375, 0.168243408203125, 0.1737823486328125, 0.1793212890625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 7.0, 6.0, 3.0, 2.0, 5.0, 12.0, 11.0, 20.0, 17.0, 11.0, 21.0, 27.0, 20.0, 35.0, 49.0, 92.0, 104.0, 98.0, 92.0, 67.0, 54.0, 45.0, 29.0, 32.0, 29.0, 17.0, 15.0, 7.0, 16.0, 10.0, 7.0, 5.0, 7.0, 11.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00662994384765625, -0.006454288959503174, -0.006278634071350098, -0.0061029791831970215, -0.005927324295043945, -0.005751669406890869, -0.005576014518737793, -0.005400359630584717, -0.005224704742431641, -0.0050490498542785645, -0.004873394966125488, -0.004697740077972412, -0.004522085189819336, -0.00434643030166626, -0.004170775413513184, -0.003995120525360107, -0.0038194656372070312, -0.003643810749053955, -0.003468155860900879, -0.0032925009727478027, -0.0031168460845947266, -0.0029411911964416504, -0.0027655363082885742, -0.002589881420135498, -0.002414226531982422, -0.0022385716438293457, -0.0020629167556762695, -0.0018872618675231934, -0.0017116069793701172, -0.001535952091217041, -0.0013602972030639648, -0.0011846423149108887, -0.0010089874267578125, -0.0008333325386047363, -0.0006576776504516602, -0.000482022762298584, -0.0003063678741455078, -0.00013071298599243164, 4.494190216064453e-05, 0.0002205967903137207, 0.0003962516784667969, 0.000571906566619873, 0.0007475614547729492, 0.0009232163429260254, 0.0010988712310791016, 0.0012745261192321777, 0.001450181007385254, 0.00162583589553833, 0.0018014907836914062, 0.0019771456718444824, 0.0021528005599975586, 0.0023284554481506348, 0.002504110336303711, 0.002679765224456787, 0.0028554201126098633, 0.0030310750007629395, 0.0032067298889160156, 0.003382384777069092, 0.003558039665222168, 0.003733694553375244, 0.00390934944152832, 0.0040850043296813965, 0.004260659217834473, 0.004436314105987549, 0.004611968994140625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 7.0, 9.0, 11.0, 2.0, 13.0, 10.0, 17.0, 20.0, 40.0, 39.0, 59.0, 81.0, 153.0, 177.0, 396.0, 1138.0, 93082.0, 947383.0, 4511.0, 603.0, 256.0, 159.0, 107.0, 83.0, 36.0, 23.0, 39.0, 21.0, 22.0, 9.0, 6.0, 6.0, 3.0, 7.0, 8.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0853271484375, -0.08207416534423828, -0.07882118225097656, -0.07556819915771484, -0.07231521606445312, -0.0690622329711914, -0.06580924987792969, -0.06255626678466797, -0.05930328369140625, -0.05605030059814453, -0.05279731750488281, -0.049544334411621094, -0.046291351318359375, -0.043038368225097656, -0.03978538513183594, -0.03653240203857422, -0.0332794189453125, -0.03002643585205078, -0.026773452758789062, -0.023520469665527344, -0.020267486572265625, -0.017014503479003906, -0.013761520385742188, -0.010508537292480469, -0.00725555419921875, -0.004002571105957031, -0.0007495880126953125, 0.0025033950805664062, 0.005756378173828125, 0.009009361267089844, 0.012262344360351562, 0.015515327453613281, 0.018768310546875, 0.02202129364013672, 0.025274276733398438, 0.028527259826660156, 0.031780242919921875, 0.035033226013183594, 0.03828620910644531, 0.04153919219970703, 0.04479217529296875, 0.04804515838623047, 0.05129814147949219, 0.054551124572753906, 0.057804107666015625, 0.061057090759277344, 0.06431007385253906, 0.06756305694580078, 0.0708160400390625, 0.07406902313232422, 0.07732200622558594, 0.08057498931884766, 0.08382797241210938, 0.0870809555053711, 0.09033393859863281, 0.09358692169189453, 0.09683990478515625, 0.10009288787841797, 0.10334587097167969, 0.1065988540649414, 0.10985183715820312, 0.11310482025146484, 0.11635780334472656, 0.11961078643798828, 0.12286376953125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [35.0, 736.0, 215.0, 25.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021249116398394108, -0.0008498249808326364, 0.00042526167817413807, 0.0017003482207655907, 0.002975434996187687, 0.004250521771609783, 0.005525608081370592, 0.006800694856792688, 0.008075781166553497, 0.009350867941975594, 0.01062595471739769, 0.011901041492819786, 0.013176128268241882, 0.014451215043663979, 0.015726301819086075, 0.017001386731863022, 0.018276475369930267, 0.019551562145352364, 0.02082664892077446, 0.022101735696196556, 0.023376822471618652, 0.02465190924704075, 0.025926996022462845, 0.027202080935239792, 0.028477167710661888, 0.029752254486083984, 0.03102734126150608, 0.03230242803692818, 0.033577512949705124, 0.03485260158777237, 0.036127686500549316, 0.03740277513861656, 0.03867786005139351, 0.039952944964170456, 0.0412280336022377, 0.04250311851501465, 0.043778207153081894, 0.04505329206585884, 0.046328380703926086, 0.04760346561670303, 0.04887855425477028, 0.050153639167547226, 0.05142872780561447, 0.05270381271839142, 0.053978901356458664, 0.05525398626923561, 0.056529074907302856, 0.0578041598200798, 0.05907924473285675, 0.0603543296456337, 0.06162941828370094, 0.06290450692176819, 0.06417959183454514, 0.06545467674732208, 0.06672976166009903, 0.06800485402345657, 0.06927993893623352, 0.07055502384901047, 0.07183010876178741, 0.07310520112514496, 0.0743802860379219, 0.07565537095069885, 0.0769304558634758, 0.07820554822683334, 0.07948063313961029]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 6.0, 8.0, 12.0, 10.0, 23.0, 27.0, 39.0, 32.0, 35.0, 42.0, 66.0, 70.0, 64.0, 62.0, 72.0, 58.0, 75.0, 61.0, 52.0, 59.0, 33.0, 34.0, 22.0, 22.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007820487022399902, -0.007613399066030979, -0.007406311109662056, -0.007199223153293133, -0.00699213519692421, -0.006785047240555286, -0.006577959284186363, -0.00637087132781744, -0.006163783371448517, -0.005956695415079594, -0.0057496074587106705, -0.005542519502341747, -0.005335431545972824, -0.005128343589603901, -0.004921255633234978, -0.0047141676768660545, -0.004507079720497131, -0.004299991764128208, -0.004092903807759285, -0.003885815851390362, -0.0036787278950214386, -0.0034716399386525154, -0.0032645519822835922, -0.003057464025914669, -0.002850376069545746, -0.0026432881131768227, -0.0024362001568078995, -0.0022291122004389763, -0.002022024244070053, -0.00181493628770113, -0.0016078483313322067, -0.0014007603749632835, -0.0011936724185943604, -0.0009865844622254372, -0.000779496505856514, -0.0005724085494875908, -0.0003653205931186676, -0.00015823263674974442, 4.885531961917877e-05, 0.00025594327598810196, 0.00046303123235702515, 0.0006701191887259483, 0.0008772071450948715, 0.0010842951014637947, 0.001291383057832718, 0.001498471014201641, 0.0017055589705705643, 0.0019126469269394875, 0.0021197348833084106, 0.002326822839677334, 0.002533910796046257, 0.00274099875241518, 0.0029480867087841034, 0.0031551746651530266, 0.0033622626215219498, 0.003569350577890873, 0.003776438534259796, 0.003983526490628719, 0.0041906144469976425, 0.004397702403366566, 0.004604790359735489, 0.004811878316104412, 0.005018966272473335, 0.0052260542288422585, 0.005433142185211182]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 5.0, 7.0, 10.0, 8.0, 12.0, 11.0, 19.0, 13.0, 20.0, 30.0, 29.0, 21.0, 22.0, 44.0, 32.0, 33.0, 29.0, 41.0, 37.0, 45.0, 50.0, 32.0, 36.0, 40.0, 30.0, 41.0, 31.0, 28.0, 29.0, 31.0, 29.0, 29.0, 14.0, 15.0, 19.0, 17.0, 11.0, 11.0, 4.0, 6.0, 8.0, 9.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.671875, -2.592071533203125, -2.51226806640625, -2.432464599609375, -2.3526611328125, -2.272857666015625, -2.19305419921875, -2.113250732421875, -2.033447265625, -1.953643798828125, -1.87384033203125, -1.794036865234375, -1.7142333984375, -1.634429931640625, -1.55462646484375, -1.474822998046875, -1.39501953125, -1.315216064453125, -1.23541259765625, -1.155609130859375, -1.0758056640625, -0.996002197265625, -0.91619873046875, -0.836395263671875, -0.756591796875, -0.676788330078125, -0.59698486328125, -0.517181396484375, -0.4373779296875, -0.357574462890625, -0.27777099609375, -0.197967529296875, -0.1181640625, -0.038360595703125, 0.04144287109375, 0.121246337890625, 0.2010498046875, 0.280853271484375, 0.36065673828125, 0.440460205078125, 0.520263671875, 0.600067138671875, 0.67987060546875, 0.759674072265625, 0.8394775390625, 0.919281005859375, 0.99908447265625, 1.078887939453125, 1.15869140625, 1.238494873046875, 1.31829833984375, 1.398101806640625, 1.4779052734375, 1.557708740234375, 1.63751220703125, 1.717315673828125, 1.797119140625, 1.876922607421875, 1.95672607421875, 2.036529541015625, 2.1163330078125, 2.196136474609375, 2.27593994140625, 2.355743408203125, 2.435546875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 19.0, 25.0, 45.0, 77.0, 102.0, 186.0, 263.0, 486.0, 803.0, 1455.0, 2650.0, 5086.0, 9451.0, 18584.0, 36980.0, 75035.0, 155089.0, 270027.0, 233572.0, 119859.0, 58083.0, 29240.0, 14820.0, 7576.0, 4034.0, 2076.0, 1138.0, 678.0, 415.0, 226.0, 157.0, 115.0, 53.0, 45.0, 23.0, 22.0, 11.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.716796875, -2.636474609375, -2.55615234375, -2.475830078125, -2.3955078125, -2.315185546875, -2.23486328125, -2.154541015625, -2.07421875, -1.993896484375, -1.91357421875, -1.833251953125, -1.7529296875, -1.672607421875, -1.59228515625, -1.511962890625, -1.431640625, -1.351318359375, -1.27099609375, -1.190673828125, -1.1103515625, -1.030029296875, -0.94970703125, -0.869384765625, -0.7890625, -0.708740234375, -0.62841796875, -0.548095703125, -0.4677734375, -0.387451171875, -0.30712890625, -0.226806640625, -0.146484375, -0.066162109375, 0.01416015625, 0.094482421875, 0.1748046875, 0.255126953125, 0.33544921875, 0.415771484375, 0.49609375, 0.576416015625, 0.65673828125, 0.737060546875, 0.8173828125, 0.897705078125, 0.97802734375, 1.058349609375, 1.138671875, 1.218994140625, 1.29931640625, 1.379638671875, 1.4599609375, 1.540283203125, 1.62060546875, 1.700927734375, 1.78125, 1.861572265625, 1.94189453125, 2.022216796875, 2.1025390625, 2.182861328125, 2.26318359375, 2.343505859375, 2.423828125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 4.0, 7.0, 9.0, 7.0, 11.0, 10.0, 15.0, 18.0, 26.0, 24.0, 33.0, 30.0, 21.0, 40.0, 44.0, 62.0, 67.0, 117.0, 223.0, 1401.0, 294.0, 121.0, 82.0, 53.0, 52.0, 34.0, 31.0, 25.0, 36.0, 25.0, 28.0, 17.0, 16.0, 15.0, 15.0, 8.0, 8.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.890625, -10.5667724609375, -10.242919921875, -9.9190673828125, -9.59521484375, -9.2713623046875, -8.947509765625, -8.6236572265625, -8.2998046875, -7.9759521484375, -7.652099609375, -7.3282470703125, -7.00439453125, -6.6805419921875, -6.356689453125, -6.0328369140625, -5.708984375, -5.3851318359375, -5.061279296875, -4.7374267578125, -4.41357421875, -4.0897216796875, -3.765869140625, -3.4420166015625, -3.1181640625, -2.7943115234375, -2.470458984375, -2.1466064453125, -1.82275390625, -1.4989013671875, -1.175048828125, -0.8511962890625, -0.52734375, -0.2034912109375, 0.120361328125, 0.4442138671875, 0.76806640625, 1.0919189453125, 1.415771484375, 1.7396240234375, 2.0634765625, 2.3873291015625, 2.711181640625, 3.0350341796875, 3.35888671875, 3.6827392578125, 4.006591796875, 4.3304443359375, 4.654296875, 4.9781494140625, 5.302001953125, 5.6258544921875, 5.94970703125, 6.2735595703125, 6.597412109375, 6.9212646484375, 7.2451171875, 7.5689697265625, 7.892822265625, 8.2166748046875, 8.54052734375, 8.8643798828125, 9.188232421875, 9.5120849609375, 9.8359375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 3.0, 11.0, 19.0, 34.0, 35.0, 46.0, 55.0, 84.0, 99.0, 192.0, 269.0, 445.0, 1552.0, 27904.0, 3073162.0, 38738.0, 1668.0, 490.0, 272.0, 171.0, 108.0, 109.0, 62.0, 46.0, 34.0, 25.0, 16.0, 15.0, 8.0, 13.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.625, -26.65673828125, -25.6884765625, -24.72021484375, -23.751953125, -22.78369140625, -21.8154296875, -20.84716796875, -19.87890625, -18.91064453125, -17.9423828125, -16.97412109375, -16.005859375, -15.03759765625, -14.0693359375, -13.10107421875, -12.1328125, -11.16455078125, -10.1962890625, -9.22802734375, -8.259765625, -7.29150390625, -6.3232421875, -5.35498046875, -4.38671875, -3.41845703125, -2.4501953125, -1.48193359375, -0.513671875, 0.45458984375, 1.4228515625, 2.39111328125, 3.359375, 4.32763671875, 5.2958984375, 6.26416015625, 7.232421875, 8.20068359375, 9.1689453125, 10.13720703125, 11.10546875, 12.07373046875, 13.0419921875, 14.01025390625, 14.978515625, 15.94677734375, 16.9150390625, 17.88330078125, 18.8515625, 19.81982421875, 20.7880859375, 21.75634765625, 22.724609375, 23.69287109375, 24.6611328125, 25.62939453125, 26.59765625, 27.56591796875, 28.5341796875, 29.50244140625, 30.470703125, 31.43896484375, 32.4072265625, 33.37548828125, 34.34375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 22.0, 738.0, 258.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.9682502746582, -34.8353157043457, -29.702383041381836, -24.56945037841797, -19.43651580810547, -14.303581237792969, -9.170648574829102, -4.037715911865234, 1.0952186584472656, 6.228152275085449, 11.361085891723633, 16.4940185546875, 21.626953125, 26.7598876953125, 31.892820358276367, 37.025753021240234, 42.158687591552734, 47.291622161865234, 52.42455291748047, 57.55748748779297, 62.69042205810547, 67.82335662841797, 72.95629119873047, 78.08921813964844, 83.22215270996094, 88.35508728027344, 93.48802185058594, 98.62095642089844, 103.75389099121094, 108.88682556152344, 114.0197525024414, 119.1526870727539, 124.28561401367188, 129.41854858398438, 134.55148315429688, 139.68441772460938, 144.81735229492188, 149.95028686523438, 155.08322143554688, 160.21615600585938, 165.34909057617188, 170.48202514648438, 175.61495971679688, 180.74789428710938, 185.88082885742188, 191.01376342773438, 196.14669799804688, 201.27963256835938, 206.4125518798828, 211.5454864501953, 216.6784210205078, 221.8113555908203, 226.9442901611328, 232.0772247314453, 237.2101593017578, 242.34307861328125, 247.47601318359375, 252.60894775390625, 257.74188232421875, 262.87481689453125, 268.00775146484375, 273.14068603515625, 278.27362060546875, 283.40655517578125, 288.53948974609375]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 4.0, 1.0, 5.0, 7.0, 10.0, 6.0, 11.0, 16.0, 15.0, 5.0, 24.0, 16.0, 22.0, 31.0, 32.0, 28.0, 24.0, 27.0, 38.0, 39.0, 35.0, 35.0, 43.0, 35.0, 34.0, 34.0, 37.0, 40.0, 40.0, 38.0, 24.0, 27.0, 24.0, 23.0, 24.0, 21.0, 20.0, 15.0, 14.0, 14.0, 11.0, 9.0, 13.0, 6.0, 6.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.11534881591797, -21.422685623168945, -20.73002052307129, -20.037357330322266, -19.34469223022461, -18.652029037475586, -17.959365844726562, -17.266700744628906, -16.574037551879883, -15.881373405456543, -15.188709259033203, -14.49604606628418, -13.80338191986084, -13.1107177734375, -12.418054580688477, -11.725390434265137, -11.032726287841797, -10.340062141418457, -9.647397994995117, -8.954734802246094, -8.262070655822754, -7.569406509399414, -6.876742839813232, -6.184079170227051, -5.491415023803711, -4.798750877380371, -4.1060872077941895, -3.4134232997894287, -2.720759391784668, -2.0280954837799072, -1.3354315757751465, -0.6427679061889648, 0.049896240234375, 0.7425601482391357, 1.4352240562438965, 2.1278879642486572, 2.820551872253418, 3.5132157802581787, 4.2058796882629395, 4.898543357849121, 5.591207504272461, 6.283871650695801, 6.976535320281982, 7.669198989868164, 8.361863136291504, 9.054527282714844, 9.747190475463867, 10.439854621887207, 11.132518768310547, 11.825182914733887, 12.517847061157227, 13.21051025390625, 13.90317440032959, 14.59583854675293, 15.288501739501953, 15.981165885925293, 16.673830032348633, 17.366493225097656, 18.059158325195312, 18.751821517944336, 19.44448471069336, 20.137149810791016, 20.82981300354004, 21.522476196289062, 22.21514129638672]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 7.0, 4.0, 9.0, 4.0, 14.0, 13.0, 15.0, 15.0, 18.0, 16.0, 21.0, 20.0, 24.0, 35.0, 26.0, 29.0, 38.0, 43.0, 29.0, 34.0, 49.0, 36.0, 36.0, 40.0, 34.0, 38.0, 29.0, 31.0, 34.0, 20.0, 32.0, 28.0, 28.0, 19.0, 18.0, 12.0, 9.0, 12.0, 19.0, 11.0, 7.0, 10.0, 15.0, 4.0, 5.0, 6.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.71484375, -2.632354736328125, -2.54986572265625, -2.467376708984375, -2.3848876953125, -2.302398681640625, -2.21990966796875, -2.137420654296875, -2.054931640625, -1.972442626953125, -1.88995361328125, -1.807464599609375, -1.7249755859375, -1.642486572265625, -1.55999755859375, -1.477508544921875, -1.39501953125, -1.312530517578125, -1.23004150390625, -1.147552490234375, -1.0650634765625, -0.982574462890625, -0.90008544921875, -0.817596435546875, -0.735107421875, -0.652618408203125, -0.57012939453125, -0.487640380859375, -0.4051513671875, -0.322662353515625, -0.24017333984375, -0.157684326171875, -0.0751953125, 0.007293701171875, 0.08978271484375, 0.172271728515625, 0.2547607421875, 0.337249755859375, 0.41973876953125, 0.502227783203125, 0.584716796875, 0.667205810546875, 0.74969482421875, 0.832183837890625, 0.9146728515625, 0.997161865234375, 1.07965087890625, 1.162139892578125, 1.24462890625, 1.327117919921875, 1.40960693359375, 1.492095947265625, 1.5745849609375, 1.657073974609375, 1.73956298828125, 1.822052001953125, 1.904541015625, 1.987030029296875, 2.06951904296875, 2.152008056640625, 2.2344970703125, 2.316986083984375, 2.39947509765625, 2.481964111328125, 2.564453125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 7.0, 3.0, 7.0, 7.0, 10.0, 8.0, 8.0, 16.0, 14.0, 19.0, 13.0, 23.0, 27.0, 35.0, 24.0, 51.0, 81.0, 154.0, 430.0, 1417.0, 9509.0, 132522.0, 1885645.0, 2002805.0, 148217.0, 10554.0, 1633.0, 447.0, 195.0, 93.0, 60.0, 48.0, 26.0, 21.0, 16.0, 25.0, 13.0, 17.0, 17.0, 18.0, 13.0, 12.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.2662353515625, -8.985595703125, -8.7049560546875, -8.42431640625, -8.1436767578125, -7.863037109375, -7.5823974609375, -7.3017578125, -7.0211181640625, -6.740478515625, -6.4598388671875, -6.17919921875, -5.8985595703125, -5.617919921875, -5.3372802734375, -5.056640625, -4.7760009765625, -4.495361328125, -4.2147216796875, -3.93408203125, -3.6534423828125, -3.372802734375, -3.0921630859375, -2.8115234375, -2.5308837890625, -2.250244140625, -1.9696044921875, -1.68896484375, -1.4083251953125, -1.127685546875, -0.8470458984375, -0.56640625, -0.2857666015625, -0.005126953125, 0.2755126953125, 0.55615234375, 0.8367919921875, 1.117431640625, 1.3980712890625, 1.6787109375, 1.9593505859375, 2.239990234375, 2.5206298828125, 2.80126953125, 3.0819091796875, 3.362548828125, 3.6431884765625, 3.923828125, 4.2044677734375, 4.485107421875, 4.7657470703125, 5.04638671875, 5.3270263671875, 5.607666015625, 5.8883056640625, 6.1689453125, 6.4495849609375, 6.730224609375, 7.0108642578125, 7.29150390625, 7.5721435546875, 7.852783203125, 8.1334228515625, 8.4140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 9.0, 13.0, 19.0, 23.0, 24.0, 37.0, 53.0, 50.0, 89.0, 106.0, 166.0, 193.0, 267.0, 330.0, 348.0, 394.0, 417.0, 307.0, 297.0, 210.0, 165.0, 142.0, 87.0, 89.0, 61.0, 40.0, 32.0, 24.0, 13.0, 20.0, 9.0, 8.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.06640625, -5.87451171875, -5.6826171875, -5.49072265625, -5.298828125, -5.10693359375, -4.9150390625, -4.72314453125, -4.53125, -4.33935546875, -4.1474609375, -3.95556640625, -3.763671875, -3.57177734375, -3.3798828125, -3.18798828125, -2.99609375, -2.80419921875, -2.6123046875, -2.42041015625, -2.228515625, -2.03662109375, -1.8447265625, -1.65283203125, -1.4609375, -1.26904296875, -1.0771484375, -0.88525390625, -0.693359375, -0.50146484375, -0.3095703125, -0.11767578125, 0.07421875, 0.26611328125, 0.4580078125, 0.64990234375, 0.841796875, 1.03369140625, 1.2255859375, 1.41748046875, 1.609375, 1.80126953125, 1.9931640625, 2.18505859375, 2.376953125, 2.56884765625, 2.7607421875, 2.95263671875, 3.14453125, 3.33642578125, 3.5283203125, 3.72021484375, 3.912109375, 4.10400390625, 4.2958984375, 4.48779296875, 4.6796875, 4.87158203125, 5.0634765625, 5.25537109375, 5.447265625, 5.63916015625, 5.8310546875, 6.02294921875, 6.21484375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 12.0, 10.0, 12.0, 21.0, 24.0, 39.0, 54.0, 86.0, 81.0, 149.0, 198.0, 306.0, 610.0, 2062.0, 18517.0, 413205.0, 3306067.0, 430402.0, 18781.0, 2107.0, 577.0, 296.0, 202.0, 116.0, 92.0, 65.0, 50.0, 31.0, 30.0, 19.0, 17.0, 11.0, 10.0, 7.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.4375, -13.979248046875, -13.52099609375, -13.062744140625, -12.6044921875, -12.146240234375, -11.68798828125, -11.229736328125, -10.771484375, -10.313232421875, -9.85498046875, -9.396728515625, -8.9384765625, -8.480224609375, -8.02197265625, -7.563720703125, -7.10546875, -6.647216796875, -6.18896484375, -5.730712890625, -5.2724609375, -4.814208984375, -4.35595703125, -3.897705078125, -3.439453125, -2.981201171875, -2.52294921875, -2.064697265625, -1.6064453125, -1.148193359375, -0.68994140625, -0.231689453125, 0.2265625, 0.684814453125, 1.14306640625, 1.601318359375, 2.0595703125, 2.517822265625, 2.97607421875, 3.434326171875, 3.892578125, 4.350830078125, 4.80908203125, 5.267333984375, 5.7255859375, 6.183837890625, 6.64208984375, 7.100341796875, 7.55859375, 8.016845703125, 8.47509765625, 8.933349609375, 9.3916015625, 9.849853515625, 10.30810546875, 10.766357421875, 11.224609375, 11.682861328125, 12.14111328125, 12.599365234375, 13.0576171875, 13.515869140625, 13.97412109375, 14.432373046875, 14.890625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 21.0, 66.0, 127.0, 275.0, 237.0, 174.0, 87.0, 16.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.227203369140625, -31.95541000366211, -29.683616638183594, -27.41182518005371, -25.140031814575195, -22.86823844909668, -20.596446990966797, -18.32465362548828, -16.052860260009766, -13.78106689453125, -11.50927448272705, -9.237482070922852, -6.965688705444336, -4.69389533996582, -2.422102928161621, -0.15031051635742188, 2.1214828491210938, 4.393275737762451, 6.665068626403809, 8.936861038208008, 11.208654403686523, 13.480447769165039, 15.752240180969238, 18.024032592773438, 20.295825958251953, 22.56761932373047, 24.839412689208984, 27.111204147338867, 29.382997512817383, 31.6547908782959, 33.92658233642578, 36.1983757019043, 38.47016143798828, 40.7419548034668, 43.01374816894531, 45.28554153442383, 47.557334899902344, 49.829124450683594, 52.10091781616211, 54.372711181640625, 56.64450454711914, 58.916297912597656, 61.18809127807617, 63.45988464355469, 65.73167419433594, 68.00347137451172, 70.27526092529297, 72.54705810546875, 74.81884765625, 77.09063720703125, 79.36243438720703, 81.63422393798828, 83.90602111816406, 86.17781066894531, 88.4496078491211, 90.72139739990234, 92.99319458007812, 95.26498413085938, 97.53678131103516, 99.8085708618164, 102.08036804199219, 104.35215759277344, 106.62395477294922, 108.89574432373047, 111.16753387451172]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 3.0, 1.0, 8.0, 9.0, 13.0, 18.0, 17.0, 13.0, 21.0, 25.0, 28.0, 25.0, 31.0, 27.0, 30.0, 44.0, 33.0, 42.0, 42.0, 42.0, 39.0, 33.0, 37.0, 33.0, 34.0, 46.0, 40.0, 25.0, 24.0, 35.0, 25.0, 22.0, 23.0, 20.0, 25.0, 21.0, 14.0, 9.0, 4.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.351171493530273, -21.68994903564453, -21.028724670410156, -20.36750030517578, -19.70627784729004, -19.045055389404297, -18.383831024169922, -17.722606658935547, -17.061384201049805, -16.400161743164062, -15.738937377929688, -15.077713966369629, -14.41649055480957, -13.755267143249512, -13.094043731689453, -12.432820320129395, -11.771596908569336, -11.110373497009277, -10.449150085449219, -9.78792667388916, -9.126703262329102, -8.465479850769043, -7.804256439208984, -7.143033027648926, -6.481809616088867, -5.820586204528809, -5.15936279296875, -4.498139381408691, -3.836915969848633, -3.175692558288574, -2.5144691467285156, -1.853245735168457, -1.1920242309570312, -0.5308008193969727, 0.13042259216308594, 0.7916460037231445, 1.4528694152832031, 2.1140928268432617, 2.7753162384033203, 3.436539649963379, 4.0977630615234375, 4.758986473083496, 5.420209884643555, 6.081433296203613, 6.742656707763672, 7.4038801193237305, 8.065103530883789, 8.726326942443848, 9.387550354003906, 10.048773765563965, 10.709997177124023, 11.371220588684082, 12.03244400024414, 12.6936674118042, 13.354890823364258, 14.016114234924316, 14.677337646484375, 15.338561058044434, 15.999784469604492, 16.661006927490234, 17.32223129272461, 17.983455657958984, 18.644678115844727, 19.30590057373047, 19.967124938964844]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 4.0, 6.0, 9.0, 8.0, 7.0, 9.0, 5.0, 17.0, 14.0, 15.0, 14.0, 19.0, 32.0, 13.0, 21.0, 27.0, 31.0, 34.0, 32.0, 47.0, 40.0, 38.0, 37.0, 35.0, 46.0, 47.0, 45.0, 30.0, 36.0, 32.0, 29.0, 29.0, 22.0, 20.0, 16.0, 13.0, 19.0, 14.0, 13.0, 10.0, 13.0, 10.0, 10.0, 12.0, 7.0, 2.0, 6.0, 0.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.666015625, -2.583404541015625, -2.50079345703125, -2.418182373046875, -2.3355712890625, -2.252960205078125, -2.17034912109375, -2.087738037109375, -2.005126953125, -1.922515869140625, -1.83990478515625, -1.757293701171875, -1.6746826171875, -1.592071533203125, -1.50946044921875, -1.426849365234375, -1.34423828125, -1.261627197265625, -1.17901611328125, -1.096405029296875, -1.0137939453125, -0.931182861328125, -0.84857177734375, -0.765960693359375, -0.683349609375, -0.600738525390625, -0.51812744140625, -0.435516357421875, -0.3529052734375, -0.270294189453125, -0.18768310546875, -0.105072021484375, -0.0224609375, 0.060150146484375, 0.14276123046875, 0.225372314453125, 0.3079833984375, 0.390594482421875, 0.47320556640625, 0.555816650390625, 0.638427734375, 0.721038818359375, 0.80364990234375, 0.886260986328125, 0.9688720703125, 1.051483154296875, 1.13409423828125, 1.216705322265625, 1.29931640625, 1.381927490234375, 1.46453857421875, 1.547149658203125, 1.6297607421875, 1.712371826171875, 1.79498291015625, 1.877593994140625, 1.960205078125, 2.042816162109375, 2.12542724609375, 2.208038330078125, 2.2906494140625, 2.373260498046875, 2.45587158203125, 2.538482666015625, 2.62109375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 14.0, 9.0, 20.0, 19.0, 26.0, 45.0, 64.0, 111.0, 140.0, 198.0, 320.0, 476.0, 718.0, 1097.0, 1826.0, 2826.0, 4750.0, 8121.0, 14401.0, 25679.0, 48199.0, 92402.0, 175744.0, 258334.0, 191587.0, 102303.0, 52681.0, 28212.0, 15625.0, 8897.0, 5187.0, 3108.0, 1913.0, 1190.0, 780.0, 485.0, 320.0, 253.0, 158.0, 104.0, 65.0, 44.0, 26.0, 22.0, 20.0, 7.0, 10.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.4169921875, -0.40378570556640625, -0.3905792236328125, -0.37737274169921875, -0.364166259765625, -0.35095977783203125, -0.3377532958984375, -0.32454681396484375, -0.31134033203125, -0.29813385009765625, -0.2849273681640625, -0.27172088623046875, -0.258514404296875, -0.24530792236328125, -0.2321014404296875, -0.21889495849609375, -0.2056884765625, -0.19248199462890625, -0.1792755126953125, -0.16606903076171875, -0.152862548828125, -0.13965606689453125, -0.1264495849609375, -0.11324310302734375, -0.10003662109375, -0.08683013916015625, -0.0736236572265625, -0.06041717529296875, -0.047210693359375, -0.03400421142578125, -0.0207977294921875, -0.00759124755859375, 0.005615234375, 0.01882171630859375, 0.0320281982421875, 0.04523468017578125, 0.058441162109375, 0.07164764404296875, 0.0848541259765625, 0.09806060791015625, 0.11126708984375, 0.12447357177734375, 0.1376800537109375, 0.15088653564453125, 0.164093017578125, 0.17729949951171875, 0.1905059814453125, 0.20371246337890625, 0.2169189453125, 0.23012542724609375, 0.2433319091796875, 0.25653839111328125, 0.269744873046875, 0.28295135498046875, 0.2961578369140625, 0.30936431884765625, 0.32257080078125, 0.33577728271484375, 0.3489837646484375, 0.36219024658203125, 0.375396728515625, 0.38860321044921875, 0.4018096923828125, 0.41501617431640625, 0.42822265625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 14.0, 7.0, 9.0, 7.0, 9.0, 16.0, 12.0, 10.0, 28.0, 22.0, 16.0, 23.0, 30.0, 21.0, 26.0, 39.0, 33.0, 38.0, 39.0, 32.0, 31.0, 1054.0, 36.0, 36.0, 37.0, 26.0, 24.0, 40.0, 34.0, 32.0, 28.0, 28.0, 24.0, 28.0, 20.0, 15.0, 13.0, 17.0, 9.0, 13.0, 11.0, 7.0, 4.0, 8.0, 3.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.547943115234375, -1.49432373046875, -1.440704345703125, -1.3870849609375, -1.333465576171875, -1.27984619140625, -1.226226806640625, -1.172607421875, -1.118988037109375, -1.06536865234375, -1.011749267578125, -0.9581298828125, -0.904510498046875, -0.85089111328125, -0.797271728515625, -0.74365234375, -0.690032958984375, -0.63641357421875, -0.582794189453125, -0.5291748046875, -0.475555419921875, -0.42193603515625, -0.368316650390625, -0.314697265625, -0.261077880859375, -0.20745849609375, -0.153839111328125, -0.1002197265625, -0.046600341796875, 0.00701904296875, 0.060638427734375, 0.1142578125, 0.167877197265625, 0.22149658203125, 0.275115966796875, 0.3287353515625, 0.382354736328125, 0.43597412109375, 0.489593505859375, 0.543212890625, 0.596832275390625, 0.65045166015625, 0.704071044921875, 0.7576904296875, 0.811309814453125, 0.86492919921875, 0.918548583984375, 0.97216796875, 1.025787353515625, 1.07940673828125, 1.133026123046875, 1.1866455078125, 1.240264892578125, 1.29388427734375, 1.347503662109375, 1.401123046875, 1.454742431640625, 1.50836181640625, 1.561981201171875, 1.6156005859375, 1.669219970703125, 1.72283935546875, 1.776458740234375, 1.830078125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 10.0, 16.0, 37.0, 48.0, 77.0, 116.0, 147.0, 222.0, 331.0, 463.0, 640.0, 910.0, 1237.0, 1864.0, 2701.0, 3963.0, 5808.0, 8469.0, 12163.0, 17714.0, 25996.0, 37456.0, 53869.0, 76833.0, 106223.0, 162769.0, 1162507.0, 119990.0, 89164.0, 63390.0, 44172.0, 30643.0, 20816.0, 14404.0, 9961.0, 6913.0, 4657.0, 3115.0, 2275.0, 1501.0, 1123.0, 759.0, 490.0, 365.0, 256.0, 181.0, 133.0, 85.0, 48.0, 40.0, 24.0, 14.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.1680908203125, -0.1628742218017578, -0.15765762329101562, -0.15244102478027344, -0.14722442626953125, -0.14200782775878906, -0.13679122924804688, -0.1315746307373047, -0.1263580322265625, -0.12114143371582031, -0.11592483520507812, -0.11070823669433594, -0.10549163818359375, -0.10027503967285156, -0.09505844116210938, -0.08984184265136719, -0.084625244140625, -0.07940864562988281, -0.07419204711914062, -0.06897544860839844, -0.06375885009765625, -0.05854225158691406, -0.053325653076171875, -0.04810905456542969, -0.0428924560546875, -0.03767585754394531, -0.032459259033203125, -0.027242660522460938, -0.02202606201171875, -0.016809463500976562, -0.011592864990234375, -0.0063762664794921875, -0.00115966796875, 0.0040569305419921875, 0.009273529052734375, 0.014490127563476562, 0.01970672607421875, 0.024923324584960938, 0.030139923095703125, 0.03535652160644531, 0.0405731201171875, 0.04578971862792969, 0.051006317138671875, 0.05622291564941406, 0.06143951416015625, 0.06665611267089844, 0.07187271118164062, 0.07708930969238281, 0.082305908203125, 0.08752250671386719, 0.09273910522460938, 0.09795570373535156, 0.10317230224609375, 0.10838890075683594, 0.11360549926757812, 0.11882209777832031, 0.1240386962890625, 0.1292552947998047, 0.13447189331054688, 0.13968849182128906, 0.14490509033203125, 0.15012168884277344, 0.15533828735351562, 0.1605548858642578, 0.165771484375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 16.0, 11.0, 6.0, 17.0, 28.0, 32.0, 35.0, 34.0, 43.0, 69.0, 84.0, 112.0, 109.0, 87.0, 63.0, 40.0, 30.0, 35.0, 21.0, 20.0, 17.0, 8.0, 3.0, 10.0, 10.0, 4.0, 8.0, 10.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004810333251953125, -0.004660069942474365, -0.0045098066329956055, -0.004359543323516846, -0.004209280014038086, -0.004059016704559326, -0.003908753395080566, -0.0037584900856018066, -0.003608226776123047, -0.003457963466644287, -0.0033077001571655273, -0.0031574368476867676, -0.003007173538208008, -0.002856910228729248, -0.0027066469192504883, -0.0025563836097717285, -0.0024061203002929688, -0.002255856990814209, -0.0021055936813354492, -0.0019553303718566895, -0.0018050670623779297, -0.00165480375289917, -0.0015045404434204102, -0.0013542771339416504, -0.0012040138244628906, -0.0010537505149841309, -0.0009034872055053711, -0.0007532238960266113, -0.0006029605865478516, -0.0004526972770690918, -0.00030243396759033203, -0.00015217065811157227, -1.9073486328125e-06, 0.00014835596084594727, 0.00029861927032470703, 0.0004488825798034668, 0.0005991458892822266, 0.0007494091987609863, 0.0008996725082397461, 0.0010499358177185059, 0.0012001991271972656, 0.0013504624366760254, 0.0015007257461547852, 0.001650989055633545, 0.0018012523651123047, 0.0019515156745910645, 0.0021017789840698242, 0.002252042293548584, 0.0024023056030273438, 0.0025525689125061035, 0.0027028322219848633, 0.002853095531463623, 0.003003358840942383, 0.0031536221504211426, 0.0033038854598999023, 0.003454148769378662, 0.003604412078857422, 0.0037546753883361816, 0.0039049386978149414, 0.004055202007293701, 0.004205465316772461, 0.004355728626251221, 0.0045059919357299805, 0.00465625524520874, 0.0048065185546875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 9.0, 9.0, 10.0, 9.0, 9.0, 16.0, 14.0, 33.0, 43.0, 55.0, 65.0, 114.0, 191.0, 392.0, 2268.0, 401548.0, 639928.0, 2806.0, 386.0, 205.0, 127.0, 84.0, 62.0, 42.0, 31.0, 18.0, 18.0, 17.0, 15.0, 3.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09478759765625, -0.0918283462524414, -0.08886909484863281, -0.08590984344482422, -0.08295059204101562, -0.07999134063720703, -0.07703208923339844, -0.07407283782958984, -0.07111358642578125, -0.06815433502197266, -0.06519508361816406, -0.06223583221435547, -0.059276580810546875, -0.05631732940673828, -0.05335807800292969, -0.050398826599121094, -0.0474395751953125, -0.044480323791503906, -0.04152107238769531, -0.03856182098388672, -0.035602569580078125, -0.03264331817626953, -0.029684066772460938, -0.026724815368652344, -0.02376556396484375, -0.020806312561035156, -0.017847061157226562, -0.014887809753417969, -0.011928558349609375, -0.008969306945800781, -0.0060100555419921875, -0.0030508041381835938, -9.1552734375e-05, 0.0028676986694335938, 0.0058269500732421875, 0.008786201477050781, 0.011745452880859375, 0.014704704284667969, 0.017663955688476562, 0.020623207092285156, 0.02358245849609375, 0.026541709899902344, 0.029500961303710938, 0.03246021270751953, 0.035419464111328125, 0.03837871551513672, 0.04133796691894531, 0.044297218322753906, 0.0472564697265625, 0.050215721130371094, 0.05317497253417969, 0.05613422393798828, 0.059093475341796875, 0.06205272674560547, 0.06501197814941406, 0.06797122955322266, 0.07093048095703125, 0.07388973236083984, 0.07684898376464844, 0.07980823516845703, 0.08276748657226562, 0.08572673797607422, 0.08868598937988281, 0.0916452407836914, 0.0946044921875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 12.0, 503.0, 454.0, 39.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036411816254258156, -0.002398015931248665, -0.0011548504699021578, 8.831499144434929e-05, 0.0013314806856215, 0.0025746463797986507, 0.003817811608314514, 0.005060977302491665, 0.006304142996668816, 0.007547308690845966, 0.008790474385023117, 0.010033639147877693, 0.011276805773377419, 0.012519970536231995, 0.013763136230409145, 0.015006301924586296, 0.016249466687440872, 0.01749263145029545, 0.018735798075795174, 0.01997896283864975, 0.021222129464149475, 0.02246529422700405, 0.023708458989858627, 0.024951625615358353, 0.026194792240858078, 0.027437957003712654, 0.02868112362921238, 0.029924288392066956, 0.03116745501756668, 0.032410621643066406, 0.03365378454327583, 0.03489695116877556, 0.036140117794275284, 0.03738328441977501, 0.038626447319984436, 0.03986961394548416, 0.04111278057098389, 0.04235594719648361, 0.04359911009669304, 0.044842276722192764, 0.04608544334769249, 0.047328609973192215, 0.04857177287340164, 0.04981493949890137, 0.05105810612440109, 0.05230127274990082, 0.053544435650110245, 0.05478760227560997, 0.0560307651758194, 0.05727393180131912, 0.05851709470152855, 0.059760261327028275, 0.061003427952528, 0.062246594578027725, 0.06348975747823715, 0.06473292410373688, 0.0659760907292366, 0.06721925735473633, 0.06846242398023605, 0.06970559060573578, 0.07094874978065491, 0.07219191640615463, 0.07343508303165436, 0.07467824965715408, 0.07592141628265381]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 12.0, 15.0, 18.0, 22.0, 33.0, 36.0, 38.0, 45.0, 61.0, 59.0, 73.0, 65.0, 89.0, 79.0, 64.0, 50.0, 53.0, 51.0, 40.0, 27.0, 28.0, 14.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0064484477043151855, -0.006268625147640705, -0.006088802590966225, -0.005908980034291744, -0.005729157477617264, -0.005549334920942783, -0.005369512364268303, -0.0051896898075938225, -0.005009867250919342, -0.004830044694244862, -0.004650222137570381, -0.004470399580895901, -0.00429057702422142, -0.00411075446754694, -0.003930931910872459, -0.003751109354197979, -0.0035712867975234985, -0.003391464240849018, -0.0032116416841745377, -0.0030318191275000572, -0.0028519965708255768, -0.0026721740141510963, -0.002492351457476616, -0.0023125289008021355, -0.002132706344127655, -0.0019528837874531746, -0.0017730612307786942, -0.0015932386741042137, -0.0014134161174297333, -0.0012335935607552528, -0.0010537710040807724, -0.000873948447406292, -0.0006941258907318115, -0.0005143033340573311, -0.00033448077738285065, -0.0001546582207083702, 2.516433596611023e-05, 0.00020498689264059067, 0.0003848094493150711, 0.0005646320059895515, 0.000744454562664032, 0.0009242771193385124, 0.0011040996760129929, 0.0012839222326874733, 0.0014637447893619537, 0.0016435673460364342, 0.0018233899027109146, 0.002003212459385395, 0.0021830350160598755, 0.002362857572734356, 0.0025426801294088364, 0.002722502686083317, 0.0029023252427577972, 0.0030821477994322777, 0.003261970356106758, 0.0034417929127812386, 0.003621615469455719, 0.0038014380261301994, 0.00398126058280468, 0.00416108313947916, 0.004340905696153641, 0.004520728252828121, 0.004700550809502602, 0.004880373366177082, 0.0050601959228515625]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 4.0, 6.0, 9.0, 8.0, 7.0, 9.0, 5.0, 17.0, 14.0, 15.0, 13.0, 20.0, 32.0, 13.0, 21.0, 27.0, 31.0, 34.0, 32.0, 47.0, 40.0, 38.0, 37.0, 35.0, 46.0, 47.0, 45.0, 30.0, 36.0, 32.0, 29.0, 29.0, 22.0, 20.0, 16.0, 12.0, 20.0, 14.0, 13.0, 10.0, 13.0, 10.0, 10.0, 12.0, 7.0, 2.0, 6.0, 0.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.666015625, -2.583404541015625, -2.50079345703125, -2.418182373046875, -2.3355712890625, -2.252960205078125, -2.17034912109375, -2.087738037109375, -2.005126953125, -1.922515869140625, -1.83990478515625, -1.757293701171875, -1.6746826171875, -1.592071533203125, -1.50946044921875, -1.426849365234375, -1.34423828125, -1.261627197265625, -1.17901611328125, -1.096405029296875, -1.0137939453125, -0.931182861328125, -0.84857177734375, -0.765960693359375, -0.683349609375, -0.600738525390625, -0.51812744140625, -0.435516357421875, -0.3529052734375, -0.270294189453125, -0.18768310546875, -0.105072021484375, -0.0224609375, 0.060150146484375, 0.14276123046875, 0.225372314453125, 0.3079833984375, 0.390594482421875, 0.47320556640625, 0.555816650390625, 0.638427734375, 0.721038818359375, 0.80364990234375, 0.886260986328125, 0.9688720703125, 1.051483154296875, 1.13409423828125, 1.216705322265625, 1.29931640625, 1.381927490234375, 1.46453857421875, 1.547149658203125, 1.6297607421875, 1.712371826171875, 1.79498291015625, 1.877593994140625, 1.960205078125, 2.042816162109375, 2.12542724609375, 2.208038330078125, 2.2906494140625, 2.373260498046875, 2.45587158203125, 2.538482666015625, 2.62109375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 12.0, 23.0, 32.0, 42.0, 78.0, 125.0, 284.0, 630.0, 1422.0, 3471.0, 8061.0, 19612.0, 46201.0, 109440.0, 267014.0, 339665.0, 145378.0, 61932.0, 26130.0, 10958.0, 4473.0, 1853.0, 872.0, 405.0, 185.0, 101.0, 54.0, 32.0, 20.0, 14.0, 9.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.39453125, -4.279388427734375, -4.16424560546875, -4.049102783203125, -3.9339599609375, -3.818817138671875, -3.70367431640625, -3.588531494140625, -3.473388671875, -3.358245849609375, -3.24310302734375, -3.127960205078125, -3.0128173828125, -2.897674560546875, -2.78253173828125, -2.667388916015625, -2.55224609375, -2.437103271484375, -2.32196044921875, -2.206817626953125, -2.0916748046875, -1.976531982421875, -1.86138916015625, -1.746246337890625, -1.631103515625, -1.515960693359375, -1.40081787109375, -1.285675048828125, -1.1705322265625, -1.055389404296875, -0.94024658203125, -0.825103759765625, -0.7099609375, -0.594818115234375, -0.47967529296875, -0.364532470703125, -0.2493896484375, -0.134246826171875, -0.01910400390625, 0.096038818359375, 0.211181640625, 0.326324462890625, 0.44146728515625, 0.556610107421875, 0.6717529296875, 0.786895751953125, 0.90203857421875, 1.017181396484375, 1.13232421875, 1.247467041015625, 1.36260986328125, 1.477752685546875, 1.5928955078125, 1.708038330078125, 1.82318115234375, 1.938323974609375, 2.053466796875, 2.168609619140625, 2.28375244140625, 2.398895263671875, 2.5140380859375, 2.629180908203125, 2.74432373046875, 2.859466552734375, 2.974609375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 10.0, 12.0, 6.0, 11.0, 13.0, 19.0, 22.0, 23.0, 33.0, 33.0, 29.0, 48.0, 68.0, 73.0, 110.0, 216.0, 1461.0, 252.0, 138.0, 95.0, 52.0, 56.0, 42.0, 32.0, 29.0, 33.0, 28.0, 18.0, 9.0, 12.0, 14.0, 12.0, 4.0, 7.0, 5.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.921875, -9.5855712890625, -9.249267578125, -8.9129638671875, -8.57666015625, -8.2403564453125, -7.904052734375, -7.5677490234375, -7.2314453125, -6.8951416015625, -6.558837890625, -6.2225341796875, -5.88623046875, -5.5499267578125, -5.213623046875, -4.8773193359375, -4.541015625, -4.2047119140625, -3.868408203125, -3.5321044921875, -3.19580078125, -2.8594970703125, -2.523193359375, -2.1868896484375, -1.8505859375, -1.5142822265625, -1.177978515625, -0.8416748046875, -0.50537109375, -0.1690673828125, 0.167236328125, 0.5035400390625, 0.83984375, 1.1761474609375, 1.512451171875, 1.8487548828125, 2.18505859375, 2.5213623046875, 2.857666015625, 3.1939697265625, 3.5302734375, 3.8665771484375, 4.202880859375, 4.5391845703125, 4.87548828125, 5.2117919921875, 5.548095703125, 5.8843994140625, 6.220703125, 6.5570068359375, 6.893310546875, 7.2296142578125, 7.56591796875, 7.9022216796875, 8.238525390625, 8.5748291015625, 8.9111328125, 9.2474365234375, 9.583740234375, 9.9200439453125, 10.25634765625, 10.5926513671875, 10.928955078125, 11.2652587890625, 11.6015625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 8.0, 5.0, 9.0, 12.0, 17.0, 25.0, 34.0, 41.0, 49.0, 66.0, 90.0, 111.0, 212.0, 266.0, 513.0, 1599.0, 68830.0, 3052449.0, 18954.0, 1147.0, 418.0, 232.0, 145.0, 104.0, 93.0, 63.0, 46.0, 39.0, 27.0, 27.0, 8.0, 18.0, 12.0, 5.0, 4.0, 6.0, 1.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.109375, -22.161865234375, -21.21435546875, -20.266845703125, -19.3193359375, -18.371826171875, -17.42431640625, -16.476806640625, -15.529296875, -14.581787109375, -13.63427734375, -12.686767578125, -11.7392578125, -10.791748046875, -9.84423828125, -8.896728515625, -7.94921875, -7.001708984375, -6.05419921875, -5.106689453125, -4.1591796875, -3.211669921875, -2.26416015625, -1.316650390625, -0.369140625, 0.578369140625, 1.52587890625, 2.473388671875, 3.4208984375, 4.368408203125, 5.31591796875, 6.263427734375, 7.2109375, 8.158447265625, 9.10595703125, 10.053466796875, 11.0009765625, 11.948486328125, 12.89599609375, 13.843505859375, 14.791015625, 15.738525390625, 16.68603515625, 17.633544921875, 18.5810546875, 19.528564453125, 20.47607421875, 21.423583984375, 22.37109375, 23.318603515625, 24.26611328125, 25.213623046875, 26.1611328125, 27.108642578125, 28.05615234375, 29.003662109375, 29.951171875, 30.898681640625, 31.84619140625, 32.793701171875, 33.7412109375, 34.688720703125, 35.63623046875, 36.583740234375, 37.53125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 19.0, 99.0, 366.0, 396.0, 121.0, 11.0, 4.0], "bins": [-123.5738296508789, -121.51334381103516, -119.4528579711914, -117.39237213134766, -115.3318862915039, -113.27140045166016, -111.2109146118164, -109.15042877197266, -107.0899429321289, -105.02945709228516, -102.9689712524414, -100.90848541259766, -98.8479995727539, -96.78751373291016, -94.7270278930664, -92.66654205322266, -90.60604858398438, -88.54556274414062, -86.48507690429688, -84.42459106445312, -82.36410522460938, -80.30361938476562, -78.24313354492188, -76.18264770507812, -74.12216186523438, -72.06167602539062, -70.00119018554688, -67.94070434570312, -65.88021850585938, -63.819732666015625, -61.759246826171875, -59.698760986328125, -57.638267517089844, -55.577781677246094, -53.517295837402344, -51.456809997558594, -49.396324157714844, -47.335838317871094, -45.275352478027344, -43.214866638183594, -41.154380798339844, -39.093894958496094, -37.033409118652344, -34.972923278808594, -32.912437438964844, -30.851951599121094, -28.79146385192871, -26.73097801208496, -24.67049217224121, -22.61000633239746, -20.54952049255371, -18.489032745361328, -16.428546905517578, -14.368062019348145, -12.307575225830078, -10.247089385986328, -8.186603546142578, -6.126117706298828, -4.06563138961792, -2.0051450729370117, 0.05534076690673828, 2.1158266067504883, 4.176313400268555, 6.236799240112305, 8.297285079956055]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 4.0, 8.0, 13.0, 15.0, 20.0, 22.0, 16.0, 26.0, 33.0, 38.0, 30.0, 36.0, 30.0, 32.0, 41.0, 40.0, 45.0, 50.0, 39.0, 42.0, 37.0, 34.0, 41.0, 30.0, 32.0, 36.0, 30.0, 23.0, 21.0, 16.0, 15.0, 22.0, 17.0, 12.0, 10.0, 16.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.9287166595459, -27.018306732177734, -26.10789680480957, -25.197486877441406, -24.28707504272461, -23.376665115356445, -22.46625518798828, -21.555845260620117, -20.645435333251953, -19.73502540588379, -18.824615478515625, -17.914203643798828, -17.003793716430664, -16.0933837890625, -15.182973861694336, -14.272563934326172, -13.362153053283691, -12.451743125915527, -11.541332244873047, -10.630922317504883, -9.720512390136719, -8.810102462768555, -7.899691581726074, -6.98928165435791, -6.078871250152588, -5.168460845947266, -4.258050918579102, -3.3476405143737793, -2.437230348587036, -1.526820182800293, -0.6164097785949707, 0.29400014877319336, 1.2044105529785156, 2.114820718765259, 3.025230884552002, 3.935641288757324, 4.846051216125488, 5.7564616203308105, 6.666872024536133, 7.577281951904297, 8.487691879272461, 9.398101806640625, 10.308512687683105, 11.21892261505127, 12.129332542419434, 13.039743423461914, 13.950153350830078, 14.860563278198242, 15.770974159240723, 16.681385040283203, 17.591794967651367, 18.50220489501953, 19.412614822387695, 20.32302474975586, 21.233436584472656, 22.143844604492188, 23.054256439208984, 23.96466636657715, 24.875076293945312, 25.78548812866211, 26.695898056030273, 27.606307983398438, 28.5167179107666, 29.427127838134766, 30.33753776550293]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 2.0, 5.0, 9.0, 5.0, 13.0, 10.0, 13.0, 15.0, 18.0, 11.0, 17.0, 24.0, 24.0, 28.0, 27.0, 26.0, 33.0, 36.0, 37.0, 44.0, 37.0, 44.0, 53.0, 38.0, 51.0, 39.0, 32.0, 35.0, 33.0, 29.0, 25.0, 23.0, 23.0, 16.0, 15.0, 11.0, 17.0, 12.0, 9.0, 16.0, 11.0, 7.0, 8.0, 3.0, 6.0, 5.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.951171875, -2.853363037109375, -2.75555419921875, -2.657745361328125, -2.5599365234375, -2.462127685546875, -2.36431884765625, -2.266510009765625, -2.168701171875, -2.070892333984375, -1.97308349609375, -1.875274658203125, -1.7774658203125, -1.679656982421875, -1.58184814453125, -1.484039306640625, -1.38623046875, -1.288421630859375, -1.19061279296875, -1.092803955078125, -0.9949951171875, -0.897186279296875, -0.79937744140625, -0.701568603515625, -0.603759765625, -0.505950927734375, -0.40814208984375, -0.310333251953125, -0.2125244140625, -0.114715576171875, -0.01690673828125, 0.080902099609375, 0.1787109375, 0.276519775390625, 0.37432861328125, 0.472137451171875, 0.5699462890625, 0.667755126953125, 0.76556396484375, 0.863372802734375, 0.961181640625, 1.058990478515625, 1.15679931640625, 1.254608154296875, 1.3524169921875, 1.450225830078125, 1.54803466796875, 1.645843505859375, 1.74365234375, 1.841461181640625, 1.93927001953125, 2.037078857421875, 2.1348876953125, 2.232696533203125, 2.33050537109375, 2.428314208984375, 2.526123046875, 2.623931884765625, 2.72174072265625, 2.819549560546875, 2.9173583984375, 3.015167236328125, 3.11297607421875, 3.210784912109375, 3.30859375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 6.0, 5.0, 8.0, 11.0, 20.0, 15.0, 16.0, 15.0, 30.0, 31.0, 30.0, 48.0, 78.0, 126.0, 348.0, 938.0, 3916.0, 37362.0, 613608.0, 2816951.0, 673208.0, 41274.0, 4441.0, 959.0, 319.0, 136.0, 82.0, 53.0, 35.0, 37.0, 31.0, 22.0, 12.0, 16.0, 14.0, 14.0, 7.0, 15.0, 6.0, 9.0, 5.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.2760009765625, -8.981689453125, -8.6873779296875, -8.39306640625, -8.0987548828125, -7.804443359375, -7.5101318359375, -7.2158203125, -6.9215087890625, -6.627197265625, -6.3328857421875, -6.03857421875, -5.7442626953125, -5.449951171875, -5.1556396484375, -4.861328125, -4.5670166015625, -4.272705078125, -3.9783935546875, -3.68408203125, -3.3897705078125, -3.095458984375, -2.8011474609375, -2.5068359375, -2.2125244140625, -1.918212890625, -1.6239013671875, -1.32958984375, -1.0352783203125, -0.740966796875, -0.4466552734375, -0.15234375, 0.1419677734375, 0.436279296875, 0.7305908203125, 1.02490234375, 1.3192138671875, 1.613525390625, 1.9078369140625, 2.2021484375, 2.4964599609375, 2.790771484375, 3.0850830078125, 3.37939453125, 3.6737060546875, 3.968017578125, 4.2623291015625, 4.556640625, 4.8509521484375, 5.145263671875, 5.4395751953125, 5.73388671875, 6.0281982421875, 6.322509765625, 6.6168212890625, 6.9111328125, 7.2054443359375, 7.499755859375, 7.7940673828125, 8.08837890625, 8.3826904296875, 8.677001953125, 8.9713134765625, 9.265625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 4.0, 9.0, 14.0, 19.0, 17.0, 28.0, 38.0, 63.0, 84.0, 93.0, 128.0, 170.0, 233.0, 338.0, 362.0, 466.0, 437.0, 351.0, 304.0, 241.0, 177.0, 129.0, 103.0, 73.0, 42.0, 44.0, 25.0, 27.0, 14.0, 9.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40625, -7.18115234375, -6.9560546875, -6.73095703125, -6.505859375, -6.28076171875, -6.0556640625, -5.83056640625, -5.60546875, -5.38037109375, -5.1552734375, -4.93017578125, -4.705078125, -4.47998046875, -4.2548828125, -4.02978515625, -3.8046875, -3.57958984375, -3.3544921875, -3.12939453125, -2.904296875, -2.67919921875, -2.4541015625, -2.22900390625, -2.00390625, -1.77880859375, -1.5537109375, -1.32861328125, -1.103515625, -0.87841796875, -0.6533203125, -0.42822265625, -0.203125, 0.02197265625, 0.2470703125, 0.47216796875, 0.697265625, 0.92236328125, 1.1474609375, 1.37255859375, 1.59765625, 1.82275390625, 2.0478515625, 2.27294921875, 2.498046875, 2.72314453125, 2.9482421875, 3.17333984375, 3.3984375, 3.62353515625, 3.8486328125, 4.07373046875, 4.298828125, 4.52392578125, 4.7490234375, 4.97412109375, 5.19921875, 5.42431640625, 5.6494140625, 5.87451171875, 6.099609375, 6.32470703125, 6.5498046875, 6.77490234375, 7.0]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 2.0, 2.0, 4.0, 18.0, 12.0, 18.0, 33.0, 35.0, 46.0, 67.0, 115.0, 160.0, 200.0, 297.0, 560.0, 2308.0, 86070.0, 3709588.0, 387901.0, 4951.0, 730.0, 352.0, 231.0, 161.0, 120.0, 78.0, 64.0, 45.0, 27.0, 21.0, 15.0, 13.0, 9.0, 7.0, 5.0, 1.0, 8.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.546875, -21.811279296875, -21.07568359375, -20.340087890625, -19.6044921875, -18.868896484375, -18.13330078125, -17.397705078125, -16.662109375, -15.926513671875, -15.19091796875, -14.455322265625, -13.7197265625, -12.984130859375, -12.24853515625, -11.512939453125, -10.77734375, -10.041748046875, -9.30615234375, -8.570556640625, -7.8349609375, -7.099365234375, -6.36376953125, -5.628173828125, -4.892578125, -4.156982421875, -3.42138671875, -2.685791015625, -1.9501953125, -1.214599609375, -0.47900390625, 0.256591796875, 0.9921875, 1.727783203125, 2.46337890625, 3.198974609375, 3.9345703125, 4.670166015625, 5.40576171875, 6.141357421875, 6.876953125, 7.612548828125, 8.34814453125, 9.083740234375, 9.8193359375, 10.554931640625, 11.29052734375, 12.026123046875, 12.76171875, 13.497314453125, 14.23291015625, 14.968505859375, 15.7041015625, 16.439697265625, 17.17529296875, 17.910888671875, 18.646484375, 19.382080078125, 20.11767578125, 20.853271484375, 21.5888671875, 22.324462890625, 23.06005859375, 23.795654296875, 24.53125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 27.0, 68.0, 157.0, 208.0, 246.0, 180.0, 83.0, 22.0, 11.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.91522216796875, -97.7030029296875, -95.49077606201172, -93.27855682373047, -91.06633758544922, -88.85411071777344, -86.64189147949219, -84.42967224121094, -82.21745300292969, -80.00523376464844, -77.79300689697266, -75.5807876586914, -73.36856842041016, -71.15634155273438, -68.94412231445312, -66.73190307617188, -64.5196762084961, -62.30745315551758, -60.09523391723633, -57.88301086425781, -55.67079162597656, -53.45856857299805, -51.24634552001953, -49.03412628173828, -46.821903228759766, -44.60968017578125, -42.3974609375, -40.185237884521484, -37.97301483154297, -35.76079559326172, -33.5485725402832, -31.33635139465332, -29.124134063720703, -26.91191291809082, -24.699691772460938, -22.487468719482422, -20.27524757385254, -18.063026428222656, -15.850804328918457, -13.638582229614258, -11.426361083984375, -9.214139938354492, -7.001917839050293, -4.789696216583252, -2.577474594116211, -0.3652534484863281, 1.846968650817871, 4.05919075012207, 6.271411895751953, 8.483633041381836, 10.695855140686035, 12.908077239990234, 15.120298385620117, 17.33251953125, 19.544742584228516, 21.7569637298584, 23.96918487548828, 26.181406021118164, 28.393627166748047, 30.605850219726562, 32.81806945800781, 35.03029251098633, 37.242515563964844, 39.454734802246094, 41.66695785522461]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 4.0, 4.0, 7.0, 3.0, 11.0, 9.0, 11.0, 16.0, 13.0, 15.0, 24.0, 17.0, 27.0, 20.0, 29.0, 33.0, 28.0, 35.0, 29.0, 44.0, 34.0, 40.0, 35.0, 35.0, 43.0, 35.0, 54.0, 50.0, 34.0, 42.0, 37.0, 24.0, 22.0, 23.0, 13.0, 13.0, 18.0, 9.0, 9.0, 13.0, 11.0, 7.0, 3.0, 6.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.811996459960938, -21.090408325195312, -20.368820190429688, -19.647233963012695, -18.92564582824707, -18.204057693481445, -17.482471466064453, -16.760883331298828, -16.039295196533203, -15.317707061767578, -14.59611988067627, -13.874532699584961, -13.152944564819336, -12.431356430053711, -11.709769248962402, -10.988182067871094, -10.266593933105469, -9.545005798339844, -8.823418617248535, -8.101831436157227, -7.380243301391602, -6.658655643463135, -5.937067985534668, -5.215480327606201, -4.493892669677734, -3.7723050117492676, -3.050717353820801, -2.329129695892334, -1.6075420379638672, -0.8859543800354004, -0.1643667221069336, 0.5572209358215332, 1.27880859375, 2.000396251678467, 2.7219839096069336, 3.4435715675354004, 4.165159225463867, 4.886746883392334, 5.608334541320801, 6.329922199249268, 7.051509857177734, 7.773097515106201, 8.494685173034668, 9.216272354125977, 9.937860488891602, 10.659448623657227, 11.381035804748535, 12.102622985839844, 12.824211120605469, 13.545799255371094, 14.267386436462402, 14.988973617553711, 15.710561752319336, 16.43214988708496, 17.153736114501953, 17.875324249267578, 18.596912384033203, 19.318500518798828, 20.040088653564453, 20.761674880981445, 21.48326301574707, 22.204851150512695, 22.926437377929688, 23.648025512695312, 24.369613647460938]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 4.0, 3.0, 7.0, 5.0, 6.0, 6.0, 18.0, 13.0, 17.0, 19.0, 20.0, 22.0, 12.0, 35.0, 25.0, 36.0, 42.0, 30.0, 42.0, 27.0, 38.0, 40.0, 34.0, 43.0, 43.0, 36.0, 40.0, 41.0, 27.0, 19.0, 28.0, 23.0, 30.0, 19.0, 19.0, 18.0, 14.0, 18.0, 7.0, 13.0, 12.0, 7.0, 7.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.828125, -2.738739013671875, -2.64935302734375, -2.559967041015625, -2.4705810546875, -2.381195068359375, -2.29180908203125, -2.202423095703125, -2.113037109375, -2.023651123046875, -1.93426513671875, -1.844879150390625, -1.7554931640625, -1.666107177734375, -1.57672119140625, -1.487335205078125, -1.39794921875, -1.308563232421875, -1.21917724609375, -1.129791259765625, -1.0404052734375, -0.951019287109375, -0.86163330078125, -0.772247314453125, -0.682861328125, -0.593475341796875, -0.50408935546875, -0.414703369140625, -0.3253173828125, -0.235931396484375, -0.14654541015625, -0.057159423828125, 0.0322265625, 0.121612548828125, 0.21099853515625, 0.300384521484375, 0.3897705078125, 0.479156494140625, 0.56854248046875, 0.657928466796875, 0.747314453125, 0.836700439453125, 0.92608642578125, 1.015472412109375, 1.1048583984375, 1.194244384765625, 1.28363037109375, 1.373016357421875, 1.46240234375, 1.551788330078125, 1.64117431640625, 1.730560302734375, 1.8199462890625, 1.909332275390625, 1.99871826171875, 2.088104248046875, 2.177490234375, 2.266876220703125, 2.35626220703125, 2.445648193359375, 2.5350341796875, 2.624420166015625, 2.71380615234375, 2.803192138671875, 2.892578125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 14.0, 17.0, 22.0, 47.0, 60.0, 97.0, 158.0, 252.0, 354.0, 670.0, 1124.0, 2018.0, 3316.0, 6113.0, 11242.0, 20255.0, 38135.0, 73567.0, 146718.0, 260372.0, 230079.0, 121397.0, 61891.0, 31870.0, 17100.0, 9341.0, 5254.0, 2881.0, 1653.0, 993.0, 557.0, 340.0, 210.0, 129.0, 91.0, 64.0, 38.0, 31.0, 19.0, 16.0, 8.0, 8.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.5060844421386719, -0.49068450927734375, -0.4752845764160156, -0.4598846435546875, -0.4444847106933594, -0.42908477783203125, -0.4136848449707031, -0.398284912109375, -0.3828849792480469, -0.36748504638671875, -0.3520851135253906, -0.3366851806640625, -0.3212852478027344, -0.30588531494140625, -0.2904853820800781, -0.27508544921875, -0.2596855163574219, -0.24428558349609375, -0.22888565063476562, -0.2134857177734375, -0.19808578491210938, -0.18268585205078125, -0.16728591918945312, -0.151885986328125, -0.13648605346679688, -0.12108612060546875, -0.10568618774414062, -0.0902862548828125, -0.07488632202148438, -0.05948638916015625, -0.044086456298828125, -0.0286865234375, -0.013286590576171875, 0.00211334228515625, 0.017513275146484375, 0.0329132080078125, 0.048313140869140625, 0.06371307373046875, 0.07911300659179688, 0.094512939453125, 0.10991287231445312, 0.12531280517578125, 0.14071273803710938, 0.1561126708984375, 0.17151260375976562, 0.18691253662109375, 0.20231246948242188, 0.21771240234375, 0.23311233520507812, 0.24851226806640625, 0.2639122009277344, 0.2793121337890625, 0.2947120666503906, 0.31011199951171875, 0.3255119323730469, 0.340911865234375, 0.3563117980957031, 0.37171173095703125, 0.3871116638183594, 0.4025115966796875, 0.4179115295410156, 0.43331146240234375, 0.4487113952636719, 0.464111328125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 2.0, 7.0, 9.0, 16.0, 7.0, 13.0, 13.0, 18.0, 21.0, 27.0, 27.0, 35.0, 43.0, 30.0, 17.0, 31.0, 40.0, 41.0, 35.0, 1075.0, 49.0, 46.0, 47.0, 43.0, 36.0, 29.0, 35.0, 26.0, 29.0, 25.0, 18.0, 13.0, 23.0, 20.0, 11.0, 11.0, 15.0, 12.0, 8.0, 7.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.232421875, -2.1665496826171875, -2.100677490234375, -2.0348052978515625, -1.96893310546875, -1.9030609130859375, -1.837188720703125, -1.7713165283203125, -1.7054443359375, -1.6395721435546875, -1.573699951171875, -1.5078277587890625, -1.44195556640625, -1.3760833740234375, -1.310211181640625, -1.2443389892578125, -1.178466796875, -1.1125946044921875, -1.046722412109375, -0.9808502197265625, -0.91497802734375, -0.8491058349609375, -0.783233642578125, -0.7173614501953125, -0.6514892578125, -0.5856170654296875, -0.519744873046875, -0.4538726806640625, -0.38800048828125, -0.3221282958984375, -0.256256103515625, -0.1903839111328125, -0.12451171875, -0.0586395263671875, 0.007232666015625, 0.0731048583984375, 0.13897705078125, 0.2048492431640625, 0.270721435546875, 0.3365936279296875, 0.4024658203125, 0.4683380126953125, 0.534210205078125, 0.6000823974609375, 0.66595458984375, 0.7318267822265625, 0.797698974609375, 0.8635711669921875, 0.929443359375, 0.9953155517578125, 1.061187744140625, 1.1270599365234375, 1.19293212890625, 1.2588043212890625, 1.324676513671875, 1.3905487060546875, 1.4564208984375, 1.5222930908203125, 1.588165283203125, 1.6540374755859375, 1.71990966796875, 1.7857818603515625, 1.851654052734375, 1.9175262451171875, 1.9833984375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 6.0, 6.0, 9.0, 14.0, 21.0, 27.0, 30.0, 76.0, 92.0, 144.0, 189.0, 304.0, 457.0, 668.0, 979.0, 1519.0, 2191.0, 3372.0, 5039.0, 7644.0, 11424.0, 18002.0, 27520.0, 41680.0, 63408.0, 94791.0, 135625.0, 1205206.0, 155804.0, 108110.0, 72563.0, 47912.0, 31836.0, 20565.0, 13490.0, 8970.0, 5754.0, 3941.0, 2518.0, 1675.0, 1179.0, 769.0, 527.0, 337.0, 221.0, 180.0, 112.0, 72.0, 48.0, 34.0, 31.0, 22.0, 7.0, 8.0, 3.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.207275390625, -0.2005176544189453, -0.19375991821289062, -0.18700218200683594, -0.18024444580078125, -0.17348670959472656, -0.16672897338867188, -0.1599712371826172, -0.1532135009765625, -0.1464557647705078, -0.13969802856445312, -0.13294029235839844, -0.12618255615234375, -0.11942481994628906, -0.11266708374023438, -0.10590934753417969, -0.099151611328125, -0.09239387512207031, -0.08563613891601562, -0.07887840270996094, -0.07212066650390625, -0.06536293029785156, -0.058605194091796875, -0.05184745788574219, -0.0450897216796875, -0.03833198547363281, -0.031574249267578125, -0.024816513061523438, -0.01805877685546875, -0.011301040649414062, -0.004543304443359375, 0.0022144317626953125, 0.00897216796875, 0.015729904174804688, 0.022487640380859375, 0.029245376586914062, 0.03600311279296875, 0.04276084899902344, 0.049518585205078125, 0.05627632141113281, 0.0630340576171875, 0.06979179382324219, 0.07654953002929688, 0.08330726623535156, 0.09006500244140625, 0.09682273864746094, 0.10358047485351562, 0.11033821105957031, 0.117095947265625, 0.12385368347167969, 0.13061141967773438, 0.13736915588378906, 0.14412689208984375, 0.15088462829589844, 0.15764236450195312, 0.1644001007080078, 0.1711578369140625, 0.1779155731201172, 0.18467330932617188, 0.19143104553222656, 0.19818878173828125, 0.20494651794433594, 0.21170425415039062, 0.2184619903564453, 0.2252197265625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 7.0, 5.0, 9.0, 8.0, 13.0, 18.0, 18.0, 23.0, 25.0, 28.0, 53.0, 53.0, 72.0, 78.0, 101.0, 81.0, 91.0, 73.0, 60.0, 43.0, 29.0, 21.0, 10.0, 11.0, 13.0, 6.0, 7.0, 5.0, 11.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0049896240234375, -0.004822790622711182, -0.004655957221984863, -0.004489123821258545, -0.0043222904205322266, -0.004155457019805908, -0.00398862361907959, -0.0038217902183532715, -0.003654956817626953, -0.0034881234169006348, -0.0033212900161743164, -0.003154456615447998, -0.0029876232147216797, -0.0028207898139953613, -0.002653956413269043, -0.0024871230125427246, -0.0023202896118164062, -0.002153456211090088, -0.0019866228103637695, -0.0018197894096374512, -0.0016529560089111328, -0.0014861226081848145, -0.001319289207458496, -0.0011524558067321777, -0.0009856224060058594, -0.000818789005279541, -0.0006519556045532227, -0.0004851222038269043, -0.00031828880310058594, -0.00015145540237426758, 1.537799835205078e-05, 0.00018221139907836914, 0.0003490447998046875, 0.0005158782005310059, 0.0006827116012573242, 0.0008495450019836426, 0.001016378402709961, 0.0011832118034362793, 0.0013500452041625977, 0.001516878604888916, 0.0016837120056152344, 0.0018505454063415527, 0.002017378807067871, 0.0021842122077941895, 0.002351045608520508, 0.002517879009246826, 0.0026847124099731445, 0.002851545810699463, 0.0030183792114257812, 0.0031852126121520996, 0.003352046012878418, 0.0035188794136047363, 0.0036857128143310547, 0.003852546215057373, 0.004019379615783691, 0.00418621301651001, 0.004353046417236328, 0.0045198798179626465, 0.004686713218688965, 0.004853546619415283, 0.0050203800201416016, 0.00518721342086792, 0.005354046821594238, 0.005520880222320557, 0.005687713623046875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 5.0, 5.0, 6.0, 10.0, 11.0, 11.0, 12.0, 14.0, 28.0, 28.0, 35.0, 62.0, 90.0, 162.0, 316.0, 970.0, 58537.0, 980851.0, 6243.0, 478.0, 241.0, 119.0, 68.0, 60.0, 40.0, 33.0, 27.0, 29.0, 19.0, 8.0, 6.0, 10.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1064453125, -0.1031484603881836, -0.09985160827636719, -0.09655475616455078, -0.09325790405273438, -0.08996105194091797, -0.08666419982910156, -0.08336734771728516, -0.08007049560546875, -0.07677364349365234, -0.07347679138183594, -0.07017993927001953, -0.06688308715820312, -0.06358623504638672, -0.06028938293457031, -0.056992530822753906, -0.0536956787109375, -0.050398826599121094, -0.04710197448730469, -0.04380512237548828, -0.040508270263671875, -0.03721141815185547, -0.03391456604003906, -0.030617713928222656, -0.02732086181640625, -0.024024009704589844, -0.020727157592773438, -0.01743030548095703, -0.014133453369140625, -0.010836601257324219, -0.0075397491455078125, -0.004242897033691406, -0.000946044921875, 0.0023508071899414062, 0.0056476593017578125, 0.008944511413574219, 0.012241363525390625, 0.015538215637207031, 0.018835067749023438, 0.022131919860839844, 0.02542877197265625, 0.028725624084472656, 0.03202247619628906, 0.03531932830810547, 0.038616180419921875, 0.04191303253173828, 0.04520988464355469, 0.048506736755371094, 0.0518035888671875, 0.055100440979003906, 0.05839729309082031, 0.06169414520263672, 0.06499099731445312, 0.06828784942626953, 0.07158470153808594, 0.07488155364990234, 0.07817840576171875, 0.08147525787353516, 0.08477210998535156, 0.08806896209716797, 0.09136581420898438, 0.09466266632080078, 0.09795951843261719, 0.1012563705444336, 0.10455322265625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 11.0, 91.0, 518.0, 292.0, 72.0, 22.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00397814204916358, -0.003284793347120285, -0.0025914444122463465, -0.001898095477372408, -0.001204746775329113, -0.0005113980732858181, 0.00018195109441876411, 0.000875299796462059, 0.001568648498505354, 0.002261997200548649, 0.0029553461354225874, 0.003648695070296526, 0.004342043772339821, 0.005035392474383116, 0.005728741642087698, 0.006422090344130993, 0.007115439046174288, 0.007808787748217583, 0.008502136915922165, 0.009195486083626747, 0.009888834320008755, 0.010582182556390762, 0.011275531724095345, 0.011968880891799927, 0.012662230059504509, 0.013355579227209091, 0.014048927463591099, 0.014742276631295681, 0.015435624867677689, 0.01612897403538227, 0.016822323203086853, 0.017515672370791435, 0.018209021538496017, 0.0189023707062006, 0.019595719873905182, 0.020289067178964615, 0.020982416346669197, 0.02167576551437378, 0.02236911468207836, 0.023062463849782944, 0.023755811154842377, 0.02444916032254696, 0.02514250949025154, 0.025835856795310974, 0.026529205963015556, 0.02722255513072014, 0.02791590429842472, 0.028609253466129303, 0.029302602633833885, 0.029995951801538467, 0.03068930096924305, 0.03138265013694763, 0.032075997442007065, 0.0327693447470665, 0.03346269577741623, 0.03415604308247566, 0.034849394112825394, 0.03554274141788483, 0.03623609244823456, 0.03692943975329399, 0.03762279078364372, 0.038316138088703156, 0.03900948911905289, 0.03970283642411232, 0.04039618372917175]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 7.0, 10.0, 7.0, 13.0, 15.0, 6.0, 16.0, 22.0, 31.0, 29.0, 28.0, 29.0, 40.0, 39.0, 41.0, 43.0, 34.0, 39.0, 41.0, 46.0, 45.0, 38.0, 43.0, 29.0, 30.0, 31.0, 30.0, 27.0, 32.0, 21.0, 21.0, 27.0, 14.0, 16.0, 12.0, 6.0, 5.0, 5.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0029751062393188477, -0.0028793727979063988, -0.00278363935649395, -0.002687905915081501, -0.002592172473669052, -0.0024964390322566032, -0.0024007055908441544, -0.0023049721494317055, -0.0022092387080192566, -0.0021135052666068077, -0.002017771825194359, -0.00192203838378191, -0.001826304942369461, -0.0017305715009570122, -0.0016348380595445633, -0.0015391046181321144, -0.0014433711767196655, -0.0013476377353072166, -0.0012519042938947678, -0.0011561708524823189, -0.00106043741106987, -0.0009647039696574211, -0.0008689705282449722, -0.0007732370868325233, -0.0006775036454200745, -0.0005817702040076256, -0.0004860367625951767, -0.0003903033211827278, -0.00029456987977027893, -0.00019883643835783005, -0.00010310299694538116, -7.3695555329322815e-06, 8.83638858795166e-05, 0.00018409732729196548, 0.00027983076870441437, 0.00037556421011686325, 0.00047129765152931213, 0.000567031092941761, 0.0006627645343542099, 0.0007584979757666588, 0.0008542314171791077, 0.0009499648585915565, 0.0010456983000040054, 0.0011414317414164543, 0.0012371651828289032, 0.001332898624241352, 0.001428632065653801, 0.0015243655070662498, 0.0016200989484786987, 0.0017158323898911476, 0.0018115658313035965, 0.0019072992727160454, 0.0020030327141284943, 0.002098766155540943, 0.002194499596953392, 0.002290233038365841, 0.00238596647977829, 0.0024816999211907387, 0.0025774333626031876, 0.0026731668040156364, 0.0027689002454280853, 0.002864633686840534, 0.002960367128252983, 0.003056100569665432, 0.003151834011077881]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 4.0, 3.0, 7.0, 5.0, 6.0, 6.0, 18.0, 13.0, 17.0, 19.0, 20.0, 22.0, 12.0, 35.0, 25.0, 36.0, 42.0, 30.0, 42.0, 26.0, 39.0, 40.0, 34.0, 43.0, 43.0, 36.0, 40.0, 41.0, 27.0, 19.0, 28.0, 23.0, 30.0, 19.0, 19.0, 18.0, 14.0, 18.0, 7.0, 13.0, 12.0, 7.0, 7.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.828125, -2.738739013671875, -2.64935302734375, -2.559967041015625, -2.4705810546875, -2.381195068359375, -2.29180908203125, -2.202423095703125, -2.113037109375, -2.023651123046875, -1.93426513671875, -1.844879150390625, -1.7554931640625, -1.666107177734375, -1.57672119140625, -1.487335205078125, -1.39794921875, -1.308563232421875, -1.21917724609375, -1.129791259765625, -1.0404052734375, -0.951019287109375, -0.86163330078125, -0.772247314453125, -0.682861328125, -0.593475341796875, -0.50408935546875, -0.414703369140625, -0.3253173828125, -0.235931396484375, -0.14654541015625, -0.057159423828125, 0.0322265625, 0.121612548828125, 0.21099853515625, 0.300384521484375, 0.3897705078125, 0.479156494140625, 0.56854248046875, 0.657928466796875, 0.747314453125, 0.836700439453125, 0.92608642578125, 1.015472412109375, 1.1048583984375, 1.194244384765625, 1.28363037109375, 1.373016357421875, 1.46240234375, 1.551788330078125, 1.64117431640625, 1.730560302734375, 1.8199462890625, 1.909332275390625, 1.99871826171875, 2.088104248046875, 2.177490234375, 2.266876220703125, 2.35626220703125, 2.445648193359375, 2.5350341796875, 2.624420166015625, 2.71380615234375, 2.803192138671875, 2.892578125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 11.0, 14.0, 35.0, 31.0, 70.0, 92.0, 125.0, 209.0, 324.0, 532.0, 932.0, 1651.0, 3091.0, 6069.0, 12466.0, 26340.0, 56989.0, 122302.0, 272640.0, 295791.0, 131848.0, 61239.0, 28303.0, 13407.0, 6439.0, 3312.0, 1759.0, 969.0, 610.0, 375.0, 200.0, 127.0, 65.0, 67.0, 41.0, 19.0, 16.0, 14.0, 11.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.18359375, -3.0810546875, -2.978515625, -2.8759765625, -2.7734375, -2.6708984375, -2.568359375, -2.4658203125, -2.36328125, -2.2607421875, -2.158203125, -2.0556640625, -1.953125, -1.8505859375, -1.748046875, -1.6455078125, -1.54296875, -1.4404296875, -1.337890625, -1.2353515625, -1.1328125, -1.0302734375, -0.927734375, -0.8251953125, -0.72265625, -0.6201171875, -0.517578125, -0.4150390625, -0.3125, -0.2099609375, -0.107421875, -0.0048828125, 0.09765625, 0.2001953125, 0.302734375, 0.4052734375, 0.5078125, 0.6103515625, 0.712890625, 0.8154296875, 0.91796875, 1.0205078125, 1.123046875, 1.2255859375, 1.328125, 1.4306640625, 1.533203125, 1.6357421875, 1.73828125, 1.8408203125, 1.943359375, 2.0458984375, 2.1484375, 2.2509765625, 2.353515625, 2.4560546875, 2.55859375, 2.6611328125, 2.763671875, 2.8662109375, 2.96875, 3.0712890625, 3.173828125, 3.2763671875, 3.37890625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 6.0, 3.0, 9.0, 8.0, 6.0, 9.0, 16.0, 25.0, 19.0, 20.0, 34.0, 33.0, 40.0, 40.0, 48.0, 69.0, 98.0, 131.0, 252.0, 1402.0, 188.0, 105.0, 78.0, 60.0, 41.0, 39.0, 35.0, 35.0, 28.0, 29.0, 18.0, 19.0, 23.0, 18.0, 9.0, 10.0, 7.0, 4.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0], "bins": [-11.1015625, -10.7864990234375, -10.471435546875, -10.1563720703125, -9.84130859375, -9.5262451171875, -9.211181640625, -8.8961181640625, -8.5810546875, -8.2659912109375, -7.950927734375, -7.6358642578125, -7.32080078125, -7.0057373046875, -6.690673828125, -6.3756103515625, -6.060546875, -5.7454833984375, -5.430419921875, -5.1153564453125, -4.80029296875, -4.4852294921875, -4.170166015625, -3.8551025390625, -3.5400390625, -3.2249755859375, -2.909912109375, -2.5948486328125, -2.27978515625, -1.9647216796875, -1.649658203125, -1.3345947265625, -1.01953125, -0.7044677734375, -0.389404296875, -0.0743408203125, 0.24072265625, 0.5557861328125, 0.870849609375, 1.1859130859375, 1.5009765625, 1.8160400390625, 2.131103515625, 2.4461669921875, 2.76123046875, 3.0762939453125, 3.391357421875, 3.7064208984375, 4.021484375, 4.3365478515625, 4.651611328125, 4.9666748046875, 5.28173828125, 5.5968017578125, 5.911865234375, 6.2269287109375, 6.5419921875, 6.8570556640625, 7.172119140625, 7.4871826171875, 7.80224609375, 8.1173095703125, 8.432373046875, 8.7474365234375, 9.0625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 15.0, 8.0, 28.0, 44.0, 35.0, 67.0, 86.0, 185.0, 280.0, 565.0, 2137.0, 3003638.0, 136496.0, 986.0, 433.0, 247.0, 151.0, 82.0, 48.0, 43.0, 22.0, 25.0, 16.0, 19.0, 8.0, 2.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.59375, -53.90087890625, -52.2080078125, -50.51513671875, -48.822265625, -47.12939453125, -45.4365234375, -43.74365234375, -42.05078125, -40.35791015625, -38.6650390625, -36.97216796875, -35.279296875, -33.58642578125, -31.8935546875, -30.20068359375, -28.5078125, -26.81494140625, -25.1220703125, -23.42919921875, -21.736328125, -20.04345703125, -18.3505859375, -16.65771484375, -14.96484375, -13.27197265625, -11.5791015625, -9.88623046875, -8.193359375, -6.50048828125, -4.8076171875, -3.11474609375, -1.421875, 0.27099609375, 1.9638671875, 3.65673828125, 5.349609375, 7.04248046875, 8.7353515625, 10.42822265625, 12.12109375, 13.81396484375, 15.5068359375, 17.19970703125, 18.892578125, 20.58544921875, 22.2783203125, 23.97119140625, 25.6640625, 27.35693359375, 29.0498046875, 30.74267578125, 32.435546875, 34.12841796875, 35.8212890625, 37.51416015625, 39.20703125, 40.89990234375, 42.5927734375, 44.28564453125, 45.978515625, 47.67138671875, 49.3642578125, 51.05712890625, 52.75]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 50.0, 672.0, 286.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-232.76841735839844, -228.51593017578125, -224.263427734375, -220.0109405517578, -215.75845336914062, -211.50595092773438, -207.2534637451172, -203.00096130371094, -198.74847412109375, -194.49598693847656, -190.2434844970703, -185.99099731445312, -181.73849487304688, -177.4860076904297, -173.2335205078125, -168.98101806640625, -164.72853088378906, -160.47604370117188, -156.22354125976562, -151.97105407714844, -147.71856689453125, -143.466064453125, -139.2135772705078, -134.96107482910156, -130.70858764648438, -126.45609283447266, -122.20359802246094, -117.95111083984375, -113.69861602783203, -109.44612121582031, -105.19363403320312, -100.9411392211914, -96.68863677978516, -92.43614196777344, -88.18365478515625, -83.93115997314453, -79.67866516113281, -75.4261703491211, -71.17367553710938, -66.92118835449219, -62.66869354248047, -58.41619873046875, -54.1637077331543, -49.911216735839844, -45.658721923828125, -41.406227111816406, -37.15373611450195, -32.9012451171875, -28.64875030517578, -24.396257400512695, -20.14376449584961, -15.891271591186523, -11.638778686523438, -7.386285781860352, -3.1337928771972656, 1.1187000274658203, 5.371192932128906, 9.623685836791992, 13.876178741455078, 18.128671646118164, 22.38116455078125, 26.633657455444336, 30.886150360107422, 35.138641357421875, 39.391136169433594]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 5.0, 5.0, 4.0, 11.0, 19.0, 18.0, 18.0, 27.0, 32.0, 30.0, 36.0, 25.0, 49.0, 31.0, 32.0, 47.0, 45.0, 44.0, 39.0, 49.0, 50.0, 52.0, 43.0, 32.0, 41.0, 29.0, 31.0, 27.0, 36.0, 22.0, 22.0, 10.0, 13.0, 5.0, 6.0, 7.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-32.968597412109375, -32.02206039428711, -31.075519561767578, -30.128982543945312, -29.182443618774414, -28.235904693603516, -27.289365768432617, -26.34282684326172, -25.39628791809082, -24.449748992919922, -23.503210067749023, -22.556671142578125, -21.61013412475586, -20.66359519958496, -19.717056274414062, -18.770517349243164, -17.823978424072266, -16.877439498901367, -15.930901527404785, -14.984362602233887, -14.037823677062988, -13.091285705566406, -12.144746780395508, -11.19820785522461, -10.251670837402344, -9.305131912231445, -8.358593940734863, -7.412055015563965, -6.465516090393066, -5.518977642059326, -4.572439193725586, -3.6259002685546875, -2.679361343383789, -1.7328226566314697, -0.7862840890884399, 0.16025447845458984, 1.1067931652069092, 2.0533318519592285, 2.9998703002929688, 3.946409225463867, 4.892947673797607, 5.839486122131348, 6.786025047302246, 7.732563495635986, 8.679101943969727, 9.625640869140625, 10.572179794311523, 11.518718719482422, 12.465256690979004, 13.411795616149902, 14.358333587646484, 15.304872512817383, 16.25141143798828, 17.19795036315918, 18.144489288330078, 19.091026306152344, 20.037565231323242, 20.98410415649414, 21.93064308166504, 22.877182006835938, 23.823719024658203, 24.7702579498291, 25.716796875, 26.6633358001709, 27.609874725341797]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 4.0, 4.0, 4.0, 6.0, 5.0, 11.0, 10.0, 11.0, 12.0, 26.0, 20.0, 19.0, 24.0, 24.0, 26.0, 33.0, 26.0, 38.0, 31.0, 30.0, 42.0, 42.0, 39.0, 41.0, 45.0, 40.0, 32.0, 21.0, 31.0, 25.0, 30.0, 31.0, 31.0, 16.0, 29.0, 24.0, 11.0, 12.0, 18.0, 11.0, 13.0, 7.0, 10.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0], "bins": [-3.2421875, -3.141876220703125, -3.04156494140625, -2.941253662109375, -2.8409423828125, -2.740631103515625, -2.64031982421875, -2.540008544921875, -2.439697265625, -2.339385986328125, -2.23907470703125, -2.138763427734375, -2.0384521484375, -1.938140869140625, -1.83782958984375, -1.737518310546875, -1.63720703125, -1.536895751953125, -1.43658447265625, -1.336273193359375, -1.2359619140625, -1.135650634765625, -1.03533935546875, -0.935028076171875, -0.834716796875, -0.734405517578125, -0.63409423828125, -0.533782958984375, -0.4334716796875, -0.333160400390625, -0.23284912109375, -0.132537841796875, -0.0322265625, 0.068084716796875, 0.16839599609375, 0.268707275390625, 0.3690185546875, 0.469329833984375, 0.56964111328125, 0.669952392578125, 0.770263671875, 0.870574951171875, 0.97088623046875, 1.071197509765625, 1.1715087890625, 1.271820068359375, 1.37213134765625, 1.472442626953125, 1.57275390625, 1.673065185546875, 1.77337646484375, 1.873687744140625, 1.9739990234375, 2.074310302734375, 2.17462158203125, 2.274932861328125, 2.375244140625, 2.475555419921875, 2.57586669921875, 2.676177978515625, 2.7764892578125, 2.876800537109375, 2.97711181640625, 3.077423095703125, 3.177734375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 5.0, 8.0, 10.0, 25.0, 14.0, 17.0, 32.0, 32.0, 54.0, 66.0, 101.0, 130.0, 197.0, 392.0, 842.0, 2725.0, 11736.0, 77068.0, 556125.0, 1990638.0, 1290624.0, 223525.0, 31299.0, 5573.0, 1505.0, 583.0, 267.0, 181.0, 121.0, 102.0, 55.0, 48.0, 36.0, 35.0, 25.0, 19.0, 14.0, 6.0, 4.0, 4.0, 7.0, 2.0, 3.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.6328125, -6.42401123046875, -6.2152099609375, -6.00640869140625, -5.797607421875, -5.58880615234375, -5.3800048828125, -5.17120361328125, -4.96240234375, -4.75360107421875, -4.5447998046875, -4.33599853515625, -4.127197265625, -3.91839599609375, -3.7095947265625, -3.50079345703125, -3.2919921875, -3.08319091796875, -2.8743896484375, -2.66558837890625, -2.456787109375, -2.24798583984375, -2.0391845703125, -1.83038330078125, -1.62158203125, -1.41278076171875, -1.2039794921875, -0.99517822265625, -0.786376953125, -0.57757568359375, -0.3687744140625, -0.15997314453125, 0.048828125, 0.25762939453125, 0.4664306640625, 0.67523193359375, 0.884033203125, 1.09283447265625, 1.3016357421875, 1.51043701171875, 1.71923828125, 1.92803955078125, 2.1368408203125, 2.34564208984375, 2.554443359375, 2.76324462890625, 2.9720458984375, 3.18084716796875, 3.3896484375, 3.59844970703125, 3.8072509765625, 4.01605224609375, 4.224853515625, 4.43365478515625, 4.6424560546875, 4.85125732421875, 5.06005859375, 5.26885986328125, 5.4776611328125, 5.68646240234375, 5.895263671875, 6.10406494140625, 6.3128662109375, 6.52166748046875, 6.73046875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 16.0, 14.0, 14.0, 22.0, 19.0, 26.0, 35.0, 41.0, 65.0, 80.0, 102.0, 140.0, 175.0, 193.0, 245.0, 344.0, 381.0, 390.0, 321.0, 326.0, 268.0, 194.0, 161.0, 100.0, 103.0, 59.0, 52.0, 32.0, 40.0, 21.0, 24.0, 17.0, 10.0, 9.0, 7.0, 12.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.2578125, -7.063232421875, -6.86865234375, -6.674072265625, -6.4794921875, -6.284912109375, -6.09033203125, -5.895751953125, -5.701171875, -5.506591796875, -5.31201171875, -5.117431640625, -4.9228515625, -4.728271484375, -4.53369140625, -4.339111328125, -4.14453125, -3.949951171875, -3.75537109375, -3.560791015625, -3.3662109375, -3.171630859375, -2.97705078125, -2.782470703125, -2.587890625, -2.393310546875, -2.19873046875, -2.004150390625, -1.8095703125, -1.614990234375, -1.42041015625, -1.225830078125, -1.03125, -0.836669921875, -0.64208984375, -0.447509765625, -0.2529296875, -0.058349609375, 0.13623046875, 0.330810546875, 0.525390625, 0.719970703125, 0.91455078125, 1.109130859375, 1.3037109375, 1.498291015625, 1.69287109375, 1.887451171875, 2.08203125, 2.276611328125, 2.47119140625, 2.665771484375, 2.8603515625, 3.054931640625, 3.24951171875, 3.444091796875, 3.638671875, 3.833251953125, 4.02783203125, 4.222412109375, 4.4169921875, 4.611572265625, 4.80615234375, 5.000732421875, 5.1953125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 12.0, 7.0, 7.0, 17.0, 19.0, 30.0, 29.0, 50.0, 55.0, 64.0, 120.0, 151.0, 206.0, 306.0, 481.0, 1526.0, 53961.0, 3138324.0, 984773.0, 11956.0, 806.0, 394.0, 269.0, 174.0, 135.0, 107.0, 67.0, 59.0, 48.0, 32.0, 20.0, 17.0, 20.0, 12.0, 10.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.644775390625, -16.96142578125, -16.278076171875, -15.5947265625, -14.911376953125, -14.22802734375, -13.544677734375, -12.861328125, -12.177978515625, -11.49462890625, -10.811279296875, -10.1279296875, -9.444580078125, -8.76123046875, -8.077880859375, -7.39453125, -6.711181640625, -6.02783203125, -5.344482421875, -4.6611328125, -3.977783203125, -3.29443359375, -2.611083984375, -1.927734375, -1.244384765625, -0.56103515625, 0.122314453125, 0.8056640625, 1.489013671875, 2.17236328125, 2.855712890625, 3.5390625, 4.222412109375, 4.90576171875, 5.589111328125, 6.2724609375, 6.955810546875, 7.63916015625, 8.322509765625, 9.005859375, 9.689208984375, 10.37255859375, 11.055908203125, 11.7392578125, 12.422607421875, 13.10595703125, 13.789306640625, 14.47265625, 15.156005859375, 15.83935546875, 16.522705078125, 17.2060546875, 17.889404296875, 18.57275390625, 19.256103515625, 19.939453125, 20.622802734375, 21.30615234375, 21.989501953125, 22.6728515625, 23.356201171875, 24.03955078125, 24.722900390625, 25.40625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 39.0, 119.0, 212.0, 289.0, 212.0, 100.0, 30.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.07173156738281, -91.62750244140625, -89.18327331542969, -86.73904418945312, -84.29481506347656, -81.8505859375, -79.40635681152344, -76.96212768554688, -74.51789855957031, -72.07366943359375, -69.62944030761719, -67.18521118164062, -64.74098205566406, -62.2967529296875, -59.85251998901367, -57.40829086303711, -54.96405792236328, -52.51982879638672, -50.075599670410156, -47.631370544433594, -45.18714141845703, -42.74291229248047, -40.29867935180664, -37.85445022583008, -35.410221099853516, -32.96599197387695, -30.52176284790039, -28.077531814575195, -25.633302688598633, -23.18907356262207, -20.744842529296875, -18.300613403320312, -15.856391906738281, -13.412162780761719, -10.96793270111084, -8.523702621459961, -6.079473495483398, -3.635244369506836, -1.191014289855957, 1.2532157897949219, 3.6974449157714844, 6.141674518585205, 8.585904121398926, 11.030134201049805, 13.474363327026367, 15.91859245300293, 18.362823486328125, 20.807052612304688, 23.25128173828125, 25.695510864257812, 28.139739990234375, 30.58397102355957, 33.0281982421875, 35.47242736816406, 37.91666030883789, 40.36088943481445, 42.805118560791016, 45.24934768676758, 47.69357681274414, 50.1378059387207, 52.58203887939453, 55.026268005371094, 57.470497131347656, 59.91472625732422, 62.35895538330078]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 10.0, 3.0, 10.0, 17.0, 17.0, 23.0, 19.0, 24.0, 34.0, 25.0, 28.0, 34.0, 44.0, 30.0, 33.0, 39.0, 53.0, 50.0, 39.0, 48.0, 42.0, 35.0, 35.0, 40.0, 34.0, 24.0, 20.0, 25.0, 22.0, 31.0, 16.0, 21.0, 10.0, 18.0, 7.0, 7.0, 9.0, 8.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-29.03809356689453, -28.252334594726562, -27.466577529907227, -26.680818557739258, -25.895061492919922, -25.109302520751953, -24.323543548583984, -23.537784576416016, -22.75202751159668, -21.96626853942871, -21.180511474609375, -20.394752502441406, -19.608993530273438, -18.8232364654541, -18.037477493286133, -17.251720428466797, -16.465961456298828, -15.680203437805176, -14.894445419311523, -14.108686447143555, -13.322928428649902, -12.53717041015625, -11.751411437988281, -10.965653419494629, -10.179895401000977, -9.394137382507324, -8.608379364013672, -7.822620391845703, -7.036862373352051, -6.251104354858398, -5.465345859527588, -4.679587364196777, -3.893829345703125, -3.1080710887908936, -2.322312831878662, -1.5365545749664307, -0.7507963180541992, 0.03496193885803223, 0.8207201957702637, 1.6064786911010742, 2.3922367095947266, 3.177994966506958, 3.9637532234191895, 4.74951171875, 5.535269737243652, 6.321027755737305, 7.106786251068115, 7.892544746398926, 8.678302764892578, 9.46406078338623, 10.249818801879883, 11.035577774047852, 11.821335792541504, 12.607093811035156, 13.392852783203125, 14.178610801696777, 14.96436882019043, 15.750126838684082, 16.535884857177734, 17.321643829345703, 18.107402801513672, 18.893159866333008, 19.678918838500977, 20.464675903320312, 21.25043487548828]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 2.0, 6.0, 15.0, 11.0, 9.0, 14.0, 11.0, 15.0, 24.0, 26.0, 26.0, 25.0, 35.0, 29.0, 33.0, 44.0, 42.0, 40.0, 39.0, 40.0, 33.0, 40.0, 36.0, 48.0, 29.0, 35.0, 28.0, 42.0, 29.0, 34.0, 23.0, 14.0, 19.0, 15.0, 18.0, 3.0, 17.0, 7.0, 6.0, 5.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.48828125, -3.385406494140625, -3.28253173828125, -3.179656982421875, -3.0767822265625, -2.973907470703125, -2.87103271484375, -2.768157958984375, -2.665283203125, -2.562408447265625, -2.45953369140625, -2.356658935546875, -2.2537841796875, -2.150909423828125, -2.04803466796875, -1.945159912109375, -1.84228515625, -1.739410400390625, -1.63653564453125, -1.533660888671875, -1.4307861328125, -1.327911376953125, -1.22503662109375, -1.122161865234375, -1.019287109375, -0.916412353515625, -0.81353759765625, -0.710662841796875, -0.6077880859375, -0.504913330078125, -0.40203857421875, -0.299163818359375, -0.1962890625, -0.093414306640625, 0.00946044921875, 0.112335205078125, 0.2152099609375, 0.318084716796875, 0.42095947265625, 0.523834228515625, 0.626708984375, 0.729583740234375, 0.83245849609375, 0.935333251953125, 1.0382080078125, 1.141082763671875, 1.24395751953125, 1.346832275390625, 1.44970703125, 1.552581787109375, 1.65545654296875, 1.758331298828125, 1.8612060546875, 1.964080810546875, 2.06695556640625, 2.169830322265625, 2.272705078125, 2.375579833984375, 2.47845458984375, 2.581329345703125, 2.6842041015625, 2.787078857421875, 2.88995361328125, 2.992828369140625, 3.095703125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 7.0, 3.0, 6.0, 2.0, 8.0, 14.0, 17.0, 23.0, 33.0, 51.0, 93.0, 139.0, 269.0, 453.0, 841.0, 1499.0, 2659.0, 4740.0, 9036.0, 17293.0, 35290.0, 76704.0, 170277.0, 304023.0, 225535.0, 103873.0, 47692.0, 22689.0, 11602.0, 6152.0, 3266.0, 1853.0, 1040.0, 585.0, 339.0, 156.0, 114.0, 57.0, 33.0, 30.0, 12.0, 13.0, 9.0, 5.0, 4.0, 5.0, 2.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5732421875, -0.5545654296875, -0.535888671875, -0.5172119140625, -0.49853515625, -0.4798583984375, -0.461181640625, -0.4425048828125, -0.423828125, -0.4051513671875, -0.386474609375, -0.3677978515625, -0.34912109375, -0.3304443359375, -0.311767578125, -0.2930908203125, -0.2744140625, -0.2557373046875, -0.237060546875, -0.2183837890625, -0.19970703125, -0.1810302734375, -0.162353515625, -0.1436767578125, -0.125, -0.1063232421875, -0.087646484375, -0.0689697265625, -0.05029296875, -0.0316162109375, -0.012939453125, 0.0057373046875, 0.0244140625, 0.0430908203125, 0.061767578125, 0.0804443359375, 0.09912109375, 0.1177978515625, 0.136474609375, 0.1551513671875, 0.173828125, 0.1925048828125, 0.211181640625, 0.2298583984375, 0.24853515625, 0.2672119140625, 0.285888671875, 0.3045654296875, 0.3232421875, 0.3419189453125, 0.360595703125, 0.3792724609375, 0.39794921875, 0.4166259765625, 0.435302734375, 0.4539794921875, 0.47265625, 0.4913330078125, 0.510009765625, 0.5286865234375, 0.54736328125, 0.5660400390625, 0.584716796875, 0.6033935546875, 0.6220703125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 2.0, 9.0, 9.0, 6.0, 13.0, 14.0, 12.0, 14.0, 18.0, 19.0, 20.0, 32.0, 28.0, 40.0, 38.0, 30.0, 47.0, 43.0, 42.0, 38.0, 1078.0, 46.0, 33.0, 46.0, 37.0, 38.0, 23.0, 38.0, 28.0, 20.0, 29.0, 24.0, 22.0, 14.0, 18.0, 6.0, 11.0, 5.0, 10.0, 6.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.455078125, -2.381866455078125, -2.30865478515625, -2.235443115234375, -2.1622314453125, -2.089019775390625, -2.01580810546875, -1.942596435546875, -1.869384765625, -1.796173095703125, -1.72296142578125, -1.649749755859375, -1.5765380859375, -1.503326416015625, -1.43011474609375, -1.356903076171875, -1.28369140625, -1.210479736328125, -1.13726806640625, -1.064056396484375, -0.9908447265625, -0.917633056640625, -0.84442138671875, -0.771209716796875, -0.697998046875, -0.624786376953125, -0.55157470703125, -0.478363037109375, -0.4051513671875, -0.331939697265625, -0.25872802734375, -0.185516357421875, -0.1123046875, -0.039093017578125, 0.03411865234375, 0.107330322265625, 0.1805419921875, 0.253753662109375, 0.32696533203125, 0.400177001953125, 0.473388671875, 0.546600341796875, 0.61981201171875, 0.693023681640625, 0.7662353515625, 0.839447021484375, 0.91265869140625, 0.985870361328125, 1.05908203125, 1.132293701171875, 1.20550537109375, 1.278717041015625, 1.3519287109375, 1.425140380859375, 1.49835205078125, 1.571563720703125, 1.644775390625, 1.717987060546875, 1.79119873046875, 1.864410400390625, 1.9376220703125, 2.010833740234375, 2.08404541015625, 2.157257080078125, 2.23046875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 13.0, 24.0, 29.0, 53.0, 77.0, 99.0, 151.0, 207.0, 338.0, 565.0, 872.0, 1329.0, 1963.0, 2963.0, 4579.0, 7015.0, 10805.0, 16451.0, 25667.0, 39487.0, 60665.0, 93531.0, 135746.0, 1205362.0, 166106.0, 112137.0, 74527.0, 47885.0, 30734.0, 20298.0, 13060.0, 8462.0, 5531.0, 3642.0, 2294.0, 1510.0, 1010.0, 690.0, 410.0, 274.0, 188.0, 123.0, 84.0, 55.0, 33.0, 29.0, 20.0, 12.0, 6.0, 1.0, 8.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.2359619140625, -0.22852516174316406, -0.22108840942382812, -0.2136516571044922, -0.20621490478515625, -0.1987781524658203, -0.19134140014648438, -0.18390464782714844, -0.1764678955078125, -0.16903114318847656, -0.16159439086914062, -0.1541576385498047, -0.14672088623046875, -0.1392841339111328, -0.13184738159179688, -0.12441062927246094, -0.116973876953125, -0.10953712463378906, -0.10210037231445312, -0.09466361999511719, -0.08722686767578125, -0.07979011535644531, -0.07235336303710938, -0.06491661071777344, -0.0574798583984375, -0.05004310607910156, -0.042606353759765625, -0.03516960144042969, -0.02773284912109375, -0.020296096801757812, -0.012859344482421875, -0.0054225921630859375, 0.00201416015625, 0.009450912475585938, 0.016887664794921875, 0.024324417114257812, 0.03176116943359375, 0.03919792175292969, 0.046634674072265625, 0.05407142639160156, 0.0615081787109375, 0.06894493103027344, 0.07638168334960938, 0.08381843566894531, 0.09125518798828125, 0.09869194030761719, 0.10612869262695312, 0.11356544494628906, 0.121002197265625, 0.12843894958496094, 0.13587570190429688, 0.1433124542236328, 0.15074920654296875, 0.1581859588623047, 0.16562271118164062, 0.17305946350097656, 0.1804962158203125, 0.18793296813964844, 0.19536972045898438, 0.2028064727783203, 0.21024322509765625, 0.2176799774169922, 0.22511672973632812, 0.23255348205566406, 0.239990234375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 1.0, 4.0, 7.0, 4.0, 5.0, 10.0, 16.0, 15.0, 20.0, 19.0, 41.0, 48.0, 73.0, 106.0, 107.0, 123.0, 99.0, 55.0, 42.0, 39.0, 30.0, 20.0, 23.0, 14.0, 15.0, 7.0, 3.0, 10.0, 2.0, 10.0, 5.0, 6.0, 5.0, 2.0, 1.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00750732421875, -0.007273674011230469, -0.0070400238037109375, -0.006806373596191406, -0.006572723388671875, -0.006339073181152344, -0.0061054229736328125, -0.005871772766113281, -0.00563812255859375, -0.005404472351074219, -0.0051708221435546875, -0.004937171936035156, -0.004703521728515625, -0.004469871520996094, -0.0042362213134765625, -0.004002571105957031, -0.0037689208984375, -0.0035352706909179688, -0.0033016204833984375, -0.0030679702758789062, -0.002834320068359375, -0.0026006698608398438, -0.0023670196533203125, -0.0021333694458007812, -0.00189971923828125, -0.0016660690307617188, -0.0014324188232421875, -0.0011987686157226562, -0.000965118408203125, -0.0007314682006835938, -0.0004978179931640625, -0.00026416778564453125, -3.0517578125e-05, 0.00020313262939453125, 0.0004367828369140625, 0.0006704330444335938, 0.000904083251953125, 0.0011377334594726562, 0.0013713836669921875, 0.0016050338745117188, 0.00183868408203125, 0.0020723342895507812, 0.0023059844970703125, 0.0025396347045898438, 0.002773284912109375, 0.0030069351196289062, 0.0032405853271484375, 0.0034742355346679688, 0.0037078857421875, 0.003941535949707031, 0.0041751861572265625, 0.004408836364746094, 0.004642486572265625, 0.004876136779785156, 0.0051097869873046875, 0.005343437194824219, 0.00557708740234375, 0.005810737609863281, 0.0060443878173828125, 0.006278038024902344, 0.006511688232421875, 0.006745338439941406, 0.0069789886474609375, 0.007212638854980469, 0.0074462890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 8.0, 4.0, 7.0, 15.0, 9.0, 11.0, 9.0, 26.0, 31.0, 33.0, 42.0, 66.0, 96.0, 140.0, 324.0, 1235.0, 884121.0, 160801.0, 834.0, 304.0, 133.0, 91.0, 56.0, 38.0, 19.0, 31.0, 14.0, 8.0, 10.0, 6.0, 6.0, 1.0, 5.0, 4.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1441650390625, -0.13934326171875, -0.134521484375, -0.12969970703125, -0.1248779296875, -0.12005615234375, -0.115234375, -0.11041259765625, -0.1055908203125, -0.10076904296875, -0.095947265625, -0.09112548828125, -0.0863037109375, -0.08148193359375, -0.07666015625, -0.07183837890625, -0.0670166015625, -0.06219482421875, -0.057373046875, -0.05255126953125, -0.0477294921875, -0.04290771484375, -0.0380859375, -0.03326416015625, -0.0284423828125, -0.02362060546875, -0.018798828125, -0.01397705078125, -0.0091552734375, -0.00433349609375, 0.00048828125, 0.00531005859375, 0.0101318359375, 0.01495361328125, 0.019775390625, 0.02459716796875, 0.0294189453125, 0.03424072265625, 0.0390625, 0.04388427734375, 0.0487060546875, 0.05352783203125, 0.058349609375, 0.06317138671875, 0.0679931640625, 0.07281494140625, 0.07763671875, 0.08245849609375, 0.0872802734375, 0.09210205078125, 0.096923828125, 0.10174560546875, 0.1065673828125, 0.11138916015625, 0.1162109375, 0.12103271484375, 0.1258544921875, 0.13067626953125, 0.135498046875, 0.14031982421875, 0.1451416015625, 0.14996337890625, 0.15478515625, 0.15960693359375, 0.1644287109375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 20.0, 164.0, 557.0, 199.0, 49.0, 23.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011133488267660141, -0.010367042385041714, -0.009600597433745861, -0.008834151551127434, -0.008067706599831581, -0.007301260717213154, -0.006534815300256014, -0.005768369883298874, -0.005001924466341734, -0.004235479049384594, -0.003469033632427454, -0.0027025879826396704, -0.0019361425656825304, -0.0011696971487253904, -0.0004032514989376068, 0.00036319391801953316, 0.0011296393349766731, 0.001896084751933813, 0.002662530168890953, 0.0034289758186787367, 0.004195421002805233, 0.00496186688542366, 0.0057283123023808, 0.00649475771933794, 0.00726120313629508, 0.00802764855325222, 0.008794094435870647, 0.0095605393871665, 0.010326985269784927, 0.01109343022108078, 0.011859876103699207, 0.012626321986317635, 0.013392766937613487, 0.014159212820231915, 0.014925657771527767, 0.015692103654146194, 0.016458548605442047, 0.0172249935567379, 0.0179914403706789, 0.018757885321974754, 0.019524330273270607, 0.02029077522456646, 0.02105722203850746, 0.021823666989803314, 0.022590111941099167, 0.02335655689239502, 0.02412300370633602, 0.024889448657631874, 0.025655895471572876, 0.02642234042286873, 0.02718878723680973, 0.027955232188105583, 0.028721677139401436, 0.02948812209069729, 0.03025456890463829, 0.031021013855934143, 0.031787458807229996, 0.03255390375852585, 0.0333203487098217, 0.034086793661117554, 0.034853242337703705, 0.03561968728899956, 0.03638613224029541, 0.03715257719159126, 0.037919022142887115]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 2.0, 3.0, 6.0, 9.0, 7.0, 11.0, 10.0, 16.0, 16.0, 26.0, 19.0, 18.0, 28.0, 29.0, 28.0, 41.0, 35.0, 47.0, 44.0, 35.0, 43.0, 44.0, 33.0, 42.0, 50.0, 39.0, 31.0, 37.0, 41.0, 33.0, 28.0, 27.0, 23.0, 23.0, 15.0, 14.0, 9.0, 9.0, 13.0, 5.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004331350326538086, -0.0042100828140974045, -0.004088815301656723, -0.0039675477892160416, -0.00384628027677536, -0.0037250127643346786, -0.003603745251893997, -0.0034824777394533157, -0.0033612102270126343, -0.003239942714571953, -0.0031186752021312714, -0.00299740768969059, -0.0028761401772499084, -0.002754872664809227, -0.0026336051523685455, -0.002512337639927864, -0.0023910701274871826, -0.002269802615046501, -0.0021485351026058197, -0.0020272675901651382, -0.0019060000777244568, -0.0017847325652837753, -0.0016634650528430939, -0.0015421975404024124, -0.001420930027961731, -0.0012996625155210495, -0.001178395003080368, -0.0010571274906396866, -0.0009358599781990051, -0.0008145924657583237, -0.0006933249533176422, -0.0005720574408769608, -0.0004507899284362793, -0.00032952241599559784, -0.00020825490355491638, -8.698739111423492e-05, 3.428012132644653e-05, 0.000155547633767128, 0.00027681514620780945, 0.0003980826586484909, 0.0005193501710891724, 0.0006406176835298538, 0.0007618851959705353, 0.0008831527084112167, 0.0010044202208518982, 0.0011256877332925797, 0.001246955245733261, 0.0013682227581739426, 0.001489490270614624, 0.0016107577830553055, 0.001732025295495987, 0.0018532928079366684, 0.00197456032037735, 0.0020958278328180313, 0.0022170953452587128, 0.0023383628576993942, 0.0024596303701400757, 0.002580897882580757, 0.0027021653950214386, 0.00282343290746212, 0.0029447004199028015, 0.003065967932343483, 0.0031872354447841644, 0.003308502957224846, 0.0034297704696655273]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 2.0, 6.0, 15.0, 11.0, 9.0, 14.0, 11.0, 15.0, 24.0, 26.0, 26.0, 25.0, 35.0, 29.0, 33.0, 44.0, 42.0, 40.0, 39.0, 40.0, 33.0, 40.0, 36.0, 48.0, 29.0, 35.0, 28.0, 42.0, 29.0, 34.0, 23.0, 14.0, 18.0, 16.0, 18.0, 3.0, 17.0, 7.0, 6.0, 5.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.48828125, -3.385406494140625, -3.28253173828125, -3.179656982421875, -3.0767822265625, -2.973907470703125, -2.87103271484375, -2.768157958984375, -2.665283203125, -2.562408447265625, -2.45953369140625, -2.356658935546875, -2.2537841796875, -2.150909423828125, -2.04803466796875, -1.945159912109375, -1.84228515625, -1.739410400390625, -1.63653564453125, -1.533660888671875, -1.4307861328125, -1.327911376953125, -1.22503662109375, -1.122161865234375, -1.019287109375, -0.916412353515625, -0.81353759765625, -0.710662841796875, -0.6077880859375, -0.504913330078125, -0.40203857421875, -0.299163818359375, -0.1962890625, -0.093414306640625, 0.00946044921875, 0.112335205078125, 0.2152099609375, 0.318084716796875, 0.42095947265625, 0.523834228515625, 0.626708984375, 0.729583740234375, 0.83245849609375, 0.935333251953125, 1.0382080078125, 1.141082763671875, 1.24395751953125, 1.346832275390625, 1.44970703125, 1.552581787109375, 1.65545654296875, 1.758331298828125, 1.8612060546875, 1.964080810546875, 2.06695556640625, 2.169830322265625, 2.272705078125, 2.375579833984375, 2.47845458984375, 2.581329345703125, 2.6842041015625, 2.787078857421875, 2.88995361328125, 2.992828369140625, 3.095703125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 13.0, 12.0, 12.0, 14.0, 36.0, 49.0, 57.0, 81.0, 121.0, 187.0, 322.0, 506.0, 982.0, 1980.0, 4152.0, 9199.0, 21798.0, 52024.0, 125233.0, 309893.0, 307080.0, 124130.0, 51649.0, 21123.0, 9220.0, 4120.0, 2076.0, 1033.0, 535.0, 320.0, 177.0, 122.0, 70.0, 61.0, 44.0, 30.0, 18.0, 17.0, 9.0, 19.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.31640625, -3.205841064453125, -3.09527587890625, -2.984710693359375, -2.8741455078125, -2.763580322265625, -2.65301513671875, -2.542449951171875, -2.431884765625, -2.321319580078125, -2.21075439453125, -2.100189208984375, -1.9896240234375, -1.879058837890625, -1.76849365234375, -1.657928466796875, -1.54736328125, -1.436798095703125, -1.32623291015625, -1.215667724609375, -1.1051025390625, -0.994537353515625, -0.88397216796875, -0.773406982421875, -0.662841796875, -0.552276611328125, -0.44171142578125, -0.331146240234375, -0.2205810546875, -0.110015869140625, 0.00054931640625, 0.111114501953125, 0.2216796875, 0.332244873046875, 0.44281005859375, 0.553375244140625, 0.6639404296875, 0.774505615234375, 0.88507080078125, 0.995635986328125, 1.106201171875, 1.216766357421875, 1.32733154296875, 1.437896728515625, 1.5484619140625, 1.659027099609375, 1.76959228515625, 1.880157470703125, 1.99072265625, 2.101287841796875, 2.21185302734375, 2.322418212890625, 2.4329833984375, 2.543548583984375, 2.65411376953125, 2.764678955078125, 2.875244140625, 2.985809326171875, 3.09637451171875, 3.206939697265625, 3.3175048828125, 3.428070068359375, 3.53863525390625, 3.649200439453125, 3.759765625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 3.0, 7.0, 5.0, 9.0, 10.0, 12.0, 16.0, 19.0, 29.0, 18.0, 23.0, 35.0, 36.0, 44.0, 53.0, 62.0, 73.0, 141.0, 347.0, 1391.0, 205.0, 86.0, 66.0, 36.0, 53.0, 38.0, 36.0, 32.0, 29.0, 24.0, 20.0, 19.0, 10.0, 14.0, 11.0, 8.0, 8.0, 6.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9453125, -11.535400390625, -11.12548828125, -10.715576171875, -10.3056640625, -9.895751953125, -9.48583984375, -9.075927734375, -8.666015625, -8.256103515625, -7.84619140625, -7.436279296875, -7.0263671875, -6.616455078125, -6.20654296875, -5.796630859375, -5.38671875, -4.976806640625, -4.56689453125, -4.156982421875, -3.7470703125, -3.337158203125, -2.92724609375, -2.517333984375, -2.107421875, -1.697509765625, -1.28759765625, -0.877685546875, -0.4677734375, -0.057861328125, 0.35205078125, 0.761962890625, 1.171875, 1.581787109375, 1.99169921875, 2.401611328125, 2.8115234375, 3.221435546875, 3.63134765625, 4.041259765625, 4.451171875, 4.861083984375, 5.27099609375, 5.680908203125, 6.0908203125, 6.500732421875, 6.91064453125, 7.320556640625, 7.73046875, 8.140380859375, 8.55029296875, 8.960205078125, 9.3701171875, 9.780029296875, 10.18994140625, 10.599853515625, 11.009765625, 11.419677734375, 11.82958984375, 12.239501953125, 12.6494140625, 13.059326171875, 13.46923828125, 13.879150390625, 14.2890625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 4.0, 14.0, 19.0, 21.0, 44.0, 69.0, 121.0, 197.0, 416.0, 1411.0, 47633.0, 3091575.0, 2987.0, 589.0, 230.0, 131.0, 91.0, 49.0, 27.0, 26.0, 14.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.23046875, -60.0234375, -57.81640625, -55.609375, -53.40234375, -51.1953125, -48.98828125, -46.78125, -44.57421875, -42.3671875, -40.16015625, -37.953125, -35.74609375, -33.5390625, -31.33203125, -29.125, -26.91796875, -24.7109375, -22.50390625, -20.296875, -18.08984375, -15.8828125, -13.67578125, -11.46875, -9.26171875, -7.0546875, -4.84765625, -2.640625, -0.43359375, 1.7734375, 3.98046875, 6.1875, 8.39453125, 10.6015625, 12.80859375, 15.015625, 17.22265625, 19.4296875, 21.63671875, 23.84375, 26.05078125, 28.2578125, 30.46484375, 32.671875, 34.87890625, 37.0859375, 39.29296875, 41.5, 43.70703125, 45.9140625, 48.12109375, 50.328125, 52.53515625, 54.7421875, 56.94921875, 59.15625, 61.36328125, 63.5703125, 65.77734375, 67.984375, 70.19140625, 72.3984375, 74.60546875, 76.8125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 97.0, 794.0, 120.0], "bins": [-266.9373474121094, -262.6640319824219, -258.3907165527344, -254.11740112304688, -249.84408569335938, -245.57077026367188, -241.29745483398438, -237.02415466308594, -232.75083923339844, -228.47752380371094, -224.20420837402344, -219.93089294433594, -215.65757751464844, -211.38427734375, -207.1109619140625, -202.837646484375, -198.5643310546875, -194.291015625, -190.0177001953125, -185.744384765625, -181.4710693359375, -177.19775390625, -172.9244384765625, -168.65113830566406, -164.3778076171875, -160.1044921875, -155.8311767578125, -151.557861328125, -147.2845458984375, -143.01123046875, -138.7379150390625, -134.46461486816406, -130.19131469726562, -125.91799926757812, -121.64468383789062, -117.37136840820312, -113.09806060791016, -108.82474517822266, -104.55142974853516, -100.27811431884766, -96.00479888916016, -91.73148345947266, -87.45816802978516, -83.18486022949219, -78.91154479980469, -74.63822937011719, -70.36491394042969, -66.09159851074219, -61.81828689575195, -57.54497146606445, -53.27165985107422, -48.99834442138672, -44.72502899169922, -40.451717376708984, -36.178401947021484, -31.905088424682617, -27.631776809692383, -23.358463287353516, -19.085147857666016, -14.811834335327148, -10.538520812988281, -6.265207290649414, -1.991891860961914, 2.281421661376953, 6.5547356605529785]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 6.0, 12.0, 10.0, 16.0, 14.0, 21.0, 21.0, 23.0, 30.0, 19.0, 30.0, 29.0, 34.0, 30.0, 29.0, 30.0, 33.0, 43.0, 38.0, 29.0, 51.0, 25.0, 53.0, 33.0, 43.0, 25.0, 29.0, 27.0, 28.0, 24.0, 16.0, 14.0, 30.0, 16.0, 12.0, 13.0, 14.0, 14.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-27.907957077026367, -27.000696182250977, -26.093433380126953, -25.186172485351562, -24.27890968322754, -23.37164878845215, -22.464385986328125, -21.557125091552734, -20.649864196777344, -19.742603302001953, -18.83534049987793, -17.92807960510254, -17.020816802978516, -16.113555908203125, -15.206294059753418, -14.299032211303711, -13.391769409179688, -12.48450756072998, -11.577245712280273, -10.669984817504883, -9.76272201538086, -8.855461120605469, -7.948199272155762, -7.040937423706055, -6.133675575256348, -5.226413726806641, -4.319151878356934, -3.4118905067443848, -2.5046286582946777, -1.5973668098449707, -0.6901054382324219, 0.21715641021728516, 1.1244182586669922, 2.031680107116699, 2.938941717147827, 3.846203327178955, 4.753465175628662, 5.660727024078369, 6.567988395690918, 7.475250244140625, 8.382512092590332, 9.289773941040039, 10.197035789489746, 11.104297637939453, 12.011558532714844, 12.918821334838867, 13.826082229614258, 14.733344078063965, 15.640605926513672, 16.547866821289062, 17.455129623413086, 18.362390518188477, 19.2696533203125, 20.17691421508789, 21.08417510986328, 21.991437911987305, 22.898700714111328, 23.80596160888672, 24.713224411010742, 25.620485305786133, 26.527748107910156, 27.435009002685547, 28.342269897460938, 29.24953269958496, 30.15679359436035]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 7.0, 3.0, 9.0, 9.0, 22.0, 7.0, 9.0, 14.0, 21.0, 15.0, 15.0, 27.0, 27.0, 36.0, 28.0, 38.0, 32.0, 40.0, 30.0, 49.0, 31.0, 37.0, 37.0, 39.0, 40.0, 37.0, 28.0, 26.0, 37.0, 31.0, 25.0, 31.0, 24.0, 22.0, 12.0, 22.0, 10.0, 13.0, 10.0, 8.0, 7.0, 6.0, 6.0, 5.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.35546875, -3.248748779296875, -3.14202880859375, -3.035308837890625, -2.9285888671875, -2.821868896484375, -2.71514892578125, -2.608428955078125, -2.501708984375, -2.394989013671875, -2.28826904296875, -2.181549072265625, -2.0748291015625, -1.968109130859375, -1.86138916015625, -1.754669189453125, -1.64794921875, -1.541229248046875, -1.43450927734375, -1.327789306640625, -1.2210693359375, -1.114349365234375, -1.00762939453125, -0.900909423828125, -0.794189453125, -0.687469482421875, -0.58074951171875, -0.474029541015625, -0.3673095703125, -0.260589599609375, -0.15386962890625, -0.047149658203125, 0.0595703125, 0.166290283203125, 0.27301025390625, 0.379730224609375, 0.4864501953125, 0.593170166015625, 0.69989013671875, 0.806610107421875, 0.913330078125, 1.020050048828125, 1.12677001953125, 1.233489990234375, 1.3402099609375, 1.446929931640625, 1.55364990234375, 1.660369873046875, 1.76708984375, 1.873809814453125, 1.98052978515625, 2.087249755859375, 2.1939697265625, 2.300689697265625, 2.40740966796875, 2.514129638671875, 2.620849609375, 2.727569580078125, 2.83428955078125, 2.941009521484375, 3.0477294921875, 3.154449462890625, 3.26116943359375, 3.367889404296875, 3.474609375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 6.0, 5.0, 9.0, 5.0, 8.0, 10.0, 12.0, 19.0, 19.0, 23.0, 30.0, 47.0, 41.0, 58.0, 63.0, 87.0, 109.0, 238.0, 402.0, 1140.0, 3927.0, 19149.0, 131364.0, 887368.0, 2145588.0, 852187.0, 127244.0, 18909.0, 3831.0, 1131.0, 428.0, 224.0, 164.0, 91.0, 75.0, 49.0, 50.0, 30.0, 30.0, 23.0, 25.0, 10.0, 9.0, 17.0, 8.0, 1.0, 13.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-7.44140625, -7.22564697265625, -7.0098876953125, -6.79412841796875, -6.578369140625, -6.36260986328125, -6.1468505859375, -5.93109130859375, -5.71533203125, -5.49957275390625, -5.2838134765625, -5.06805419921875, -4.852294921875, -4.63653564453125, -4.4207763671875, -4.20501708984375, -3.9892578125, -3.77349853515625, -3.5577392578125, -3.34197998046875, -3.126220703125, -2.91046142578125, -2.6947021484375, -2.47894287109375, -2.26318359375, -2.04742431640625, -1.8316650390625, -1.61590576171875, -1.400146484375, -1.18438720703125, -0.9686279296875, -0.75286865234375, -0.537109375, -0.32135009765625, -0.1055908203125, 0.11016845703125, 0.325927734375, 0.54168701171875, 0.7574462890625, 0.97320556640625, 1.18896484375, 1.40472412109375, 1.6204833984375, 1.83624267578125, 2.052001953125, 2.26776123046875, 2.4835205078125, 2.69927978515625, 2.9150390625, 3.13079833984375, 3.3465576171875, 3.56231689453125, 3.778076171875, 3.99383544921875, 4.2095947265625, 4.42535400390625, 4.64111328125, 4.85687255859375, 5.0726318359375, 5.28839111328125, 5.504150390625, 5.71990966796875, 5.9356689453125, 6.15142822265625, 6.3671875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 3.0, 7.0, 7.0, 17.0, 15.0, 26.0, 32.0, 51.0, 48.0, 69.0, 95.0, 104.0, 143.0, 207.0, 282.0, 355.0, 398.0, 430.0, 423.0, 342.0, 266.0, 187.0, 151.0, 108.0, 88.0, 63.0, 38.0, 33.0, 26.0, 12.0, 17.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-9.1015625, -8.87042236328125, -8.6392822265625, -8.40814208984375, -8.177001953125, -7.94586181640625, -7.7147216796875, -7.48358154296875, -7.25244140625, -7.02130126953125, -6.7901611328125, -6.55902099609375, -6.327880859375, -6.09674072265625, -5.8656005859375, -5.63446044921875, -5.4033203125, -5.17218017578125, -4.9410400390625, -4.70989990234375, -4.478759765625, -4.24761962890625, -4.0164794921875, -3.78533935546875, -3.55419921875, -3.32305908203125, -3.0919189453125, -2.86077880859375, -2.629638671875, -2.39849853515625, -2.1673583984375, -1.93621826171875, -1.705078125, -1.47393798828125, -1.2427978515625, -1.01165771484375, -0.780517578125, -0.54937744140625, -0.3182373046875, -0.08709716796875, 0.14404296875, 0.37518310546875, 0.6063232421875, 0.83746337890625, 1.068603515625, 1.29974365234375, 1.5308837890625, 1.76202392578125, 1.9931640625, 2.22430419921875, 2.4554443359375, 2.68658447265625, 2.917724609375, 3.14886474609375, 3.3800048828125, 3.61114501953125, 3.84228515625, 4.07342529296875, 4.3045654296875, 4.53570556640625, 4.766845703125, 4.99798583984375, 5.2291259765625, 5.46026611328125, 5.69140625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 11.0, 17.0, 18.0, 28.0, 32.0, 50.0, 72.0, 116.0, 163.0, 198.0, 322.0, 552.0, 4958.0, 2214441.0, 1967222.0, 4431.0, 559.0, 316.0, 201.0, 134.0, 114.0, 83.0, 54.0, 49.0, 31.0, 27.0, 21.0, 15.0, 11.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.52685546875, -23.4599609375, -22.39306640625, -21.326171875, -20.25927734375, -19.1923828125, -18.12548828125, -17.05859375, -15.99169921875, -14.9248046875, -13.85791015625, -12.791015625, -11.72412109375, -10.6572265625, -9.59033203125, -8.5234375, -7.45654296875, -6.3896484375, -5.32275390625, -4.255859375, -3.18896484375, -2.1220703125, -1.05517578125, 0.01171875, 1.07861328125, 2.1455078125, 3.21240234375, 4.279296875, 5.34619140625, 6.4130859375, 7.47998046875, 8.546875, 9.61376953125, 10.6806640625, 11.74755859375, 12.814453125, 13.88134765625, 14.9482421875, 16.01513671875, 17.08203125, 18.14892578125, 19.2158203125, 20.28271484375, 21.349609375, 22.41650390625, 23.4833984375, 24.55029296875, 25.6171875, 26.68408203125, 27.7509765625, 28.81787109375, 29.884765625, 30.95166015625, 32.0185546875, 33.08544921875, 34.15234375, 35.21923828125, 36.2861328125, 37.35302734375, 38.419921875, 39.48681640625, 40.5537109375, 41.62060546875, 42.6875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 24.0, 174.0, 440.0, 323.0, 53.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-210.8077392578125, -206.39984130859375, -201.99192810058594, -197.58401489257812, -193.17611694335938, -188.76821899414062, -184.3603057861328, -179.952392578125, -175.54449462890625, -171.1365966796875, -166.7286834716797, -162.32077026367188, -157.91287231445312, -153.50497436523438, -149.09706115722656, -144.68914794921875, -140.28125, -135.87335205078125, -131.46543884277344, -127.05753326416016, -122.64962768554688, -118.2417221069336, -113.83381652832031, -109.42591094970703, -105.01800537109375, -100.61009979248047, -96.20219421386719, -91.7942886352539, -87.38638305664062, -82.97847747802734, -78.57057189941406, -74.16266632080078, -69.75475311279297, -65.34684753417969, -60.938941955566406, -56.531036376953125, -52.123130798339844, -47.71522521972656, -43.30731964111328, -38.8994140625, -34.49150848388672, -30.083602905273438, -25.675697326660156, -21.267791748046875, -16.859886169433594, -12.451980590820312, -8.044075012207031, -3.63616943359375, 0.7717361450195312, 5.1796417236328125, 9.587547302246094, 13.995452880859375, 18.403358459472656, 22.811264038085938, 27.21916961669922, 31.6270751953125, 36.03498077392578, 40.44288635253906, 44.850791931152344, 49.258697509765625, 53.666603088378906, 58.07450866699219, 62.48241424560547, 66.89031982421875, 71.29822540283203]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 8.0, 5.0, 5.0, 11.0, 10.0, 9.0, 16.0, 10.0, 20.0, 19.0, 17.0, 22.0, 21.0, 32.0, 34.0, 30.0, 39.0, 33.0, 35.0, 44.0, 38.0, 42.0, 38.0, 34.0, 38.0, 26.0, 48.0, 39.0, 34.0, 31.0, 30.0, 23.0, 27.0, 23.0, 21.0, 6.0, 16.0, 9.0, 13.0, 8.0, 8.0, 7.0, 5.0, 8.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-22.873281478881836, -22.197052001953125, -21.520822525024414, -20.844593048095703, -20.168363571166992, -19.49213409423828, -18.815906524658203, -18.13967514038086, -17.46344757080078, -16.78721809387207, -16.11098861694336, -15.434759140014648, -14.758529663085938, -14.082300186157227, -13.406071662902832, -12.729842185974121, -12.053611755371094, -11.377382278442383, -10.701152801513672, -10.024923324584961, -9.34869384765625, -8.672464370727539, -7.9962358474731445, -7.320006370544434, -6.643776893615723, -5.967547416687012, -5.291317939758301, -4.615088939666748, -3.938859462738037, -3.262629985809326, -2.5864009857177734, -1.9101715087890625, -1.2339439392089844, -0.557714581489563, 0.1185147762298584, 0.7947440147399902, 1.4709734916687012, 2.147202968597412, 2.823431968688965, 3.499661445617676, 4.175890922546387, 4.852120399475098, 5.528349876403809, 6.204578876495361, 6.880808353424072, 7.557037830352783, 8.233266830444336, 8.909496307373047, 9.585725784301758, 10.261955261230469, 10.93818473815918, 11.61441421508789, 12.290643692016602, 12.966873168945312, 13.643101692199707, 14.319331169128418, 14.995560646057129, 15.67179012298584, 16.348018646240234, 17.024248123168945, 17.700477600097656, 18.376707077026367, 19.052936553955078, 19.72916603088379, 20.4053955078125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 4.0, 8.0, 8.0, 3.0, 8.0, 9.0, 22.0, 20.0, 18.0, 23.0, 32.0, 22.0, 23.0, 22.0, 36.0, 28.0, 30.0, 38.0, 42.0, 42.0, 41.0, 31.0, 32.0, 30.0, 45.0, 34.0, 47.0, 23.0, 26.0, 23.0, 30.0, 24.0, 26.0, 17.0, 15.0, 19.0, 19.0, 13.0, 10.0, 10.0, 5.0, 5.0, 4.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.236328125, -3.13580322265625, -3.0352783203125, -2.93475341796875, -2.834228515625, -2.73370361328125, -2.6331787109375, -2.53265380859375, -2.43212890625, -2.33160400390625, -2.2310791015625, -2.13055419921875, -2.030029296875, -1.92950439453125, -1.8289794921875, -1.72845458984375, -1.6279296875, -1.52740478515625, -1.4268798828125, -1.32635498046875, -1.225830078125, -1.12530517578125, -1.0247802734375, -0.92425537109375, -0.82373046875, -0.72320556640625, -0.6226806640625, -0.52215576171875, -0.421630859375, -0.32110595703125, -0.2205810546875, -0.12005615234375, -0.01953125, 0.08099365234375, 0.1815185546875, 0.28204345703125, 0.382568359375, 0.48309326171875, 0.5836181640625, 0.68414306640625, 0.78466796875, 0.88519287109375, 0.9857177734375, 1.08624267578125, 1.186767578125, 1.28729248046875, 1.3878173828125, 1.48834228515625, 1.5888671875, 1.68939208984375, 1.7899169921875, 1.89044189453125, 1.990966796875, 2.09149169921875, 2.1920166015625, 2.29254150390625, 2.39306640625, 2.49359130859375, 2.5941162109375, 2.69464111328125, 2.795166015625, 2.89569091796875, 2.9962158203125, 3.09674072265625, 3.197265625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 14.0, 28.0, 23.0, 44.0, 58.0, 91.0, 190.0, 332.0, 570.0, 1113.0, 2076.0, 3885.0, 7462.0, 14883.0, 30672.0, 66063.0, 144194.0, 279195.0, 257144.0, 127780.0, 58250.0, 26768.0, 13261.0, 6741.0, 3609.0, 1863.0, 994.0, 495.0, 282.0, 158.0, 105.0, 68.0, 39.0, 24.0, 18.0, 9.0, 12.0, 10.0, 9.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.472900390625, -0.4546546936035156, -0.43640899658203125, -0.4181632995605469, -0.3999176025390625, -0.3816719055175781, -0.36342620849609375, -0.3451805114746094, -0.326934814453125, -0.3086891174316406, -0.29044342041015625, -0.2721977233886719, -0.2539520263671875, -0.23570632934570312, -0.21746063232421875, -0.19921493530273438, -0.18096923828125, -0.16272354125976562, -0.14447784423828125, -0.12623214721679688, -0.1079864501953125, -0.08974075317382812, -0.07149505615234375, -0.053249359130859375, -0.035003662109375, -0.016757965087890625, 0.00148773193359375, 0.019733428955078125, 0.0379791259765625, 0.056224822998046875, 0.07447052001953125, 0.09271621704101562, 0.1109619140625, 0.12920761108398438, 0.14745330810546875, 0.16569900512695312, 0.1839447021484375, 0.20219039916992188, 0.22043609619140625, 0.23868179321289062, 0.256927490234375, 0.2751731872558594, 0.29341888427734375, 0.3116645812988281, 0.3299102783203125, 0.3481559753417969, 0.36640167236328125, 0.3846473693847656, 0.40289306640625, 0.4211387634277344, 0.43938446044921875, 0.4576301574707031, 0.4758758544921875, 0.4941215515136719, 0.5123672485351562, 0.5306129455566406, 0.548858642578125, 0.5671043395996094, 0.5853500366210938, 0.6035957336425781, 0.6218414306640625, 0.6400871276855469, 0.6583328247070312, 0.6765785217285156, 0.69482421875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 5.0, 1.0, 8.0, 5.0, 9.0, 7.0, 12.0, 5.0, 12.0, 12.0, 18.0, 23.0, 23.0, 24.0, 28.0, 39.0, 28.0, 20.0, 36.0, 44.0, 49.0, 41.0, 1063.0, 44.0, 33.0, 43.0, 31.0, 41.0, 33.0, 40.0, 42.0, 29.0, 20.0, 17.0, 19.0, 20.0, 13.0, 19.0, 15.0, 14.0, 13.0, 10.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.435546875, -2.363494873046875, -2.29144287109375, -2.219390869140625, -2.1473388671875, -2.075286865234375, -2.00323486328125, -1.931182861328125, -1.859130859375, -1.787078857421875, -1.71502685546875, -1.642974853515625, -1.5709228515625, -1.498870849609375, -1.42681884765625, -1.354766845703125, -1.28271484375, -1.210662841796875, -1.13861083984375, -1.066558837890625, -0.9945068359375, -0.922454833984375, -0.85040283203125, -0.778350830078125, -0.706298828125, -0.634246826171875, -0.56219482421875, -0.490142822265625, -0.4180908203125, -0.346038818359375, -0.27398681640625, -0.201934814453125, -0.1298828125, -0.057830810546875, 0.01422119140625, 0.086273193359375, 0.1583251953125, 0.230377197265625, 0.30242919921875, 0.374481201171875, 0.446533203125, 0.518585205078125, 0.59063720703125, 0.662689208984375, 0.7347412109375, 0.806793212890625, 0.87884521484375, 0.950897216796875, 1.02294921875, 1.095001220703125, 1.16705322265625, 1.239105224609375, 1.3111572265625, 1.383209228515625, 1.45526123046875, 1.527313232421875, 1.599365234375, 1.671417236328125, 1.74346923828125, 1.815521240234375, 1.8875732421875, 1.959625244140625, 2.03167724609375, 2.103729248046875, 2.17578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 4.0, 17.0, 18.0, 24.0, 56.0, 85.0, 119.0, 206.0, 259.0, 379.0, 584.0, 885.0, 1325.0, 2023.0, 3030.0, 4497.0, 6728.0, 10199.0, 15365.0, 23077.0, 34241.0, 51077.0, 74033.0, 105919.0, 143195.0, 1195516.0, 129256.0, 95233.0, 65333.0, 44028.0, 30114.0, 20037.0, 13574.0, 9019.0, 6004.0, 3867.0, 2518.0, 1788.0, 1156.0, 765.0, 551.0, 382.0, 213.0, 140.0, 104.0, 56.0, 55.0, 36.0, 18.0, 17.0, 8.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.22119140625, -0.21435165405273438, -0.20751190185546875, -0.20067214965820312, -0.1938323974609375, -0.18699264526367188, -0.18015289306640625, -0.17331314086914062, -0.166473388671875, -0.15963363647460938, -0.15279388427734375, -0.14595413208007812, -0.1391143798828125, -0.13227462768554688, -0.12543487548828125, -0.11859512329101562, -0.11175537109375, -0.10491561889648438, -0.09807586669921875, -0.09123611450195312, -0.0843963623046875, -0.07755661010742188, -0.07071685791015625, -0.06387710571289062, -0.057037353515625, -0.050197601318359375, -0.04335784912109375, -0.036518096923828125, -0.0296783447265625, -0.022838592529296875, -0.01599884033203125, -0.009159088134765625, -0.0023193359375, 0.004520416259765625, 0.01136016845703125, 0.018199920654296875, 0.0250396728515625, 0.031879425048828125, 0.03871917724609375, 0.045558929443359375, 0.052398681640625, 0.059238433837890625, 0.06607818603515625, 0.07291793823242188, 0.0797576904296875, 0.08659744262695312, 0.09343719482421875, 0.10027694702148438, 0.10711669921875, 0.11395645141601562, 0.12079620361328125, 0.12763595581054688, 0.1344757080078125, 0.14131546020507812, 0.14815521240234375, 0.15499496459960938, 0.161834716796875, 0.16867446899414062, 0.17551422119140625, 0.18235397338867188, 0.1891937255859375, 0.19603347778320312, 0.20287322998046875, 0.20971298217773438, 0.216552734375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 3.0, 4.0, 8.0, 7.0, 6.0, 10.0, 10.0, 12.0, 13.0, 15.0, 29.0, 19.0, 28.0, 27.0, 35.0, 42.0, 39.0, 45.0, 41.0, 53.0, 53.0, 58.0, 50.0, 33.0, 51.0, 40.0, 37.0, 34.0, 19.0, 24.0, 35.0, 19.0, 20.0, 11.0, 16.0, 10.0, 8.0, 5.0, 10.0, 8.0, 7.0, 3.0, 8.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003582000732421875, -0.0034675002098083496, -0.0033529996871948242, -0.003238499164581299, -0.0031239986419677734, -0.003009498119354248, -0.0028949975967407227, -0.0027804970741271973, -0.002665996551513672, -0.0025514960289001465, -0.002436995506286621, -0.0023224949836730957, -0.0022079944610595703, -0.002093493938446045, -0.0019789934158325195, -0.0018644928932189941, -0.0017499923706054688, -0.0016354918479919434, -0.001520991325378418, -0.0014064908027648926, -0.0012919902801513672, -0.0011774897575378418, -0.0010629892349243164, -0.000948488712310791, -0.0008339881896972656, -0.0007194876670837402, -0.0006049871444702148, -0.0004904866218566895, -0.00037598609924316406, -0.00026148557662963867, -0.00014698505401611328, -3.248453140258789e-05, 8.20159912109375e-05, 0.0001965165138244629, 0.0003110170364379883, 0.00042551755905151367, 0.0005400180816650391, 0.0006545186042785645, 0.0007690191268920898, 0.0008835196495056152, 0.0009980201721191406, 0.001112520694732666, 0.0012270212173461914, 0.0013415217399597168, 0.0014560222625732422, 0.0015705227851867676, 0.001685023307800293, 0.0017995238304138184, 0.0019140243530273438, 0.002028524875640869, 0.0021430253982543945, 0.00225752592086792, 0.0023720264434814453, 0.0024865269660949707, 0.002601027488708496, 0.0027155280113220215, 0.002830028533935547, 0.0029445290565490723, 0.0030590295791625977, 0.003173530101776123, 0.0032880306243896484, 0.003402531147003174, 0.0035170316696166992, 0.0036315321922302246, 0.00374603271484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 3.0, 5.0, 8.0, 10.0, 6.0, 13.0, 10.0, 19.0, 21.0, 26.0, 27.0, 45.0, 49.0, 52.0, 68.0, 103.0, 147.0, 283.0, 558.0, 4660.0, 803739.0, 235223.0, 2182.0, 470.0, 216.0, 135.0, 114.0, 71.0, 52.0, 59.0, 30.0, 31.0, 21.0, 18.0, 13.0, 14.0, 16.0, 7.0, 7.0, 11.0, 2.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07916259765625, -0.07675552368164062, -0.07434844970703125, -0.07194137573242188, -0.0695343017578125, -0.06712722778320312, -0.06472015380859375, -0.062313079833984375, -0.059906005859375, -0.057498931884765625, -0.05509185791015625, -0.052684783935546875, -0.0502777099609375, -0.047870635986328125, -0.04546356201171875, -0.043056488037109375, -0.0406494140625, -0.038242340087890625, -0.03583526611328125, -0.033428192138671875, -0.0310211181640625, -0.028614044189453125, -0.02620697021484375, -0.023799896240234375, -0.021392822265625, -0.018985748291015625, -0.01657867431640625, -0.014171600341796875, -0.0117645263671875, -0.009357452392578125, -0.00695037841796875, -0.004543304443359375, -0.00213623046875, 0.000270843505859375, 0.00267791748046875, 0.005084991455078125, 0.0074920654296875, 0.009899139404296875, 0.01230621337890625, 0.014713287353515625, 0.017120361328125, 0.019527435302734375, 0.02193450927734375, 0.024341583251953125, 0.0267486572265625, 0.029155731201171875, 0.03156280517578125, 0.033969879150390625, 0.036376953125, 0.038784027099609375, 0.04119110107421875, 0.043598175048828125, 0.0460052490234375, 0.048412322998046875, 0.05081939697265625, 0.053226470947265625, 0.055633544921875, 0.058040618896484375, 0.06044769287109375, 0.06285476684570312, 0.0652618408203125, 0.06766891479492188, 0.07007598876953125, 0.07248306274414062, 0.07489013671875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 20.0, 46.0, 76.0, 195.0, 232.0, 208.0, 101.0, 59.0, 39.0, 11.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003941108472645283, -0.003715698141604662, -0.0034902875777333975, -0.0032648772466927767, -0.003039466915652156, -0.0028140563517808914, -0.0025886460207402706, -0.00236323568969965, -0.002137825358659029, -0.0019124149112030864, -0.0016870045801624656, -0.001461594132706523, -0.0012361838016659021, -0.0010107733542099595, -0.0007853629067540169, -0.0005599525757133961, -0.0003345420118421316, -0.00010913160804193467, 0.00011627879575826228, 0.00034168921411037445, 0.0005670996033586562, 0.0007925099926069379, 0.0010179204400628805, 0.0012433307711035013, 0.001468741218559444, 0.0016941516660153866, 0.0019195619970560074, 0.002144972328096628, 0.0023703828919678926, 0.0025957932230085135, 0.002821203786879778, 0.0030466141179203987, 0.0032720244489610195, 0.0034974347800016403, 0.0037228453438729048, 0.003948255442082882, 0.00417366623878479, 0.004399076569825411, 0.004624486900866032, 0.0048498972319066525, 0.005075307562947273, 0.005300717893987894, 0.005526128225028515, 0.005751539021730423, 0.005976949352771044, 0.006202359683811665, 0.006427770014852285, 0.006653180345892906, 0.006878591142594814, 0.007104001473635435, 0.007329411804676056, 0.007554822601377964, 0.007780232932418585, 0.008005643263459206, 0.008231053128838539, 0.008456463925540447, 0.00868187379091978, 0.008907284587621689, 0.009132694453001022, 0.00935810524970293, 0.009583515115082264, 0.009808925911784172, 0.010034335777163506, 0.010259746573865414, 0.010485157370567322]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 3.0, 4.0, 3.0, 7.0, 6.0, 14.0, 9.0, 8.0, 13.0, 19.0, 25.0, 18.0, 34.0, 24.0, 27.0, 24.0, 36.0, 43.0, 26.0, 31.0, 24.0, 33.0, 34.0, 33.0, 54.0, 30.0, 34.0, 39.0, 33.0, 34.0, 20.0, 24.0, 23.0, 20.0, 24.0, 27.0, 25.0, 14.0, 14.0, 12.0, 17.0, 6.0, 7.0, 9.0, 7.0, 7.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0019467473030090332, -0.001883956603705883, -0.0018211659044027328, -0.0017583752050995827, -0.0016955845057964325, -0.0016327938064932823, -0.0015700031071901321, -0.001507212407886982, -0.0014444217085838318, -0.0013816310092806816, -0.0013188403099775314, -0.0012560496106743813, -0.001193258911371231, -0.001130468212068081, -0.0010676775127649307, -0.0010048868134617805, -0.0009420961141586304, -0.0008793054148554802, -0.00081651471555233, -0.0007537240162491798, -0.0006909333169460297, -0.0006281426176428795, -0.0005653519183397293, -0.0005025612190365791, -0.00043977051973342896, -0.0003769798204302788, -0.0003141891211271286, -0.0002513984218239784, -0.00018860772252082825, -0.00012581702321767807, -6.302632391452789e-05, -2.3562461137771606e-07, 6.255507469177246e-05, 0.00012534577399492264, 0.00018813647329807281, 0.000250927172601223, 0.00031371787190437317, 0.00037650857120752335, 0.0004392992705106735, 0.0005020899698138237, 0.0005648806691169739, 0.000627671368420124, 0.0006904620677232742, 0.0007532527670264244, 0.0008160434663295746, 0.0008788341656327248, 0.0009416248649358749, 0.0010044155642390251, 0.0010672062635421753, 0.0011299969628453255, 0.0011927876621484756, 0.0012555783614516258, 0.001318369060754776, 0.0013811597600579262, 0.0014439504593610764, 0.0015067411586642265, 0.0015695318579673767, 0.0016323225572705269, 0.001695113256573677, 0.0017579039558768272, 0.0018206946551799774, 0.0018834853544831276, 0.0019462760537862778, 0.002009066753089428, 0.002071857452392578]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 3.0, 4.0, 4.0, 8.0, 8.0, 3.0, 8.0, 9.0, 22.0, 20.0, 19.0, 22.0, 32.0, 22.0, 23.0, 22.0, 36.0, 28.0, 30.0, 39.0, 41.0, 42.0, 41.0, 31.0, 32.0, 30.0, 45.0, 34.0, 47.0, 23.0, 26.0, 23.0, 30.0, 24.0, 26.0, 17.0, 14.0, 20.0, 19.0, 13.0, 10.0, 10.0, 5.0, 5.0, 4.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.236328125, -3.13580322265625, -3.0352783203125, -2.93475341796875, -2.834228515625, -2.73370361328125, -2.6331787109375, -2.53265380859375, -2.43212890625, -2.33160400390625, -2.2310791015625, -2.13055419921875, -2.030029296875, -1.92950439453125, -1.8289794921875, -1.72845458984375, -1.6279296875, -1.52740478515625, -1.4268798828125, -1.32635498046875, -1.225830078125, -1.12530517578125, -1.0247802734375, -0.92425537109375, -0.82373046875, -0.72320556640625, -0.6226806640625, -0.52215576171875, -0.421630859375, -0.32110595703125, -0.2205810546875, -0.12005615234375, -0.01953125, 0.08099365234375, 0.1815185546875, 0.28204345703125, 0.382568359375, 0.48309326171875, 0.5836181640625, 0.68414306640625, 0.78466796875, 0.88519287109375, 0.9857177734375, 1.08624267578125, 1.186767578125, 1.28729248046875, 1.3878173828125, 1.48834228515625, 1.5888671875, 1.68939208984375, 1.7899169921875, 1.89044189453125, 1.990966796875, 2.09149169921875, 2.1920166015625, 2.29254150390625, 2.39306640625, 2.49359130859375, 2.5941162109375, 2.69464111328125, 2.795166015625, 2.89569091796875, 2.9962158203125, 3.09674072265625, 3.197265625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 9.0, 7.0, 12.0, 8.0, 11.0, 15.0, 31.0, 37.0, 59.0, 87.0, 146.0, 292.0, 562.0, 998.0, 1943.0, 3601.0, 7005.0, 13254.0, 26384.0, 59046.0, 154251.0, 365473.0, 244748.0, 93463.0, 38427.0, 18393.0, 9377.0, 5170.0, 2681.0, 1376.0, 683.0, 422.0, 210.0, 117.0, 52.0, 65.0, 32.0, 23.0, 17.0, 10.0, 12.0, 9.0, 9.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.51171875, -3.401092529296875, -3.29046630859375, -3.179840087890625, -3.0692138671875, -2.958587646484375, -2.84796142578125, -2.737335205078125, -2.626708984375, -2.516082763671875, -2.40545654296875, -2.294830322265625, -2.1842041015625, -2.073577880859375, -1.96295166015625, -1.852325439453125, -1.74169921875, -1.631072998046875, -1.52044677734375, -1.409820556640625, -1.2991943359375, -1.188568115234375, -1.07794189453125, -0.967315673828125, -0.856689453125, -0.746063232421875, -0.63543701171875, -0.524810791015625, -0.4141845703125, -0.303558349609375, -0.19293212890625, -0.082305908203125, 0.0283203125, 0.138946533203125, 0.24957275390625, 0.360198974609375, 0.4708251953125, 0.581451416015625, 0.69207763671875, 0.802703857421875, 0.913330078125, 1.023956298828125, 1.13458251953125, 1.245208740234375, 1.3558349609375, 1.466461181640625, 1.57708740234375, 1.687713623046875, 1.79833984375, 1.908966064453125, 2.01959228515625, 2.130218505859375, 2.2408447265625, 2.351470947265625, 2.46209716796875, 2.572723388671875, 2.683349609375, 2.793975830078125, 2.90460205078125, 3.015228271484375, 3.1258544921875, 3.236480712890625, 3.34710693359375, 3.457733154296875, 3.568359375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 3.0, 7.0, 5.0, 3.0, 5.0, 10.0, 13.0, 16.0, 15.0, 21.0, 29.0, 19.0, 28.0, 34.0, 28.0, 44.0, 55.0, 74.0, 92.0, 206.0, 1572.0, 265.0, 98.0, 76.0, 46.0, 56.0, 28.0, 27.0, 30.0, 24.0, 23.0, 21.0, 18.0, 20.0, 5.0, 14.0, 2.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-16.359375, -15.912109375, -15.46484375, -15.017578125, -14.5703125, -14.123046875, -13.67578125, -13.228515625, -12.78125, -12.333984375, -11.88671875, -11.439453125, -10.9921875, -10.544921875, -10.09765625, -9.650390625, -9.203125, -8.755859375, -8.30859375, -7.861328125, -7.4140625, -6.966796875, -6.51953125, -6.072265625, -5.625, -5.177734375, -4.73046875, -4.283203125, -3.8359375, -3.388671875, -2.94140625, -2.494140625, -2.046875, -1.599609375, -1.15234375, -0.705078125, -0.2578125, 0.189453125, 0.63671875, 1.083984375, 1.53125, 1.978515625, 2.42578125, 2.873046875, 3.3203125, 3.767578125, 4.21484375, 4.662109375, 5.109375, 5.556640625, 6.00390625, 6.451171875, 6.8984375, 7.345703125, 7.79296875, 8.240234375, 8.6875, 9.134765625, 9.58203125, 10.029296875, 10.4765625, 10.923828125, 11.37109375, 11.818359375, 12.265625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 4.0, 9.0, 4.0, 10.0, 11.0, 17.0, 19.0, 22.0, 25.0, 42.0, 50.0, 75.0, 106.0, 158.0, 202.0, 361.0, 806.0, 8823.0, 3036978.0, 94970.0, 1615.0, 447.0, 256.0, 163.0, 133.0, 93.0, 83.0, 48.0, 40.0, 28.0, 27.0, 12.0, 14.0, 9.0, 12.0, 7.0, 2.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.0, -37.80810546875, -36.6162109375, -35.42431640625, -34.232421875, -33.04052734375, -31.8486328125, -30.65673828125, -29.46484375, -28.27294921875, -27.0810546875, -25.88916015625, -24.697265625, -23.50537109375, -22.3134765625, -21.12158203125, -19.9296875, -18.73779296875, -17.5458984375, -16.35400390625, -15.162109375, -13.97021484375, -12.7783203125, -11.58642578125, -10.39453125, -9.20263671875, -8.0107421875, -6.81884765625, -5.626953125, -4.43505859375, -3.2431640625, -2.05126953125, -0.859375, 0.33251953125, 1.5244140625, 2.71630859375, 3.908203125, 5.10009765625, 6.2919921875, 7.48388671875, 8.67578125, 9.86767578125, 11.0595703125, 12.25146484375, 13.443359375, 14.63525390625, 15.8271484375, 17.01904296875, 18.2109375, 19.40283203125, 20.5947265625, 21.78662109375, 22.978515625, 24.17041015625, 25.3623046875, 26.55419921875, 27.74609375, 28.93798828125, 30.1298828125, 31.32177734375, 32.513671875, 33.70556640625, 34.8974609375, 36.08935546875, 37.28125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 380.0, 631.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.77734375, -289.5188293457031, -284.26031494140625, -279.0018005371094, -273.7432556152344, -268.4847412109375, -263.2262268066406, -257.96771240234375, -252.70919799804688, -247.45068359375, -242.19215393066406, -236.9336395263672, -231.6751251220703, -226.41659545898438, -221.1580810546875, -215.89956665039062, -210.6410369873047, -205.3825225830078, -200.12399291992188, -194.865478515625, -189.60696411132812, -184.34844970703125, -179.0899200439453, -173.83140563964844, -168.5728759765625, -163.31436157226562, -158.0558319091797, -152.7973175048828, -147.53880310058594, -142.2802734375, -137.02175903320312, -131.76324462890625, -126.50473022460938, -121.24620819091797, -115.9876937866211, -110.72917175292969, -105.47065734863281, -100.2121353149414, -94.95361328125, -89.69509887695312, -84.43658447265625, -79.17806243896484, -73.91954803466797, -68.66102600097656, -63.40250778198242, -58.14398956298828, -52.885467529296875, -47.626949310302734, -42.36842727661133, -37.10990905761719, -31.851388931274414, -26.59286880493164, -21.3343505859375, -16.07583236694336, -10.817312240600586, -5.5587921142578125, -0.3002738952636719, 4.958245277404785, 10.216764450073242, 15.4752836227417, 20.733802795410156, 25.992321014404297, 31.25084114074707, 36.509361267089844, 41.767879486083984]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 7.0, 6.0, 8.0, 14.0, 23.0, 22.0, 19.0, 19.0, 22.0, 28.0, 24.0, 27.0, 29.0, 29.0, 36.0, 40.0, 29.0, 52.0, 28.0, 35.0, 47.0, 34.0, 44.0, 33.0, 25.0, 37.0, 32.0, 24.0, 23.0, 33.0, 28.0, 17.0, 14.0, 11.0, 18.0, 10.0, 16.0, 7.0, 5.0, 9.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-29.192794799804688, -28.256088256835938, -27.319379806518555, -26.382673263549805, -25.445964813232422, -24.509258270263672, -23.572551727294922, -22.63584327697754, -21.69913673400879, -20.76243019104004, -19.825721740722656, -18.889015197753906, -17.952306747436523, -17.015600204467773, -16.07889175415039, -15.14218521118164, -14.205477714538574, -13.268770217895508, -12.332062721252441, -11.395355224609375, -10.458648681640625, -9.521941184997559, -8.585233688354492, -7.648526668548584, -6.711819171905518, -5.775111675262451, -4.838404655456543, -3.9016971588134766, -2.9649899005889893, -2.028282642364502, -1.0915751457214355, -0.15486812591552734, 0.7818393707275391, 1.7185466289520264, 2.6552538871765137, 3.59196138381958, 4.528668403625488, 5.465375900268555, 6.402083396911621, 7.338790416717529, 8.275497436523438, 9.212204933166504, 10.14891242980957, 11.08561897277832, 12.022326469421387, 12.959033966064453, 13.89574146270752, 14.832448959350586, 15.769156455993652, 16.70586395263672, 17.64257049560547, 18.57927894592285, 19.5159854888916, 20.452693939208984, 21.389400482177734, 22.326107025146484, 23.262815475463867, 24.199522018432617, 25.13623046875, 26.07293701171875, 27.009645462036133, 27.946352005004883, 28.883060455322266, 29.819766998291016, 30.756473541259766]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 8.0, 7.0, 10.0, 8.0, 8.0, 16.0, 18.0, 17.0, 31.0, 33.0, 29.0, 24.0, 22.0, 36.0, 41.0, 44.0, 33.0, 50.0, 35.0, 45.0, 38.0, 49.0, 41.0, 44.0, 38.0, 25.0, 37.0, 18.0, 25.0, 24.0, 26.0, 19.0, 16.0, 18.0, 14.0, 7.0, 9.0, 6.0, 8.0, 8.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.947998046875, -3.82177734375, -3.695556640625, -3.5693359375, -3.443115234375, -3.31689453125, -3.190673828125, -3.064453125, -2.938232421875, -2.81201171875, -2.685791015625, -2.5595703125, -2.433349609375, -2.30712890625, -2.180908203125, -2.0546875, -1.928466796875, -1.80224609375, -1.676025390625, -1.5498046875, -1.423583984375, -1.29736328125, -1.171142578125, -1.044921875, -0.918701171875, -0.79248046875, -0.666259765625, -0.5400390625, -0.413818359375, -0.28759765625, -0.161376953125, -0.03515625, 0.091064453125, 0.21728515625, 0.343505859375, 0.4697265625, 0.595947265625, 0.72216796875, 0.848388671875, 0.974609375, 1.100830078125, 1.22705078125, 1.353271484375, 1.4794921875, 1.605712890625, 1.73193359375, 1.858154296875, 1.984375, 2.110595703125, 2.23681640625, 2.363037109375, 2.4892578125, 2.615478515625, 2.74169921875, 2.867919921875, 2.994140625, 3.120361328125, 3.24658203125, 3.372802734375, 3.4990234375, 3.625244140625, 3.75146484375, 3.877685546875, 4.00390625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 1.0, 8.0, 9.0, 7.0, 5.0, 9.0, 12.0, 14.0, 24.0, 40.0, 40.0, 39.0, 55.0, 86.0, 120.0, 218.0, 419.0, 1334.0, 7496.0, 81855.0, 1146537.0, 2561271.0, 364366.0, 25475.0, 3126.0, 779.0, 300.0, 167.0, 116.0, 80.0, 67.0, 52.0, 38.0, 26.0, 23.0, 14.0, 9.0, 10.0, 11.0, 5.0, 5.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-11.3125, -11.0006103515625, -10.688720703125, -10.3768310546875, -10.06494140625, -9.7530517578125, -9.441162109375, -9.1292724609375, -8.8173828125, -8.5054931640625, -8.193603515625, -7.8817138671875, -7.56982421875, -7.2579345703125, -6.946044921875, -6.6341552734375, -6.322265625, -6.0103759765625, -5.698486328125, -5.3865966796875, -5.07470703125, -4.7628173828125, -4.450927734375, -4.1390380859375, -3.8271484375, -3.5152587890625, -3.203369140625, -2.8914794921875, -2.57958984375, -2.2677001953125, -1.955810546875, -1.6439208984375, -1.33203125, -1.0201416015625, -0.708251953125, -0.3963623046875, -0.08447265625, 0.2274169921875, 0.539306640625, 0.8511962890625, 1.1630859375, 1.4749755859375, 1.786865234375, 2.0987548828125, 2.41064453125, 2.7225341796875, 3.034423828125, 3.3463134765625, 3.658203125, 3.9700927734375, 4.281982421875, 4.5938720703125, 4.90576171875, 5.2176513671875, 5.529541015625, 5.8414306640625, 6.1533203125, 6.4652099609375, 6.777099609375, 7.0889892578125, 7.40087890625, 7.7127685546875, 8.024658203125, 8.3365478515625, 8.6484375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 15.0, 12.0, 15.0, 25.0, 33.0, 38.0, 52.0, 77.0, 84.0, 110.0, 151.0, 207.0, 246.0, 255.0, 401.0, 399.0, 409.0, 334.0, 265.0, 209.0, 182.0, 131.0, 105.0, 80.0, 48.0, 19.0, 33.0, 33.0, 23.0, 15.0, 15.0, 8.0, 8.0, 6.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.43994140625, -6.2236328125, -6.00732421875, -5.791015625, -5.57470703125, -5.3583984375, -5.14208984375, -4.92578125, -4.70947265625, -4.4931640625, -4.27685546875, -4.060546875, -3.84423828125, -3.6279296875, -3.41162109375, -3.1953125, -2.97900390625, -2.7626953125, -2.54638671875, -2.330078125, -2.11376953125, -1.8974609375, -1.68115234375, -1.46484375, -1.24853515625, -1.0322265625, -0.81591796875, -0.599609375, -0.38330078125, -0.1669921875, 0.04931640625, 0.265625, 0.48193359375, 0.6982421875, 0.91455078125, 1.130859375, 1.34716796875, 1.5634765625, 1.77978515625, 1.99609375, 2.21240234375, 2.4287109375, 2.64501953125, 2.861328125, 3.07763671875, 3.2939453125, 3.51025390625, 3.7265625, 3.94287109375, 4.1591796875, 4.37548828125, 4.591796875, 4.80810546875, 5.0244140625, 5.24072265625, 5.45703125, 5.67333984375, 5.8896484375, 6.10595703125, 6.322265625, 6.53857421875, 6.7548828125, 6.97119140625, 7.1875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 6.0, 6.0, 6.0, 14.0, 9.0, 21.0, 37.0, 34.0, 25.0, 35.0, 61.0, 102.0, 144.0, 173.0, 236.0, 364.0, 856.0, 17857.0, 3280994.0, 886691.0, 4826.0, 574.0, 328.0, 217.0, 185.0, 104.0, 91.0, 67.0, 49.0, 42.0, 37.0, 17.0, 14.0, 14.0, 11.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.03125, -31.0849609375, -30.138671875, -29.1923828125, -28.24609375, -27.2998046875, -26.353515625, -25.4072265625, -24.4609375, -23.5146484375, -22.568359375, -21.6220703125, -20.67578125, -19.7294921875, -18.783203125, -17.8369140625, -16.890625, -15.9443359375, -14.998046875, -14.0517578125, -13.10546875, -12.1591796875, -11.212890625, -10.2666015625, -9.3203125, -8.3740234375, -7.427734375, -6.4814453125, -5.53515625, -4.5888671875, -3.642578125, -2.6962890625, -1.75, -0.8037109375, 0.142578125, 1.0888671875, 2.03515625, 2.9814453125, 3.927734375, 4.8740234375, 5.8203125, 6.7666015625, 7.712890625, 8.6591796875, 9.60546875, 10.5517578125, 11.498046875, 12.4443359375, 13.390625, 14.3369140625, 15.283203125, 16.2294921875, 17.17578125, 18.1220703125, 19.068359375, 20.0146484375, 20.9609375, 21.9072265625, 22.853515625, 23.7998046875, 24.74609375, 25.6923828125, 26.638671875, 27.5849609375, 28.53125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 21.0, 47.0, 87.0, 143.0, 200.0, 177.0, 147.0, 105.0, 46.0, 25.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.91415786743164, -52.18389129638672, -50.4536247253418, -48.723358154296875, -46.99308776855469, -45.262821197509766, -43.532554626464844, -41.80228805541992, -40.072021484375, -38.34175491333008, -36.611488342285156, -34.88121795654297, -33.15095138549805, -31.420684814453125, -29.690418243408203, -27.96015167236328, -26.229883193969727, -24.499616622924805, -22.76934814453125, -21.039081573486328, -19.308815002441406, -17.578548431396484, -15.84827995300293, -14.118013381958008, -12.38774585723877, -10.657478332519531, -8.92721176147461, -7.196944236755371, -5.466677188873291, -3.736410140991211, -2.0061426162719727, -0.2758760452270508, 1.4543914794921875, 3.1846585273742676, 4.914925575256348, 6.645193099975586, 8.375459671020508, 10.105727195739746, 11.835994720458984, 13.566261291503906, 15.296528816223145, 17.026796340942383, 18.757062911987305, 20.48733139038086, 22.21759796142578, 23.947864532470703, 25.678131103515625, 27.408397674560547, 29.1386661529541, 30.868932723999023, 32.59920120239258, 34.3294677734375, 36.05973434448242, 37.790000915527344, 39.52027130126953, 41.25053405761719, 42.980804443359375, 44.7110710144043, 46.44133758544922, 48.171607971191406, 49.90187454223633, 51.63214111328125, 53.36240768432617, 55.092674255371094, 56.822940826416016]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 2.0, 1.0, 7.0, 3.0, 10.0, 10.0, 12.0, 13.0, 14.0, 16.0, 19.0, 27.0, 25.0, 22.0, 27.0, 25.0, 30.0, 43.0, 40.0, 33.0, 40.0, 38.0, 50.0, 41.0, 29.0, 45.0, 30.0, 37.0, 42.0, 26.0, 25.0, 23.0, 25.0, 24.0, 22.0, 16.0, 14.0, 18.0, 12.0, 14.0, 6.0, 14.0, 10.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-24.63397216796875, -23.928255081176758, -23.222537994384766, -22.51681900024414, -21.81110191345215, -21.105384826660156, -20.39966583251953, -19.69394874572754, -18.988231658935547, -18.282514572143555, -17.576797485351562, -16.871078491210938, -16.165361404418945, -15.459644317626953, -14.753926277160645, -14.048208236694336, -13.342491149902344, -12.636774063110352, -11.931056022644043, -11.225337982177734, -10.519620895385742, -9.81390380859375, -9.108185768127441, -8.402467727661133, -7.696750640869141, -6.99103307723999, -6.28531551361084, -5.5795979499816895, -4.873880386352539, -4.168162822723389, -3.4624452590942383, -2.756727695465088, -2.0510101318359375, -1.345292568206787, -0.6395750045776367, 0.06614255905151367, 0.7718601226806641, 1.4775776863098145, 2.183295249938965, 2.8890128135681152, 3.5947303771972656, 4.300447940826416, 5.006165504455566, 5.711883068084717, 6.417600631713867, 7.123318195343018, 7.829035758972168, 8.534753799438477, 9.240470886230469, 9.946187973022461, 10.65190601348877, 11.357624053955078, 12.06334114074707, 12.769058227539062, 13.474776268005371, 14.18049430847168, 14.886211395263672, 15.591928482055664, 16.297645568847656, 17.00336456298828, 17.709081649780273, 18.414798736572266, 19.12051773071289, 19.826234817504883, 20.531951904296875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 13.0, 3.0, 6.0, 5.0, 6.0, 12.0, 16.0, 17.0, 16.0, 20.0, 30.0, 27.0, 24.0, 34.0, 35.0, 32.0, 31.0, 35.0, 45.0, 46.0, 44.0, 50.0, 38.0, 47.0, 30.0, 34.0, 49.0, 25.0, 26.0, 29.0, 15.0, 23.0, 12.0, 20.0, 23.0, 15.0, 17.0, 13.0, 15.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-4.19921875, -4.08270263671875, -3.9661865234375, -3.84967041015625, -3.733154296875, -3.61663818359375, -3.5001220703125, -3.38360595703125, -3.26708984375, -3.15057373046875, -3.0340576171875, -2.91754150390625, -2.801025390625, -2.68450927734375, -2.5679931640625, -2.45147705078125, -2.3349609375, -2.21844482421875, -2.1019287109375, -1.98541259765625, -1.868896484375, -1.75238037109375, -1.6358642578125, -1.51934814453125, -1.40283203125, -1.28631591796875, -1.1697998046875, -1.05328369140625, -0.936767578125, -0.82025146484375, -0.7037353515625, -0.58721923828125, -0.470703125, -0.35418701171875, -0.2376708984375, -0.12115478515625, -0.004638671875, 0.11187744140625, 0.2283935546875, 0.34490966796875, 0.46142578125, 0.57794189453125, 0.6944580078125, 0.81097412109375, 0.927490234375, 1.04400634765625, 1.1605224609375, 1.27703857421875, 1.3935546875, 1.51007080078125, 1.6265869140625, 1.74310302734375, 1.859619140625, 1.97613525390625, 2.0926513671875, 2.20916748046875, 2.32568359375, 2.44219970703125, 2.5587158203125, 2.67523193359375, 2.791748046875, 2.90826416015625, 3.0247802734375, 3.14129638671875, 3.2578125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 16.0, 18.0, 21.0, 53.0, 60.0, 105.0, 185.0, 281.0, 469.0, 927.0, 1618.0, 3056.0, 5380.0, 10297.0, 19490.0, 39358.0, 78845.0, 157149.0, 260675.0, 224806.0, 122159.0, 60671.0, 29628.0, 15381.0, 8041.0, 4499.0, 2365.0, 1325.0, 699.0, 370.0, 202.0, 136.0, 115.0, 57.0, 34.0, 19.0, 18.0, 12.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.483642578125, -0.4674186706542969, -0.45119476318359375, -0.4349708557128906, -0.4187469482421875, -0.4025230407714844, -0.38629913330078125, -0.3700752258300781, -0.353851318359375, -0.3376274108886719, -0.32140350341796875, -0.3051795959472656, -0.2889556884765625, -0.2727317810058594, -0.25650787353515625, -0.24028396606445312, -0.22406005859375, -0.20783615112304688, -0.19161224365234375, -0.17538833618164062, -0.1591644287109375, -0.14294052124023438, -0.12671661376953125, -0.11049270629882812, -0.094268798828125, -0.07804489135742188, -0.06182098388671875, -0.045597076416015625, -0.0293731689453125, -0.013149261474609375, 0.00307464599609375, 0.019298553466796875, 0.0355224609375, 0.051746368408203125, 0.06797027587890625, 0.08419418334960938, 0.1004180908203125, 0.11664199829101562, 0.13286590576171875, 0.14908981323242188, 0.165313720703125, 0.18153762817382812, 0.19776153564453125, 0.21398544311523438, 0.2302093505859375, 0.24643325805664062, 0.26265716552734375, 0.2788810729980469, 0.29510498046875, 0.3113288879394531, 0.32755279541015625, 0.3437767028808594, 0.3600006103515625, 0.3762245178222656, 0.39244842529296875, 0.4086723327636719, 0.424896240234375, 0.4411201477050781, 0.45734405517578125, 0.4735679626464844, 0.4897918701171875, 0.5060157775878906, 0.5222396850585938, 0.5384635925292969, 0.5546875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 5.0, 7.0, 14.0, 9.0, 21.0, 12.0, 14.0, 23.0, 15.0, 21.0, 18.0, 33.0, 29.0, 29.0, 33.0, 36.0, 36.0, 32.0, 30.0, 30.0, 1059.0, 31.0, 40.0, 36.0, 31.0, 35.0, 37.0, 30.0, 20.0, 34.0, 33.0, 31.0, 20.0, 20.0, 23.0, 12.0, 16.0, 8.0, 12.0, 16.0, 12.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.404296875, -2.335479736328125, -2.26666259765625, -2.197845458984375, -2.1290283203125, -2.060211181640625, -1.99139404296875, -1.922576904296875, -1.853759765625, -1.784942626953125, -1.71612548828125, -1.647308349609375, -1.5784912109375, -1.509674072265625, -1.44085693359375, -1.372039794921875, -1.30322265625, -1.234405517578125, -1.16558837890625, -1.096771240234375, -1.0279541015625, -0.959136962890625, -0.89031982421875, -0.821502685546875, -0.752685546875, -0.683868408203125, -0.61505126953125, -0.546234130859375, -0.4774169921875, -0.408599853515625, -0.33978271484375, -0.270965576171875, -0.2021484375, -0.133331298828125, -0.06451416015625, 0.004302978515625, 0.0731201171875, 0.141937255859375, 0.21075439453125, 0.279571533203125, 0.348388671875, 0.417205810546875, 0.48602294921875, 0.554840087890625, 0.6236572265625, 0.692474365234375, 0.76129150390625, 0.830108642578125, 0.89892578125, 0.967742919921875, 1.03656005859375, 1.105377197265625, 1.1741943359375, 1.243011474609375, 1.31182861328125, 1.380645751953125, 1.449462890625, 1.518280029296875, 1.58709716796875, 1.655914306640625, 1.7247314453125, 1.793548583984375, 1.86236572265625, 1.931182861328125, 2.0]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 17.0, 13.0, 21.0, 36.0, 58.0, 98.0, 105.0, 182.0, 228.0, 389.0, 513.0, 778.0, 1178.0, 1677.0, 2479.0, 3617.0, 5372.0, 8080.0, 12075.0, 18267.0, 27388.0, 40528.0, 59089.0, 85548.0, 116205.0, 823326.0, 509865.0, 115439.0, 84246.0, 58739.0, 39791.0, 27013.0, 18151.0, 11852.0, 7983.0, 5370.0, 3704.0, 2493.0, 1621.0, 1098.0, 760.0, 524.0, 378.0, 270.0, 195.0, 112.0, 77.0, 77.0, 41.0, 28.0, 19.0, 5.0, 7.0, 3.0, 4.0, 2.0, 2.0], "bins": [-0.227783203125, -0.22087669372558594, -0.21397018432617188, -0.2070636749267578, -0.20015716552734375, -0.1932506561279297, -0.18634414672851562, -0.17943763732910156, -0.1725311279296875, -0.16562461853027344, -0.15871810913085938, -0.1518115997314453, -0.14490509033203125, -0.1379985809326172, -0.13109207153320312, -0.12418556213378906, -0.117279052734375, -0.11037254333496094, -0.10346603393554688, -0.09655952453613281, -0.08965301513671875, -0.08274650573730469, -0.07583999633789062, -0.06893348693847656, -0.0620269775390625, -0.05512046813964844, -0.048213958740234375, -0.04130744934082031, -0.03440093994140625, -0.027494430541992188, -0.020587921142578125, -0.013681411743164062, -0.00677490234375, 0.0001316070556640625, 0.007038116455078125, 0.013944625854492188, 0.02085113525390625, 0.027757644653320312, 0.034664154052734375, 0.04157066345214844, 0.0484771728515625, 0.05538368225097656, 0.062290191650390625, 0.06919670104980469, 0.07610321044921875, 0.08300971984863281, 0.08991622924804688, 0.09682273864746094, 0.103729248046875, 0.11063575744628906, 0.11754226684570312, 0.12444877624511719, 0.13135528564453125, 0.1382617950439453, 0.14516830444335938, 0.15207481384277344, 0.1589813232421875, 0.16588783264160156, 0.17279434204101562, 0.1797008514404297, 0.18660736083984375, 0.1935138702392578, 0.20042037963867188, 0.20732688903808594, 0.2142333984375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 5.0, 0.0, 4.0, 1.0, 6.0, 4.0, 5.0, 9.0, 14.0, 20.0, 21.0, 24.0, 39.0, 41.0, 61.0, 69.0, 89.0, 106.0, 72.0, 80.0, 58.0, 58.0, 43.0, 42.0, 30.0, 15.0, 28.0, 12.0, 6.0, 4.0, 7.0, 4.0, 8.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.00628662109375, -0.006097197532653809, -0.005907773971557617, -0.005718350410461426, -0.005528926849365234, -0.005339503288269043, -0.0051500797271728516, -0.00496065616607666, -0.004771232604980469, -0.004581809043884277, -0.004392385482788086, -0.0042029619216918945, -0.004013538360595703, -0.0038241147994995117, -0.0036346912384033203, -0.003445267677307129, -0.0032558441162109375, -0.003066420555114746, -0.0028769969940185547, -0.0026875734329223633, -0.002498149871826172, -0.0023087263107299805, -0.002119302749633789, -0.0019298791885375977, -0.0017404556274414062, -0.0015510320663452148, -0.0013616085052490234, -0.001172184944152832, -0.0009827613830566406, -0.0007933378219604492, -0.0006039142608642578, -0.0004144906997680664, -0.000225067138671875, -3.5643577575683594e-05, 0.0001537799835205078, 0.0003432035446166992, 0.0005326271057128906, 0.000722050666809082, 0.0009114742279052734, 0.0011008977890014648, 0.0012903213500976562, 0.0014797449111938477, 0.001669168472290039, 0.0018585920333862305, 0.002048015594482422, 0.0022374391555786133, 0.0024268627166748047, 0.002616286277770996, 0.0028057098388671875, 0.002995133399963379, 0.0031845569610595703, 0.0033739805221557617, 0.003563404083251953, 0.0037528276443481445, 0.003942251205444336, 0.004131674766540527, 0.004321098327636719, 0.00451052188873291, 0.0046999454498291016, 0.004889369010925293, 0.005078792572021484, 0.005268216133117676, 0.005457639694213867, 0.005647063255310059, 0.00583648681640625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 9.0, 7.0, 10.0, 6.0, 12.0, 14.0, 29.0, 44.0, 40.0, 85.0, 127.0, 153.0, 313.0, 725.0, 73341.0, 971016.0, 1513.0, 425.0, 218.0, 137.0, 82.0, 57.0, 42.0, 32.0, 25.0, 20.0, 10.0, 7.0, 7.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11846923828125, -0.1146707534790039, -0.11087226867675781, -0.10707378387451172, -0.10327529907226562, -0.09947681427001953, -0.09567832946777344, -0.09187984466552734, -0.08808135986328125, -0.08428287506103516, -0.08048439025878906, -0.07668590545654297, -0.07288742065429688, -0.06908893585205078, -0.06529045104980469, -0.061491966247558594, -0.0576934814453125, -0.053894996643066406, -0.05009651184082031, -0.04629802703857422, -0.042499542236328125, -0.03870105743408203, -0.03490257263183594, -0.031104087829589844, -0.02730560302734375, -0.023507118225097656, -0.019708633422851562, -0.01591014862060547, -0.012111663818359375, -0.008313179016113281, -0.0045146942138671875, -0.0007162094116210938, 0.003082275390625, 0.006880760192871094, 0.010679244995117188, 0.014477729797363281, 0.018276214599609375, 0.02207469940185547, 0.025873184204101562, 0.029671669006347656, 0.03347015380859375, 0.037268638610839844, 0.04106712341308594, 0.04486560821533203, 0.048664093017578125, 0.05246257781982422, 0.05626106262207031, 0.060059547424316406, 0.0638580322265625, 0.0676565170288086, 0.07145500183105469, 0.07525348663330078, 0.07905197143554688, 0.08285045623779297, 0.08664894104003906, 0.09044742584228516, 0.09424591064453125, 0.09804439544677734, 0.10184288024902344, 0.10564136505126953, 0.10943984985351562, 0.11323833465576172, 0.11703681945800781, 0.1208353042602539, 0.1246337890625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [40.0, 830.0, 139.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017441656673327088, -0.0006225272081792355, 0.0004991112509742379, 0.0016207498265430331, 0.0027423882856965065, 0.003864026628434658, 0.004985665436834097, 0.0061073037795722485, 0.0072289421223104, 0.008350580930709839, 0.00947221927344799, 0.010593857616186142, 0.011715495958924294, 0.012837134301662445, 0.013958772644400597, 0.015080410987138748, 0.0162020493298769, 0.01732368767261505, 0.018445326015353203, 0.019566964358091354, 0.020688602700829506, 0.021810241043567657, 0.022931881248950958, 0.02405351772904396, 0.02517515793442726, 0.026296796277165413, 0.027418434619903564, 0.028540072962641716, 0.029661711305379868, 0.03078334964811802, 0.03190498799085617, 0.03302662819623947, 0.034148264676332474, 0.035269904881715775, 0.03639154136180878, 0.03751318156719208, 0.03863481804728508, 0.03975645825266838, 0.04087809473276138, 0.041999734938144684, 0.043121371418237686, 0.04424301162362099, 0.04536464810371399, 0.04648628830909729, 0.04760792478919029, 0.04872956499457359, 0.049851201474666595, 0.050972841680049896, 0.0520944818854332, 0.0532161220908165, 0.0543377585709095, 0.0554593987762928, 0.0565810352563858, 0.057702675461769104, 0.058824311941862106, 0.05994595214724541, 0.06106758862733841, 0.06218922883272171, 0.06331086903810501, 0.06443250179290771, 0.06555414199829102, 0.06667578220367432, 0.06779742240905762, 0.06891905516386032, 0.07004069536924362]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 5.0, 9.0, 13.0, 19.0, 15.0, 27.0, 40.0, 34.0, 45.0, 45.0, 43.0, 60.0, 59.0, 69.0, 75.0, 71.0, 59.0, 51.0, 45.0, 29.0, 38.0, 27.0, 25.0, 26.0, 17.0, 6.0, 18.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004349350929260254, -0.004208815284073353, -0.004068279638886452, -0.003927743993699551, -0.0037872083485126495, -0.0036466727033257484, -0.0035061370581388474, -0.0033656014129519463, -0.003225065767765045, -0.003084530122578144, -0.002943994477391243, -0.002803458832204342, -0.002662923187017441, -0.0025223875418305397, -0.0023818518966436386, -0.0022413162514567375, -0.0021007806062698364, -0.0019602449610829353, -0.0018197093158960342, -0.0016791736707091331, -0.001538638025522232, -0.001398102380335331, -0.0012575667351484299, -0.0011170310899615288, -0.0009764954447746277, -0.0008359597995877266, -0.0006954241544008255, -0.0005548885092139244, -0.0004143528640270233, -0.0002738172188401222, -0.00013328157365322113, 7.254071533679962e-06, 0.00014778971672058105, 0.00028832536190748215, 0.00042886100709438324, 0.0005693966522812843, 0.0007099322974681854, 0.0008504679426550865, 0.0009910035878419876, 0.0011315392330288887, 0.0012720748782157898, 0.0014126105234026909, 0.001553146168589592, 0.001693681813776493, 0.0018342174589633942, 0.0019747531041502953, 0.0021152887493371964, 0.0022558243945240974, 0.0023963600397109985, 0.0025368956848978996, 0.0026774313300848007, 0.002817966975271702, 0.002958502620458603, 0.003099038265645504, 0.003239573910832405, 0.003380109556019306, 0.0035206452012062073, 0.0036611808463931084, 0.0038017164915800095, 0.0039422521367669106, 0.004082787781953812, 0.004223323427140713, 0.004363859072327614, 0.004504394717514515, 0.004644930362701416]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 13.0, 3.0, 6.0, 5.0, 6.0, 12.0, 16.0, 17.0, 16.0, 20.0, 30.0, 27.0, 24.0, 34.0, 35.0, 32.0, 31.0, 35.0, 45.0, 47.0, 43.0, 50.0, 38.0, 47.0, 30.0, 34.0, 49.0, 25.0, 26.0, 29.0, 15.0, 23.0, 12.0, 20.0, 23.0, 15.0, 17.0, 13.0, 15.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-4.19921875, -4.08270263671875, -3.9661865234375, -3.84967041015625, -3.733154296875, -3.61663818359375, -3.5001220703125, -3.38360595703125, -3.26708984375, -3.15057373046875, -3.0340576171875, -2.91754150390625, -2.801025390625, -2.68450927734375, -2.5679931640625, -2.45147705078125, -2.3349609375, -2.21844482421875, -2.1019287109375, -1.98541259765625, -1.868896484375, -1.75238037109375, -1.6358642578125, -1.51934814453125, -1.40283203125, -1.28631591796875, -1.1697998046875, -1.05328369140625, -0.936767578125, -0.82025146484375, -0.7037353515625, -0.58721923828125, -0.470703125, -0.35418701171875, -0.2376708984375, -0.12115478515625, -0.004638671875, 0.11187744140625, 0.2283935546875, 0.34490966796875, 0.46142578125, 0.57794189453125, 0.6944580078125, 0.81097412109375, 0.927490234375, 1.04400634765625, 1.1605224609375, 1.27703857421875, 1.3935546875, 1.51007080078125, 1.6265869140625, 1.74310302734375, 1.859619140625, 1.97613525390625, 2.0926513671875, 2.20916748046875, 2.32568359375, 2.44219970703125, 2.5587158203125, 2.67523193359375, 2.791748046875, 2.90826416015625, 3.0247802734375, 3.14129638671875, 3.2578125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 10.0, 13.0, 18.0, 15.0, 17.0, 19.0, 42.0, 53.0, 71.0, 92.0, 144.0, 215.0, 374.0, 710.0, 1536.0, 3245.0, 7278.0, 16452.0, 36881.0, 86182.0, 210144.0, 378496.0, 176682.0, 72445.0, 31497.0, 14025.0, 6158.0, 2894.0, 1230.0, 587.0, 309.0, 180.0, 131.0, 98.0, 61.0, 58.0, 50.0, 33.0, 30.0, 16.0, 14.0, 13.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-4.33984375, -4.217254638671875, -4.09466552734375, -3.972076416015625, -3.8494873046875, -3.726898193359375, -3.60430908203125, -3.481719970703125, -3.359130859375, -3.236541748046875, -3.11395263671875, -2.991363525390625, -2.8687744140625, -2.746185302734375, -2.62359619140625, -2.501007080078125, -2.37841796875, -2.255828857421875, -2.13323974609375, -2.010650634765625, -1.8880615234375, -1.765472412109375, -1.64288330078125, -1.520294189453125, -1.397705078125, -1.275115966796875, -1.15252685546875, -1.029937744140625, -0.9073486328125, -0.784759521484375, -0.66217041015625, -0.539581298828125, -0.4169921875, -0.294403076171875, -0.17181396484375, -0.049224853515625, 0.0733642578125, 0.195953369140625, 0.31854248046875, 0.441131591796875, 0.563720703125, 0.686309814453125, 0.80889892578125, 0.931488037109375, 1.0540771484375, 1.176666259765625, 1.29925537109375, 1.421844482421875, 1.54443359375, 1.667022705078125, 1.78961181640625, 1.912200927734375, 2.0347900390625, 2.157379150390625, 2.27996826171875, 2.402557373046875, 2.525146484375, 2.647735595703125, 2.77032470703125, 2.892913818359375, 3.0155029296875, 3.138092041015625, 3.26068115234375, 3.383270263671875, 3.505859375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 6.0, 8.0, 12.0, 10.0, 15.0, 17.0, 28.0, 25.0, 35.0, 30.0, 40.0, 58.0, 58.0, 96.0, 140.0, 1502.0, 408.0, 124.0, 69.0, 54.0, 49.0, 47.0, 49.0, 24.0, 24.0, 21.0, 29.0, 17.0, 18.0, 10.0, 12.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0234375, -11.5596923828125, -11.095947265625, -10.6322021484375, -10.16845703125, -9.7047119140625, -9.240966796875, -8.7772216796875, -8.3134765625, -7.8497314453125, -7.385986328125, -6.9222412109375, -6.45849609375, -5.9947509765625, -5.531005859375, -5.0672607421875, -4.603515625, -4.1397705078125, -3.676025390625, -3.2122802734375, -2.74853515625, -2.2847900390625, -1.821044921875, -1.3572998046875, -0.8935546875, -0.4298095703125, 0.033935546875, 0.4976806640625, 0.96142578125, 1.4251708984375, 1.888916015625, 2.3526611328125, 2.81640625, 3.2801513671875, 3.743896484375, 4.2076416015625, 4.67138671875, 5.1351318359375, 5.598876953125, 6.0626220703125, 6.5263671875, 6.9901123046875, 7.453857421875, 7.9176025390625, 8.38134765625, 8.8450927734375, 9.308837890625, 9.7725830078125, 10.236328125, 10.7000732421875, 11.163818359375, 11.6275634765625, 12.09130859375, 12.5550537109375, 13.018798828125, 13.4825439453125, 13.9462890625, 14.4100341796875, 14.873779296875, 15.3375244140625, 15.80126953125, 16.2650146484375, 16.728759765625, 17.1925048828125, 17.65625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 4.0, 6.0, 5.0, 12.0, 29.0, 39.0, 36.0, 68.0, 91.0, 114.0, 196.0, 448.0, 1010.0, 7384.0, 3115869.0, 18046.0, 1226.0, 450.0, 235.0, 137.0, 94.0, 47.0, 46.0, 24.0, 28.0, 13.0, 10.0, 6.0, 3.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.90625, -49.34375, -47.78125, -46.21875, -44.65625, -43.09375, -41.53125, -39.96875, -38.40625, -36.84375, -35.28125, -33.71875, -32.15625, -30.59375, -29.03125, -27.46875, -25.90625, -24.34375, -22.78125, -21.21875, -19.65625, -18.09375, -16.53125, -14.96875, -13.40625, -11.84375, -10.28125, -8.71875, -7.15625, -5.59375, -4.03125, -2.46875, -0.90625, 0.65625, 2.21875, 3.78125, 5.34375, 6.90625, 8.46875, 10.03125, 11.59375, 13.15625, 14.71875, 16.28125, 17.84375, 19.40625, 20.96875, 22.53125, 24.09375, 25.65625, 27.21875, 28.78125, 30.34375, 31.90625, 33.46875, 35.03125, 36.59375, 38.15625, 39.71875, 41.28125, 42.84375, 44.40625, 45.96875, 47.53125, 49.09375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 81.0, 499.0, 380.0, 53.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0781831741333, -9.587721824645996, -7.09726095199585, -4.606800079345703, -2.1163387298583984, 0.37412261962890625, 2.8645830154418945, 5.355044364929199, 7.845505714416504, 10.335967063903809, 12.826427459716797, 15.316888809204102, 17.807350158691406, 20.29781150817871, 22.788272857666016, 25.278732299804688, 27.769195556640625, 30.25965690612793, 32.750118255615234, 35.240577697753906, 37.731040954589844, 40.221500396728516, 42.71195983886719, 45.202423095703125, 47.6928825378418, 50.18334197998047, 52.673805236816406, 55.16426467895508, 57.654727935791016, 60.14518737792969, 62.635650634765625, 65.12611389160156, 67.61656951904297, 70.1070327758789, 72.59748840332031, 75.08795166015625, 77.57841491699219, 80.06887817382812, 82.55933380126953, 85.04979705810547, 87.5402603149414, 90.03072357177734, 92.52117919921875, 95.01164245605469, 97.50210571289062, 99.99256896972656, 102.48302459716797, 104.9734878540039, 107.46394348144531, 109.95440673828125, 112.44486236572266, 114.9353256225586, 117.42578887939453, 119.91625213623047, 122.40670776367188, 124.89717102050781, 127.38763427734375, 129.8780975341797, 132.36856079101562, 134.85902404785156, 137.34947204589844, 139.83993530273438, 142.3303985595703, 144.82086181640625, 147.3113250732422]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 8.0, 4.0, 13.0, 10.0, 8.0, 12.0, 15.0, 20.0, 12.0, 22.0, 34.0, 30.0, 32.0, 31.0, 29.0, 27.0, 44.0, 40.0, 41.0, 29.0, 39.0, 47.0, 35.0, 43.0, 48.0, 33.0, 42.0, 41.0, 33.0, 38.0, 25.0, 17.0, 25.0, 15.0, 12.0, 5.0, 4.0, 18.0, 9.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.48008918762207, -29.532920837402344, -28.585750579833984, -27.638582229614258, -26.69141387939453, -25.744243621826172, -24.797075271606445, -23.84990692138672, -22.90273666381836, -21.955568313598633, -21.008398056030273, -20.061229705810547, -19.11406135559082, -18.166893005371094, -17.219722747802734, -16.272554397583008, -15.325386047363281, -14.378216743469238, -13.431048393249512, -12.483879089355469, -11.536710739135742, -10.5895414352417, -9.642372131347656, -8.69520378112793, -7.748034477233887, -6.800865650177002, -5.853696823120117, -4.906527519226074, -3.9593586921691895, -3.0121898651123047, -2.0650205612182617, -1.117851734161377, -0.170684814453125, 0.7764841318130493, 1.7236530780792236, 2.6708221435546875, 3.6179909706115723, 4.565159797668457, 5.5123291015625, 6.459497928619385, 7.4066667556762695, 8.353836059570312, 9.301004409790039, 10.248173713684082, 11.195343017578125, 12.142511367797852, 13.089680671691895, 14.036849975585938, 14.984018325805664, 15.931187629699707, 16.87835693359375, 17.825525283813477, 18.772693634033203, 19.719863891601562, 20.66703224182129, 21.614200592041016, 22.561370849609375, 23.5085391998291, 24.45570945739746, 25.402877807617188, 26.350046157836914, 27.29721450805664, 28.244384765625, 29.191553115844727, 30.138721466064453]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 10.0, 7.0, 8.0, 8.0, 15.0, 17.0, 16.0, 14.0, 24.0, 24.0, 30.0, 39.0, 29.0, 29.0, 34.0, 34.0, 41.0, 43.0, 47.0, 45.0, 55.0, 42.0, 29.0, 28.0, 31.0, 29.0, 30.0, 23.0, 22.0, 27.0, 20.0, 18.0, 18.0, 19.0, 13.0, 19.0, 13.0, 14.0, 6.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.375, -4.248870849609375, -4.12274169921875, -3.996612548828125, -3.8704833984375, -3.744354248046875, -3.61822509765625, -3.492095947265625, -3.365966796875, -3.239837646484375, -3.11370849609375, -2.987579345703125, -2.8614501953125, -2.735321044921875, -2.60919189453125, -2.483062744140625, -2.35693359375, -2.230804443359375, -2.10467529296875, -1.978546142578125, -1.8524169921875, -1.726287841796875, -1.60015869140625, -1.474029541015625, -1.347900390625, -1.221771240234375, -1.09564208984375, -0.969512939453125, -0.8433837890625, -0.717254638671875, -0.59112548828125, -0.464996337890625, -0.3388671875, -0.212738037109375, -0.08660888671875, 0.039520263671875, 0.1656494140625, 0.291778564453125, 0.41790771484375, 0.544036865234375, 0.670166015625, 0.796295166015625, 0.92242431640625, 1.048553466796875, 1.1746826171875, 1.300811767578125, 1.42694091796875, 1.553070068359375, 1.67919921875, 1.805328369140625, 1.93145751953125, 2.057586669921875, 2.1837158203125, 2.309844970703125, 2.43597412109375, 2.562103271484375, 2.688232421875, 2.814361572265625, 2.94049072265625, 3.066619873046875, 3.1927490234375, 3.318878173828125, 3.44500732421875, 3.571136474609375, 3.697265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 9.0, 8.0, 5.0, 13.0, 14.0, 14.0, 22.0, 16.0, 39.0, 36.0, 45.0, 45.0, 69.0, 96.0, 141.0, 227.0, 565.0, 2535.0, 19977.0, 280666.0, 2480121.0, 1308128.0, 90879.0, 8166.0, 1360.0, 401.0, 176.0, 107.0, 68.0, 63.0, 48.0, 43.0, 32.0, 30.0, 23.0, 18.0, 17.0, 15.0, 11.0, 12.0, 9.0, 4.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-11.671875, -11.3458251953125, -11.019775390625, -10.6937255859375, -10.36767578125, -10.0416259765625, -9.715576171875, -9.3895263671875, -9.0634765625, -8.7374267578125, -8.411376953125, -8.0853271484375, -7.75927734375, -7.4332275390625, -7.107177734375, -6.7811279296875, -6.455078125, -6.1290283203125, -5.802978515625, -5.4769287109375, -5.15087890625, -4.8248291015625, -4.498779296875, -4.1727294921875, -3.8466796875, -3.5206298828125, -3.194580078125, -2.8685302734375, -2.54248046875, -2.2164306640625, -1.890380859375, -1.5643310546875, -1.23828125, -0.9122314453125, -0.586181640625, -0.2601318359375, 0.06591796875, 0.3919677734375, 0.718017578125, 1.0440673828125, 1.3701171875, 1.6961669921875, 2.022216796875, 2.3482666015625, 2.67431640625, 3.0003662109375, 3.326416015625, 3.6524658203125, 3.978515625, 4.3045654296875, 4.630615234375, 4.9566650390625, 5.28271484375, 5.6087646484375, 5.934814453125, 6.2608642578125, 6.5869140625, 6.9129638671875, 7.239013671875, 7.5650634765625, 7.89111328125, 8.2171630859375, 8.543212890625, 8.8692626953125, 9.1953125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 10.0, 14.0, 15.0, 23.0, 21.0, 29.0, 37.0, 64.0, 78.0, 112.0, 167.0, 218.0, 309.0, 379.0, 492.0, 499.0, 398.0, 323.0, 227.0, 166.0, 125.0, 80.0, 76.0, 53.0, 40.0, 30.0, 19.0, 22.0, 14.0, 9.0, 6.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.4375, -9.18359375, -8.9296875, -8.67578125, -8.421875, -8.16796875, -7.9140625, -7.66015625, -7.40625, -7.15234375, -6.8984375, -6.64453125, -6.390625, -6.13671875, -5.8828125, -5.62890625, -5.375, -5.12109375, -4.8671875, -4.61328125, -4.359375, -4.10546875, -3.8515625, -3.59765625, -3.34375, -3.08984375, -2.8359375, -2.58203125, -2.328125, -2.07421875, -1.8203125, -1.56640625, -1.3125, -1.05859375, -0.8046875, -0.55078125, -0.296875, -0.04296875, 0.2109375, 0.46484375, 0.71875, 0.97265625, 1.2265625, 1.48046875, 1.734375, 1.98828125, 2.2421875, 2.49609375, 2.75, 3.00390625, 3.2578125, 3.51171875, 3.765625, 4.01953125, 4.2734375, 4.52734375, 4.78125, 5.03515625, 5.2890625, 5.54296875, 5.796875, 6.05078125, 6.3046875, 6.55859375, 6.8125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 6.0, 18.0, 9.0, 22.0, 24.0, 40.0, 46.0, 60.0, 73.0, 115.0, 144.0, 263.0, 363.0, 949.0, 70194.0, 4084120.0, 35825.0, 810.0, 387.0, 244.0, 165.0, 102.0, 84.0, 55.0, 34.0, 29.0, 17.0, 26.0, 18.0, 10.0, 7.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.25, -32.955078125, -31.66015625, -30.365234375, -29.0703125, -27.775390625, -26.48046875, -25.185546875, -23.890625, -22.595703125, -21.30078125, -20.005859375, -18.7109375, -17.416015625, -16.12109375, -14.826171875, -13.53125, -12.236328125, -10.94140625, -9.646484375, -8.3515625, -7.056640625, -5.76171875, -4.466796875, -3.171875, -1.876953125, -0.58203125, 0.712890625, 2.0078125, 3.302734375, 4.59765625, 5.892578125, 7.1875, 8.482421875, 9.77734375, 11.072265625, 12.3671875, 13.662109375, 14.95703125, 16.251953125, 17.546875, 18.841796875, 20.13671875, 21.431640625, 22.7265625, 24.021484375, 25.31640625, 26.611328125, 27.90625, 29.201171875, 30.49609375, 31.791015625, 33.0859375, 34.380859375, 35.67578125, 36.970703125, 38.265625, 39.560546875, 40.85546875, 42.150390625, 43.4453125, 44.740234375, 46.03515625, 47.330078125, 48.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 0.0, 6.0, 17.0, 26.0, 45.0, 44.0, 53.0, 75.0, 104.0, 98.0, 92.0, 97.0, 80.0, 63.0, 56.0, 51.0, 29.0, 24.0, 10.0, 13.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.58039093017578, -23.791807174682617, -23.003225326538086, -22.214641571044922, -21.42605972290039, -20.637475967407227, -19.848892211914062, -19.06031036376953, -18.271728515625, -17.483144760131836, -16.694562911987305, -15.90597915649414, -15.11739730834961, -14.328813552856445, -13.540230751037598, -12.75164794921875, -11.963064193725586, -11.174481391906738, -10.38589859008789, -9.597314834594727, -8.808732986450195, -8.020149230957031, -7.231566429138184, -6.442983627319336, -5.654400825500488, -4.865818023681641, -4.077235221862793, -3.288651943206787, -2.5000691413879395, -1.7114863395690918, -0.9229030609130859, -0.13432025909423828, 0.6542606353759766, 1.4428435564041138, 2.231426477432251, 3.0200095176696777, 3.8085923194885254, 4.597175121307373, 5.385758399963379, 6.174341201782227, 6.962924003601074, 7.751506805419922, 8.54008960723877, 9.328672409057617, 10.117256164550781, 10.905838012695312, 11.694421768188477, 12.483004570007324, 13.271587371826172, 14.06017017364502, 14.848752975463867, 15.637336730957031, 16.425918579101562, 17.214502334594727, 18.00308609008789, 18.791667938232422, 19.580249786376953, 20.368833541870117, 21.15741539001465, 21.945999145507812, 22.734580993652344, 23.523164749145508, 24.311748504638672, 25.100330352783203, 25.888914108276367]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 10.0, 9.0, 14.0, 6.0, 18.0, 29.0, 20.0, 17.0, 24.0, 27.0, 32.0, 35.0, 37.0, 56.0, 53.0, 46.0, 44.0, 41.0, 51.0, 52.0, 42.0, 29.0, 37.0, 28.0, 34.0, 35.0, 25.0, 20.0, 22.0, 14.0, 21.0, 8.0, 15.0, 15.0, 8.0, 7.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.19389533996582, -29.341651916503906, -28.48940658569336, -27.637161254882812, -26.7849178314209, -25.932674407958984, -25.080429077148438, -24.22818374633789, -23.375940322875977, -22.523696899414062, -21.671451568603516, -20.81920623779297, -19.966962814331055, -19.11471939086914, -18.262474060058594, -17.410228729248047, -16.557985305786133, -15.705740928649902, -14.853496551513672, -14.001252174377441, -13.149007797241211, -12.29676342010498, -11.44451904296875, -10.59227466583252, -9.740030288696289, -8.887785911560059, -8.035541534423828, -7.183297157287598, -6.331052780151367, -5.478808403015137, -4.626564025878906, -3.774319648742676, -2.922077178955078, -2.0698328018188477, -1.2175884246826172, -0.3653440475463867, 0.48690032958984375, 1.3391447067260742, 2.1913890838623047, 3.043633460998535, 3.8958778381347656, 4.748122215270996, 5.600366592407227, 6.452610969543457, 7.3048553466796875, 8.157099723815918, 9.009344100952148, 9.861588478088379, 10.71383285522461, 11.56607723236084, 12.41832160949707, 13.2705659866333, 14.122810363769531, 14.975054740905762, 15.827299118041992, 16.679542541503906, 17.531787872314453, 18.384033203125, 19.236276626586914, 20.088520050048828, 20.940765380859375, 21.793010711669922, 22.645254135131836, 23.49749755859375, 24.349742889404297]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 1.0, 7.0, 4.0, 7.0, 9.0, 6.0, 8.0, 12.0, 13.0, 15.0, 18.0, 18.0, 25.0, 24.0, 31.0, 26.0, 34.0, 41.0, 41.0, 32.0, 46.0, 41.0, 44.0, 32.0, 42.0, 39.0, 34.0, 33.0, 36.0, 33.0, 26.0, 15.0, 25.0, 17.0, 27.0, 18.0, 18.0, 19.0, 15.0, 17.0, 17.0, 7.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0], "bins": [-4.390625, -4.269561767578125, -4.14849853515625, -4.027435302734375, -3.9063720703125, -3.785308837890625, -3.66424560546875, -3.543182373046875, -3.422119140625, -3.301055908203125, -3.17999267578125, -3.058929443359375, -2.9378662109375, -2.816802978515625, -2.69573974609375, -2.574676513671875, -2.45361328125, -2.332550048828125, -2.21148681640625, -2.090423583984375, -1.9693603515625, -1.848297119140625, -1.72723388671875, -1.606170654296875, -1.485107421875, -1.364044189453125, -1.24298095703125, -1.121917724609375, -1.0008544921875, -0.879791259765625, -0.75872802734375, -0.637664794921875, -0.5166015625, -0.395538330078125, -0.27447509765625, -0.153411865234375, -0.0323486328125, 0.088714599609375, 0.20977783203125, 0.330841064453125, 0.451904296875, 0.572967529296875, 0.69403076171875, 0.815093994140625, 0.9361572265625, 1.057220458984375, 1.17828369140625, 1.299346923828125, 1.42041015625, 1.541473388671875, 1.66253662109375, 1.783599853515625, 1.9046630859375, 2.025726318359375, 2.14678955078125, 2.267852783203125, 2.388916015625, 2.509979248046875, 2.63104248046875, 2.752105712890625, 2.8731689453125, 2.994232177734375, 3.11529541015625, 3.236358642578125, 3.357421875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 11.0, 15.0, 21.0, 31.0, 49.0, 72.0, 119.0, 231.0, 386.0, 754.0, 1343.0, 2454.0, 4491.0, 8800.0, 17420.0, 36397.0, 76222.0, 159768.0, 290082.0, 231193.0, 113020.0, 53489.0, 25551.0, 12552.0, 6528.0, 3350.0, 1788.0, 978.0, 558.0, 350.0, 193.0, 126.0, 76.0, 39.0, 36.0, 18.0, 12.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.73291015625, -0.7124176025390625, -0.691925048828125, -0.6714324951171875, -0.65093994140625, -0.6304473876953125, -0.609954833984375, -0.5894622802734375, -0.5689697265625, -0.5484771728515625, -0.527984619140625, -0.5074920654296875, -0.48699951171875, -0.4665069580078125, -0.446014404296875, -0.4255218505859375, -0.405029296875, -0.3845367431640625, -0.364044189453125, -0.3435516357421875, -0.32305908203125, -0.3025665283203125, -0.282073974609375, -0.2615814208984375, -0.2410888671875, -0.2205963134765625, -0.200103759765625, -0.1796112060546875, -0.15911865234375, -0.1386260986328125, -0.118133544921875, -0.0976409912109375, -0.0771484375, -0.0566558837890625, -0.036163330078125, -0.0156707763671875, 0.00482177734375, 0.0253143310546875, 0.045806884765625, 0.0662994384765625, 0.0867919921875, 0.1072845458984375, 0.127777099609375, 0.1482696533203125, 0.16876220703125, 0.1892547607421875, 0.209747314453125, 0.2302398681640625, 0.250732421875, 0.2712249755859375, 0.291717529296875, 0.3122100830078125, 0.33270263671875, 0.3531951904296875, 0.373687744140625, 0.3941802978515625, 0.4146728515625, 0.4351654052734375, 0.455657958984375, 0.4761505126953125, 0.49664306640625, 0.5171356201171875, 0.537628173828125, 0.5581207275390625, 0.57861328125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 3.0, 3.0, 10.0, 8.0, 5.0, 10.0, 12.0, 14.0, 17.0, 20.0, 30.0, 19.0, 18.0, 27.0, 29.0, 30.0, 32.0, 39.0, 38.0, 38.0, 34.0, 32.0, 1062.0, 37.0, 35.0, 34.0, 36.0, 22.0, 40.0, 35.0, 31.0, 26.0, 34.0, 19.0, 21.0, 11.0, 17.0, 14.0, 14.0, 24.0, 4.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0], "bins": [-2.626953125, -2.550048828125, -2.47314453125, -2.396240234375, -2.3193359375, -2.242431640625, -2.16552734375, -2.088623046875, -2.01171875, -1.934814453125, -1.85791015625, -1.781005859375, -1.7041015625, -1.627197265625, -1.55029296875, -1.473388671875, -1.396484375, -1.319580078125, -1.24267578125, -1.165771484375, -1.0888671875, -1.011962890625, -0.93505859375, -0.858154296875, -0.78125, -0.704345703125, -0.62744140625, -0.550537109375, -0.4736328125, -0.396728515625, -0.31982421875, -0.242919921875, -0.166015625, -0.089111328125, -0.01220703125, 0.064697265625, 0.1416015625, 0.218505859375, 0.29541015625, 0.372314453125, 0.44921875, 0.526123046875, 0.60302734375, 0.679931640625, 0.7568359375, 0.833740234375, 0.91064453125, 0.987548828125, 1.064453125, 1.141357421875, 1.21826171875, 1.295166015625, 1.3720703125, 1.448974609375, 1.52587890625, 1.602783203125, 1.6796875, 1.756591796875, 1.83349609375, 1.910400390625, 1.9873046875, 2.064208984375, 2.14111328125, 2.218017578125, 2.294921875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 13.0, 14.0, 17.0, 35.0, 43.0, 70.0, 80.0, 143.0, 175.0, 270.0, 400.0, 585.0, 770.0, 1223.0, 1782.0, 2562.0, 3807.0, 5770.0, 8941.0, 13541.0, 20788.0, 32601.0, 51060.0, 77353.0, 115157.0, 182800.0, 1186776.0, 130609.0, 90708.0, 58905.0, 38561.0, 24724.0, 15932.0, 10374.0, 6748.0, 4437.0, 3041.0, 2002.0, 1343.0, 903.0, 649.0, 440.0, 310.0, 173.0, 148.0, 106.0, 79.0, 59.0, 35.0, 19.0, 23.0, 16.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0], "bins": [-0.285400390625, -0.2765312194824219, -0.26766204833984375, -0.2587928771972656, -0.2499237060546875, -0.24105453491210938, -0.23218536376953125, -0.22331619262695312, -0.214447021484375, -0.20557785034179688, -0.19670867919921875, -0.18783950805664062, -0.1789703369140625, -0.17010116577148438, -0.16123199462890625, -0.15236282348632812, -0.14349365234375, -0.13462448120117188, -0.12575531005859375, -0.11688613891601562, -0.1080169677734375, -0.09914779663085938, -0.09027862548828125, -0.08140945434570312, -0.072540283203125, -0.06367111206054688, -0.05480194091796875, -0.045932769775390625, -0.0370635986328125, -0.028194427490234375, -0.01932525634765625, -0.010456085205078125, -0.0015869140625, 0.007282257080078125, 0.01615142822265625, 0.025020599365234375, 0.0338897705078125, 0.042758941650390625, 0.05162811279296875, 0.060497283935546875, 0.069366455078125, 0.07823562622070312, 0.08710479736328125, 0.09597396850585938, 0.1048431396484375, 0.11371231079101562, 0.12258148193359375, 0.13145065307617188, 0.14031982421875, 0.14918899536132812, 0.15805816650390625, 0.16692733764648438, 0.1757965087890625, 0.18466567993164062, 0.19353485107421875, 0.20240402221679688, 0.211273193359375, 0.22014236450195312, 0.22901153564453125, 0.23788070678710938, 0.2467498779296875, 0.2556190490722656, 0.26448822021484375, 0.2733573913574219, 0.2822265625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 5.0, 15.0, 22.0, 36.0, 48.0, 39.0, 69.0, 88.0, 142.0, 106.0, 112.0, 83.0, 76.0, 33.0, 23.0, 18.0, 13.0, 10.0, 10.0, 8.0, 5.0, 4.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00782012939453125, -0.007546544075012207, -0.007272958755493164, -0.006999373435974121, -0.006725788116455078, -0.006452202796936035, -0.006178617477416992, -0.005905032157897949, -0.005631446838378906, -0.005357861518859863, -0.00508427619934082, -0.004810690879821777, -0.004537105560302734, -0.004263520240783691, -0.0039899349212646484, -0.0037163496017456055, -0.0034427642822265625, -0.0031691789627075195, -0.0028955936431884766, -0.0026220083236694336, -0.0023484230041503906, -0.0020748376846313477, -0.0018012523651123047, -0.0015276670455932617, -0.0012540817260742188, -0.0009804964065551758, -0.0007069110870361328, -0.00043332576751708984, -0.00015974044799804688, 0.0001138448715209961, 0.00038743019104003906, 0.000661015510559082, 0.000934600830078125, 0.001208186149597168, 0.001481771469116211, 0.001755356788635254, 0.002028942108154297, 0.00230252742767334, 0.002576112747192383, 0.0028496980667114258, 0.0031232833862304688, 0.0033968687057495117, 0.0036704540252685547, 0.003944039344787598, 0.004217624664306641, 0.004491209983825684, 0.0047647953033447266, 0.0050383806228637695, 0.0053119659423828125, 0.0055855512619018555, 0.0058591365814208984, 0.006132721900939941, 0.006406307220458984, 0.006679892539978027, 0.00695347785949707, 0.007227063179016113, 0.007500648498535156, 0.007774233818054199, 0.008047819137573242, 0.008321404457092285, 0.008594989776611328, 0.008868575096130371, 0.009142160415649414, 0.009415745735168457, 0.0096893310546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 14.0, 3.0, 7.0, 6.0, 13.0, 21.0, 20.0, 38.0, 62.0, 64.0, 163.0, 338.0, 1056.0, 782402.0, 262558.0, 1003.0, 286.0, 146.0, 123.0, 60.0, 60.0, 32.0, 18.0, 10.0, 10.0, 8.0, 10.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1964111328125, -0.190948486328125, -0.18548583984375, -0.180023193359375, -0.174560546875, -0.169097900390625, -0.16363525390625, -0.158172607421875, -0.1527099609375, -0.147247314453125, -0.14178466796875, -0.136322021484375, -0.130859375, -0.125396728515625, -0.11993408203125, -0.114471435546875, -0.1090087890625, -0.103546142578125, -0.09808349609375, -0.092620849609375, -0.087158203125, -0.081695556640625, -0.07623291015625, -0.070770263671875, -0.0653076171875, -0.059844970703125, -0.05438232421875, -0.048919677734375, -0.04345703125, -0.037994384765625, -0.03253173828125, -0.027069091796875, -0.0216064453125, -0.016143798828125, -0.01068115234375, -0.005218505859375, 0.000244140625, 0.005706787109375, 0.01116943359375, 0.016632080078125, 0.0220947265625, 0.027557373046875, 0.03302001953125, 0.038482666015625, 0.0439453125, 0.049407958984375, 0.05487060546875, 0.060333251953125, 0.0657958984375, 0.071258544921875, 0.07672119140625, 0.082183837890625, 0.087646484375, 0.093109130859375, 0.09857177734375, 0.104034423828125, 0.1094970703125, 0.114959716796875, 0.12042236328125, 0.125885009765625, 0.13134765625, 0.136810302734375, 0.14227294921875, 0.147735595703125, 0.1531982421875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 22.0, 515.0, 437.0, 34.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06322511285543442, -0.061849094927310944, -0.06047308072447777, -0.05909706652164459, -0.05772104859352112, -0.056345030665397644, -0.05496901646256447, -0.05359300225973129, -0.05221698433160782, -0.050840966403484344, -0.04946495220065117, -0.04808893799781799, -0.04671292006969452, -0.045336902141571045, -0.04396088793873787, -0.042584873735904694, -0.04120885580778122, -0.039832837879657745, -0.03845682367682457, -0.037080809473991394, -0.03570479154586792, -0.034328773617744446, -0.03295275941491127, -0.031576745212078094, -0.03020072728395462, -0.028824711218476295, -0.02744869515299797, -0.026072679087519646, -0.02469666302204132, -0.023320646956562996, -0.02194463089108467, -0.020568614825606346, -0.019192596897482872, -0.017816580832004547, -0.016440564766526222, -0.015064548701047897, -0.013688532635569572, -0.012312516570091248, -0.010936500504612923, -0.009560484439134598, -0.008184468373656273, -0.006808452308177948, -0.005432436242699623, -0.004056420177221298, -0.0026804041117429733, -0.0013043880462646484, 7.162801921367645e-05, 0.0014476440846920013, 0.0028236601501703262, 0.004199676215648651, 0.005575692281126976, 0.006951708346605301, 0.008327724412083626, 0.00970374047756195, 0.011079756543040276, 0.0124557726085186, 0.013831788673996925, 0.01520780473947525, 0.016583820804953575, 0.0179598368704319, 0.019335852935910225, 0.02071186900138855, 0.022087885066866875, 0.0234639011323452, 0.024839917197823524]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 15.0, 4.0, 6.0, 13.0, 9.0, 9.0, 15.0, 24.0, 26.0, 20.0, 31.0, 23.0, 38.0, 35.0, 36.0, 35.0, 42.0, 41.0, 37.0, 39.0, 49.0, 37.0, 40.0, 43.0, 29.0, 37.0, 31.0, 34.0, 24.0, 31.0, 23.0, 19.0, 20.0, 18.0, 17.0, 5.0, 10.0, 12.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003990352153778076, -0.0038534821942448616, -0.003716612234711647, -0.0035797422751784325, -0.003442872315645218, -0.0033060023561120033, -0.0031691323965787888, -0.003032262437045574, -0.0028953924775123596, -0.002758522517979145, -0.0026216525584459305, -0.002484782598912716, -0.0023479126393795013, -0.0022110426798462868, -0.002074172720313072, -0.0019373027607798576, -0.001800432801246643, -0.0016635628417134285, -0.001526692882180214, -0.0013898229226469994, -0.0012529529631137848, -0.0011160830035805702, -0.0009792130440473557, -0.0008423430845141411, -0.0007054731249809265, -0.0005686031654477119, -0.0004317332059144974, -0.0002948632463812828, -0.00015799328684806824, -2.1123327314853668e-05, 0.0001157466322183609, 0.00025261659175157547, 0.00038948655128479004, 0.0005263565108180046, 0.0006632264703512192, 0.0008000964298844337, 0.0009369663894176483, 0.0010738363489508629, 0.0012107063084840775, 0.001347576268017292, 0.0014844462275505066, 0.0016213161870837212, 0.0017581861466169357, 0.0018950561061501503, 0.002031926065683365, 0.0021687960252165794, 0.002305665984749794, 0.0024425359442830086, 0.002579405903816223, 0.0027162758633494377, 0.0028531458228826523, 0.002990015782415867, 0.0031268857419490814, 0.003263755701482296, 0.0034006256610155106, 0.003537495620548725, 0.0036743655800819397, 0.0038112355396151543, 0.003948105499148369, 0.004084975458681583, 0.004221845418214798, 0.0043587153777480125, 0.004495585337281227, 0.004632455296814442, 0.004769325256347656]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 1.0, 7.0, 4.0, 7.0, 9.0, 6.0, 8.0, 12.0, 13.0, 15.0, 18.0, 18.0, 25.0, 24.0, 31.0, 26.0, 34.0, 41.0, 40.0, 33.0, 46.0, 41.0, 44.0, 32.0, 42.0, 39.0, 34.0, 33.0, 36.0, 33.0, 26.0, 15.0, 25.0, 17.0, 27.0, 18.0, 18.0, 19.0, 15.0, 17.0, 17.0, 7.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0], "bins": [-4.390625, -4.269561767578125, -4.14849853515625, -4.027435302734375, -3.9063720703125, -3.785308837890625, -3.66424560546875, -3.543182373046875, -3.422119140625, -3.301055908203125, -3.17999267578125, -3.058929443359375, -2.9378662109375, -2.816802978515625, -2.69573974609375, -2.574676513671875, -2.45361328125, -2.332550048828125, -2.21148681640625, -2.090423583984375, -1.9693603515625, -1.848297119140625, -1.72723388671875, -1.606170654296875, -1.485107421875, -1.364044189453125, -1.24298095703125, -1.121917724609375, -1.0008544921875, -0.879791259765625, -0.75872802734375, -0.637664794921875, -0.5166015625, -0.395538330078125, -0.27447509765625, -0.153411865234375, -0.0323486328125, 0.088714599609375, 0.20977783203125, 0.330841064453125, 0.451904296875, 0.572967529296875, 0.69403076171875, 0.815093994140625, 0.9361572265625, 1.057220458984375, 1.17828369140625, 1.299346923828125, 1.42041015625, 1.541473388671875, 1.66253662109375, 1.783599853515625, 1.9046630859375, 2.025726318359375, 2.14678955078125, 2.267852783203125, 2.388916015625, 2.509979248046875, 2.63104248046875, 2.752105712890625, 2.8731689453125, 2.994232177734375, 3.11529541015625, 3.236358642578125, 3.357421875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 6.0, 12.0, 11.0, 15.0, 20.0, 20.0, 25.0, 37.0, 45.0, 69.0, 96.0, 122.0, 171.0, 286.0, 574.0, 1199.0, 3757.0, 14727.0, 59502.0, 337743.0, 522650.0, 79580.0, 19758.0, 5056.0, 1481.0, 574.0, 291.0, 178.0, 104.0, 90.0, 82.0, 54.0, 43.0, 34.0, 24.0, 22.0, 26.0, 16.0, 10.0, 10.0, 4.0, 8.0, 6.0, 0.0, 3.0, 1.0, 0.0, 5.0], "bins": [-8.3515625, -8.1202392578125, -7.888916015625, -7.6575927734375, -7.42626953125, -7.1949462890625, -6.963623046875, -6.7322998046875, -6.5009765625, -6.2696533203125, -6.038330078125, -5.8070068359375, -5.57568359375, -5.3443603515625, -5.113037109375, -4.8817138671875, -4.650390625, -4.4190673828125, -4.187744140625, -3.9564208984375, -3.72509765625, -3.4937744140625, -3.262451171875, -3.0311279296875, -2.7998046875, -2.5684814453125, -2.337158203125, -2.1058349609375, -1.87451171875, -1.6431884765625, -1.411865234375, -1.1805419921875, -0.94921875, -0.7178955078125, -0.486572265625, -0.2552490234375, -0.02392578125, 0.2073974609375, 0.438720703125, 0.6700439453125, 0.9013671875, 1.1326904296875, 1.364013671875, 1.5953369140625, 1.82666015625, 2.0579833984375, 2.289306640625, 2.5206298828125, 2.751953125, 2.9832763671875, 3.214599609375, 3.4459228515625, 3.67724609375, 3.9085693359375, 4.139892578125, 4.3712158203125, 4.6025390625, 4.8338623046875, 5.065185546875, 5.2965087890625, 5.52783203125, 5.7591552734375, 5.990478515625, 6.2218017578125, 6.453125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 13.0, 12.0, 14.0, 9.0, 15.0, 12.0, 15.0, 17.0, 24.0, 19.0, 29.0, 34.0, 35.0, 54.0, 61.0, 64.0, 102.0, 247.0, 1523.0, 193.0, 88.0, 72.0, 48.0, 45.0, 31.0, 31.0, 26.0, 34.0, 27.0, 26.0, 16.0, 15.0, 14.0, 15.0, 13.0, 10.0, 6.0, 6.0, 0.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1484375, -12.74267578125, -12.3369140625, -11.93115234375, -11.525390625, -11.11962890625, -10.7138671875, -10.30810546875, -9.90234375, -9.49658203125, -9.0908203125, -8.68505859375, -8.279296875, -7.87353515625, -7.4677734375, -7.06201171875, -6.65625, -6.25048828125, -5.8447265625, -5.43896484375, -5.033203125, -4.62744140625, -4.2216796875, -3.81591796875, -3.41015625, -3.00439453125, -2.5986328125, -2.19287109375, -1.787109375, -1.38134765625, -0.9755859375, -0.56982421875, -0.1640625, 0.24169921875, 0.6474609375, 1.05322265625, 1.458984375, 1.86474609375, 2.2705078125, 2.67626953125, 3.08203125, 3.48779296875, 3.8935546875, 4.29931640625, 4.705078125, 5.11083984375, 5.5166015625, 5.92236328125, 6.328125, 6.73388671875, 7.1396484375, 7.54541015625, 7.951171875, 8.35693359375, 8.7626953125, 9.16845703125, 9.57421875, 9.97998046875, 10.3857421875, 10.79150390625, 11.197265625, 11.60302734375, 12.0087890625, 12.41455078125, 12.8203125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 7.0, 8.0, 3.0, 10.0, 11.0, 9.0, 18.0, 13.0, 16.0, 29.0, 25.0, 47.0, 42.0, 71.0, 74.0, 100.0, 140.0, 278.0, 669.0, 2958.0, 26969.0, 3038349.0, 69595.0, 4399.0, 878.0, 317.0, 166.0, 118.0, 66.0, 52.0, 50.0, 32.0, 30.0, 24.0, 22.0, 23.0, 21.0, 17.0, 14.0, 11.0, 5.0, 7.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-42.9375, -41.66015625, -40.3828125, -39.10546875, -37.828125, -36.55078125, -35.2734375, -33.99609375, -32.71875, -31.44140625, -30.1640625, -28.88671875, -27.609375, -26.33203125, -25.0546875, -23.77734375, -22.5, -21.22265625, -19.9453125, -18.66796875, -17.390625, -16.11328125, -14.8359375, -13.55859375, -12.28125, -11.00390625, -9.7265625, -8.44921875, -7.171875, -5.89453125, -4.6171875, -3.33984375, -2.0625, -0.78515625, 0.4921875, 1.76953125, 3.046875, 4.32421875, 5.6015625, 6.87890625, 8.15625, 9.43359375, 10.7109375, 11.98828125, 13.265625, 14.54296875, 15.8203125, 17.09765625, 18.375, 19.65234375, 20.9296875, 22.20703125, 23.484375, 24.76171875, 26.0390625, 27.31640625, 28.59375, 29.87109375, 31.1484375, 32.42578125, 33.703125, 34.98046875, 36.2578125, 37.53515625, 38.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 17.0, 16.0, 63.0, 105.0, 187.0, 202.0, 182.0, 147.0, 45.0, 22.0, 13.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.219508171081543, -9.132844924926758, -8.046182632446289, -6.959519863128662, -5.872857093811035, -4.786194324493408, -3.6995315551757812, -2.6128687858581543, -1.5262060165405273, -0.4395432472229004, 0.6471195220947266, 1.7337822914123535, 2.8204450607299805, 3.9071078300476074, 4.993770599365234, 6.080433368682861, 7.167096138000488, 8.253759384155273, 9.340421676635742, 10.427083969116211, 11.513747215270996, 12.600410461425781, 13.68707275390625, 14.773735046386719, 15.860398292541504, 16.94706153869629, 18.033723831176758, 19.120386123657227, 20.207050323486328, 21.293712615966797, 22.380374908447266, 23.467037200927734, 24.55370330810547, 25.640365600585938, 26.727027893066406, 27.813692092895508, 28.900354385375977, 29.987016677856445, 31.073680877685547, 32.160343170166016, 33.247005462646484, 34.33366775512695, 35.42033004760742, 36.50699234008789, 37.593658447265625, 38.680320739746094, 39.76698303222656, 40.85364532470703, 41.9403076171875, 43.02696990966797, 44.11363220214844, 45.200294494628906, 46.286956787109375, 47.37362289428711, 48.46028518676758, 49.54694747924805, 50.633609771728516, 51.720272064208984, 52.80693435668945, 53.89359664916992, 54.980262756347656, 56.066925048828125, 57.153587341308594, 58.24024963378906, 59.32691192626953]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 7.0, 5.0, 12.0, 4.0, 6.0, 10.0, 17.0, 16.0, 18.0, 16.0, 20.0, 30.0, 25.0, 27.0, 33.0, 22.0, 38.0, 35.0, 40.0, 33.0, 45.0, 41.0, 50.0, 42.0, 35.0, 41.0, 36.0, 35.0, 35.0, 27.0, 34.0, 28.0, 17.0, 16.0, 15.0, 17.0, 11.0, 11.0, 9.0, 10.0, 7.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-36.81783676147461, -35.67250061035156, -34.52716064453125, -33.3818244934082, -32.236488342285156, -31.09115219116211, -29.94581413269043, -28.80047607421875, -27.655139923095703, -26.509803771972656, -25.364465713500977, -24.219127655029297, -23.07379150390625, -21.928455352783203, -20.783117294311523, -19.637779235839844, -18.492443084716797, -17.34710693359375, -16.20176887512207, -15.056431770324707, -13.911094665527344, -12.76575756072998, -11.620420455932617, -10.475083351135254, -9.32974624633789, -8.184409141540527, -7.039072036743164, -5.893734931945801, -4.7483978271484375, -3.603060722351074, -2.457723617553711, -1.3123865127563477, -0.16704559326171875, 0.9782915115356445, 2.123628616333008, 3.268965721130371, 4.414302825927734, 5.559639930725098, 6.704977035522461, 7.850314140319824, 8.995651245117188, 10.14098834991455, 11.286325454711914, 12.431662559509277, 13.57699966430664, 14.722336769104004, 15.867673873901367, 17.013011932373047, 18.158348083496094, 19.30368423461914, 20.44902229309082, 21.5943603515625, 22.739696502685547, 23.885032653808594, 25.030370712280273, 26.175708770751953, 27.321044921875, 28.466381072998047, 29.611719131469727, 30.757057189941406, 31.902393341064453, 33.0477294921875, 34.19306945800781, 35.33840560913086, 36.483741760253906]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 7.0, 7.0, 7.0, 8.0, 9.0, 18.0, 19.0, 30.0, 22.0, 19.0, 32.0, 33.0, 28.0, 33.0, 33.0, 46.0, 44.0, 37.0, 55.0, 43.0, 47.0, 35.0, 24.0, 40.0, 33.0, 23.0, 38.0, 30.0, 20.0, 30.0, 18.0, 23.0, 15.0, 23.0, 15.0, 10.0, 11.0, 5.0, 2.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.453125, -4.306396484375, -4.15966796875, -4.012939453125, -3.8662109375, -3.719482421875, -3.57275390625, -3.426025390625, -3.279296875, -3.132568359375, -2.98583984375, -2.839111328125, -2.6923828125, -2.545654296875, -2.39892578125, -2.252197265625, -2.10546875, -1.958740234375, -1.81201171875, -1.665283203125, -1.5185546875, -1.371826171875, -1.22509765625, -1.078369140625, -0.931640625, -0.784912109375, -0.63818359375, -0.491455078125, -0.3447265625, -0.197998046875, -0.05126953125, 0.095458984375, 0.2421875, 0.388916015625, 0.53564453125, 0.682373046875, 0.8291015625, 0.975830078125, 1.12255859375, 1.269287109375, 1.416015625, 1.562744140625, 1.70947265625, 1.856201171875, 2.0029296875, 2.149658203125, 2.29638671875, 2.443115234375, 2.58984375, 2.736572265625, 2.88330078125, 3.030029296875, 3.1767578125, 3.323486328125, 3.47021484375, 3.616943359375, 3.763671875, 3.910400390625, 4.05712890625, 4.203857421875, 4.3505859375, 4.497314453125, 4.64404296875, 4.790771484375, 4.9375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 13.0, 13.0, 8.0, 17.0, 25.0, 30.0, 32.0, 60.0, 73.0, 133.0, 217.0, 384.0, 796.0, 1754.0, 4477.0, 12878.0, 44564.0, 171464.0, 610811.0, 1387844.0, 1275600.0, 496416.0, 133326.0, 35360.0, 10708.0, 3882.0, 1690.0, 726.0, 383.0, 187.0, 128.0, 73.0, 50.0, 36.0, 26.0, 28.0, 17.0, 14.0, 12.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9921875, -4.81951904296875, -4.6468505859375, -4.47418212890625, -4.301513671875, -4.12884521484375, -3.9561767578125, -3.78350830078125, -3.61083984375, -3.43817138671875, -3.2655029296875, -3.09283447265625, -2.920166015625, -2.74749755859375, -2.5748291015625, -2.40216064453125, -2.2294921875, -2.05682373046875, -1.8841552734375, -1.71148681640625, -1.538818359375, -1.36614990234375, -1.1934814453125, -1.02081298828125, -0.84814453125, -0.67547607421875, -0.5028076171875, -0.33013916015625, -0.157470703125, 0.01519775390625, 0.1878662109375, 0.36053466796875, 0.533203125, 0.70587158203125, 0.8785400390625, 1.05120849609375, 1.223876953125, 1.39654541015625, 1.5692138671875, 1.74188232421875, 1.91455078125, 2.08721923828125, 2.2598876953125, 2.43255615234375, 2.605224609375, 2.77789306640625, 2.9505615234375, 3.12322998046875, 3.2958984375, 3.46856689453125, 3.6412353515625, 3.81390380859375, 3.986572265625, 4.15924072265625, 4.3319091796875, 4.50457763671875, 4.67724609375, 4.84991455078125, 5.0225830078125, 5.19525146484375, 5.367919921875, 5.54058837890625, 5.7132568359375, 5.88592529296875, 6.05859375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 10.0, 17.0, 24.0, 42.0, 30.0, 45.0, 66.0, 90.0, 136.0, 169.0, 242.0, 323.0, 424.0, 470.0, 479.0, 414.0, 298.0, 215.0, 155.0, 118.0, 73.0, 73.0, 47.0, 32.0, 20.0, 12.0, 14.0, 10.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.40625, -10.1246337890625, -9.843017578125, -9.5614013671875, -9.27978515625, -8.9981689453125, -8.716552734375, -8.4349365234375, -8.1533203125, -7.8717041015625, -7.590087890625, -7.3084716796875, -7.02685546875, -6.7452392578125, -6.463623046875, -6.1820068359375, -5.900390625, -5.6187744140625, -5.337158203125, -5.0555419921875, -4.77392578125, -4.4923095703125, -4.210693359375, -3.9290771484375, -3.6474609375, -3.3658447265625, -3.084228515625, -2.8026123046875, -2.52099609375, -2.2393798828125, -1.957763671875, -1.6761474609375, -1.39453125, -1.1129150390625, -0.831298828125, -0.5496826171875, -0.26806640625, 0.0135498046875, 0.295166015625, 0.5767822265625, 0.8583984375, 1.1400146484375, 1.421630859375, 1.7032470703125, 1.98486328125, 2.2664794921875, 2.548095703125, 2.8297119140625, 3.111328125, 3.3929443359375, 3.674560546875, 3.9561767578125, 4.23779296875, 4.5194091796875, 4.801025390625, 5.0826416015625, 5.3642578125, 5.6458740234375, 5.927490234375, 6.2091064453125, 6.49072265625, 6.7723388671875, 7.053955078125, 7.3355712890625, 7.6171875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 6.0, 8.0, 13.0, 12.0, 15.0, 19.0, 50.0, 74.0, 93.0, 131.0, 236.0, 425.0, 792.0, 2180.0, 44102.0, 3847516.0, 291886.0, 4247.0, 1111.0, 516.0, 315.0, 201.0, 99.0, 56.0, 52.0, 45.0, 28.0, 19.0, 14.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.09375, -28.0791015625, -27.064453125, -26.0498046875, -25.03515625, -24.0205078125, -23.005859375, -21.9912109375, -20.9765625, -19.9619140625, -18.947265625, -17.9326171875, -16.91796875, -15.9033203125, -14.888671875, -13.8740234375, -12.859375, -11.8447265625, -10.830078125, -9.8154296875, -8.80078125, -7.7861328125, -6.771484375, -5.7568359375, -4.7421875, -3.7275390625, -2.712890625, -1.6982421875, -0.68359375, 0.3310546875, 1.345703125, 2.3603515625, 3.375, 4.3896484375, 5.404296875, 6.4189453125, 7.43359375, 8.4482421875, 9.462890625, 10.4775390625, 11.4921875, 12.5068359375, 13.521484375, 14.5361328125, 15.55078125, 16.5654296875, 17.580078125, 18.5947265625, 19.609375, 20.6240234375, 21.638671875, 22.6533203125, 23.66796875, 24.6826171875, 25.697265625, 26.7119140625, 27.7265625, 28.7412109375, 29.755859375, 30.7705078125, 31.78515625, 32.7998046875, 33.814453125, 34.8291015625, 35.84375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 211.0, 758.0, 45.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-397.21319580078125, -388.0487365722656, -378.88427734375, -369.7198486328125, -360.5553894042969, -351.39093017578125, -342.2264709472656, -333.06201171875, -323.8975830078125, -314.7331237792969, -305.56866455078125, -296.40423583984375, -287.2397766113281, -278.0753173828125, -268.9108581542969, -259.74639892578125, -250.58193969726562, -241.41748046875, -232.25303649902344, -223.0885772705078, -213.92413330078125, -204.75967407226562, -195.59521484375, -186.43075561523438, -177.2663116455078, -168.1018524169922, -158.93740844726562, -149.77294921875, -140.60848999023438, -131.4440460205078, -122.27958679199219, -113.1151351928711, -103.95066833496094, -94.78621673583984, -85.62176513671875, -76.45730590820312, -67.29285430908203, -58.12840270996094, -48.96394729614258, -39.79949188232422, -30.635040283203125, -21.4705867767334, -12.306133270263672, -3.1416797637939453, 6.022773742675781, 15.187225341796875, 24.351680755615234, 33.516136169433594, 42.68058776855469, 51.84503936767578, 61.00949478149414, 70.1739501953125, 79.3384017944336, 88.50285339355469, 97.66731262207031, 106.8317642211914, 115.9962158203125, 125.1606674194336, 134.3251190185547, 143.4895782470703, 152.65402221679688, 161.8184814453125, 170.98294067382812, 180.14739990234375, 189.3118438720703]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 5.0, 9.0, 8.0, 16.0, 15.0, 19.0, 17.0, 11.0, 31.0, 31.0, 27.0, 34.0, 28.0, 43.0, 46.0, 43.0, 65.0, 51.0, 58.0, 53.0, 36.0, 44.0, 41.0, 40.0, 34.0, 25.0, 25.0, 32.0, 25.0, 19.0, 23.0, 12.0, 6.0, 10.0, 8.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.778839111328125, -31.794004440307617, -30.80916976928711, -29.824337005615234, -28.839502334594727, -27.85466766357422, -26.869834899902344, -25.885000228881836, -24.900165557861328, -23.91533088684082, -22.930496215820312, -21.945663452148438, -20.96082878112793, -19.975994110107422, -18.991161346435547, -18.00632667541504, -17.02149200439453, -16.036657333374023, -15.051823616027832, -14.06698989868164, -13.082155227661133, -12.097320556640625, -11.112486839294434, -10.127653121948242, -9.142818450927734, -8.157983779907227, -7.173150062561035, -6.1883158683776855, -5.203481674194336, -4.218647480010986, -3.2338132858276367, -2.248979091644287, -1.2641448974609375, -0.2793107032775879, 0.7055234909057617, 1.6903576850891113, 2.675191879272461, 3.6600260734558105, 4.64486026763916, 5.62969446182251, 6.614528656005859, 7.599362850189209, 8.584197044372559, 9.56903076171875, 10.553865432739258, 11.538700103759766, 12.523533821105957, 13.508367538452148, 14.493202209472656, 15.478036880493164, 16.462871551513672, 17.447704315185547, 18.432538986206055, 19.417373657226562, 20.402206420898438, 21.387041091918945, 22.371875762939453, 23.35671043395996, 24.34154510498047, 25.326377868652344, 26.31121253967285, 27.29604721069336, 28.280879974365234, 29.265714645385742, 30.25054931640625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 6.0, 11.0, 9.0, 7.0, 11.0, 6.0, 20.0, 18.0, 25.0, 23.0, 21.0, 27.0, 36.0, 33.0, 46.0, 44.0, 43.0, 50.0, 50.0, 42.0, 39.0, 38.0, 34.0, 37.0, 36.0, 34.0, 42.0, 28.0, 29.0, 26.0, 16.0, 27.0, 13.0, 15.0, 11.0, 8.0, 11.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.6112060546875, -4.464599609375, -4.3179931640625, -4.17138671875, -4.0247802734375, -3.878173828125, -3.7315673828125, -3.5849609375, -3.4383544921875, -3.291748046875, -3.1451416015625, -2.99853515625, -2.8519287109375, -2.705322265625, -2.5587158203125, -2.412109375, -2.2655029296875, -2.118896484375, -1.9722900390625, -1.82568359375, -1.6790771484375, -1.532470703125, -1.3858642578125, -1.2392578125, -1.0926513671875, -0.946044921875, -0.7994384765625, -0.65283203125, -0.5062255859375, -0.359619140625, -0.2130126953125, -0.06640625, 0.0802001953125, 0.226806640625, 0.3734130859375, 0.52001953125, 0.6666259765625, 0.813232421875, 0.9598388671875, 1.1064453125, 1.2530517578125, 1.399658203125, 1.5462646484375, 1.69287109375, 1.8394775390625, 1.986083984375, 2.1326904296875, 2.279296875, 2.4259033203125, 2.572509765625, 2.7191162109375, 2.86572265625, 3.0123291015625, 3.158935546875, 3.3055419921875, 3.4521484375, 3.5987548828125, 3.745361328125, 3.8919677734375, 4.03857421875, 4.1851806640625, 4.331787109375, 4.4783935546875, 4.625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 4.0, 6.0, 8.0, 5.0, 10.0, 19.0, 22.0, 32.0, 38.0, 70.0, 81.0, 128.0, 201.0, 291.0, 426.0, 670.0, 1002.0, 1533.0, 2324.0, 3829.0, 5923.0, 9336.0, 14876.0, 24407.0, 39190.0, 66038.0, 110408.0, 175981.0, 209994.0, 148859.0, 91001.0, 54453.0, 32869.0, 20245.0, 12593.0, 7858.0, 4857.0, 3064.0, 2029.0, 1336.0, 846.0, 546.0, 347.0, 252.0, 170.0, 131.0, 61.0, 55.0, 39.0, 30.0, 27.0, 12.0, 5.0, 8.0, 9.0, 1.0, 8.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.476806640625, -0.461578369140625, -0.44635009765625, -0.431121826171875, -0.4158935546875, -0.400665283203125, -0.38543701171875, -0.370208740234375, -0.35498046875, -0.339752197265625, -0.32452392578125, -0.309295654296875, -0.2940673828125, -0.278839111328125, -0.26361083984375, -0.248382568359375, -0.233154296875, -0.217926025390625, -0.20269775390625, -0.187469482421875, -0.1722412109375, -0.157012939453125, -0.14178466796875, -0.126556396484375, -0.111328125, -0.096099853515625, -0.08087158203125, -0.065643310546875, -0.0504150390625, -0.035186767578125, -0.01995849609375, -0.004730224609375, 0.010498046875, 0.025726318359375, 0.04095458984375, 0.056182861328125, 0.0714111328125, 0.086639404296875, 0.10186767578125, 0.117095947265625, 0.13232421875, 0.147552490234375, 0.16278076171875, 0.178009033203125, 0.1932373046875, 0.208465576171875, 0.22369384765625, 0.238922119140625, 0.254150390625, 0.269378662109375, 0.28460693359375, 0.299835205078125, 0.3150634765625, 0.330291748046875, 0.34552001953125, 0.360748291015625, 0.3759765625, 0.391204833984375, 0.40643310546875, 0.421661376953125, 0.4368896484375, 0.452117919921875, 0.46734619140625, 0.482574462890625, 0.497802734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 6.0, 7.0, 11.0, 15.0, 11.0, 11.0, 14.0, 25.0, 12.0, 25.0, 26.0, 30.0, 34.0, 38.0, 32.0, 36.0, 29.0, 36.0, 31.0, 40.0, 1059.0, 36.0, 37.0, 29.0, 27.0, 44.0, 33.0, 25.0, 36.0, 22.0, 20.0, 23.0, 23.0, 20.0, 12.0, 19.0, 16.0, 15.0, 10.0, 11.0, 3.0, 7.0, 1.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.515625, -2.4346923828125, -2.353759765625, -2.2728271484375, -2.19189453125, -2.1109619140625, -2.030029296875, -1.9490966796875, -1.8681640625, -1.7872314453125, -1.706298828125, -1.6253662109375, -1.54443359375, -1.4635009765625, -1.382568359375, -1.3016357421875, -1.220703125, -1.1397705078125, -1.058837890625, -0.9779052734375, -0.89697265625, -0.8160400390625, -0.735107421875, -0.6541748046875, -0.5732421875, -0.4923095703125, -0.411376953125, -0.3304443359375, -0.24951171875, -0.1685791015625, -0.087646484375, -0.0067138671875, 0.07421875, 0.1551513671875, 0.236083984375, 0.3170166015625, 0.39794921875, 0.4788818359375, 0.559814453125, 0.6407470703125, 0.7216796875, 0.8026123046875, 0.883544921875, 0.9644775390625, 1.04541015625, 1.1263427734375, 1.207275390625, 1.2882080078125, 1.369140625, 1.4500732421875, 1.531005859375, 1.6119384765625, 1.69287109375, 1.7738037109375, 1.854736328125, 1.9356689453125, 2.0166015625, 2.0975341796875, 2.178466796875, 2.2593994140625, 2.34033203125, 2.4212646484375, 2.502197265625, 2.5831298828125, 2.6640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 8.0, 9.0, 10.0, 12.0, 11.0, 31.0, 44.0, 56.0, 81.0, 110.0, 176.0, 270.0, 411.0, 581.0, 811.0, 1277.0, 1841.0, 2942.0, 4165.0, 6654.0, 10004.0, 15680.0, 24539.0, 38636.0, 60227.0, 92889.0, 136574.0, 1210959.0, 165187.0, 114020.0, 74655.0, 47754.0, 30393.0, 19507.0, 12693.0, 8212.0, 5193.0, 3517.0, 2273.0, 1582.0, 1048.0, 680.0, 478.0, 278.0, 195.0, 138.0, 105.0, 73.0, 49.0, 24.0, 26.0, 12.0, 12.0, 9.0, 6.0, 4.0, 4.0, 2.0, 5.0, 1.0], "bins": [-0.30419921875, -0.29461669921875, -0.2850341796875, -0.27545166015625, -0.265869140625, -0.25628662109375, -0.2467041015625, -0.23712158203125, -0.2275390625, -0.21795654296875, -0.2083740234375, -0.19879150390625, -0.189208984375, -0.17962646484375, -0.1700439453125, -0.16046142578125, -0.15087890625, -0.14129638671875, -0.1317138671875, -0.12213134765625, -0.112548828125, -0.10296630859375, -0.0933837890625, -0.08380126953125, -0.07421875, -0.06463623046875, -0.0550537109375, -0.04547119140625, -0.035888671875, -0.02630615234375, -0.0167236328125, -0.00714111328125, 0.00244140625, 0.01202392578125, 0.0216064453125, 0.03118896484375, 0.040771484375, 0.05035400390625, 0.0599365234375, 0.06951904296875, 0.0791015625, 0.08868408203125, 0.0982666015625, 0.10784912109375, 0.117431640625, 0.12701416015625, 0.1365966796875, 0.14617919921875, 0.15576171875, 0.16534423828125, 0.1749267578125, 0.18450927734375, 0.194091796875, 0.20367431640625, 0.2132568359375, 0.22283935546875, 0.232421875, 0.24200439453125, 0.2515869140625, 0.26116943359375, 0.270751953125, 0.28033447265625, 0.2899169921875, 0.29949951171875, 0.30908203125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 7.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 12.0, 12.0, 18.0, 20.0, 43.0, 69.0, 115.0, 173.0, 159.0, 129.0, 68.0, 45.0, 26.0, 16.0, 11.0, 11.0, 5.0, 6.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0107574462890625, -0.010411262512207031, -0.010065078735351562, -0.009718894958496094, -0.009372711181640625, -0.009026527404785156, -0.008680343627929688, -0.008334159851074219, -0.00798797607421875, -0.007641792297363281, -0.0072956085205078125, -0.006949424743652344, -0.006603240966796875, -0.006257057189941406, -0.0059108734130859375, -0.005564689636230469, -0.005218505859375, -0.004872322082519531, -0.0045261383056640625, -0.004179954528808594, -0.003833770751953125, -0.0034875869750976562, -0.0031414031982421875, -0.0027952194213867188, -0.00244903564453125, -0.0021028518676757812, -0.0017566680908203125, -0.0014104843139648438, -0.001064300537109375, -0.0007181167602539062, -0.0003719329833984375, -2.574920654296875e-05, 0.0003204345703125, 0.0006666183471679688, 0.0010128021240234375, 0.0013589859008789062, 0.001705169677734375, 0.0020513534545898438, 0.0023975372314453125, 0.0027437210083007812, 0.00308990478515625, 0.0034360885620117188, 0.0037822723388671875, 0.004128456115722656, 0.004474639892578125, 0.004820823669433594, 0.0051670074462890625, 0.005513191223144531, 0.005859375, 0.006205558776855469, 0.0065517425537109375, 0.006897926330566406, 0.007244110107421875, 0.007590293884277344, 0.007936477661132812, 0.008282661437988281, 0.00862884521484375, 0.008975028991699219, 0.009321212768554688, 0.009667396545410156, 0.010013580322265625, 0.010359764099121094, 0.010705947875976562, 0.011052131652832031, 0.0113983154296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 5.0, 7.0, 6.0, 8.0, 8.0, 10.0, 11.0, 9.0, 12.0, 31.0, 36.0, 52.0, 74.0, 181.0, 275.0, 1202.0, 530110.0, 514557.0, 1202.0, 292.0, 161.0, 84.0, 47.0, 44.0, 32.0, 20.0, 9.0, 8.0, 14.0, 5.0, 9.0, 6.0, 7.0, 4.0, 6.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20361328125, -0.19744300842285156, -0.19127273559570312, -0.1851024627685547, -0.17893218994140625, -0.1727619171142578, -0.16659164428710938, -0.16042137145996094, -0.1542510986328125, -0.14808082580566406, -0.14191055297851562, -0.1357402801513672, -0.12957000732421875, -0.12339973449707031, -0.11722946166992188, -0.11105918884277344, -0.104888916015625, -0.09871864318847656, -0.09254837036132812, -0.08637809753417969, -0.08020782470703125, -0.07403755187988281, -0.06786727905273438, -0.06169700622558594, -0.0555267333984375, -0.04935646057128906, -0.043186187744140625, -0.03701591491699219, -0.03084564208984375, -0.024675369262695312, -0.018505096435546875, -0.012334823608398438, -0.00616455078125, 5.7220458984375e-06, 0.006175994873046875, 0.012346267700195312, 0.01851654052734375, 0.024686813354492188, 0.030857086181640625, 0.03702735900878906, 0.0431976318359375, 0.04936790466308594, 0.055538177490234375, 0.06170845031738281, 0.06787872314453125, 0.07404899597167969, 0.08021926879882812, 0.08638954162597656, 0.092559814453125, 0.09873008728027344, 0.10490036010742188, 0.11107063293457031, 0.11724090576171875, 0.12341117858886719, 0.12958145141601562, 0.13575172424316406, 0.1419219970703125, 0.14809226989746094, 0.15426254272460938, 0.1604328155517578, 0.16660308837890625, 0.1727733612060547, 0.17894363403320312, 0.18511390686035156, 0.1912841796875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 9.0, 939.0, 67.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.1896173059940338, -0.18638519942760468, -0.18315309286117554, -0.1799209862947464, -0.17668887972831726, -0.17345677316188812, -0.17022466659545898, -0.16699256002902985, -0.1637604534626007, -0.16052834689617157, -0.15729624032974243, -0.1540641337633133, -0.15083202719688416, -0.14759992063045502, -0.14436781406402588, -0.14113570749759674, -0.1379035860300064, -0.13467147946357727, -0.13143937289714813, -0.128207266330719, -0.12497515976428986, -0.12174305319786072, -0.11851094663143158, -0.11527883261442184, -0.1120467334985733, -0.10881462693214417, -0.10558252036571503, -0.10235041379928589, -0.09911830723285675, -0.09588620066642761, -0.09265409409999847, -0.08942198008298874, -0.086189866065979, -0.08295775949954987, -0.07972565293312073, -0.07649354636669159, -0.07326143980026245, -0.07002933323383331, -0.06679722666740417, -0.06356511265039444, -0.0603330098092556, -0.05710090324282646, -0.053868796676397324, -0.05063668638467789, -0.04740457981824875, -0.04417247325181961, -0.04094036668539047, -0.037708260118961334, -0.034476153552532196, -0.031244046986103058, -0.02801193855702877, -0.024779831990599632, -0.021547723561525345, -0.018315616995096207, -0.015083510428667068, -0.011851401999592781, -0.008619293570518494, -0.005387186072766781, -0.0021550790406763554, 0.0010770279914140701, 0.004309135489165783, 0.007541242986917496, 0.010773349553346634, 0.014005457982420921, 0.01723756454885006]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 11.0, 9.0, 12.0, 17.0, 21.0, 28.0, 30.0, 35.0, 52.0, 44.0, 56.0, 41.0, 65.0, 59.0, 58.0, 49.0, 54.0, 46.0, 58.0, 29.0, 44.0, 33.0, 21.0, 23.0, 22.0, 22.0, 13.0, 8.0, 11.0, 12.0, 8.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005301833152770996, -0.005056959576904774, -0.004812086001038551, -0.004567212425172329, -0.004322338849306107, -0.004077465273439884, -0.003832591697573662, -0.0035877181217074394, -0.003342844545841217, -0.0030979709699749947, -0.0028530973941087723, -0.00260822381824255, -0.0023633502423763275, -0.002118476666510105, -0.0018736030906438828, -0.0016287295147776604, -0.001383855938911438, -0.0011389823630452156, -0.0008941087871789932, -0.0006492352113127708, -0.00040436163544654846, -0.00015948805958032608, 8.53855162858963e-05, 0.0003302590921521187, 0.0005751326680183411, 0.0008200062438845634, 0.0010648798197507858, 0.0013097533956170082, 0.0015546269714832306, 0.001799500547349453, 0.0020443741232156754, 0.0022892476990818977, 0.00253412127494812, 0.0027789948508143425, 0.003023868426680565, 0.0032687420025467873, 0.0035136155784130096, 0.003758489154279232, 0.004003362730145454, 0.004248236306011677, 0.004493109881877899, 0.0047379834577441216, 0.004982857033610344, 0.005227730609476566, 0.005472604185342789, 0.005717477761209011, 0.0059623513370752335, 0.006207224912941456, 0.006452098488807678, 0.006696972064673901, 0.006941845640540123, 0.007186719216406345, 0.007431592792272568, 0.00767646636813879, 0.007921339944005013, 0.008166213519871235, 0.008411087095737457, 0.00865596067160368, 0.008900834247469902, 0.009145707823336124, 0.009390581399202347, 0.00963545497506857, 0.009880328550934792, 0.010125202126801014, 0.010370075702667236]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 6.0, 11.0, 9.0, 8.0, 10.0, 7.0, 19.0, 20.0, 23.0, 24.0, 20.0, 30.0, 33.0, 34.0, 47.0, 44.0, 41.0, 51.0, 49.0, 42.0, 39.0, 39.0, 34.0, 37.0, 36.0, 33.0, 42.0, 28.0, 29.0, 26.0, 16.0, 27.0, 13.0, 15.0, 11.0, 8.0, 11.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75390625, -4.60736083984375, -4.4608154296875, -4.31427001953125, -4.167724609375, -4.02117919921875, -3.8746337890625, -3.72808837890625, -3.58154296875, -3.43499755859375, -3.2884521484375, -3.14190673828125, -2.995361328125, -2.84881591796875, -2.7022705078125, -2.55572509765625, -2.4091796875, -2.26263427734375, -2.1160888671875, -1.96954345703125, -1.822998046875, -1.67645263671875, -1.5299072265625, -1.38336181640625, -1.23681640625, -1.09027099609375, -0.9437255859375, -0.79718017578125, -0.650634765625, -0.50408935546875, -0.3575439453125, -0.21099853515625, -0.064453125, 0.08209228515625, 0.2286376953125, 0.37518310546875, 0.521728515625, 0.66827392578125, 0.8148193359375, 0.96136474609375, 1.10791015625, 1.25445556640625, 1.4010009765625, 1.54754638671875, 1.694091796875, 1.84063720703125, 1.9871826171875, 2.13372802734375, 2.2802734375, 2.42681884765625, 2.5733642578125, 2.71990966796875, 2.866455078125, 3.01300048828125, 3.1595458984375, 3.30609130859375, 3.45263671875, 3.59918212890625, 3.7457275390625, 3.89227294921875, 4.038818359375, 4.18536376953125, 4.3319091796875, 4.47845458984375, 4.625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 7.0, 9.0, 9.0, 8.0, 13.0, 7.0, 20.0, 38.0, 56.0, 80.0, 142.0, 290.0, 603.0, 1307.0, 2954.0, 6925.0, 16210.0, 37500.0, 97181.0, 278768.0, 369043.0, 144667.0, 53482.0, 22008.0, 9589.0, 4146.0, 1760.0, 817.0, 417.0, 183.0, 113.0, 64.0, 32.0, 28.0, 28.0, 8.0, 7.0, 10.0, 6.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.124755859375, -4.96044921875, -4.796142578125, -4.6318359375, -4.467529296875, -4.30322265625, -4.138916015625, -3.974609375, -3.810302734375, -3.64599609375, -3.481689453125, -3.3173828125, -3.153076171875, -2.98876953125, -2.824462890625, -2.66015625, -2.495849609375, -2.33154296875, -2.167236328125, -2.0029296875, -1.838623046875, -1.67431640625, -1.510009765625, -1.345703125, -1.181396484375, -1.01708984375, -0.852783203125, -0.6884765625, -0.524169921875, -0.35986328125, -0.195556640625, -0.03125, 0.133056640625, 0.29736328125, 0.461669921875, 0.6259765625, 0.790283203125, 0.95458984375, 1.118896484375, 1.283203125, 1.447509765625, 1.61181640625, 1.776123046875, 1.9404296875, 2.104736328125, 2.26904296875, 2.433349609375, 2.59765625, 2.761962890625, 2.92626953125, 3.090576171875, 3.2548828125, 3.419189453125, 3.58349609375, 3.747802734375, 3.912109375, 4.076416015625, 4.24072265625, 4.405029296875, 4.5693359375, 4.733642578125, 4.89794921875, 5.062255859375, 5.2265625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 5.0, 6.0, 9.0, 14.0, 23.0, 30.0, 18.0, 29.0, 29.0, 32.0, 31.0, 39.0, 42.0, 52.0, 53.0, 113.0, 224.0, 1430.0, 269.0, 131.0, 68.0, 40.0, 54.0, 46.0, 42.0, 33.0, 33.0, 18.0, 17.0, 21.0, 12.0, 12.0, 14.0, 18.0, 5.0, 5.0, 8.0, 4.0, 4.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.14453125, -15.6640625, -15.18359375, -14.703125, -14.22265625, -13.7421875, -13.26171875, -12.78125, -12.30078125, -11.8203125, -11.33984375, -10.859375, -10.37890625, -9.8984375, -9.41796875, -8.9375, -8.45703125, -7.9765625, -7.49609375, -7.015625, -6.53515625, -6.0546875, -5.57421875, -5.09375, -4.61328125, -4.1328125, -3.65234375, -3.171875, -2.69140625, -2.2109375, -1.73046875, -1.25, -0.76953125, -0.2890625, 0.19140625, 0.671875, 1.15234375, 1.6328125, 2.11328125, 2.59375, 3.07421875, 3.5546875, 4.03515625, 4.515625, 4.99609375, 5.4765625, 5.95703125, 6.4375, 6.91796875, 7.3984375, 7.87890625, 8.359375, 8.83984375, 9.3203125, 9.80078125, 10.28125, 10.76171875, 11.2421875, 11.72265625, 12.203125, 12.68359375, 13.1640625, 13.64453125, 14.125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 16.0, 11.0, 13.0, 13.0, 23.0, 26.0, 31.0, 38.0, 78.0, 75.0, 118.0, 217.0, 283.0, 562.0, 1366.0, 7476.0, 1016485.0, 2105467.0, 10259.0, 1515.0, 636.0, 289.0, 181.0, 148.0, 93.0, 69.0, 55.0, 29.0, 24.0, 15.0, 17.0, 12.0, 7.0, 8.0, 11.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-35.0625, -34.062255859375, -33.06201171875, -32.061767578125, -31.0615234375, -30.061279296875, -29.06103515625, -28.060791015625, -27.060546875, -26.060302734375, -25.06005859375, -24.059814453125, -23.0595703125, -22.059326171875, -21.05908203125, -20.058837890625, -19.05859375, -18.058349609375, -17.05810546875, -16.057861328125, -15.0576171875, -14.057373046875, -13.05712890625, -12.056884765625, -11.056640625, -10.056396484375, -9.05615234375, -8.055908203125, -7.0556640625, -6.055419921875, -5.05517578125, -4.054931640625, -3.0546875, -2.054443359375, -1.05419921875, -0.053955078125, 0.9462890625, 1.946533203125, 2.94677734375, 3.947021484375, 4.947265625, 5.947509765625, 6.94775390625, 7.947998046875, 8.9482421875, 9.948486328125, 10.94873046875, 11.948974609375, 12.94921875, 13.949462890625, 14.94970703125, 15.949951171875, 16.9501953125, 17.950439453125, 18.95068359375, 19.950927734375, 20.951171875, 21.951416015625, 22.95166015625, 23.951904296875, 24.9521484375, 25.952392578125, 26.95263671875, 27.952880859375, 28.953125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 22.0, 120.0, 383.0, 354.0, 111.0, 22.0, 2.0, 1.0, 0.0, 1.0], "bins": [-128.77508544921875, -126.50971984863281, -124.24435424804688, -121.97898864746094, -119.713623046875, -117.44825744628906, -115.18289184570312, -112.91753387451172, -110.65216827392578, -108.38680267333984, -106.1214370727539, -103.85607147216797, -101.59070587158203, -99.32534790039062, -97.05998229980469, -94.79461669921875, -92.52925109863281, -90.26388549804688, -87.99851989746094, -85.733154296875, -83.46778869628906, -81.20242309570312, -78.93705749511719, -76.67169952392578, -74.40632629394531, -72.14096069335938, -69.87559509277344, -67.6102294921875, -65.34486389160156, -63.07950210571289, -60.81413650512695, -58.548770904541016, -56.283409118652344, -54.018043518066406, -51.75267791748047, -49.48731231689453, -47.22195053100586, -44.95658493041992, -42.691219329833984, -40.42585372924805, -38.16048812866211, -35.89512252807617, -33.629756927490234, -31.36439323425293, -29.099029541015625, -26.833663940429688, -24.56829833984375, -22.302932739257812, -20.037569046020508, -17.77220344543457, -15.506839752197266, -13.241474151611328, -10.976109504699707, -8.710744857788086, -6.445379257202148, -4.180014610290527, -1.9146499633789062, 0.35071492195129395, 2.616079807281494, 4.881444931030273, 7.1468095779418945, 9.412174224853516, 11.677539825439453, 13.942904472351074, 16.208269119262695]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 6.0, 9.0, 5.0, 5.0, 12.0, 10.0, 7.0, 11.0, 11.0, 17.0, 15.0, 28.0, 31.0, 31.0, 30.0, 33.0, 33.0, 36.0, 49.0, 36.0, 33.0, 40.0, 35.0, 32.0, 44.0, 44.0, 27.0, 35.0, 35.0, 37.0, 33.0, 26.0, 26.0, 13.0, 23.0, 22.0, 11.0, 13.0, 11.0, 8.0, 6.0, 5.0, 5.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-36.420597076416016, -35.336246490478516, -34.25189971923828, -33.16754913330078, -32.08319854736328, -30.99884796142578, -29.914499282836914, -28.830150604248047, -27.745800018310547, -26.661449432373047, -25.57710075378418, -24.492752075195312, -23.408401489257812, -22.324050903320312, -21.239702224731445, -20.155353546142578, -19.071002960205078, -17.986652374267578, -16.90230369567871, -15.817954063415527, -14.733604431152344, -13.64925479888916, -12.564905166625977, -11.480555534362793, -10.39620590209961, -9.311856269836426, -8.227506637573242, -7.143157005310059, -6.058807373046875, -4.974457740783691, -3.890108108520508, -2.805758476257324, -1.7214126586914062, -0.6370630264282227, 0.44728660583496094, 1.5316362380981445, 2.615985870361328, 3.7003355026245117, 4.784685134887695, 5.869034767150879, 6.9533843994140625, 8.037734031677246, 9.12208366394043, 10.206433296203613, 11.290782928466797, 12.37513256072998, 13.459482192993164, 14.543831825256348, 15.628181457519531, 16.71253204345703, 17.7968807220459, 18.881229400634766, 19.965579986572266, 21.049930572509766, 22.134279251098633, 23.2186279296875, 24.302978515625, 25.3873291015625, 26.471677780151367, 27.556026458740234, 28.640377044677734, 29.724727630615234, 30.8090763092041, 31.89342498779297, 32.97777557373047]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 2.0, 9.0, 9.0, 16.0, 11.0, 13.0, 21.0, 17.0, 21.0, 28.0, 42.0, 37.0, 33.0, 39.0, 50.0, 35.0, 42.0, 50.0, 53.0, 41.0, 44.0, 42.0, 34.0, 39.0, 32.0, 25.0, 32.0, 33.0, 23.0, 19.0, 20.0, 14.0, 13.0, 11.0, 8.0, 8.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.25390625, -5.09564208984375, -4.9373779296875, -4.77911376953125, -4.620849609375, -4.46258544921875, -4.3043212890625, -4.14605712890625, -3.98779296875, -3.82952880859375, -3.6712646484375, -3.51300048828125, -3.354736328125, -3.19647216796875, -3.0382080078125, -2.87994384765625, -2.7216796875, -2.56341552734375, -2.4051513671875, -2.24688720703125, -2.088623046875, -1.93035888671875, -1.7720947265625, -1.61383056640625, -1.45556640625, -1.29730224609375, -1.1390380859375, -0.98077392578125, -0.822509765625, -0.66424560546875, -0.5059814453125, -0.34771728515625, -0.189453125, -0.03118896484375, 0.1270751953125, 0.28533935546875, 0.443603515625, 0.60186767578125, 0.7601318359375, 0.91839599609375, 1.07666015625, 1.23492431640625, 1.3931884765625, 1.55145263671875, 1.709716796875, 1.86798095703125, 2.0262451171875, 2.18450927734375, 2.3427734375, 2.50103759765625, 2.6593017578125, 2.81756591796875, 2.975830078125, 3.13409423828125, 3.2923583984375, 3.45062255859375, 3.60888671875, 3.76715087890625, 3.9254150390625, 4.08367919921875, 4.241943359375, 4.40020751953125, 4.5584716796875, 4.71673583984375, 4.875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 4.0, 7.0, 3.0, 11.0, 5.0, 7.0, 18.0, 24.0, 11.0, 26.0, 29.0, 39.0, 42.0, 61.0, 81.0, 156.0, 373.0, 1545.0, 9986.0, 131384.0, 1956813.0, 1946742.0, 133866.0, 10468.0, 1606.0, 425.0, 164.0, 85.0, 60.0, 46.0, 28.0, 29.0, 28.0, 20.0, 21.0, 17.0, 8.0, 8.0, 7.0, 8.0, 4.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6796875, -11.314697265625, -10.94970703125, -10.584716796875, -10.2197265625, -9.854736328125, -9.48974609375, -9.124755859375, -8.759765625, -8.394775390625, -8.02978515625, -7.664794921875, -7.2998046875, -6.934814453125, -6.56982421875, -6.204833984375, -5.83984375, -5.474853515625, -5.10986328125, -4.744873046875, -4.3798828125, -4.014892578125, -3.64990234375, -3.284912109375, -2.919921875, -2.554931640625, -2.18994140625, -1.824951171875, -1.4599609375, -1.094970703125, -0.72998046875, -0.364990234375, 0.0, 0.364990234375, 0.72998046875, 1.094970703125, 1.4599609375, 1.824951171875, 2.18994140625, 2.554931640625, 2.919921875, 3.284912109375, 3.64990234375, 4.014892578125, 4.3798828125, 4.744873046875, 5.10986328125, 5.474853515625, 5.83984375, 6.204833984375, 6.56982421875, 6.934814453125, 7.2998046875, 7.664794921875, 8.02978515625, 8.394775390625, 8.759765625, 9.124755859375, 9.48974609375, 9.854736328125, 10.2197265625, 10.584716796875, 10.94970703125, 11.314697265625, 11.6796875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 10.0, 12.0, 13.0, 17.0, 20.0, 26.0, 43.0, 37.0, 57.0, 77.0, 105.0, 124.0, 173.0, 256.0, 372.0, 388.0, 448.0, 447.0, 353.0, 272.0, 207.0, 138.0, 113.0, 84.0, 66.0, 42.0, 38.0, 28.0, 26.0, 22.0, 9.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.56640625, -7.34814453125, -7.1298828125, -6.91162109375, -6.693359375, -6.47509765625, -6.2568359375, -6.03857421875, -5.8203125, -5.60205078125, -5.3837890625, -5.16552734375, -4.947265625, -4.72900390625, -4.5107421875, -4.29248046875, -4.07421875, -3.85595703125, -3.6376953125, -3.41943359375, -3.201171875, -2.98291015625, -2.7646484375, -2.54638671875, -2.328125, -2.10986328125, -1.8916015625, -1.67333984375, -1.455078125, -1.23681640625, -1.0185546875, -0.80029296875, -0.58203125, -0.36376953125, -0.1455078125, 0.07275390625, 0.291015625, 0.50927734375, 0.7275390625, 0.94580078125, 1.1640625, 1.38232421875, 1.6005859375, 1.81884765625, 2.037109375, 2.25537109375, 2.4736328125, 2.69189453125, 2.91015625, 3.12841796875, 3.3466796875, 3.56494140625, 3.783203125, 4.00146484375, 4.2197265625, 4.43798828125, 4.65625, 4.87451171875, 5.0927734375, 5.31103515625, 5.529296875, 5.74755859375, 5.9658203125, 6.18408203125, 6.40234375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 12.0, 20.0, 24.0, 31.0, 45.0, 66.0, 89.0, 104.0, 140.0, 255.0, 344.0, 679.0, 2541.0, 52063.0, 2939981.0, 1173490.0, 21108.0, 1641.0, 552.0, 331.0, 207.0, 137.0, 101.0, 68.0, 59.0, 43.0, 34.0, 21.0, 12.0, 19.0, 14.0, 4.0, 6.0, 5.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.609375, -21.8525390625, -21.095703125, -20.3388671875, -19.58203125, -18.8251953125, -18.068359375, -17.3115234375, -16.5546875, -15.7978515625, -15.041015625, -14.2841796875, -13.52734375, -12.7705078125, -12.013671875, -11.2568359375, -10.5, -9.7431640625, -8.986328125, -8.2294921875, -7.47265625, -6.7158203125, -5.958984375, -5.2021484375, -4.4453125, -3.6884765625, -2.931640625, -2.1748046875, -1.41796875, -0.6611328125, 0.095703125, 0.8525390625, 1.609375, 2.3662109375, 3.123046875, 3.8798828125, 4.63671875, 5.3935546875, 6.150390625, 6.9072265625, 7.6640625, 8.4208984375, 9.177734375, 9.9345703125, 10.69140625, 11.4482421875, 12.205078125, 12.9619140625, 13.71875, 14.4755859375, 15.232421875, 15.9892578125, 16.74609375, 17.5029296875, 18.259765625, 19.0166015625, 19.7734375, 20.5302734375, 21.287109375, 22.0439453125, 22.80078125, 23.5576171875, 24.314453125, 25.0712890625, 25.828125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 10.0, 39.0, 131.0, 253.0, 318.0, 173.0, 72.0, 18.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.6399154663086, -86.26260375976562, -83.88529205322266, -81.50798034667969, -79.13066864013672, -76.75335693359375, -74.37604522705078, -71.99873352050781, -69.62142944335938, -67.2441177368164, -64.86680603027344, -62.48949432373047, -60.1121826171875, -57.73487091064453, -55.35756301879883, -52.98025131225586, -50.602935791015625, -48.225624084472656, -45.84831237792969, -43.47100067138672, -41.09368896484375, -38.71637725830078, -36.33906936645508, -33.96175765991211, -31.58444595336914, -29.207134246826172, -26.829822540283203, -24.452512741088867, -22.0752010345459, -19.69788932800293, -17.320579528808594, -14.943267822265625, -12.565963745117188, -10.188652038574219, -7.811341285705566, -5.434030055999756, -3.0567188262939453, -0.6794071197509766, 1.6979036331176758, 4.075214385986328, 6.452526092529297, 8.829837799072266, 11.207148551940918, 13.58445930480957, 15.961771011352539, 18.339082717895508, 20.716392517089844, 23.093704223632812, 25.47101593017578, 27.84832763671875, 30.22563934326172, 32.60295104980469, 34.980262756347656, 37.357574462890625, 39.73488235473633, 42.1121940612793, 44.489505767822266, 46.866817474365234, 49.2441291809082, 51.62144088745117, 53.998748779296875, 56.376060485839844, 58.75337219238281, 61.13068389892578, 63.50799560546875]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 6.0, 9.0, 7.0, 13.0, 8.0, 15.0, 17.0, 21.0, 21.0, 24.0, 33.0, 21.0, 34.0, 26.0, 36.0, 43.0, 39.0, 49.0, 38.0, 46.0, 38.0, 48.0, 41.0, 38.0, 46.0, 28.0, 40.0, 25.0, 37.0, 19.0, 24.0, 24.0, 17.0, 10.0, 6.0, 12.0, 7.0, 10.0, 4.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.472126007080078, -24.712486267089844, -23.95284652709961, -23.193206787109375, -22.43356704711914, -21.673927307128906, -20.914287567138672, -20.154647827148438, -19.395008087158203, -18.63536834716797, -17.875728607177734, -17.1160888671875, -16.356449127197266, -15.596809387207031, -14.837169647216797, -14.077529907226562, -13.317890167236328, -12.558250427246094, -11.79861068725586, -11.038970947265625, -10.27933120727539, -9.519691467285156, -8.760051727294922, -8.000411987304688, -7.240772247314453, -6.481132507324219, -5.721492767333984, -4.96185302734375, -4.202213287353516, -3.4425735473632812, -2.682933807373047, -1.9232940673828125, -1.1636543273925781, -0.40401458740234375, 0.3556251525878906, 1.115264892578125, 1.8749046325683594, 2.6345443725585938, 3.394184112548828, 4.1538238525390625, 4.913463592529297, 5.673103332519531, 6.432743072509766, 7.1923828125, 7.952022552490234, 8.711662292480469, 9.471302032470703, 10.230941772460938, 10.990581512451172, 11.750221252441406, 12.50986099243164, 13.269500732421875, 14.02914047241211, 14.788780212402344, 15.548419952392578, 16.308059692382812, 17.067699432373047, 17.82733917236328, 18.586978912353516, 19.34661865234375, 20.106258392333984, 20.86589813232422, 21.625537872314453, 22.385177612304688, 23.144817352294922]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 6.0, 9.0, 11.0, 11.0, 15.0, 12.0, 26.0, 20.0, 23.0, 28.0, 21.0, 40.0, 33.0, 42.0, 37.0, 40.0, 42.0, 44.0, 47.0, 43.0, 45.0, 43.0, 31.0, 42.0, 39.0, 25.0, 35.0, 24.0, 21.0, 19.0, 18.0, 23.0, 15.0, 13.0, 10.0, 12.0, 7.0, 3.0, 5.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.703125, -4.55908203125, -4.4150390625, -4.27099609375, -4.126953125, -3.98291015625, -3.8388671875, -3.69482421875, -3.55078125, -3.40673828125, -3.2626953125, -3.11865234375, -2.974609375, -2.83056640625, -2.6865234375, -2.54248046875, -2.3984375, -2.25439453125, -2.1103515625, -1.96630859375, -1.822265625, -1.67822265625, -1.5341796875, -1.39013671875, -1.24609375, -1.10205078125, -0.9580078125, -0.81396484375, -0.669921875, -0.52587890625, -0.3818359375, -0.23779296875, -0.09375, 0.05029296875, 0.1943359375, 0.33837890625, 0.482421875, 0.62646484375, 0.7705078125, 0.91455078125, 1.05859375, 1.20263671875, 1.3466796875, 1.49072265625, 1.634765625, 1.77880859375, 1.9228515625, 2.06689453125, 2.2109375, 2.35498046875, 2.4990234375, 2.64306640625, 2.787109375, 2.93115234375, 3.0751953125, 3.21923828125, 3.36328125, 3.50732421875, 3.6513671875, 3.79541015625, 3.939453125, 4.08349609375, 4.2275390625, 4.37158203125, 4.515625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 13.0, 18.0, 18.0, 23.0, 42.0, 63.0, 89.0, 169.0, 191.0, 328.0, 589.0, 971.0, 1563.0, 2624.0, 4482.0, 7968.0, 13795.0, 24434.0, 44600.0, 81900.0, 147439.0, 226588.0, 208116.0, 125901.0, 69598.0, 37734.0, 20909.0, 11785.0, 6788.0, 3880.0, 2259.0, 1358.0, 865.0, 511.0, 350.0, 202.0, 135.0, 102.0, 53.0, 32.0, 23.0, 16.0, 5.0, 8.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.5751953125, -0.5586967468261719, -0.5421981811523438, -0.5256996154785156, -0.5092010498046875, -0.4927024841308594, -0.47620391845703125, -0.4597053527832031, -0.443206787109375, -0.4267082214355469, -0.41020965576171875, -0.3937110900878906, -0.3772125244140625, -0.3607139587402344, -0.34421539306640625, -0.3277168273925781, -0.31121826171875, -0.2947196960449219, -0.27822113037109375, -0.2617225646972656, -0.2452239990234375, -0.22872543334960938, -0.21222686767578125, -0.19572830200195312, -0.179229736328125, -0.16273117065429688, -0.14623260498046875, -0.12973403930664062, -0.1132354736328125, -0.09673690795898438, -0.08023834228515625, -0.06373977661132812, -0.0472412109375, -0.030742645263671875, -0.01424407958984375, 0.002254486083984375, 0.0187530517578125, 0.035251617431640625, 0.05175018310546875, 0.06824874877929688, 0.084747314453125, 0.10124588012695312, 0.11774444580078125, 0.13424301147460938, 0.1507415771484375, 0.16724014282226562, 0.18373870849609375, 0.20023727416992188, 0.21673583984375, 0.23323440551757812, 0.24973297119140625, 0.2662315368652344, 0.2827301025390625, 0.2992286682128906, 0.31572723388671875, 0.3322257995605469, 0.348724365234375, 0.3652229309082031, 0.38172149658203125, 0.3982200622558594, 0.4147186279296875, 0.4312171936035156, 0.44771575927734375, 0.4642143249511719, 0.480712890625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 7.0, 10.0, 11.0, 12.0, 17.0, 20.0, 11.0, 27.0, 23.0, 32.0, 37.0, 31.0, 52.0, 30.0, 38.0, 31.0, 40.0, 41.0, 1058.0, 43.0, 33.0, 44.0, 34.0, 30.0, 35.0, 29.0, 30.0, 36.0, 17.0, 27.0, 16.0, 19.0, 17.0, 15.0, 10.0, 11.0, 8.0, 9.0, 5.0, 9.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.1953125, -3.10491943359375, -3.0145263671875, -2.92413330078125, -2.833740234375, -2.74334716796875, -2.6529541015625, -2.56256103515625, -2.47216796875, -2.38177490234375, -2.2913818359375, -2.20098876953125, -2.110595703125, -2.02020263671875, -1.9298095703125, -1.83941650390625, -1.7490234375, -1.65863037109375, -1.5682373046875, -1.47784423828125, -1.387451171875, -1.29705810546875, -1.2066650390625, -1.11627197265625, -1.02587890625, -0.93548583984375, -0.8450927734375, -0.75469970703125, -0.664306640625, -0.57391357421875, -0.4835205078125, -0.39312744140625, -0.302734375, -0.21234130859375, -0.1219482421875, -0.03155517578125, 0.058837890625, 0.14923095703125, 0.2396240234375, 0.33001708984375, 0.42041015625, 0.51080322265625, 0.6011962890625, 0.69158935546875, 0.781982421875, 0.87237548828125, 0.9627685546875, 1.05316162109375, 1.1435546875, 1.23394775390625, 1.3243408203125, 1.41473388671875, 1.505126953125, 1.59552001953125, 1.6859130859375, 1.77630615234375, 1.86669921875, 1.95709228515625, 2.0474853515625, 2.13787841796875, 2.228271484375, 2.31866455078125, 2.4090576171875, 2.49945068359375, 2.58984375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 6.0, 4.0, 20.0, 21.0, 31.0, 50.0, 96.0, 102.0, 177.0, 226.0, 316.0, 436.0, 594.0, 938.0, 1260.0, 1737.0, 2470.0, 3583.0, 5115.0, 7318.0, 10625.0, 15274.0, 22148.0, 32633.0, 47083.0, 67356.0, 93478.0, 124041.0, 1187908.0, 132726.0, 101039.0, 72759.0, 51060.0, 35566.0, 24439.0, 16608.0, 11517.0, 7935.0, 5384.0, 3851.0, 2722.0, 1858.0, 1359.0, 971.0, 653.0, 535.0, 351.0, 254.0, 176.0, 115.0, 80.0, 52.0, 27.0, 25.0, 12.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.252197265625, -0.24422073364257812, -0.23624420166015625, -0.22826766967773438, -0.2202911376953125, -0.21231460571289062, -0.20433807373046875, -0.19636154174804688, -0.188385009765625, -0.18040847778320312, -0.17243194580078125, -0.16445541381835938, -0.1564788818359375, -0.14850234985351562, -0.14052581787109375, -0.13254928588867188, -0.12457275390625, -0.11659622192382812, -0.10861968994140625, -0.10064315795898438, -0.0926666259765625, -0.08469009399414062, -0.07671356201171875, -0.06873703002929688, -0.060760498046875, -0.052783966064453125, -0.04480743408203125, -0.036830902099609375, -0.0288543701171875, -0.020877838134765625, -0.01290130615234375, -0.004924774169921875, 0.0030517578125, 0.011028289794921875, 0.01900482177734375, 0.026981353759765625, 0.0349578857421875, 0.042934417724609375, 0.05091094970703125, 0.058887481689453125, 0.066864013671875, 0.07484054565429688, 0.08281707763671875, 0.09079360961914062, 0.0987701416015625, 0.10674667358398438, 0.11472320556640625, 0.12269973754882812, 0.13067626953125, 0.13865280151367188, 0.14662933349609375, 0.15460586547851562, 0.1625823974609375, 0.17055892944335938, 0.17853546142578125, 0.18651199340820312, 0.194488525390625, 0.20246505737304688, 0.21044158935546875, 0.21841812133789062, 0.2263946533203125, 0.23437118530273438, 0.24234771728515625, 0.2503242492675781, 0.25830078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 7.0, 10.0, 5.0, 10.0, 9.0, 11.0, 14.0, 25.0, 28.0, 50.0, 49.0, 98.0, 104.0, 123.0, 120.0, 70.0, 61.0, 42.0, 25.0, 28.0, 11.0, 10.0, 12.0, 9.0, 10.0, 7.0, 3.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005950927734375, -0.005760610103607178, -0.0055702924728393555, -0.005379974842071533, -0.005189657211303711, -0.004999339580535889, -0.004809021949768066, -0.004618704319000244, -0.004428386688232422, -0.0042380690574646, -0.004047751426696777, -0.003857433795928955, -0.003667116165161133, -0.0034767985343933105, -0.0032864809036254883, -0.003096163272857666, -0.0029058456420898438, -0.0027155280113220215, -0.0025252103805541992, -0.002334892749786377, -0.0021445751190185547, -0.0019542574882507324, -0.0017639398574829102, -0.0015736222267150879, -0.0013833045959472656, -0.0011929869651794434, -0.001002669334411621, -0.0008123517036437988, -0.0006220340728759766, -0.0004317164421081543, -0.00024139881134033203, -5.1081180572509766e-05, 0.0001392364501953125, 0.00032955408096313477, 0.000519871711730957, 0.0007101893424987793, 0.0009005069732666016, 0.0010908246040344238, 0.001281142234802246, 0.0014714598655700684, 0.0016617774963378906, 0.0018520951271057129, 0.002042412757873535, 0.0022327303886413574, 0.0024230480194091797, 0.002613365650177002, 0.0028036832809448242, 0.0029940009117126465, 0.0031843185424804688, 0.003374636173248291, 0.0035649538040161133, 0.0037552714347839355, 0.003945589065551758, 0.00413590669631958, 0.004326224327087402, 0.004516541957855225, 0.004706859588623047, 0.004897177219390869, 0.005087494850158691, 0.005277812480926514, 0.005468130111694336, 0.005658447742462158, 0.0058487653732299805, 0.006039083003997803, 0.006229400634765625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 4.0, 8.0, 16.0, 17.0, 15.0, 22.0, 27.0, 49.0, 48.0, 97.0, 172.0, 281.0, 761.0, 312645.0, 732629.0, 945.0, 293.0, 165.0, 92.0, 47.0, 44.0, 20.0, 29.0, 19.0, 19.0, 13.0, 7.0, 11.0, 9.0, 10.0, 5.0, 2.0, 7.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1400146484375, -0.13590145111083984, -0.1317882537841797, -0.12767505645751953, -0.12356185913085938, -0.11944866180419922, -0.11533546447753906, -0.1112222671508789, -0.10710906982421875, -0.1029958724975586, -0.09888267517089844, -0.09476947784423828, -0.09065628051757812, -0.08654308319091797, -0.08242988586425781, -0.07831668853759766, -0.0742034912109375, -0.07009029388427734, -0.06597709655761719, -0.06186389923095703, -0.057750701904296875, -0.05363750457763672, -0.04952430725097656, -0.045411109924316406, -0.04129791259765625, -0.037184715270996094, -0.03307151794433594, -0.02895832061767578, -0.024845123291015625, -0.02073192596435547, -0.016618728637695312, -0.012505531311035156, -0.008392333984375, -0.004279136657714844, -0.0001659393310546875, 0.003947257995605469, 0.008060455322265625, 0.012173652648925781, 0.016286849975585938, 0.020400047302246094, 0.02451324462890625, 0.028626441955566406, 0.03273963928222656, 0.03685283660888672, 0.040966033935546875, 0.04507923126220703, 0.04919242858886719, 0.053305625915527344, 0.0574188232421875, 0.061532020568847656, 0.06564521789550781, 0.06975841522216797, 0.07387161254882812, 0.07798480987548828, 0.08209800720214844, 0.0862112045288086, 0.09032440185546875, 0.0944375991821289, 0.09855079650878906, 0.10266399383544922, 0.10677719116210938, 0.11089038848876953, 0.11500358581542969, 0.11911678314208984, 0.12322998046875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [10.0, 89.0, 608.0, 271.0, 31.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018283004174008965, -0.0011512056225910783, -0.00047411082778126, 0.00020298396702855825, 0.0008800787618383765, 0.0015571735566481948, 0.002234268467873335, 0.002911363262683153, 0.0035884580574929714, 0.00426555285230279, 0.004942647647112608, 0.005619742441922426, 0.0062968372367322445, 0.006973932031542063, 0.007651026826351881, 0.008328121155500412, 0.00900521595031023, 0.009682310745120049, 0.010359405539929867, 0.011036500334739685, 0.011713595129549503, 0.012390689924359322, 0.01306778471916914, 0.013744879513978958, 0.014421974308788776, 0.015099069103598595, 0.015776164829730988, 0.01645325869321823, 0.017130352556705475, 0.017807448282837868, 0.01848454400897026, 0.019161637872457504, 0.019838731735944748, 0.02051582559943199, 0.021192921325564384, 0.021870017051696777, 0.02254711091518402, 0.023224204778671265, 0.023901300504803658, 0.02457839623093605, 0.025255490094423294, 0.025932583957910538, 0.02660967968404293, 0.027286775410175323, 0.027963869273662567, 0.02864096313714981, 0.029318058863282204, 0.029995154589414597, 0.03067224845290184, 0.031349342316389084, 0.032026439905166626, 0.03270353376865387, 0.03338062763214111, 0.03405772149562836, 0.0347348153591156, 0.03541191294789314, 0.036089006811380386, 0.03676610067486763, 0.03744319826364517, 0.038120292127132416, 0.03879738599061966, 0.0394744798541069, 0.04015157371759415, 0.04082867130637169, 0.04150576516985893]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 8.0, 10.0, 8.0, 16.0, 20.0, 17.0, 16.0, 18.0, 23.0, 25.0, 28.0, 26.0, 36.0, 36.0, 39.0, 34.0, 40.0, 49.0, 29.0, 31.0, 41.0, 47.0, 39.0, 35.0, 43.0, 38.0, 30.0, 36.0, 24.0, 25.0, 17.0, 18.0, 15.0, 21.0, 14.0, 8.0, 7.0, 6.0, 10.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031104683876037598, -0.003012058325111866, -0.0029136482626199722, -0.0028152382001280785, -0.0027168281376361847, -0.002618418075144291, -0.002520008012652397, -0.0024215979501605034, -0.0023231878876686096, -0.002224777825176716, -0.002126367762684822, -0.0020279577001929283, -0.0019295476377010345, -0.0018311375752091408, -0.001732727512717247, -0.0016343174502253532, -0.0015359073877334595, -0.0014374973252415657, -0.001339087262749672, -0.0012406772002577782, -0.0011422671377658844, -0.0010438570752739906, -0.0009454470127820969, -0.0008470369502902031, -0.0007486268877983093, -0.0006502168253064156, -0.0005518067628145218, -0.000453396700322628, -0.00035498663783073425, -0.0002565765753388405, -0.00015816651284694672, -5.975645035505295e-05, 3.865361213684082e-05, 0.0001370636746287346, 0.00023547373712062836, 0.0003338837996125221, 0.0004322938621044159, 0.0005307039245963097, 0.0006291139870882034, 0.0007275240495800972, 0.000825934112071991, 0.0009243441745638847, 0.0010227542370557785, 0.0011211642995476723, 0.001219574362039566, 0.0013179844245314598, 0.0014163944870233536, 0.0015148045495152473, 0.0016132146120071411, 0.0017116246744990349, 0.0018100347369909286, 0.0019084447994828224, 0.002006854861974716, 0.00210526492446661, 0.0022036749869585037, 0.0023020850494503975, 0.0024004951119422913, 0.002498905174434185, 0.002597315236926079, 0.0026957252994179726, 0.0027941353619098663, 0.00289254542440176, 0.002990955486893654, 0.0030893655493855476, 0.0031877756118774414]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 6.0, 9.0, 11.0, 11.0, 15.0, 12.0, 26.0, 20.0, 23.0, 28.0, 21.0, 40.0, 33.0, 42.0, 37.0, 40.0, 42.0, 44.0, 47.0, 43.0, 45.0, 43.0, 31.0, 42.0, 39.0, 25.0, 35.0, 24.0, 21.0, 19.0, 17.0, 24.0, 15.0, 13.0, 10.0, 12.0, 7.0, 3.0, 5.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.703125, -4.55908203125, -4.4150390625, -4.27099609375, -4.126953125, -3.98291015625, -3.8388671875, -3.69482421875, -3.55078125, -3.40673828125, -3.2626953125, -3.11865234375, -2.974609375, -2.83056640625, -2.6865234375, -2.54248046875, -2.3984375, -2.25439453125, -2.1103515625, -1.96630859375, -1.822265625, -1.67822265625, -1.5341796875, -1.39013671875, -1.24609375, -1.10205078125, -0.9580078125, -0.81396484375, -0.669921875, -0.52587890625, -0.3818359375, -0.23779296875, -0.09375, 0.05029296875, 0.1943359375, 0.33837890625, 0.482421875, 0.62646484375, 0.7705078125, 0.91455078125, 1.05859375, 1.20263671875, 1.3466796875, 1.49072265625, 1.634765625, 1.77880859375, 1.9228515625, 2.06689453125, 2.2109375, 2.35498046875, 2.4990234375, 2.64306640625, 2.787109375, 2.93115234375, 3.0751953125, 3.21923828125, 3.36328125, 3.50732421875, 3.6513671875, 3.79541015625, 3.939453125, 4.08349609375, 4.2275390625, 4.37158203125, 4.515625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 7.0, 9.0, 15.0, 16.0, 19.0, 24.0, 35.0, 47.0, 74.0, 65.0, 107.0, 142.0, 205.0, 338.0, 650.0, 1729.0, 6949.0, 31052.0, 176923.0, 640838.0, 152157.0, 27748.0, 6189.0, 1562.0, 558.0, 304.0, 201.0, 136.0, 103.0, 74.0, 58.0, 57.0, 35.0, 26.0, 23.0, 17.0, 10.0, 13.0, 5.0, 6.0, 5.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.125, -8.852294921875, -8.57958984375, -8.306884765625, -8.0341796875, -7.761474609375, -7.48876953125, -7.216064453125, -6.943359375, -6.670654296875, -6.39794921875, -6.125244140625, -5.8525390625, -5.579833984375, -5.30712890625, -5.034423828125, -4.76171875, -4.489013671875, -4.21630859375, -3.943603515625, -3.6708984375, -3.398193359375, -3.12548828125, -2.852783203125, -2.580078125, -2.307373046875, -2.03466796875, -1.761962890625, -1.4892578125, -1.216552734375, -0.94384765625, -0.671142578125, -0.3984375, -0.125732421875, 0.14697265625, 0.419677734375, 0.6923828125, 0.965087890625, 1.23779296875, 1.510498046875, 1.783203125, 2.055908203125, 2.32861328125, 2.601318359375, 2.8740234375, 3.146728515625, 3.41943359375, 3.692138671875, 3.96484375, 4.237548828125, 4.51025390625, 4.782958984375, 5.0556640625, 5.328369140625, 5.60107421875, 5.873779296875, 6.146484375, 6.419189453125, 6.69189453125, 6.964599609375, 7.2373046875, 7.510009765625, 7.78271484375, 8.055419921875, 8.328125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 10.0, 5.0, 3.0, 4.0, 1.0, 6.0, 10.0, 11.0, 8.0, 18.0, 23.0, 21.0, 22.0, 30.0, 26.0, 32.0, 46.0, 40.0, 60.0, 90.0, 189.0, 1491.0, 350.0, 113.0, 74.0, 44.0, 38.0, 47.0, 43.0, 37.0, 21.0, 30.0, 34.0, 20.0, 19.0, 9.0, 13.0, 2.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5, -13.995849609375, -13.49169921875, -12.987548828125, -12.4833984375, -11.979248046875, -11.47509765625, -10.970947265625, -10.466796875, -9.962646484375, -9.45849609375, -8.954345703125, -8.4501953125, -7.946044921875, -7.44189453125, -6.937744140625, -6.43359375, -5.929443359375, -5.42529296875, -4.921142578125, -4.4169921875, -3.912841796875, -3.40869140625, -2.904541015625, -2.400390625, -1.896240234375, -1.39208984375, -0.887939453125, -0.3837890625, 0.120361328125, 0.62451171875, 1.128662109375, 1.6328125, 2.136962890625, 2.64111328125, 3.145263671875, 3.6494140625, 4.153564453125, 4.65771484375, 5.161865234375, 5.666015625, 6.170166015625, 6.67431640625, 7.178466796875, 7.6826171875, 8.186767578125, 8.69091796875, 9.195068359375, 9.69921875, 10.203369140625, 10.70751953125, 11.211669921875, 11.7158203125, 12.219970703125, 12.72412109375, 13.228271484375, 13.732421875, 14.236572265625, 14.74072265625, 15.244873046875, 15.7490234375, 16.253173828125, 16.75732421875, 17.261474609375, 17.765625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 8.0, 13.0, 24.0, 31.0, 28.0, 52.0, 38.0, 50.0, 80.0, 110.0, 150.0, 249.0, 583.0, 1932.0, 26844.0, 3063242.0, 48428.0, 2332.0, 627.0, 275.0, 139.0, 108.0, 65.0, 53.0, 52.0, 28.0, 31.0, 24.0, 20.0, 16.0, 12.0, 6.0, 7.0, 4.0, 8.0, 3.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-38.0, -36.900390625, -35.80078125, -34.701171875, -33.6015625, -32.501953125, -31.40234375, -30.302734375, -29.203125, -28.103515625, -27.00390625, -25.904296875, -24.8046875, -23.705078125, -22.60546875, -21.505859375, -20.40625, -19.306640625, -18.20703125, -17.107421875, -16.0078125, -14.908203125, -13.80859375, -12.708984375, -11.609375, -10.509765625, -9.41015625, -8.310546875, -7.2109375, -6.111328125, -5.01171875, -3.912109375, -2.8125, -1.712890625, -0.61328125, 0.486328125, 1.5859375, 2.685546875, 3.78515625, 4.884765625, 5.984375, 7.083984375, 8.18359375, 9.283203125, 10.3828125, 11.482421875, 12.58203125, 13.681640625, 14.78125, 15.880859375, 16.98046875, 18.080078125, 19.1796875, 20.279296875, 21.37890625, 22.478515625, 23.578125, 24.677734375, 25.77734375, 26.876953125, 27.9765625, 29.076171875, 30.17578125, 31.275390625, 32.375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 9.0, 144.0, 711.0, 149.0, 4.0, 1.0], "bins": [-221.3907928466797, -217.72946166992188, -214.06814575195312, -210.4068145751953, -206.74549865722656, -203.08416748046875, -199.4228515625, -195.7615203857422, -192.10020446777344, -188.43887329101562, -184.77755737304688, -181.11622619628906, -177.4549102783203, -173.7935791015625, -170.13226318359375, -166.47093200683594, -162.80960083007812, -159.1482696533203, -155.48695373535156, -151.82562255859375, -148.164306640625, -144.5029754638672, -140.84165954589844, -137.18032836914062, -133.51901245117188, -129.85768127441406, -126.19636535644531, -122.53504180908203, -118.87371826171875, -115.21238708496094, -111.55107116699219, -107.88973999023438, -104.2284164428711, -100.56709289550781, -96.90576934814453, -93.24444580078125, -89.58312225341797, -85.92179870605469, -82.26046752929688, -78.5991439819336, -74.93782043457031, -71.27649688720703, -67.61517333984375, -63.95384979248047, -60.29252243041992, -56.63119888305664, -52.96987533569336, -49.30854797363281, -45.6472282409668, -41.985904693603516, -38.324581146240234, -34.66325378417969, -31.001930236816406, -27.340606689453125, -23.679283142089844, -20.01795768737793, -16.35663414001465, -12.69530963897705, -9.033985137939453, -5.372661590576172, -1.7113370895385742, 1.9499874114990234, 5.611310958862305, 9.272636413574219, 12.9339599609375]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 10.0, 8.0, 14.0, 16.0, 15.0, 25.0, 28.0, 23.0, 17.0, 31.0, 34.0, 38.0, 27.0, 45.0, 42.0, 44.0, 53.0, 35.0, 44.0, 49.0, 38.0, 50.0, 29.0, 30.0, 28.0, 30.0, 28.0, 28.0, 27.0, 20.0, 19.0, 15.0, 14.0, 9.0, 6.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.35503005981445, -37.15213394165039, -35.949241638183594, -34.74634552001953, -33.54344940185547, -32.34055709838867, -31.13766098022461, -29.93476676940918, -28.73187255859375, -27.52897834777832, -26.32608413696289, -25.123188018798828, -23.9202938079834, -22.71739959716797, -21.514503479003906, -20.311609268188477, -19.108715057373047, -17.905820846557617, -16.702926635742188, -15.500030517578125, -14.297136306762695, -13.094242095947266, -11.89134693145752, -10.688451766967773, -9.485557556152344, -8.282663345336914, -7.079768180847168, -5.87687349319458, -4.673978805541992, -3.4710841178894043, -2.2681894302368164, -1.0652942657470703, 0.13759994506835938, 1.3404946327209473, 2.543389320373535, 3.746284008026123, 4.949178695678711, 6.152073383331299, 7.354968070983887, 8.557863235473633, 9.760757446289062, 10.963651657104492, 12.166546821594238, 13.369441986083984, 14.572336196899414, 15.775230407714844, 16.978126525878906, 18.181020736694336, 19.383914947509766, 20.586809158325195, 21.789703369140625, 22.992599487304688, 24.195493698120117, 25.398387908935547, 26.60128402709961, 27.80417823791504, 29.00707244873047, 30.2099666595459, 31.412860870361328, 32.61575698852539, 33.81864929199219, 35.02154541015625, 36.22444152832031, 37.427337646484375, 38.63022994995117]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 5.0, 8.0, 7.0, 13.0, 14.0, 13.0, 21.0, 20.0, 25.0, 26.0, 34.0, 40.0, 32.0, 37.0, 43.0, 57.0, 56.0, 47.0, 34.0, 48.0, 49.0, 40.0, 33.0, 35.0, 29.0, 23.0, 31.0, 31.0, 21.0, 24.0, 20.0, 10.0, 14.0, 16.0, 8.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.96484375, -4.80511474609375, -4.6453857421875, -4.48565673828125, -4.325927734375, -4.16619873046875, -4.0064697265625, -3.84674072265625, -3.68701171875, -3.52728271484375, -3.3675537109375, -3.20782470703125, -3.048095703125, -2.88836669921875, -2.7286376953125, -2.56890869140625, -2.4091796875, -2.24945068359375, -2.0897216796875, -1.92999267578125, -1.770263671875, -1.61053466796875, -1.4508056640625, -1.29107666015625, -1.13134765625, -0.97161865234375, -0.8118896484375, -0.65216064453125, -0.492431640625, -0.33270263671875, -0.1729736328125, -0.01324462890625, 0.146484375, 0.30621337890625, 0.4659423828125, 0.62567138671875, 0.785400390625, 0.94512939453125, 1.1048583984375, 1.26458740234375, 1.42431640625, 1.58404541015625, 1.7437744140625, 1.90350341796875, 2.063232421875, 2.22296142578125, 2.3826904296875, 2.54241943359375, 2.7021484375, 2.86187744140625, 3.0216064453125, 3.18133544921875, 3.341064453125, 3.50079345703125, 3.6605224609375, 3.82025146484375, 3.97998046875, 4.13970947265625, 4.2994384765625, 4.45916748046875, 4.618896484375, 4.77862548828125, 4.9383544921875, 5.09808349609375, 5.2578125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 7.0, 8.0, 9.0, 8.0, 12.0, 13.0, 11.0, 30.0, 24.0, 35.0, 58.0, 91.0, 138.0, 299.0, 623.0, 1602.0, 5234.0, 25440.0, 222248.0, 1807983.0, 1862719.0, 233617.0, 26148.0, 5036.0, 1550.0, 633.0, 270.0, 130.0, 82.0, 46.0, 35.0, 22.0, 26.0, 17.0, 13.0, 12.0, 15.0, 13.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4140625, -9.1104736328125, -8.806884765625, -8.5032958984375, -8.19970703125, -7.8961181640625, -7.592529296875, -7.2889404296875, -6.9853515625, -6.6817626953125, -6.378173828125, -6.0745849609375, -5.77099609375, -5.4674072265625, -5.163818359375, -4.8602294921875, -4.556640625, -4.2530517578125, -3.949462890625, -3.6458740234375, -3.34228515625, -3.0386962890625, -2.735107421875, -2.4315185546875, -2.1279296875, -1.8243408203125, -1.520751953125, -1.2171630859375, -0.91357421875, -0.6099853515625, -0.306396484375, -0.0028076171875, 0.30078125, 0.6043701171875, 0.907958984375, 1.2115478515625, 1.51513671875, 1.8187255859375, 2.122314453125, 2.4259033203125, 2.7294921875, 3.0330810546875, 3.336669921875, 3.6402587890625, 3.94384765625, 4.2474365234375, 4.551025390625, 4.8546142578125, 5.158203125, 5.4617919921875, 5.765380859375, 6.0689697265625, 6.37255859375, 6.6761474609375, 6.979736328125, 7.2833251953125, 7.5869140625, 7.8905029296875, 8.194091796875, 8.4976806640625, 8.80126953125, 9.1048583984375, 9.408447265625, 9.7120361328125, 10.015625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 5.0, 11.0, 12.0, 15.0, 18.0, 20.0, 42.0, 55.0, 70.0, 78.0, 134.0, 157.0, 230.0, 295.0, 325.0, 417.0, 486.0, 383.0, 298.0, 255.0, 191.0, 140.0, 107.0, 67.0, 69.0, 44.0, 36.0, 21.0, 21.0, 11.0, 10.0, 8.0, 4.0, 10.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.09375, -7.877685546875, -7.66162109375, -7.445556640625, -7.2294921875, -7.013427734375, -6.79736328125, -6.581298828125, -6.365234375, -6.149169921875, -5.93310546875, -5.717041015625, -5.5009765625, -5.284912109375, -5.06884765625, -4.852783203125, -4.63671875, -4.420654296875, -4.20458984375, -3.988525390625, -3.7724609375, -3.556396484375, -3.34033203125, -3.124267578125, -2.908203125, -2.692138671875, -2.47607421875, -2.260009765625, -2.0439453125, -1.827880859375, -1.61181640625, -1.395751953125, -1.1796875, -0.963623046875, -0.74755859375, -0.531494140625, -0.3154296875, -0.099365234375, 0.11669921875, 0.332763671875, 0.548828125, 0.764892578125, 0.98095703125, 1.197021484375, 1.4130859375, 1.629150390625, 1.84521484375, 2.061279296875, 2.27734375, 2.493408203125, 2.70947265625, 2.925537109375, 3.1416015625, 3.357666015625, 3.57373046875, 3.789794921875, 4.005859375, 4.221923828125, 4.43798828125, 4.654052734375, 4.8701171875, 5.086181640625, 5.30224609375, 5.518310546875, 5.734375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 9.0, 2.0, 7.0, 4.0, 15.0, 4.0, 16.0, 26.0, 38.0, 47.0, 57.0, 80.0, 100.0, 164.0, 221.0, 306.0, 638.0, 1471.0, 5849.0, 49892.0, 948522.0, 2987179.0, 180249.0, 14578.0, 2546.0, 894.0, 435.0, 290.0, 190.0, 142.0, 87.0, 56.0, 41.0, 30.0, 21.0, 16.0, 22.0, 14.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.15625, -13.636474609375, -13.11669921875, -12.596923828125, -12.0771484375, -11.557373046875, -11.03759765625, -10.517822265625, -9.998046875, -9.478271484375, -8.95849609375, -8.438720703125, -7.9189453125, -7.399169921875, -6.87939453125, -6.359619140625, -5.83984375, -5.320068359375, -4.80029296875, -4.280517578125, -3.7607421875, -3.240966796875, -2.72119140625, -2.201416015625, -1.681640625, -1.161865234375, -0.64208984375, -0.122314453125, 0.3974609375, 0.917236328125, 1.43701171875, 1.956787109375, 2.4765625, 2.996337890625, 3.51611328125, 4.035888671875, 4.5556640625, 5.075439453125, 5.59521484375, 6.114990234375, 6.634765625, 7.154541015625, 7.67431640625, 8.194091796875, 8.7138671875, 9.233642578125, 9.75341796875, 10.273193359375, 10.79296875, 11.312744140625, 11.83251953125, 12.352294921875, 12.8720703125, 13.391845703125, 13.91162109375, 14.431396484375, 14.951171875, 15.470947265625, 15.99072265625, 16.510498046875, 17.0302734375, 17.550048828125, 18.06982421875, 18.589599609375, 19.109375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 16.0, 36.0, 133.0, 240.0, 254.0, 190.0, 105.0, 29.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.32569694519043, -17.063838958740234, -14.801979064941406, -12.540121078491211, -10.2782621383667, -8.016403198242188, -5.754545211791992, -3.4926862716674805, -1.2308273315429688, 1.0310313701629639, 3.2928900718688965, 5.55474853515625, 7.816607475280762, 10.078466415405273, 12.340324401855469, 14.60218334197998, 16.864042282104492, 19.125900268554688, 21.387760162353516, 23.64961814880371, 25.911476135253906, 28.173336029052734, 30.43519401550293, 32.697052001953125, 34.95891189575195, 37.22077178955078, 39.482627868652344, 41.74448776245117, 44.00634765625, 46.26820373535156, 48.53006362915039, 50.79192352294922, 53.05378723144531, 55.31564712524414, 57.5775032043457, 59.83936309814453, 62.10122299194336, 64.36308288574219, 66.62493896484375, 68.88679504394531, 71.1486587524414, 73.41051483154297, 75.67237854003906, 77.93423461914062, 80.19609069824219, 82.45795440673828, 84.71981048583984, 86.9816665649414, 89.2435302734375, 91.50538635253906, 93.76725006103516, 96.02910614013672, 98.29096221923828, 100.55282592773438, 102.81468200683594, 105.0765380859375, 107.33839416503906, 109.60025024414062, 111.86211395263672, 114.12397003173828, 116.38582611083984, 118.64768981933594, 120.9095458984375, 123.17140197753906, 125.43326568603516]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 13.0, 4.0, 8.0, 9.0, 11.0, 6.0, 21.0, 17.0, 14.0, 25.0, 29.0, 21.0, 32.0, 25.0, 27.0, 35.0, 38.0, 39.0, 37.0, 40.0, 40.0, 32.0, 41.0, 40.0, 34.0, 36.0, 39.0, 24.0, 47.0, 21.0, 22.0, 24.0, 27.0, 20.0, 17.0, 11.0, 15.0, 9.0, 7.0, 6.0, 9.0, 12.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.581222534179688, -23.817628860473633, -23.054035186767578, -22.290441513061523, -21.52684783935547, -20.763256072998047, -19.999662399291992, -19.236068725585938, -18.472475051879883, -17.708881378173828, -16.945287704467773, -16.18169403076172, -15.41810131072998, -14.654507637023926, -13.890914916992188, -13.127321243286133, -12.363727569580078, -11.600133895874023, -10.836540222167969, -10.07294750213623, -9.309353828430176, -8.545760154724121, -7.782166957855225, -7.018573760986328, -6.254980087280273, -5.491386413574219, -4.727793216705322, -3.9641997814178467, -3.200606346130371, -2.4370129108428955, -1.67341947555542, -0.9098262786865234, -0.14623260498046875, 0.6173608303070068, 1.3809542655944824, 2.144547700881958, 2.9081411361694336, 3.671734571456909, 4.435328006744385, 5.198921203613281, 5.962514877319336, 6.726108551025391, 7.489701747894287, 8.253294944763184, 9.016888618469238, 9.780482292175293, 10.544075012207031, 11.307668685913086, 12.07126235961914, 12.834856033325195, 13.59844970703125, 14.362042427062988, 15.125636100769043, 15.889229774475098, 16.652822494506836, 17.41641616821289, 18.180009841918945, 18.943603515625, 19.707197189331055, 20.47079086303711, 21.23438262939453, 21.997976303100586, 22.76156997680664, 23.525163650512695, 24.28875732421875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 7.0, 12.0, 14.0, 8.0, 13.0, 11.0, 27.0, 33.0, 30.0, 33.0, 45.0, 36.0, 47.0, 51.0, 46.0, 44.0, 55.0, 45.0, 41.0, 43.0, 30.0, 37.0, 39.0, 28.0, 31.0, 29.0, 25.0, 19.0, 25.0, 13.0, 14.0, 12.0, 15.0, 7.0, 9.0, 2.0, 3.0, 5.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.76788330078125, -4.6021728515625, -4.43646240234375, -4.270751953125, -4.10504150390625, -3.9393310546875, -3.77362060546875, -3.60791015625, -3.44219970703125, -3.2764892578125, -3.11077880859375, -2.945068359375, -2.77935791015625, -2.6136474609375, -2.44793701171875, -2.2822265625, -2.11651611328125, -1.9508056640625, -1.78509521484375, -1.619384765625, -1.45367431640625, -1.2879638671875, -1.12225341796875, -0.95654296875, -0.79083251953125, -0.6251220703125, -0.45941162109375, -0.293701171875, -0.12799072265625, 0.0377197265625, 0.20343017578125, 0.369140625, 0.53485107421875, 0.7005615234375, 0.86627197265625, 1.031982421875, 1.19769287109375, 1.3634033203125, 1.52911376953125, 1.69482421875, 1.86053466796875, 2.0262451171875, 2.19195556640625, 2.357666015625, 2.52337646484375, 2.6890869140625, 2.85479736328125, 3.0205078125, 3.18621826171875, 3.3519287109375, 3.51763916015625, 3.683349609375, 3.84906005859375, 4.0147705078125, 4.18048095703125, 4.34619140625, 4.51190185546875, 4.6776123046875, 4.84332275390625, 5.009033203125, 5.17474365234375, 5.3404541015625, 5.50616455078125, 5.671875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 7.0, 10.0, 21.0, 26.0, 34.0, 45.0, 77.0, 95.0, 158.0, 199.0, 284.0, 428.0, 574.0, 862.0, 1136.0, 1690.0, 2361.0, 3445.0, 5007.0, 7273.0, 10819.0, 15982.0, 23783.0, 34650.0, 50966.0, 74511.0, 107442.0, 143696.0, 155304.0, 125652.0, 89036.0, 61879.0, 41860.0, 28563.0, 19081.0, 12978.0, 8877.0, 6146.0, 4136.0, 2853.0, 1957.0, 1337.0, 993.0, 710.0, 463.0, 337.0, 237.0, 187.0, 156.0, 59.0, 67.0, 47.0, 26.0, 18.0, 10.0, 3.0, 5.0, 1.0, 3.0, 1.0, 4.0], "bins": [-0.337646484375, -0.3268394470214844, -0.31603240966796875, -0.3052253723144531, -0.2944183349609375, -0.2836112976074219, -0.27280426025390625, -0.2619972229003906, -0.251190185546875, -0.24038314819335938, -0.22957611083984375, -0.21876907348632812, -0.2079620361328125, -0.19715499877929688, -0.18634796142578125, -0.17554092407226562, -0.16473388671875, -0.15392684936523438, -0.14311981201171875, -0.13231277465820312, -0.1215057373046875, -0.11069869995117188, -0.09989166259765625, -0.08908462524414062, -0.078277587890625, -0.06747055053710938, -0.05666351318359375, -0.045856475830078125, -0.0350494384765625, -0.024242401123046875, -0.01343536376953125, -0.002628326416015625, 0.0081787109375, 0.018985748291015625, 0.02979278564453125, 0.040599822998046875, 0.0514068603515625, 0.062213897705078125, 0.07302093505859375, 0.08382797241210938, 0.094635009765625, 0.10544204711914062, 0.11624908447265625, 0.12705612182617188, 0.1378631591796875, 0.14867019653320312, 0.15947723388671875, 0.17028427124023438, 0.18109130859375, 0.19189834594726562, 0.20270538330078125, 0.21351242065429688, 0.2243194580078125, 0.23512649536132812, 0.24593353271484375, 0.2567405700683594, 0.267547607421875, 0.2783546447753906, 0.28916168212890625, 0.2999687194824219, 0.3107757568359375, 0.3215827941894531, 0.33238983154296875, 0.3431968688964844, 0.35400390625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 10.0, 5.0, 8.0, 12.0, 10.0, 10.0, 16.0, 18.0, 21.0, 18.0, 20.0, 23.0, 36.0, 22.0, 25.0, 35.0, 50.0, 40.0, 39.0, 39.0, 1076.0, 41.0, 32.0, 34.0, 39.0, 42.0, 25.0, 34.0, 33.0, 39.0, 28.0, 19.0, 17.0, 15.0, 12.0, 20.0, 10.0, 11.0, 10.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.380859375, -3.285308837890625, -3.18975830078125, -3.094207763671875, -2.9986572265625, -2.903106689453125, -2.80755615234375, -2.712005615234375, -2.616455078125, -2.520904541015625, -2.42535400390625, -2.329803466796875, -2.2342529296875, -2.138702392578125, -2.04315185546875, -1.947601318359375, -1.85205078125, -1.756500244140625, -1.66094970703125, -1.565399169921875, -1.4698486328125, -1.374298095703125, -1.27874755859375, -1.183197021484375, -1.087646484375, -0.992095947265625, -0.89654541015625, -0.800994873046875, -0.7054443359375, -0.609893798828125, -0.51434326171875, -0.418792724609375, -0.3232421875, -0.227691650390625, -0.13214111328125, -0.036590576171875, 0.0589599609375, 0.154510498046875, 0.25006103515625, 0.345611572265625, 0.441162109375, 0.536712646484375, 0.63226318359375, 0.727813720703125, 0.8233642578125, 0.918914794921875, 1.01446533203125, 1.110015869140625, 1.20556640625, 1.301116943359375, 1.39666748046875, 1.492218017578125, 1.5877685546875, 1.683319091796875, 1.77886962890625, 1.874420166015625, 1.969970703125, 2.065521240234375, 2.16107177734375, 2.256622314453125, 2.3521728515625, 2.447723388671875, 2.54327392578125, 2.638824462890625, 2.734375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 7.0, 5.0, 8.0, 13.0, 21.0, 19.0, 42.0, 53.0, 90.0, 118.0, 167.0, 269.0, 404.0, 625.0, 852.0, 1274.0, 1901.0, 2875.0, 4167.0, 6156.0, 9181.0, 13829.0, 19996.0, 29396.0, 42261.0, 62362.0, 87626.0, 118922.0, 1155798.0, 174946.0, 109506.0, 79366.0, 55067.0, 38522.0, 26112.0, 18049.0, 12007.0, 8036.0, 5533.0, 3749.0, 2591.0, 1714.0, 1128.0, 762.0, 511.0, 374.0, 229.0, 170.0, 93.0, 76.0, 56.0, 28.0, 24.0, 18.0, 14.0, 9.0, 9.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.259033203125, -0.2509002685546875, -0.242767333984375, -0.2346343994140625, -0.22650146484375, -0.2183685302734375, -0.210235595703125, -0.2021026611328125, -0.1939697265625, -0.1858367919921875, -0.177703857421875, -0.1695709228515625, -0.16143798828125, -0.1533050537109375, -0.145172119140625, -0.1370391845703125, -0.12890625, -0.1207733154296875, -0.112640380859375, -0.1045074462890625, -0.09637451171875, -0.0882415771484375, -0.080108642578125, -0.0719757080078125, -0.0638427734375, -0.0557098388671875, -0.047576904296875, -0.0394439697265625, -0.03131103515625, -0.0231781005859375, -0.015045166015625, -0.0069122314453125, 0.001220703125, 0.0093536376953125, 0.017486572265625, 0.0256195068359375, 0.03375244140625, 0.0418853759765625, 0.050018310546875, 0.0581512451171875, 0.0662841796875, 0.0744171142578125, 0.082550048828125, 0.0906829833984375, 0.09881591796875, 0.1069488525390625, 0.115081787109375, 0.1232147216796875, 0.13134765625, 0.1394805908203125, 0.147613525390625, 0.1557464599609375, 0.16387939453125, 0.1720123291015625, 0.180145263671875, 0.1882781982421875, 0.1964111328125, 0.2045440673828125, 0.212677001953125, 0.2208099365234375, 0.22894287109375, 0.2370758056640625, 0.245208740234375, 0.2533416748046875, 0.261474609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 11.0, 6.0, 6.0, 8.0, 14.0, 13.0, 9.0, 29.0, 27.0, 39.0, 47.0, 56.0, 73.0, 86.0, 91.0, 99.0, 67.0, 55.0, 54.0, 36.0, 33.0, 22.0, 21.0, 17.0, 12.0, 13.0, 7.0, 9.0, 8.0, 3.0, 6.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005779266357421875, -0.005607903003692627, -0.005436539649963379, -0.005265176296234131, -0.005093812942504883, -0.004922449588775635, -0.004751086235046387, -0.004579722881317139, -0.004408359527587891, -0.004236996173858643, -0.0040656328201293945, -0.0038942694664001465, -0.0037229061126708984, -0.0035515427589416504, -0.0033801794052124023, -0.0032088160514831543, -0.0030374526977539062, -0.002866089344024658, -0.00269472599029541, -0.002523362636566162, -0.002351999282836914, -0.002180635929107666, -0.002009272575378418, -0.00183790922164917, -0.0016665458679199219, -0.0014951825141906738, -0.0013238191604614258, -0.0011524558067321777, -0.0009810924530029297, -0.0008097290992736816, -0.0006383657455444336, -0.00046700239181518555, -0.0002956390380859375, -0.00012427568435668945, 4.7087669372558594e-05, 0.00021845102310180664, 0.0003898143768310547, 0.0005611777305603027, 0.0007325410842895508, 0.0009039044380187988, 0.0010752677917480469, 0.001246631145477295, 0.001417994499206543, 0.001589357852935791, 0.001760721206665039, 0.0019320845603942871, 0.002103447914123535, 0.002274811267852783, 0.0024461746215820312, 0.0026175379753112793, 0.0027889013290405273, 0.0029602646827697754, 0.0031316280364990234, 0.0033029913902282715, 0.0034743547439575195, 0.0036457180976867676, 0.0038170814514160156, 0.003988444805145264, 0.004159808158874512, 0.00433117151260376, 0.004502534866333008, 0.004673898220062256, 0.004845261573791504, 0.005016624927520752, 0.00518798828125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 6.0, 4.0, 12.0, 11.0, 15.0, 14.0, 30.0, 37.0, 47.0, 37.0, 80.0, 95.0, 159.0, 253.0, 504.0, 2448.0, 973615.0, 69232.0, 861.0, 365.0, 231.0, 128.0, 100.0, 57.0, 45.0, 25.0, 29.0, 29.0, 10.0, 8.0, 11.0, 14.0, 10.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.10546875, -0.10215091705322266, -0.09883308410644531, -0.09551525115966797, -0.09219741821289062, -0.08887958526611328, -0.08556175231933594, -0.0822439193725586, -0.07892608642578125, -0.0756082534790039, -0.07229042053222656, -0.06897258758544922, -0.06565475463867188, -0.06233692169189453, -0.05901908874511719, -0.055701255798339844, -0.0523834228515625, -0.049065589904785156, -0.04574775695800781, -0.04242992401123047, -0.039112091064453125, -0.03579425811767578, -0.03247642517089844, -0.029158592224121094, -0.02584075927734375, -0.022522926330566406, -0.019205093383789062, -0.01588726043701172, -0.012569427490234375, -0.009251594543457031, -0.0059337615966796875, -0.0026159286499023438, 0.000701904296875, 0.004019737243652344, 0.0073375701904296875, 0.010655403137207031, 0.013973236083984375, 0.01729106903076172, 0.020608901977539062, 0.023926734924316406, 0.02724456787109375, 0.030562400817871094, 0.03388023376464844, 0.03719806671142578, 0.040515899658203125, 0.04383373260498047, 0.04715156555175781, 0.050469398498535156, 0.0537872314453125, 0.057105064392089844, 0.06042289733886719, 0.06374073028564453, 0.06705856323242188, 0.07037639617919922, 0.07369422912597656, 0.0770120620727539, 0.08032989501953125, 0.0836477279663086, 0.08696556091308594, 0.09028339385986328, 0.09360122680664062, 0.09691905975341797, 0.10023689270019531, 0.10355472564697266, 0.10687255859375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 44.0, 631.0, 323.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003898837836459279, -0.0030843750573694706, -0.002269912511110306, -0.0014554497320204973, -0.0006409871857613325, 0.0001734753604978323, 0.0009879383724182844, 0.0018024009186774492, 0.002616863464936614, 0.0034313262440264225, 0.004245788790285587, 0.005060251802206039, 0.005874713882803917, 0.006689176894724369, 0.007503639906644821, 0.008318101987242699, 0.00913256499916315, 0.009947028011083603, 0.01076149009168148, 0.011575953103601933, 0.012390416115522385, 0.013204878196120262, 0.014019341208040714, 0.014833804219961166, 0.015648266300559044, 0.01646272838115692, 0.017277192324399948, 0.018091654404997826, 0.018906116485595703, 0.01972058042883873, 0.020535042509436607, 0.021349504590034485, 0.02216396853327751, 0.02297843061387539, 0.023792894557118416, 0.024607356637716293, 0.02542181871831417, 0.02623628079891205, 0.027050744742155075, 0.027865206822752953, 0.02867966890335083, 0.029494130983948708, 0.030308594927191734, 0.031123057007789612, 0.03193752095103264, 0.03275198116898537, 0.033566445112228394, 0.03438090905547142, 0.03519537299871445, 0.036009836941957474, 0.0368242971599102, 0.03763876110315323, 0.038453225046396255, 0.039267685264348984, 0.04008214920759201, 0.04089661315083504, 0.041711073368787766, 0.04252553731203079, 0.04333999752998352, 0.04415446147322655, 0.044968925416469574, 0.0457833856344223, 0.04659784957766533, 0.047412313520908356, 0.048226773738861084]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 10.0, 7.0, 17.0, 11.0, 11.0, 7.0, 12.0, 22.0, 32.0, 35.0, 34.0, 33.0, 44.0, 39.0, 44.0, 57.0, 43.0, 59.0, 46.0, 42.0, 47.0, 48.0, 28.0, 37.0, 47.0, 21.0, 26.0, 39.0, 21.0, 26.0, 13.0, 10.0, 7.0, 8.0, 9.0, 4.0, 2.0, 5.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003369152545928955, -0.0032685473561286926, -0.00316794216632843, -0.0030673369765281677, -0.0029667317867279053, -0.002866126596927643, -0.0027655214071273804, -0.002664916217327118, -0.0025643110275268555, -0.002463705837726593, -0.0023631006479263306, -0.002262495458126068, -0.0021618902683258057, -0.002061285078525543, -0.0019606798887252808, -0.0018600746989250183, -0.0017594695091247559, -0.0016588643193244934, -0.001558259129524231, -0.0014576539397239685, -0.001357048749923706, -0.0012564435601234436, -0.0011558383703231812, -0.0010552331805229187, -0.0009546279907226562, -0.0008540228009223938, -0.0007534176111221313, -0.0006528124213218689, -0.0005522072315216064, -0.000451602041721344, -0.00035099685192108154, -0.0002503916621208191, -0.00014978647232055664, -4.918128252029419e-05, 5.142390727996826e-05, 0.0001520290970802307, 0.00025263428688049316, 0.0003532394766807556, 0.00045384466648101807, 0.0005544498562812805, 0.000655055046081543, 0.0007556602358818054, 0.0008562654256820679, 0.0009568706154823303, 0.0010574758052825928, 0.0011580809950828552, 0.0012586861848831177, 0.0013592913746833801, 0.0014598965644836426, 0.001560501754283905, 0.0016611069440841675, 0.00176171213388443, 0.0018623173236846924, 0.001962922513484955, 0.0020635277032852173, 0.0021641328930854797, 0.002264738082885742, 0.0023653432726860046, 0.002465948462486267, 0.0025665536522865295, 0.002667158842086792, 0.0027677640318870544, 0.002868369221687317, 0.0029689744114875793, 0.003069579601287842]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 7.0, 12.0, 14.0, 8.0, 13.0, 11.0, 27.0, 33.0, 30.0, 33.0, 45.0, 36.0, 47.0, 51.0, 46.0, 44.0, 55.0, 45.0, 41.0, 43.0, 30.0, 37.0, 39.0, 28.0, 31.0, 29.0, 25.0, 19.0, 25.0, 13.0, 14.0, 12.0, 15.0, 7.0, 9.0, 2.0, 3.0, 5.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.76788330078125, -4.6021728515625, -4.43646240234375, -4.270751953125, -4.10504150390625, -3.9393310546875, -3.77362060546875, -3.60791015625, -3.44219970703125, -3.2764892578125, -3.11077880859375, -2.945068359375, -2.77935791015625, -2.6136474609375, -2.44793701171875, -2.2822265625, -2.11651611328125, -1.9508056640625, -1.78509521484375, -1.619384765625, -1.45367431640625, -1.2879638671875, -1.12225341796875, -0.95654296875, -0.79083251953125, -0.6251220703125, -0.45941162109375, -0.293701171875, -0.12799072265625, 0.0377197265625, 0.20343017578125, 0.369140625, 0.53485107421875, 0.7005615234375, 0.86627197265625, 1.031982421875, 1.19769287109375, 1.3634033203125, 1.52911376953125, 1.69482421875, 1.86053466796875, 2.0262451171875, 2.19195556640625, 2.357666015625, 2.52337646484375, 2.6890869140625, 2.85479736328125, 3.0205078125, 3.18621826171875, 3.3519287109375, 3.51763916015625, 3.683349609375, 3.84906005859375, 4.0147705078125, 4.18048095703125, 4.34619140625, 4.51190185546875, 4.6776123046875, 4.84332275390625, 5.009033203125, 5.17474365234375, 5.3404541015625, 5.50616455078125, 5.671875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 9.0, 8.0, 13.0, 19.0, 31.0, 26.0, 34.0, 43.0, 64.0, 102.0, 117.0, 189.0, 255.0, 347.0, 484.0, 795.0, 1871.0, 7124.0, 35964.0, 484276.0, 470093.0, 35321.0, 6949.0, 1908.0, 769.0, 456.0, 315.0, 250.0, 165.0, 119.0, 126.0, 78.0, 57.0, 44.0, 35.0, 35.0, 15.0, 15.0, 8.0, 4.0, 8.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2734375, -11.8642578125, -11.455078125, -11.0458984375, -10.63671875, -10.2275390625, -9.818359375, -9.4091796875, -9.0, -8.5908203125, -8.181640625, -7.7724609375, -7.36328125, -6.9541015625, -6.544921875, -6.1357421875, -5.7265625, -5.3173828125, -4.908203125, -4.4990234375, -4.08984375, -3.6806640625, -3.271484375, -2.8623046875, -2.453125, -2.0439453125, -1.634765625, -1.2255859375, -0.81640625, -0.4072265625, 0.001953125, 0.4111328125, 0.8203125, 1.2294921875, 1.638671875, 2.0478515625, 2.45703125, 2.8662109375, 3.275390625, 3.6845703125, 4.09375, 4.5029296875, 4.912109375, 5.3212890625, 5.73046875, 6.1396484375, 6.548828125, 6.9580078125, 7.3671875, 7.7763671875, 8.185546875, 8.5947265625, 9.00390625, 9.4130859375, 9.822265625, 10.2314453125, 10.640625, 11.0498046875, 11.458984375, 11.8681640625, 12.27734375, 12.6865234375, 13.095703125, 13.5048828125, 13.9140625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 14.0, 6.0, 8.0, 19.0, 20.0, 15.0, 20.0, 27.0, 26.0, 18.0, 33.0, 38.0, 47.0, 47.0, 58.0, 92.0, 232.0, 1599.0, 204.0, 78.0, 55.0, 51.0, 38.0, 36.0, 39.0, 37.0, 26.0, 29.0, 18.0, 12.0, 18.0, 11.0, 10.0, 9.0, 14.0, 6.0, 3.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.96875, -14.52099609375, -14.0732421875, -13.62548828125, -13.177734375, -12.72998046875, -12.2822265625, -11.83447265625, -11.38671875, -10.93896484375, -10.4912109375, -10.04345703125, -9.595703125, -9.14794921875, -8.7001953125, -8.25244140625, -7.8046875, -7.35693359375, -6.9091796875, -6.46142578125, -6.013671875, -5.56591796875, -5.1181640625, -4.67041015625, -4.22265625, -3.77490234375, -3.3271484375, -2.87939453125, -2.431640625, -1.98388671875, -1.5361328125, -1.08837890625, -0.640625, -0.19287109375, 0.2548828125, 0.70263671875, 1.150390625, 1.59814453125, 2.0458984375, 2.49365234375, 2.94140625, 3.38916015625, 3.8369140625, 4.28466796875, 4.732421875, 5.18017578125, 5.6279296875, 6.07568359375, 6.5234375, 6.97119140625, 7.4189453125, 7.86669921875, 8.314453125, 8.76220703125, 9.2099609375, 9.65771484375, 10.10546875, 10.55322265625, 11.0009765625, 11.44873046875, 11.896484375, 12.34423828125, 12.7919921875, 13.23974609375, 13.6875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 4.0, 6.0, 10.0, 13.0, 12.0, 13.0, 22.0, 26.0, 20.0, 37.0, 33.0, 55.0, 73.0, 73.0, 131.0, 230.0, 457.0, 1420.0, 16740.0, 3042421.0, 79649.0, 2696.0, 655.0, 290.0, 157.0, 101.0, 69.0, 44.0, 39.0, 38.0, 27.0, 22.0, 27.0, 15.0, 12.0, 14.0, 8.0, 7.0, 7.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-37.03125, -35.82421875, -34.6171875, -33.41015625, -32.203125, -30.99609375, -29.7890625, -28.58203125, -27.375, -26.16796875, -24.9609375, -23.75390625, -22.546875, -21.33984375, -20.1328125, -18.92578125, -17.71875, -16.51171875, -15.3046875, -14.09765625, -12.890625, -11.68359375, -10.4765625, -9.26953125, -8.0625, -6.85546875, -5.6484375, -4.44140625, -3.234375, -2.02734375, -0.8203125, 0.38671875, 1.59375, 2.80078125, 4.0078125, 5.21484375, 6.421875, 7.62890625, 8.8359375, 10.04296875, 11.25, 12.45703125, 13.6640625, 14.87109375, 16.078125, 17.28515625, 18.4921875, 19.69921875, 20.90625, 22.11328125, 23.3203125, 24.52734375, 25.734375, 26.94140625, 28.1484375, 29.35546875, 30.5625, 31.76953125, 32.9765625, 34.18359375, 35.390625, 36.59765625, 37.8046875, 39.01171875, 40.21875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 77.0, 476.0, 413.0, 45.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.42146301269531, -118.77576446533203, -116.13006591796875, -113.48436737060547, -110.83866882324219, -108.1929702758789, -105.54727172851562, -102.90157318115234, -100.25587463378906, -97.61017608642578, -94.9644775390625, -92.31877899169922, -89.67308044433594, -87.02738189697266, -84.38168334960938, -81.7359848022461, -79.09028625488281, -76.44458770751953, -73.79888916015625, -71.15319061279297, -68.50749206542969, -65.8617935180664, -63.216094970703125, -60.570396423339844, -57.92469787597656, -55.27899932861328, -52.63330078125, -49.98760223388672, -47.34190368652344, -44.696205139160156, -42.050506591796875, -39.404808044433594, -36.759117126464844, -34.11341857910156, -31.46772003173828, -28.822021484375, -26.17632293701172, -23.530624389648438, -20.884925842285156, -18.239227294921875, -15.593528747558594, -12.947830200195312, -10.302131652832031, -7.65643310546875, -5.010734558105469, -2.3650360107421875, 0.28066253662109375, 2.926361083984375, 5.572059631347656, 8.217758178710938, 10.863456726074219, 13.5091552734375, 16.15485382080078, 18.800552368164062, 21.446250915527344, 24.091949462890625, 26.737648010253906, 29.383346557617188, 32.02904510498047, 34.67474365234375, 37.32044219970703, 39.96614074707031, 42.611839294433594, 45.257537841796875, 47.903236389160156]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 7.0, 5.0, 10.0, 14.0, 21.0, 21.0, 21.0, 20.0, 31.0, 26.0, 24.0, 37.0, 21.0, 22.0, 37.0, 34.0, 38.0, 46.0, 38.0, 41.0, 36.0, 43.0, 37.0, 33.0, 38.0, 35.0, 33.0, 29.0, 29.0, 19.0, 17.0, 16.0, 12.0, 14.0, 17.0, 16.0, 11.0, 10.0, 9.0, 9.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-38.20920944213867, -37.112247467041016, -36.015281677246094, -34.91831970214844, -33.82135772705078, -32.724395751953125, -31.627431869506836, -30.530467987060547, -29.43350601196289, -28.336544036865234, -27.239580154418945, -26.142616271972656, -25.045654296875, -23.948692321777344, -22.851728439331055, -21.754764556884766, -20.65780258178711, -19.560840606689453, -18.463876724243164, -17.366912841796875, -16.26995086669922, -15.172987937927246, -14.076025009155273, -12.9790620803833, -11.882099151611328, -10.785136222839355, -9.688173294067383, -8.59121036529541, -7.4942474365234375, -6.397284507751465, -5.300321578979492, -4.2033586502075195, -3.1063919067382812, -2.0094289779663086, -0.9124660491943359, 0.18449687957763672, 1.2814598083496094, 2.378422737121582, 3.4753856658935547, 4.572348594665527, 5.6693115234375, 6.766274452209473, 7.863237380981445, 8.960200309753418, 10.05716323852539, 11.154126167297363, 12.251089096069336, 13.348052024841309, 14.445014953613281, 15.541977882385254, 16.638940811157227, 17.735904693603516, 18.832866668701172, 19.929828643798828, 21.026792526245117, 22.123756408691406, 23.220718383789062, 24.31768035888672, 25.414644241333008, 26.511608123779297, 27.608570098876953, 28.70553207397461, 29.8024959564209, 30.899459838867188, 31.996421813964844]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 6.0, 8.0, 7.0, 8.0, 8.0, 14.0, 11.0, 20.0, 18.0, 14.0, 20.0, 34.0, 28.0, 35.0, 35.0, 42.0, 36.0, 46.0, 44.0, 45.0, 47.0, 39.0, 43.0, 33.0, 34.0, 34.0, 29.0, 29.0, 22.0, 22.0, 16.0, 31.0, 27.0, 17.0, 9.0, 22.0, 11.0, 13.0, 8.0, 4.0, 8.0, 8.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-4.95703125, -4.80584716796875, -4.6546630859375, -4.50347900390625, -4.352294921875, -4.20111083984375, -4.0499267578125, -3.89874267578125, -3.74755859375, -3.59637451171875, -3.4451904296875, -3.29400634765625, -3.142822265625, -2.99163818359375, -2.8404541015625, -2.68927001953125, -2.5380859375, -2.38690185546875, -2.2357177734375, -2.08453369140625, -1.933349609375, -1.78216552734375, -1.6309814453125, -1.47979736328125, -1.32861328125, -1.17742919921875, -1.0262451171875, -0.87506103515625, -0.723876953125, -0.57269287109375, -0.4215087890625, -0.27032470703125, -0.119140625, 0.03204345703125, 0.1832275390625, 0.33441162109375, 0.485595703125, 0.63677978515625, 0.7879638671875, 0.93914794921875, 1.09033203125, 1.24151611328125, 1.3927001953125, 1.54388427734375, 1.695068359375, 1.84625244140625, 1.9974365234375, 2.14862060546875, 2.2998046875, 2.45098876953125, 2.6021728515625, 2.75335693359375, 2.904541015625, 3.05572509765625, 3.2069091796875, 3.35809326171875, 3.50927734375, 3.66046142578125, 3.8116455078125, 3.96282958984375, 4.114013671875, 4.26519775390625, 4.4163818359375, 4.56756591796875, 4.71875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 5.0, 7.0, 7.0, 10.0, 16.0, 14.0, 19.0, 19.0, 47.0, 59.0, 71.0, 72.0, 120.0, 153.0, 267.0, 323.0, 651.0, 1276.0, 2917.0, 7931.0, 27520.0, 124043.0, 567005.0, 1645661.0, 1339602.0, 368409.0, 78861.0, 18635.0, 5781.0, 2141.0, 1012.0, 519.0, 326.0, 204.0, 159.0, 100.0, 73.0, 49.0, 56.0, 30.0, 25.0, 18.0, 16.0, 12.0, 15.0, 6.0, 9.0, 6.0, 9.0, 2.0, 3.0, 0.0, 2.0], "bins": [-6.890625, -6.69293212890625, -6.4952392578125, -6.29754638671875, -6.099853515625, -5.90216064453125, -5.7044677734375, -5.50677490234375, -5.30908203125, -5.11138916015625, -4.9136962890625, -4.71600341796875, -4.518310546875, -4.32061767578125, -4.1229248046875, -3.92523193359375, -3.7275390625, -3.52984619140625, -3.3321533203125, -3.13446044921875, -2.936767578125, -2.73907470703125, -2.5413818359375, -2.34368896484375, -2.14599609375, -1.94830322265625, -1.7506103515625, -1.55291748046875, -1.355224609375, -1.15753173828125, -0.9598388671875, -0.76214599609375, -0.564453125, -0.36676025390625, -0.1690673828125, 0.02862548828125, 0.226318359375, 0.42401123046875, 0.6217041015625, 0.81939697265625, 1.01708984375, 1.21478271484375, 1.4124755859375, 1.61016845703125, 1.807861328125, 2.00555419921875, 2.2032470703125, 2.40093994140625, 2.5986328125, 2.79632568359375, 2.9940185546875, 3.19171142578125, 3.389404296875, 3.58709716796875, 3.7847900390625, 3.98248291015625, 4.18017578125, 4.37786865234375, 4.5755615234375, 4.77325439453125, 4.970947265625, 5.16864013671875, 5.3663330078125, 5.56402587890625, 5.76171875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 1.0, 9.0, 4.0, 16.0, 13.0, 20.0, 25.0, 29.0, 35.0, 79.0, 77.0, 112.0, 177.0, 183.0, 292.0, 371.0, 437.0, 439.0, 403.0, 344.0, 276.0, 200.0, 124.0, 108.0, 64.0, 40.0, 52.0, 26.0, 30.0, 22.0, 19.0, 10.0, 9.0, 6.0, 2.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.88671875, -6.6602783203125, -6.433837890625, -6.2073974609375, -5.98095703125, -5.7545166015625, -5.528076171875, -5.3016357421875, -5.0751953125, -4.8487548828125, -4.622314453125, -4.3958740234375, -4.16943359375, -3.9429931640625, -3.716552734375, -3.4901123046875, -3.263671875, -3.0372314453125, -2.810791015625, -2.5843505859375, -2.35791015625, -2.1314697265625, -1.905029296875, -1.6785888671875, -1.4521484375, -1.2257080078125, -0.999267578125, -0.7728271484375, -0.54638671875, -0.3199462890625, -0.093505859375, 0.1329345703125, 0.359375, 0.5858154296875, 0.812255859375, 1.0386962890625, 1.26513671875, 1.4915771484375, 1.718017578125, 1.9444580078125, 2.1708984375, 2.3973388671875, 2.623779296875, 2.8502197265625, 3.07666015625, 3.3031005859375, 3.529541015625, 3.7559814453125, 3.982421875, 4.2088623046875, 4.435302734375, 4.6617431640625, 4.88818359375, 5.1146240234375, 5.341064453125, 5.5675048828125, 5.7939453125, 6.0203857421875, 6.246826171875, 6.4732666015625, 6.69970703125, 6.9261474609375, 7.152587890625, 7.3790283203125, 7.60546875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 2.0, 10.0, 14.0, 16.0, 18.0, 29.0, 42.0, 53.0, 86.0, 118.0, 140.0, 218.0, 405.0, 759.0, 1752.0, 9246.0, 125609.0, 2947060.0, 1056855.0, 44349.0, 4732.0, 1185.0, 582.0, 316.0, 217.0, 133.0, 94.0, 66.0, 38.0, 32.0, 24.0, 22.0, 13.0, 15.0, 3.0, 4.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-19.5, -18.92333984375, -18.3466796875, -17.77001953125, -17.193359375, -16.61669921875, -16.0400390625, -15.46337890625, -14.88671875, -14.31005859375, -13.7333984375, -13.15673828125, -12.580078125, -12.00341796875, -11.4267578125, -10.85009765625, -10.2734375, -9.69677734375, -9.1201171875, -8.54345703125, -7.966796875, -7.39013671875, -6.8134765625, -6.23681640625, -5.66015625, -5.08349609375, -4.5068359375, -3.93017578125, -3.353515625, -2.77685546875, -2.2001953125, -1.62353515625, -1.046875, -0.47021484375, 0.1064453125, 0.68310546875, 1.259765625, 1.83642578125, 2.4130859375, 2.98974609375, 3.56640625, 4.14306640625, 4.7197265625, 5.29638671875, 5.873046875, 6.44970703125, 7.0263671875, 7.60302734375, 8.1796875, 8.75634765625, 9.3330078125, 9.90966796875, 10.486328125, 11.06298828125, 11.6396484375, 12.21630859375, 12.79296875, 13.36962890625, 13.9462890625, 14.52294921875, 15.099609375, 15.67626953125, 16.2529296875, 16.82958984375, 17.40625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 18.0, 72.0, 151.0, 221.0, 228.0, 164.0, 104.0, 38.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.307598114013672, -16.325965881347656, -14.344331741333008, -12.362698554992676, -10.381065368652344, -8.399432182312012, -6.41779899597168, -4.436165809631348, -2.4545326232910156, -0.4728994369506836, 1.5087337493896484, 3.4903669357299805, 5.4720001220703125, 7.4536333084106445, 9.435266494750977, 11.416899681091309, 13.39853286743164, 15.380166053771973, 17.361799240112305, 19.343433380126953, 21.32506561279297, 23.306697845458984, 25.288331985473633, 27.26996612548828, 29.251598358154297, 31.233230590820312, 33.214866638183594, 35.19649887084961, 37.178131103515625, 39.15976333618164, 41.141395568847656, 43.12303161621094, 45.10466003417969, 47.0862922668457, 49.06792449951172, 51.049560546875, 53.031192779541016, 55.01282501220703, 56.99446105957031, 58.97609329223633, 60.957725524902344, 62.93935775756836, 64.92098999023438, 66.90262603759766, 68.88426208496094, 70.86589050292969, 72.84752655029297, 74.82915496826172, 76.810791015625, 78.79242706298828, 80.77405548095703, 82.75569152832031, 84.73731994628906, 86.71895599365234, 88.70059204101562, 90.68222045898438, 92.66385650634766, 94.64549255371094, 96.62712097167969, 98.60875701904297, 100.59039306640625, 102.572021484375, 104.55365753173828, 106.53528594970703, 108.51692199707031]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 4.0, 7.0, 10.0, 12.0, 23.0, 14.0, 14.0, 19.0, 16.0, 32.0, 28.0, 36.0, 36.0, 27.0, 42.0, 38.0, 31.0, 37.0, 37.0, 47.0, 46.0, 36.0, 39.0, 24.0, 38.0, 41.0, 27.0, 26.0, 28.0, 17.0, 23.0, 21.0, 17.0, 12.0, 15.0, 12.0, 8.0, 7.0, 8.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-24.549427032470703, -23.84429168701172, -23.139156341552734, -22.434022903442383, -21.7288875579834, -21.023752212524414, -20.318618774414062, -19.613483428955078, -18.908348083496094, -18.20321273803711, -17.498077392578125, -16.792943954467773, -16.08780860900879, -15.382673263549805, -14.677538871765137, -13.972404479980469, -13.267269134521484, -12.5621337890625, -11.856999397277832, -11.151865005493164, -10.44672966003418, -9.741594314575195, -9.036459922790527, -8.33132553100586, -7.626190185546875, -6.921055316925049, -6.215920448303223, -5.5107855796813965, -4.80565071105957, -4.100515842437744, -3.395380973815918, -2.690246105194092, -1.9851112365722656, -1.2799763679504395, -0.5748414993286133, 0.1302933692932129, 0.8354282379150391, 1.5405631065368652, 2.2456979751586914, 2.9508328437805176, 3.6559677124023438, 4.36110258102417, 5.066237449645996, 5.771372318267822, 6.476507186889648, 7.181642055511475, 7.886776924133301, 8.591911315917969, 9.297046661376953, 10.002182006835938, 10.707316398620605, 11.412450790405273, 12.117586135864258, 12.822721481323242, 13.52785587310791, 14.232990264892578, 14.938125610351562, 15.643260955810547, 16.34839630126953, 17.053529739379883, 17.758665084838867, 18.46380043029785, 19.168933868408203, 19.874069213867188, 20.579204559326172]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 6.0, 6.0, 5.0, 12.0, 7.0, 7.0, 14.0, 13.0, 23.0, 20.0, 14.0, 24.0, 36.0, 27.0, 34.0, 31.0, 36.0, 40.0, 48.0, 42.0, 34.0, 47.0, 39.0, 41.0, 45.0, 36.0, 30.0, 33.0, 27.0, 17.0, 26.0, 25.0, 22.0, 20.0, 19.0, 10.0, 17.0, 11.0, 8.0, 11.0, 8.0, 6.0, 6.0, 5.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.8828125, -4.73370361328125, -4.5845947265625, -4.43548583984375, -4.286376953125, -4.13726806640625, -3.9881591796875, -3.83905029296875, -3.68994140625, -3.54083251953125, -3.3917236328125, -3.24261474609375, -3.093505859375, -2.94439697265625, -2.7952880859375, -2.64617919921875, -2.4970703125, -2.34796142578125, -2.1988525390625, -2.04974365234375, -1.900634765625, -1.75152587890625, -1.6024169921875, -1.45330810546875, -1.30419921875, -1.15509033203125, -1.0059814453125, -0.85687255859375, -0.707763671875, -0.55865478515625, -0.4095458984375, -0.26043701171875, -0.111328125, 0.03778076171875, 0.1868896484375, 0.33599853515625, 0.485107421875, 0.63421630859375, 0.7833251953125, 0.93243408203125, 1.08154296875, 1.23065185546875, 1.3797607421875, 1.52886962890625, 1.677978515625, 1.82708740234375, 1.9761962890625, 2.12530517578125, 2.2744140625, 2.42352294921875, 2.5726318359375, 2.72174072265625, 2.870849609375, 3.01995849609375, 3.1690673828125, 3.31817626953125, 3.46728515625, 3.61639404296875, 3.7655029296875, 3.91461181640625, 4.063720703125, 4.21282958984375, 4.3619384765625, 4.51104736328125, 4.66015625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 10.0, 4.0, 6.0, 26.0, 30.0, 31.0, 44.0, 89.0, 132.0, 191.0, 252.0, 329.0, 463.0, 681.0, 979.0, 1388.0, 1851.0, 2574.0, 3680.0, 5325.0, 7632.0, 11141.0, 16341.0, 24308.0, 36237.0, 54169.0, 81056.0, 114873.0, 150665.0, 152998.0, 120019.0, 84430.0, 56905.0, 38133.0, 25372.0, 17324.0, 11907.0, 7999.0, 5529.0, 3963.0, 2723.0, 1972.0, 1333.0, 1020.0, 680.0, 548.0, 359.0, 254.0, 194.0, 138.0, 65.0, 60.0, 40.0, 45.0, 19.0, 12.0, 10.0, 8.0, 1.0, 1.0, 2.0], "bins": [-0.36865234375, -0.35715484619140625, -0.3456573486328125, -0.33415985107421875, -0.322662353515625, -0.31116485595703125, -0.2996673583984375, -0.28816986083984375, -0.27667236328125, -0.26517486572265625, -0.2536773681640625, -0.24217987060546875, -0.230682373046875, -0.21918487548828125, -0.2076873779296875, -0.19618988037109375, -0.1846923828125, -0.17319488525390625, -0.1616973876953125, -0.15019989013671875, -0.138702392578125, -0.12720489501953125, -0.1157073974609375, -0.10420989990234375, -0.09271240234375, -0.08121490478515625, -0.0697174072265625, -0.05821990966796875, -0.046722412109375, -0.03522491455078125, -0.0237274169921875, -0.01222991943359375, -0.000732421875, 0.01076507568359375, 0.0222625732421875, 0.03376007080078125, 0.045257568359375, 0.05675506591796875, 0.0682525634765625, 0.07975006103515625, 0.09124755859375, 0.10274505615234375, 0.1142425537109375, 0.12574005126953125, 0.137237548828125, 0.14873504638671875, 0.1602325439453125, 0.17173004150390625, 0.1832275390625, 0.19472503662109375, 0.2062225341796875, 0.21772003173828125, 0.229217529296875, 0.24071502685546875, 0.2522125244140625, 0.26371002197265625, 0.27520751953125, 0.28670501708984375, 0.2982025146484375, 0.30970001220703125, 0.321197509765625, 0.33269500732421875, 0.3441925048828125, 0.35569000244140625, 0.3671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 10.0, 4.0, 4.0, 9.0, 10.0, 14.0, 11.0, 19.0, 20.0, 26.0, 26.0, 27.0, 31.0, 37.0, 35.0, 32.0, 39.0, 34.0, 43.0, 43.0, 1059.0, 41.0, 40.0, 43.0, 29.0, 39.0, 35.0, 34.0, 34.0, 32.0, 32.0, 17.0, 20.0, 22.0, 19.0, 17.0, 6.0, 10.0, 3.0, 4.0, 4.0, 0.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-3.716796875, -3.612701416015625, -3.50860595703125, -3.404510498046875, -3.3004150390625, -3.196319580078125, -3.09222412109375, -2.988128662109375, -2.884033203125, -2.779937744140625, -2.67584228515625, -2.571746826171875, -2.4676513671875, -2.363555908203125, -2.25946044921875, -2.155364990234375, -2.05126953125, -1.947174072265625, -1.84307861328125, -1.738983154296875, -1.6348876953125, -1.530792236328125, -1.42669677734375, -1.322601318359375, -1.218505859375, -1.114410400390625, -1.01031494140625, -0.906219482421875, -0.8021240234375, -0.698028564453125, -0.59393310546875, -0.489837646484375, -0.3857421875, -0.281646728515625, -0.17755126953125, -0.073455810546875, 0.0306396484375, 0.134735107421875, 0.23883056640625, 0.342926025390625, 0.447021484375, 0.551116943359375, 0.65521240234375, 0.759307861328125, 0.8634033203125, 0.967498779296875, 1.07159423828125, 1.175689697265625, 1.27978515625, 1.383880615234375, 1.48797607421875, 1.592071533203125, 1.6961669921875, 1.800262451171875, 1.90435791015625, 2.008453369140625, 2.112548828125, 2.216644287109375, 2.32073974609375, 2.424835205078125, 2.5289306640625, 2.633026123046875, 2.73712158203125, 2.841217041015625, 2.9453125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [9.0, 6.0, 11.0, 9.0, 22.0, 26.0, 33.0, 64.0, 82.0, 105.0, 166.0, 223.0, 278.0, 426.0, 608.0, 846.0, 1240.0, 1760.0, 2450.0, 3505.0, 5014.0, 7160.0, 10291.0, 14800.0, 21037.0, 30519.0, 42952.0, 61039.0, 83883.0, 110043.0, 986149.0, 323818.0, 107969.0, 81826.0, 59042.0, 42012.0, 29272.0, 20766.0, 14273.0, 10083.0, 6788.0, 4865.0, 3354.0, 2452.0, 1738.0, 1208.0, 857.0, 596.0, 406.0, 338.0, 221.0, 145.0, 113.0, 88.0, 55.0, 50.0, 20.0, 13.0, 12.0, 6.0, 5.0, 3.0, 1.0, 1.0], "bins": [-0.2479248046875, -0.2399158477783203, -0.23190689086914062, -0.22389793395996094, -0.21588897705078125, -0.20788002014160156, -0.19987106323242188, -0.1918621063232422, -0.1838531494140625, -0.1758441925048828, -0.16783523559570312, -0.15982627868652344, -0.15181732177734375, -0.14380836486816406, -0.13579940795898438, -0.1277904510498047, -0.119781494140625, -0.11177253723144531, -0.10376358032226562, -0.09575462341308594, -0.08774566650390625, -0.07973670959472656, -0.07172775268554688, -0.06371879577636719, -0.0557098388671875, -0.04770088195800781, -0.039691925048828125, -0.03168296813964844, -0.02367401123046875, -0.015665054321289062, -0.007656097412109375, 0.0003528594970703125, 0.00836181640625, 0.016370773315429688, 0.024379730224609375, 0.03238868713378906, 0.04039764404296875, 0.04840660095214844, 0.056415557861328125, 0.06442451477050781, 0.0724334716796875, 0.08044242858886719, 0.08845138549804688, 0.09646034240722656, 0.10446929931640625, 0.11247825622558594, 0.12048721313476562, 0.1284961700439453, 0.136505126953125, 0.1445140838623047, 0.15252304077148438, 0.16053199768066406, 0.16854095458984375, 0.17654991149902344, 0.18455886840820312, 0.1925678253173828, 0.2005767822265625, 0.2085857391357422, 0.21659469604492188, 0.22460365295410156, 0.23261260986328125, 0.24062156677246094, 0.24863052368164062, 0.2566394805908203, 0.2646484375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 3.0, 2.0, 11.0, 13.0, 9.0, 11.0, 17.0, 16.0, 20.0, 23.0, 20.0, 28.0, 38.0, 58.0, 58.0, 88.0, 85.0, 86.0, 69.0, 60.0, 60.0, 38.0, 37.0, 28.0, 22.0, 22.0, 11.0, 11.0, 7.0, 10.0, 8.0, 4.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.00467681884765625, -0.004553020000457764, -0.004429221153259277, -0.004305422306060791, -0.004181623458862305, -0.004057824611663818, -0.003934025764465332, -0.0038102269172668457, -0.0036864280700683594, -0.003562629222869873, -0.0034388303756713867, -0.0033150315284729004, -0.003191232681274414, -0.0030674338340759277, -0.0029436349868774414, -0.002819836139678955, -0.0026960372924804688, -0.0025722384452819824, -0.002448439598083496, -0.0023246407508850098, -0.0022008419036865234, -0.002077043056488037, -0.0019532442092895508, -0.0018294453620910645, -0.0017056465148925781, -0.0015818476676940918, -0.0014580488204956055, -0.0013342499732971191, -0.0012104511260986328, -0.0010866522789001465, -0.0009628534317016602, -0.0008390545845031738, -0.0007152557373046875, -0.0005914568901062012, -0.00046765804290771484, -0.0003438591957092285, -0.0002200603485107422, -9.626150131225586e-05, 2.753734588623047e-05, 0.0001513361930847168, 0.0002751350402832031, 0.00039893388748168945, 0.0005227327346801758, 0.0006465315818786621, 0.0007703304290771484, 0.0008941292762756348, 0.001017928123474121, 0.0011417269706726074, 0.0012655258178710938, 0.00138932466506958, 0.0015131235122680664, 0.0016369223594665527, 0.001760721206665039, 0.0018845200538635254, 0.0020083189010620117, 0.002132117748260498, 0.0022559165954589844, 0.0023797154426574707, 0.002503514289855957, 0.0026273131370544434, 0.0027511119842529297, 0.002874910831451416, 0.0029987096786499023, 0.0031225085258483887, 0.003246307373046875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 13.0, 8.0, 9.0, 14.0, 14.0, 23.0, 40.0, 28.0, 69.0, 78.0, 126.0, 201.0, 320.0, 665.0, 11600.0, 998411.0, 34953.0, 939.0, 356.0, 203.0, 127.0, 65.0, 60.0, 39.0, 51.0, 23.0, 27.0, 20.0, 16.0, 7.0, 8.0, 8.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06787109375, -0.06541252136230469, -0.06295394897460938, -0.06049537658691406, -0.05803680419921875, -0.05557823181152344, -0.053119659423828125, -0.05066108703613281, -0.0482025146484375, -0.04574394226074219, -0.043285369873046875, -0.04082679748535156, -0.03836822509765625, -0.03590965270996094, -0.033451080322265625, -0.030992507934570312, -0.028533935546875, -0.026075363159179688, -0.023616790771484375, -0.021158218383789062, -0.01869964599609375, -0.016241073608398438, -0.013782501220703125, -0.011323928833007812, -0.0088653564453125, -0.0064067840576171875, -0.003948211669921875, -0.0014896392822265625, 0.00096893310546875, 0.0034275054931640625, 0.005886077880859375, 0.008344650268554688, 0.01080322265625, 0.013261795043945312, 0.015720367431640625, 0.018178939819335938, 0.02063751220703125, 0.023096084594726562, 0.025554656982421875, 0.028013229370117188, 0.0304718017578125, 0.03293037414550781, 0.035388946533203125, 0.03784751892089844, 0.04030609130859375, 0.04276466369628906, 0.045223236083984375, 0.04768180847167969, 0.050140380859375, 0.05259895324707031, 0.055057525634765625, 0.05751609802246094, 0.05997467041015625, 0.06243324279785156, 0.06489181518554688, 0.06735038757324219, 0.0698089599609375, 0.07226753234863281, 0.07472610473632812, 0.07718467712402344, 0.07964324951171875, 0.08210182189941406, 0.08456039428710938, 0.08701896667480469, 0.0894775390625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 153.0, 796.0, 57.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01752881519496441, -0.0166240893304348, -0.01571936532855034, -0.014814639464020729, -0.01390991359949112, -0.013005188666284084, -0.01210046373307705, -0.01119573786854744, -0.010291012935340405, -0.00938628800213337, -0.00848156213760376, -0.007576837204396725, -0.006672111805528402, -0.00576738640666008, -0.004862661473453045, -0.0039579360745847225, -0.0030532106757164, -0.0021484852768480778, -0.001243760110810399, -0.00033903494477272034, 0.000565690454095602, 0.0014704158529639244, 0.0023751407861709595, 0.003279866185039282, 0.004184591583907604, 0.005089316982775927, 0.005994042381644249, 0.006898767314851284, 0.007803492713719606, 0.008708218112587929, 0.009612943045794964, 0.010517667979001999, 0.011422395706176758, 0.012327120639383793, 0.013231846503913403, 0.014136571437120438, 0.015041297301650047, 0.015946023166179657, 0.016850747168064117, 0.017755473032593727, 0.018660198897123337, 0.019564924761652946, 0.020469648763537407, 0.021374374628067017, 0.022279100492596626, 0.023183826357126236, 0.024088550359010696, 0.024993276223540306, 0.025898000225424767, 0.026802726089954376, 0.027707450091838837, 0.028612175956368446, 0.029516901820898056, 0.030421625822782516, 0.031326353549957275, 0.032231077551841736, 0.033135801553726196, 0.03404052555561066, 0.034945253282785416, 0.035849977284669876, 0.03675470128655434, 0.037659429013729095, 0.038564153015613556, 0.039468877017498016, 0.040373604744672775]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 11.0, 7.0, 12.0, 8.0, 14.0, 23.0, 25.0, 36.0, 28.0, 43.0, 42.0, 37.0, 32.0, 46.0, 35.0, 44.0, 45.0, 56.0, 53.0, 45.0, 37.0, 37.0, 40.0, 41.0, 29.0, 26.0, 21.0, 13.0, 14.0, 13.0, 16.0, 10.0, 9.0, 15.0, 7.0, 5.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002440512180328369, -0.0023599201813340187, -0.0022793281823396683, -0.002198736183345318, -0.0021181441843509674, -0.002037552185356617, -0.0019569601863622665, -0.001876368187367916, -0.0017957761883735657, -0.0017151841893792152, -0.0016345921903848648, -0.0015540001913905144, -0.001473408192396164, -0.0013928161934018135, -0.001312224194407463, -0.0012316321954131126, -0.0011510401964187622, -0.0010704481974244118, -0.0009898561984300613, -0.0009092641994357109, -0.0008286722004413605, -0.00074808020144701, -0.0006674882024526596, -0.0005868962034583092, -0.0005063042044639587, -0.0004257122054696083, -0.0003451202064752579, -0.00026452820748090744, -0.000183936208486557, -0.00010334420949220657, -2.275221049785614e-05, 5.783978849649429e-05, 0.00013843178749084473, 0.00021902378648519516, 0.0002996157854795456, 0.000380207784473896, 0.00046079978346824646, 0.0005413917824625969, 0.0006219837814569473, 0.0007025757804512978, 0.0007831677794456482, 0.0008637597784399986, 0.0009443517774343491, 0.0010249437764286995, 0.00110553577542305, 0.0011861277744174004, 0.0012667197734117508, 0.0013473117724061012, 0.0014279037714004517, 0.001508495770394802, 0.0015890877693891525, 0.001669679768383503, 0.0017502717673778534, 0.0018308637663722038, 0.0019114557653665543, 0.0019920477643609047, 0.002072639763355255, 0.0021532317623496056, 0.002233823761343956, 0.0023144157603383064, 0.002395007759332657, 0.0024755997583270073, 0.0025561917573213577, 0.002636783756315708, 0.0027173757553100586]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 6.0, 6.0, 5.0, 12.0, 7.0, 7.0, 14.0, 13.0, 23.0, 20.0, 14.0, 24.0, 36.0, 28.0, 34.0, 30.0, 36.0, 40.0, 48.0, 42.0, 34.0, 47.0, 39.0, 41.0, 45.0, 36.0, 31.0, 32.0, 27.0, 17.0, 26.0, 25.0, 22.0, 20.0, 19.0, 10.0, 17.0, 11.0, 8.0, 11.0, 8.0, 5.0, 7.0, 5.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.8828125, -4.73370361328125, -4.5845947265625, -4.43548583984375, -4.286376953125, -4.13726806640625, -3.9881591796875, -3.83905029296875, -3.68994140625, -3.54083251953125, -3.3917236328125, -3.24261474609375, -3.093505859375, -2.94439697265625, -2.7952880859375, -2.64617919921875, -2.4970703125, -2.34796142578125, -2.1988525390625, -2.04974365234375, -1.900634765625, -1.75152587890625, -1.6024169921875, -1.45330810546875, -1.30419921875, -1.15509033203125, -1.0059814453125, -0.85687255859375, -0.707763671875, -0.55865478515625, -0.4095458984375, -0.26043701171875, -0.111328125, 0.03778076171875, 0.1868896484375, 0.33599853515625, 0.485107421875, 0.63421630859375, 0.7833251953125, 0.93243408203125, 1.08154296875, 1.23065185546875, 1.3797607421875, 1.52886962890625, 1.677978515625, 1.82708740234375, 1.9761962890625, 2.12530517578125, 2.2744140625, 2.42352294921875, 2.5726318359375, 2.72174072265625, 2.870849609375, 3.01995849609375, 3.1690673828125, 3.31817626953125, 3.46728515625, 3.61639404296875, 3.7655029296875, 3.91461181640625, 4.063720703125, 4.21282958984375, 4.3619384765625, 4.51104736328125, 4.66015625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 9.0, 17.0, 8.0, 21.0, 22.0, 39.0, 52.0, 55.0, 93.0, 104.0, 150.0, 252.0, 370.0, 633.0, 1114.0, 2025.0, 4450.0, 10601.0, 26732.0, 69419.0, 185369.0, 401048.0, 213954.0, 79116.0, 30504.0, 11967.0, 4980.0, 2292.0, 1172.0, 695.0, 400.0, 234.0, 165.0, 99.0, 93.0, 55.0, 56.0, 38.0, 38.0, 30.0, 15.0, 22.0, 12.0, 12.0, 6.0, 3.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-6.1484375, -5.95965576171875, -5.7708740234375, -5.58209228515625, -5.393310546875, -5.20452880859375, -5.0157470703125, -4.82696533203125, -4.63818359375, -4.44940185546875, -4.2606201171875, -4.07183837890625, -3.883056640625, -3.69427490234375, -3.5054931640625, -3.31671142578125, -3.1279296875, -2.93914794921875, -2.7503662109375, -2.56158447265625, -2.372802734375, -2.18402099609375, -1.9952392578125, -1.80645751953125, -1.61767578125, -1.42889404296875, -1.2401123046875, -1.05133056640625, -0.862548828125, -0.67376708984375, -0.4849853515625, -0.29620361328125, -0.107421875, 0.08135986328125, 0.2701416015625, 0.45892333984375, 0.647705078125, 0.83648681640625, 1.0252685546875, 1.21405029296875, 1.40283203125, 1.59161376953125, 1.7803955078125, 1.96917724609375, 2.157958984375, 2.34674072265625, 2.5355224609375, 2.72430419921875, 2.9130859375, 3.10186767578125, 3.2906494140625, 3.47943115234375, 3.668212890625, 3.85699462890625, 4.0457763671875, 4.23455810546875, 4.42333984375, 4.61212158203125, 4.8009033203125, 4.98968505859375, 5.178466796875, 5.36724853515625, 5.5560302734375, 5.74481201171875, 5.93359375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 8.0, 3.0, 5.0, 3.0, 12.0, 10.0, 16.0, 25.0, 24.0, 23.0, 30.0, 38.0, 37.0, 39.0, 40.0, 63.0, 94.0, 185.0, 1440.0, 354.0, 149.0, 82.0, 47.0, 40.0, 40.0, 42.0, 40.0, 33.0, 23.0, 19.0, 20.0, 15.0, 7.0, 9.0, 12.0, 6.0, 5.0, 8.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8125, -15.315185546875, -14.81787109375, -14.320556640625, -13.8232421875, -13.325927734375, -12.82861328125, -12.331298828125, -11.833984375, -11.336669921875, -10.83935546875, -10.342041015625, -9.8447265625, -9.347412109375, -8.85009765625, -8.352783203125, -7.85546875, -7.358154296875, -6.86083984375, -6.363525390625, -5.8662109375, -5.368896484375, -4.87158203125, -4.374267578125, -3.876953125, -3.379638671875, -2.88232421875, -2.385009765625, -1.8876953125, -1.390380859375, -0.89306640625, -0.395751953125, 0.1015625, 0.598876953125, 1.09619140625, 1.593505859375, 2.0908203125, 2.588134765625, 3.08544921875, 3.582763671875, 4.080078125, 4.577392578125, 5.07470703125, 5.572021484375, 6.0693359375, 6.566650390625, 7.06396484375, 7.561279296875, 8.05859375, 8.555908203125, 9.05322265625, 9.550537109375, 10.0478515625, 10.545166015625, 11.04248046875, 11.539794921875, 12.037109375, 12.534423828125, 13.03173828125, 13.529052734375, 14.0263671875, 14.523681640625, 15.02099609375, 15.518310546875, 16.015625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 10.0, 16.0, 10.0, 18.0, 24.0, 21.0, 42.0, 51.0, 59.0, 80.0, 140.0, 175.0, 291.0, 424.0, 821.0, 3620.0, 76529.0, 2807404.0, 245559.0, 7814.0, 1091.0, 485.0, 313.0, 167.0, 158.0, 94.0, 82.0, 59.0, 36.0, 26.0, 16.0, 15.0, 6.0, 10.0, 4.0, 16.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.828125, -21.138427734375, -20.44873046875, -19.759033203125, -19.0693359375, -18.379638671875, -17.68994140625, -17.000244140625, -16.310546875, -15.620849609375, -14.93115234375, -14.241455078125, -13.5517578125, -12.862060546875, -12.17236328125, -11.482666015625, -10.79296875, -10.103271484375, -9.41357421875, -8.723876953125, -8.0341796875, -7.344482421875, -6.65478515625, -5.965087890625, -5.275390625, -4.585693359375, -3.89599609375, -3.206298828125, -2.5166015625, -1.826904296875, -1.13720703125, -0.447509765625, 0.2421875, 0.931884765625, 1.62158203125, 2.311279296875, 3.0009765625, 3.690673828125, 4.38037109375, 5.070068359375, 5.759765625, 6.449462890625, 7.13916015625, 7.828857421875, 8.5185546875, 9.208251953125, 9.89794921875, 10.587646484375, 11.27734375, 11.967041015625, 12.65673828125, 13.346435546875, 14.0361328125, 14.725830078125, 15.41552734375, 16.105224609375, 16.794921875, 17.484619140625, 18.17431640625, 18.864013671875, 19.5537109375, 20.243408203125, 20.93310546875, 21.622802734375, 22.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 450.0, 555.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-298.1723937988281, -292.32733154296875, -286.48223876953125, -280.6371765136719, -274.7921142578125, -268.947021484375, -263.1019592285156, -257.2568664550781, -251.41180419921875, -245.5667266845703, -239.72164916992188, -233.8765869140625, -228.03150939941406, -222.18643188476562, -216.34136962890625, -210.4962921142578, -204.65121459960938, -198.80613708496094, -192.9610595703125, -187.11599731445312, -181.2709197998047, -175.42584228515625, -169.58078002929688, -163.73570251464844, -157.890625, -152.04554748535156, -146.20046997070312, -140.35540771484375, -134.5103302001953, -128.66525268554688, -122.82018280029297, -116.97511291503906, -111.1300277709961, -105.28495788574219, -99.43988037109375, -93.59480285644531, -87.7497329711914, -81.9046630859375, -76.05958557128906, -70.21450805664062, -64.36943817138672, -58.52436447143555, -52.679290771484375, -46.8342170715332, -40.98914337158203, -35.14406967163086, -29.298995971679688, -23.453922271728516, -17.608848571777344, -11.763774871826172, -5.918701171875, -0.07362747192382812, 5.771446228027344, 11.616519927978516, 17.461593627929688, 23.30666732788086, 29.15174102783203, 34.9968147277832, 40.841888427734375, 46.68696212768555, 52.53203582763672, 58.37710952758789, 64.22218322753906, 70.0672607421875, 75.9123306274414]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 13.0, 7.0, 7.0, 10.0, 17.0, 14.0, 21.0, 19.0, 25.0, 22.0, 19.0, 29.0, 25.0, 37.0, 36.0, 43.0, 33.0, 46.0, 40.0, 53.0, 37.0, 37.0, 36.0, 40.0, 39.0, 29.0, 38.0, 36.0, 17.0, 33.0, 19.0, 19.0, 25.0, 8.0, 18.0, 15.0, 7.0, 8.0, 7.0, 3.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.2372989654541, -28.192447662353516, -27.14759635925293, -26.102745056152344, -25.057891845703125, -24.013042449951172, -22.968189239501953, -21.923337936401367, -20.87848663330078, -19.833635330200195, -18.78878402709961, -17.743932723999023, -16.699081420898438, -15.654229164123535, -14.609376907348633, -13.564525604248047, -12.519674301147461, -11.474822998046875, -10.429971694946289, -9.385119438171387, -8.3402681350708, -7.295416831970215, -6.250565052032471, -5.205713272094727, -4.160861968994141, -3.1160104274749756, -2.0711588859558105, -1.0263073444366455, 0.01854419708251953, 1.0633955001831055, 2.1082472801208496, 3.1530990600585938, 4.197948455810547, 5.242799758911133, 6.287651538848877, 7.332503318786621, 8.377354621887207, 9.422205924987793, 10.467058181762695, 11.511909484863281, 12.556760787963867, 13.601612091064453, 14.646463394165039, 15.691315650939941, 16.736167907714844, 17.781017303466797, 18.825870513916016, 19.8707218170166, 20.915573120117188, 21.960424423217773, 23.00527572631836, 24.050127029418945, 25.09497833251953, 26.13983154296875, 27.184682846069336, 28.229534149169922, 29.274385452270508, 30.319236755371094, 31.36408805847168, 32.408939361572266, 33.453792572021484, 34.49864196777344, 35.543495178222656, 36.588348388671875, 37.63319778442383]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 9.0, 6.0, 5.0, 6.0, 19.0, 11.0, 22.0, 31.0, 28.0, 27.0, 41.0, 47.0, 32.0, 39.0, 50.0, 34.0, 52.0, 46.0, 47.0, 48.0, 38.0, 43.0, 37.0, 24.0, 23.0, 40.0, 32.0, 26.0, 19.0, 22.0, 18.0, 20.0, 11.0, 6.0, 9.0, 4.0, 4.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.0, -5.82373046875, -5.6474609375, -5.47119140625, -5.294921875, -5.11865234375, -4.9423828125, -4.76611328125, -4.58984375, -4.41357421875, -4.2373046875, -4.06103515625, -3.884765625, -3.70849609375, -3.5322265625, -3.35595703125, -3.1796875, -3.00341796875, -2.8271484375, -2.65087890625, -2.474609375, -2.29833984375, -2.1220703125, -1.94580078125, -1.76953125, -1.59326171875, -1.4169921875, -1.24072265625, -1.064453125, -0.88818359375, -0.7119140625, -0.53564453125, -0.359375, -0.18310546875, -0.0068359375, 0.16943359375, 0.345703125, 0.52197265625, 0.6982421875, 0.87451171875, 1.05078125, 1.22705078125, 1.4033203125, 1.57958984375, 1.755859375, 1.93212890625, 2.1083984375, 2.28466796875, 2.4609375, 2.63720703125, 2.8134765625, 2.98974609375, 3.166015625, 3.34228515625, 3.5185546875, 3.69482421875, 3.87109375, 4.04736328125, 4.2236328125, 4.39990234375, 4.576171875, 4.75244140625, 4.9287109375, 5.10498046875, 5.28125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 7.0, 7.0, 8.0, 14.0, 13.0, 20.0, 23.0, 28.0, 42.0, 80.0, 121.0, 165.0, 320.0, 546.0, 1086.0, 2170.0, 5333.0, 14209.0, 45197.0, 161318.0, 546158.0, 1367435.0, 1337546.0, 507188.0, 142168.0, 40470.0, 13141.0, 4903.0, 2160.0, 1015.0, 543.0, 304.0, 183.0, 97.0, 67.0, 54.0, 31.0, 26.0, 16.0, 18.0, 8.0, 12.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.46875, -5.3028564453125, -5.136962890625, -4.9710693359375, -4.80517578125, -4.6392822265625, -4.473388671875, -4.3074951171875, -4.1416015625, -3.9757080078125, -3.809814453125, -3.6439208984375, -3.47802734375, -3.3121337890625, -3.146240234375, -2.9803466796875, -2.814453125, -2.6485595703125, -2.482666015625, -2.3167724609375, -2.15087890625, -1.9849853515625, -1.819091796875, -1.6531982421875, -1.4873046875, -1.3214111328125, -1.155517578125, -0.9896240234375, -0.82373046875, -0.6578369140625, -0.491943359375, -0.3260498046875, -0.16015625, 0.0057373046875, 0.171630859375, 0.3375244140625, 0.50341796875, 0.6693115234375, 0.835205078125, 1.0010986328125, 1.1669921875, 1.3328857421875, 1.498779296875, 1.6646728515625, 1.83056640625, 1.9964599609375, 2.162353515625, 2.3282470703125, 2.494140625, 2.6600341796875, 2.825927734375, 2.9918212890625, 3.15771484375, 3.3236083984375, 3.489501953125, 3.6553955078125, 3.8212890625, 3.9871826171875, 4.153076171875, 4.3189697265625, 4.48486328125, 4.6507568359375, 4.816650390625, 4.9825439453125, 5.1484375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 8.0, 4.0, 4.0, 7.0, 13.0, 18.0, 19.0, 22.0, 24.0, 32.0, 55.0, 68.0, 102.0, 121.0, 171.0, 212.0, 294.0, 368.0, 434.0, 460.0, 377.0, 358.0, 216.0, 174.0, 120.0, 93.0, 77.0, 50.0, 38.0, 32.0, 26.0, 18.0, 12.0, 12.0, 7.0, 6.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.390625, -7.18597412109375, -6.9813232421875, -6.77667236328125, -6.572021484375, -6.36737060546875, -6.1627197265625, -5.95806884765625, -5.75341796875, -5.54876708984375, -5.3441162109375, -5.13946533203125, -4.934814453125, -4.73016357421875, -4.5255126953125, -4.32086181640625, -4.1162109375, -3.91156005859375, -3.7069091796875, -3.50225830078125, -3.297607421875, -3.09295654296875, -2.8883056640625, -2.68365478515625, -2.47900390625, -2.27435302734375, -2.0697021484375, -1.86505126953125, -1.660400390625, -1.45574951171875, -1.2510986328125, -1.04644775390625, -0.841796875, -0.63714599609375, -0.4324951171875, -0.22784423828125, -0.023193359375, 0.18145751953125, 0.3861083984375, 0.59075927734375, 0.79541015625, 1.00006103515625, 1.2047119140625, 1.40936279296875, 1.614013671875, 1.81866455078125, 2.0233154296875, 2.22796630859375, 2.4326171875, 2.63726806640625, 2.8419189453125, 3.04656982421875, 3.251220703125, 3.45587158203125, 3.6605224609375, 3.86517333984375, 4.06982421875, 4.27447509765625, 4.4791259765625, 4.68377685546875, 4.888427734375, 5.09307861328125, 5.2977294921875, 5.50238037109375, 5.70703125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 5.0, 11.0, 9.0, 18.0, 18.0, 32.0, 34.0, 49.0, 63.0, 102.0, 150.0, 260.0, 525.0, 1061.0, 2850.0, 8786.0, 33567.0, 157382.0, 1066187.0, 2408479.0, 414665.0, 73641.0, 17826.0, 5004.0, 1767.0, 748.0, 344.0, 207.0, 142.0, 89.0, 59.0, 51.0, 42.0, 24.0, 26.0, 9.0, 21.0, 13.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.34375, -9.044921875, -8.74609375, -8.447265625, -8.1484375, -7.849609375, -7.55078125, -7.251953125, -6.953125, -6.654296875, -6.35546875, -6.056640625, -5.7578125, -5.458984375, -5.16015625, -4.861328125, -4.5625, -4.263671875, -3.96484375, -3.666015625, -3.3671875, -3.068359375, -2.76953125, -2.470703125, -2.171875, -1.873046875, -1.57421875, -1.275390625, -0.9765625, -0.677734375, -0.37890625, -0.080078125, 0.21875, 0.517578125, 0.81640625, 1.115234375, 1.4140625, 1.712890625, 2.01171875, 2.310546875, 2.609375, 2.908203125, 3.20703125, 3.505859375, 3.8046875, 4.103515625, 4.40234375, 4.701171875, 5.0, 5.298828125, 5.59765625, 5.896484375, 6.1953125, 6.494140625, 6.79296875, 7.091796875, 7.390625, 7.689453125, 7.98828125, 8.287109375, 8.5859375, 8.884765625, 9.18359375, 9.482421875, 9.78125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 22.0, 47.0, 97.0, 150.0, 175.0, 176.0, 140.0, 98.0, 64.0, 21.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.483957290649414, -21.083271026611328, -19.68258285522461, -18.281896591186523, -16.881210327148438, -15.480523109436035, -14.079835891723633, -12.679149627685547, -11.278462409973145, -9.877775192260742, -8.477088928222656, -7.076401710510254, -5.67571496963501, -4.275028228759766, -2.8743410110473633, -1.4736547470092773, -0.072967529296875, 1.3277193307876587, 2.7284061908721924, 4.129093170166016, 5.52977991104126, 6.930466651916504, 8.331153869628906, 9.731840133666992, 11.132527351379395, 12.533214569091797, 13.933900833129883, 15.334588050842285, 16.735275268554688, 18.135961532592773, 19.53664779663086, 20.937335968017578, 22.338024139404297, 23.738710403442383, 25.1393985748291, 26.540084838867188, 27.940771102905273, 29.34145736694336, 30.742145538330078, 32.14282989501953, 33.54351806640625, 34.94420623779297, 36.34489059448242, 37.74557876586914, 39.14626693725586, 40.54695129394531, 41.94763946533203, 43.34832763671875, 44.74901580810547, 46.14970397949219, 47.55038833618164, 48.95107650756836, 50.35176467895508, 51.75244903564453, 53.15313720703125, 54.55382537841797, 55.95450973510742, 57.35519790649414, 58.755882263183594, 60.15657043457031, 61.55725860595703, 62.957942962646484, 64.35862731933594, 65.75931549072266, 67.16000366210938]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 3.0, 3.0, 7.0, 13.0, 8.0, 7.0, 22.0, 10.0, 20.0, 31.0, 27.0, 32.0, 29.0, 44.0, 35.0, 32.0, 35.0, 45.0, 39.0, 40.0, 54.0, 47.0, 51.0, 30.0, 40.0, 43.0, 39.0, 29.0, 29.0, 26.0, 21.0, 21.0, 20.0, 22.0, 11.0, 4.0, 10.0, 6.0, 4.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.14306640625, -23.337657928466797, -22.532249450683594, -21.72684097290039, -20.921430587768555, -20.11602210998535, -19.31061363220215, -18.505205154418945, -17.699796676635742, -16.89438819885254, -16.088979721069336, -15.283570289611816, -14.478161811828613, -13.672752380371094, -12.86734390258789, -12.061935424804688, -11.256525993347168, -10.451117515563965, -9.645708084106445, -8.840299606323242, -8.034891128540039, -7.229482173919678, -6.424073219299316, -5.618664741516113, -4.813255786895752, -4.007846832275391, -3.2024383544921875, -2.397029399871826, -1.591620683670044, -0.7862119674682617, 0.01919698715209961, 0.8246054649353027, 1.630014419555664, 2.4354231357574463, 3.2408318519592285, 4.04624080657959, 4.851649284362793, 5.657058238983154, 6.462467193603516, 7.267875671386719, 8.073284149169922, 8.878692626953125, 9.684102058410645, 10.489510536193848, 11.29491901397705, 12.10032844543457, 12.905736923217773, 13.711145401000977, 14.516554832458496, 15.3219633102417, 16.12737274169922, 16.932781219482422, 17.738189697265625, 18.543598175048828, 19.34900665283203, 20.154415130615234, 20.95982551574707, 21.765233993530273, 22.570642471313477, 23.376052856445312, 24.181461334228516, 24.98686981201172, 25.792278289794922, 26.597686767578125, 27.403095245361328]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 7.0, 6.0, 12.0, 15.0, 13.0, 10.0, 24.0, 41.0, 22.0, 26.0, 29.0, 45.0, 43.0, 28.0, 43.0, 41.0, 43.0, 44.0, 41.0, 40.0, 52.0, 44.0, 34.0, 35.0, 25.0, 30.0, 23.0, 28.0, 22.0, 27.0, 22.0, 22.0, 6.0, 8.0, 5.0, 3.0, 5.0, 8.0, 5.0, 0.0, 5.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.4453125, -5.2796630859375, -5.114013671875, -4.9483642578125, -4.78271484375, -4.6170654296875, -4.451416015625, -4.2857666015625, -4.1201171875, -3.9544677734375, -3.788818359375, -3.6231689453125, -3.45751953125, -3.2918701171875, -3.126220703125, -2.9605712890625, -2.794921875, -2.6292724609375, -2.463623046875, -2.2979736328125, -2.13232421875, -1.9666748046875, -1.801025390625, -1.6353759765625, -1.4697265625, -1.3040771484375, -1.138427734375, -0.9727783203125, -0.80712890625, -0.6414794921875, -0.475830078125, -0.3101806640625, -0.14453125, 0.0211181640625, 0.186767578125, 0.3524169921875, 0.51806640625, 0.6837158203125, 0.849365234375, 1.0150146484375, 1.1806640625, 1.3463134765625, 1.511962890625, 1.6776123046875, 1.84326171875, 2.0089111328125, 2.174560546875, 2.3402099609375, 2.505859375, 2.6715087890625, 2.837158203125, 3.0028076171875, 3.16845703125, 3.3341064453125, 3.499755859375, 3.6654052734375, 3.8310546875, 3.9967041015625, 4.162353515625, 4.3280029296875, 4.49365234375, 4.6593017578125, 4.824951171875, 4.9906005859375, 5.15625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 12.0, 17.0, 30.0, 44.0, 82.0, 92.0, 153.0, 198.0, 253.0, 415.0, 595.0, 834.0, 1262.0, 1845.0, 2717.0, 4155.0, 6419.0, 10109.0, 15758.0, 25307.0, 41876.0, 67661.0, 109760.0, 164801.0, 192905.0, 148457.0, 96006.0, 58628.0, 36178.0, 22049.0, 13788.0, 8770.0, 5822.0, 3793.0, 2409.0, 1703.0, 1165.0, 792.0, 514.0, 346.0, 270.0, 196.0, 125.0, 77.0, 52.0, 36.0, 18.0, 16.0, 21.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.464599609375, -0.4502410888671875, -0.435882568359375, -0.4215240478515625, -0.40716552734375, -0.3928070068359375, -0.378448486328125, -0.3640899658203125, -0.3497314453125, -0.3353729248046875, -0.321014404296875, -0.3066558837890625, -0.29229736328125, -0.2779388427734375, -0.263580322265625, -0.2492218017578125, -0.23486328125, -0.2205047607421875, -0.206146240234375, -0.1917877197265625, -0.17742919921875, -0.1630706787109375, -0.148712158203125, -0.1343536376953125, -0.1199951171875, -0.1056365966796875, -0.091278076171875, -0.0769195556640625, -0.06256103515625, -0.0482025146484375, -0.033843994140625, -0.0194854736328125, -0.005126953125, 0.0092315673828125, 0.023590087890625, 0.0379486083984375, 0.05230712890625, 0.0666656494140625, 0.081024169921875, 0.0953826904296875, 0.1097412109375, 0.1240997314453125, 0.138458251953125, 0.1528167724609375, 0.16717529296875, 0.1815338134765625, 0.195892333984375, 0.2102508544921875, 0.224609375, 0.2389678955078125, 0.253326416015625, 0.2676849365234375, 0.28204345703125, 0.2964019775390625, 0.310760498046875, 0.3251190185546875, 0.3394775390625, 0.3538360595703125, 0.368194580078125, 0.3825531005859375, 0.39691162109375, 0.4112701416015625, 0.425628662109375, 0.4399871826171875, 0.454345703125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 7.0, 14.0, 12.0, 19.0, 12.0, 16.0, 22.0, 22.0, 32.0, 43.0, 42.0, 34.0, 29.0, 53.0, 52.0, 38.0, 1059.0, 45.0, 43.0, 36.0, 44.0, 36.0, 49.0, 27.0, 30.0, 36.0, 25.0, 22.0, 19.0, 14.0, 20.0, 10.0, 10.0, 7.0, 8.0, 5.0, 5.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.34765625, -3.23602294921875, -3.1243896484375, -3.01275634765625, -2.901123046875, -2.78948974609375, -2.6778564453125, -2.56622314453125, -2.45458984375, -2.34295654296875, -2.2313232421875, -2.11968994140625, -2.008056640625, -1.89642333984375, -1.7847900390625, -1.67315673828125, -1.5615234375, -1.44989013671875, -1.3382568359375, -1.22662353515625, -1.114990234375, -1.00335693359375, -0.8917236328125, -0.78009033203125, -0.66845703125, -0.55682373046875, -0.4451904296875, -0.33355712890625, -0.221923828125, -0.11029052734375, 0.0013427734375, 0.11297607421875, 0.224609375, 0.33624267578125, 0.4478759765625, 0.55950927734375, 0.671142578125, 0.78277587890625, 0.8944091796875, 1.00604248046875, 1.11767578125, 1.22930908203125, 1.3409423828125, 1.45257568359375, 1.564208984375, 1.67584228515625, 1.7874755859375, 1.89910888671875, 2.0107421875, 2.12237548828125, 2.2340087890625, 2.34564208984375, 2.457275390625, 2.56890869140625, 2.6805419921875, 2.79217529296875, 2.90380859375, 3.01544189453125, 3.1270751953125, 3.23870849609375, 3.350341796875, 3.46197509765625, 3.5736083984375, 3.68524169921875, 3.796875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 5.0, 5.0, 11.0, 20.0, 39.0, 49.0, 90.0, 125.0, 167.0, 272.0, 367.0, 528.0, 775.0, 1109.0, 1614.0, 2397.0, 3528.0, 5231.0, 7978.0, 11929.0, 17874.0, 26136.0, 39201.0, 58110.0, 83427.0, 114928.0, 370263.0, 966440.0, 117183.0, 85076.0, 59572.0, 40443.0, 27327.0, 18127.0, 12000.0, 8014.0, 5386.0, 3719.0, 2483.0, 1572.0, 1113.0, 776.0, 562.0, 400.0, 260.0, 152.0, 117.0, 90.0, 49.0, 39.0, 19.0, 16.0, 13.0, 5.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.308837890625, -0.2994880676269531, -0.29013824462890625, -0.2807884216308594, -0.2714385986328125, -0.2620887756347656, -0.25273895263671875, -0.24338912963867188, -0.234039306640625, -0.22468948364257812, -0.21533966064453125, -0.20598983764648438, -0.1966400146484375, -0.18729019165039062, -0.17794036865234375, -0.16859054565429688, -0.15924072265625, -0.14989089965820312, -0.14054107666015625, -0.13119125366210938, -0.1218414306640625, -0.11249160766601562, -0.10314178466796875, -0.09379196166992188, -0.084442138671875, -0.07509231567382812, -0.06574249267578125, -0.056392669677734375, -0.0470428466796875, -0.037693023681640625, -0.02834320068359375, -0.018993377685546875, -0.0096435546875, -0.000293731689453125, 0.00905609130859375, 0.018405914306640625, 0.0277557373046875, 0.037105560302734375, 0.04645538330078125, 0.055805206298828125, 0.065155029296875, 0.07450485229492188, 0.08385467529296875, 0.09320449829101562, 0.1025543212890625, 0.11190414428710938, 0.12125396728515625, 0.13060379028320312, 0.13995361328125, 0.14930343627929688, 0.15865325927734375, 0.16800308227539062, 0.1773529052734375, 0.18670272827148438, 0.19605255126953125, 0.20540237426757812, 0.214752197265625, 0.22410202026367188, 0.23345184326171875, 0.24280166625976562, 0.2521514892578125, 0.2615013122558594, 0.27085113525390625, 0.2802009582519531, 0.28955078125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 5.0, 3.0, 10.0, 6.0, 14.0, 18.0, 20.0, 25.0, 34.0, 61.0, 66.0, 83.0, 104.0, 99.0, 97.0, 92.0, 76.0, 41.0, 36.0, 35.0, 16.0, 13.0, 11.0, 9.0, 9.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.005168914794921875, -0.005014479160308838, -0.004860043525695801, -0.004705607891082764, -0.0045511722564697266, -0.0043967366218566895, -0.004242300987243652, -0.004087865352630615, -0.003933429718017578, -0.003778994083404541, -0.003624558448791504, -0.003470122814178467, -0.0033156871795654297, -0.0031612515449523926, -0.0030068159103393555, -0.0028523802757263184, -0.0026979446411132812, -0.002543509006500244, -0.002389073371887207, -0.00223463773727417, -0.002080202102661133, -0.0019257664680480957, -0.0017713308334350586, -0.0016168951988220215, -0.0014624595642089844, -0.0013080239295959473, -0.0011535882949829102, -0.000999152660369873, -0.0008447170257568359, -0.0006902813911437988, -0.0005358457565307617, -0.0003814101219177246, -0.0002269744873046875, -7.253885269165039e-05, 8.189678192138672e-05, 0.00023633241653442383, 0.00039076805114746094, 0.000545203685760498, 0.0006996393203735352, 0.0008540749549865723, 0.0010085105895996094, 0.0011629462242126465, 0.0013173818588256836, 0.0014718174934387207, 0.0016262531280517578, 0.001780688762664795, 0.001935124397277832, 0.002089560031890869, 0.0022439956665039062, 0.0023984313011169434, 0.0025528669357299805, 0.0027073025703430176, 0.0028617382049560547, 0.003016173839569092, 0.003170609474182129, 0.003325045108795166, 0.003479480743408203, 0.0036339163780212402, 0.0037883520126342773, 0.0039427876472473145, 0.0040972232818603516, 0.004251658916473389, 0.004406094551086426, 0.004560530185699463, 0.0047149658203125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 3.0, 4.0, 12.0, 13.0, 20.0, 32.0, 39.0, 59.0, 95.0, 132.0, 228.0, 506.0, 4306.0, 991960.0, 49394.0, 889.0, 303.0, 195.0, 90.0, 65.0, 56.0, 30.0, 30.0, 17.0, 12.0, 11.0, 8.0, 5.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0928955078125, -0.08987140655517578, -0.08684730529785156, -0.08382320404052734, -0.08079910278320312, -0.0777750015258789, -0.07475090026855469, -0.07172679901123047, -0.06870269775390625, -0.06567859649658203, -0.06265449523925781, -0.059630393981933594, -0.056606292724609375, -0.053582191467285156, -0.05055809020996094, -0.04753398895263672, -0.0445098876953125, -0.04148578643798828, -0.03846168518066406, -0.035437583923339844, -0.032413482666015625, -0.029389381408691406, -0.026365280151367188, -0.02334117889404297, -0.02031707763671875, -0.01729297637939453, -0.014268875122070312, -0.011244773864746094, -0.008220672607421875, -0.005196571350097656, -0.0021724700927734375, 0.0008516311645507812, 0.003875732421875, 0.006899833679199219, 0.009923934936523438, 0.012948036193847656, 0.015972137451171875, 0.018996238708496094, 0.022020339965820312, 0.02504444122314453, 0.02806854248046875, 0.03109264373779297, 0.03411674499511719, 0.037140846252441406, 0.040164947509765625, 0.043189048767089844, 0.04621315002441406, 0.04923725128173828, 0.0522613525390625, 0.05528545379638672, 0.05830955505371094, 0.061333656311035156, 0.06435775756835938, 0.0673818588256836, 0.07040596008300781, 0.07343006134033203, 0.07645416259765625, 0.07947826385498047, 0.08250236511230469, 0.0855264663696289, 0.08855056762695312, 0.09157466888427734, 0.09459877014160156, 0.09762287139892578, 0.10064697265625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 202.0, 775.0, 34.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053008273243904114, -0.05195494741201401, -0.0509016178548336, -0.0498482920229435, -0.04879496246576309, -0.047741636633872986, -0.04668830707669258, -0.045634981244802475, -0.04458165168762207, -0.043528325855731964, -0.04247499629855156, -0.04142167046666145, -0.04036834090948105, -0.03931501507759094, -0.03826168552041054, -0.03720835968852043, -0.03615503013134003, -0.03510170429944992, -0.034048374742269516, -0.03299504891037941, -0.031941719353199005, -0.03088839165866375, -0.029835063964128494, -0.028781738132238388, -0.027728412300348282, -0.026675084605813026, -0.02562175691127777, -0.024568429216742516, -0.02351510152220726, -0.022461773827672005, -0.02140844613313675, -0.020355120301246643, -0.01930179074406624, -0.018248463049530983, -0.017195135354995728, -0.016141807660460472, -0.015088479965925217, -0.014035152271389961, -0.01298182550817728, -0.011928497813642025, -0.01087517011910677, -0.009821842424571514, -0.008768514730036259, -0.007715187501162291, -0.006661859806627035, -0.00560853211209178, -0.004555204883217812, -0.003501877188682556, -0.0024485494941473007, -0.0013952219160273671, -0.0003418943379074335, 0.0007114331237971783, 0.0017647608183324337, 0.002818088512867689, 0.0038714157417416573, 0.004924743436276913, 0.005978071130812168, 0.0070313988253474236, 0.008084726519882679, 0.00913805328309536, 0.010191380977630615, 0.01124470867216587, 0.012298036366701126, 0.013351364061236382, 0.014404691755771637]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 9.0, 16.0, 23.0, 27.0, 29.0, 28.0, 34.0, 42.0, 54.0, 62.0, 66.0, 56.0, 61.0, 76.0, 68.0, 59.0, 58.0, 26.0, 37.0, 30.0, 31.0, 22.0, 22.0, 19.0, 11.0, 8.0, 8.0, 3.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002965986728668213, -0.002864253707230091, -0.0027625206857919693, -0.0026607876643538475, -0.0025590546429157257, -0.002457321621477604, -0.002355588600039482, -0.0022538555786013603, -0.0021521225571632385, -0.0020503895357251167, -0.001948656514286995, -0.0018469234928488731, -0.0017451904714107513, -0.0016434574499726295, -0.0015417244285345078, -0.001439991407096386, -0.0013382583856582642, -0.0012365253642201424, -0.0011347923427820206, -0.0010330593213438988, -0.000931326299905777, -0.0008295932784676552, -0.0007278602570295334, -0.0006261272355914116, -0.0005243942141532898, -0.000422661192715168, -0.0003209281712770462, -0.0002191951498389244, -0.00011746212840080261, -1.5729106962680817e-05, 8.600391447544098e-05, 0.00018773693591356277, 0.00028946995735168457, 0.00039120297878980637, 0.0004929360002279282, 0.00059466902166605, 0.0006964020431041718, 0.0007981350645422935, 0.0008998680859804153, 0.0010016011074185371, 0.001103334128856659, 0.0012050671502947807, 0.0013068001717329025, 0.0014085331931710243, 0.0015102662146091461, 0.001611999236047268, 0.0017137322574853897, 0.0018154652789235115, 0.0019171983003616333, 0.002018931321799755, 0.002120664343237877, 0.0022223973646759987, 0.0023241303861141205, 0.0024258634075522423, 0.002527596428990364, 0.002629329450428486, 0.0027310624718666077, 0.0028327954933047295, 0.0029345285147428513, 0.003036261536180973, 0.003137994557619095, 0.0032397275790572166, 0.0033414606004953384, 0.0034431936219334602, 0.003544926643371582]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 7.0, 6.0, 12.0, 15.0, 13.0, 10.0, 24.0, 41.0, 22.0, 26.0, 29.0, 45.0, 43.0, 28.0, 43.0, 41.0, 43.0, 45.0, 40.0, 40.0, 52.0, 44.0, 34.0, 35.0, 25.0, 30.0, 23.0, 28.0, 22.0, 27.0, 22.0, 22.0, 6.0, 8.0, 5.0, 3.0, 5.0, 8.0, 5.0, 0.0, 5.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.4453125, -5.2796630859375, -5.114013671875, -4.9483642578125, -4.78271484375, -4.6170654296875, -4.451416015625, -4.2857666015625, -4.1201171875, -3.9544677734375, -3.788818359375, -3.6231689453125, -3.45751953125, -3.2918701171875, -3.126220703125, -2.9605712890625, -2.794921875, -2.6292724609375, -2.463623046875, -2.2979736328125, -2.13232421875, -1.9666748046875, -1.801025390625, -1.6353759765625, -1.4697265625, -1.3040771484375, -1.138427734375, -0.9727783203125, -0.80712890625, -0.6414794921875, -0.475830078125, -0.3101806640625, -0.14453125, 0.0211181640625, 0.186767578125, 0.3524169921875, 0.51806640625, 0.6837158203125, 0.849365234375, 1.0150146484375, 1.1806640625, 1.3463134765625, 1.511962890625, 1.6776123046875, 1.84326171875, 2.0089111328125, 2.174560546875, 2.3402099609375, 2.505859375, 2.6715087890625, 2.837158203125, 3.0028076171875, 3.16845703125, 3.3341064453125, 3.499755859375, 3.6654052734375, 3.8310546875, 3.9967041015625, 4.162353515625, 4.3280029296875, 4.49365234375, 4.6593017578125, 4.824951171875, 4.9906005859375, 5.15625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 5.0, 6.0, 11.0, 14.0, 15.0, 23.0, 38.0, 47.0, 75.0, 77.0, 131.0, 151.0, 200.0, 299.0, 479.0, 788.0, 1453.0, 3274.0, 8122.0, 24166.0, 72535.0, 220896.0, 425893.0, 191663.0, 63438.0, 21142.0, 7160.0, 2808.0, 1350.0, 737.0, 464.0, 286.0, 228.0, 145.0, 98.0, 84.0, 66.0, 52.0, 29.0, 26.0, 22.0, 11.0, 14.0, 9.0, 8.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0], "bins": [-7.5390625, -7.3135986328125, -7.088134765625, -6.8626708984375, -6.63720703125, -6.4117431640625, -6.186279296875, -5.9608154296875, -5.7353515625, -5.5098876953125, -5.284423828125, -5.0589599609375, -4.83349609375, -4.6080322265625, -4.382568359375, -4.1571044921875, -3.931640625, -3.7061767578125, -3.480712890625, -3.2552490234375, -3.02978515625, -2.8043212890625, -2.578857421875, -2.3533935546875, -2.1279296875, -1.9024658203125, -1.677001953125, -1.4515380859375, -1.22607421875, -1.0006103515625, -0.775146484375, -0.5496826171875, -0.32421875, -0.0987548828125, 0.126708984375, 0.3521728515625, 0.57763671875, 0.8031005859375, 1.028564453125, 1.2540283203125, 1.4794921875, 1.7049560546875, 1.930419921875, 2.1558837890625, 2.38134765625, 2.6068115234375, 2.832275390625, 3.0577392578125, 3.283203125, 3.5086669921875, 3.734130859375, 3.9595947265625, 4.18505859375, 4.4105224609375, 4.635986328125, 4.8614501953125, 5.0869140625, 5.3123779296875, 5.537841796875, 5.7633056640625, 5.98876953125, 6.2142333984375, 6.439697265625, 6.6651611328125, 6.890625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 6.0, 2.0, 11.0, 8.0, 11.0, 16.0, 23.0, 27.0, 32.0, 28.0, 33.0, 44.0, 48.0, 57.0, 73.0, 104.0, 150.0, 276.0, 1383.0, 174.0, 119.0, 64.0, 57.0, 44.0, 41.0, 30.0, 32.0, 24.0, 24.0, 32.0, 11.0, 14.0, 14.0, 10.0, 9.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.3157958984375, -12.858154296875, -12.4005126953125, -11.94287109375, -11.4852294921875, -11.027587890625, -10.5699462890625, -10.1123046875, -9.6546630859375, -9.197021484375, -8.7393798828125, -8.28173828125, -7.8240966796875, -7.366455078125, -6.9088134765625, -6.451171875, -5.9935302734375, -5.535888671875, -5.0782470703125, -4.62060546875, -4.1629638671875, -3.705322265625, -3.2476806640625, -2.7900390625, -2.3323974609375, -1.874755859375, -1.4171142578125, -0.95947265625, -0.5018310546875, -0.044189453125, 0.4134521484375, 0.87109375, 1.3287353515625, 1.786376953125, 2.2440185546875, 2.70166015625, 3.1593017578125, 3.616943359375, 4.0745849609375, 4.5322265625, 4.9898681640625, 5.447509765625, 5.9051513671875, 6.36279296875, 6.8204345703125, 7.278076171875, 7.7357177734375, 8.193359375, 8.6510009765625, 9.108642578125, 9.5662841796875, 10.02392578125, 10.4815673828125, 10.939208984375, 11.3968505859375, 11.8544921875, 12.3121337890625, 12.769775390625, 13.2274169921875, 13.68505859375, 14.1427001953125, 14.600341796875, 15.0579833984375, 15.515625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 1.0, 6.0, 8.0, 5.0, 20.0, 21.0, 17.0, 37.0, 44.0, 51.0, 84.0, 100.0, 167.0, 260.0, 374.0, 682.0, 1721.0, 23032.0, 2649683.0, 459673.0, 6984.0, 1085.0, 561.0, 316.0, 200.0, 164.0, 112.0, 74.0, 48.0, 55.0, 35.0, 15.0, 19.0, 19.0, 10.0, 9.0, 4.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.109375, -28.2734375, -27.4375, -26.6015625, -25.765625, -24.9296875, -24.09375, -23.2578125, -22.421875, -21.5859375, -20.75, -19.9140625, -19.078125, -18.2421875, -17.40625, -16.5703125, -15.734375, -14.8984375, -14.0625, -13.2265625, -12.390625, -11.5546875, -10.71875, -9.8828125, -9.046875, -8.2109375, -7.375, -6.5390625, -5.703125, -4.8671875, -4.03125, -3.1953125, -2.359375, -1.5234375, -0.6875, 0.1484375, 0.984375, 1.8203125, 2.65625, 3.4921875, 4.328125, 5.1640625, 6.0, 6.8359375, 7.671875, 8.5078125, 9.34375, 10.1796875, 11.015625, 11.8515625, 12.6875, 13.5234375, 14.359375, 15.1953125, 16.03125, 16.8671875, 17.703125, 18.5390625, 19.375, 20.2109375, 21.046875, 21.8828125, 22.71875, 23.5546875, 24.390625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 44.0, 897.0, 76.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.91563415527344, -197.97793579101562, -191.04025268554688, -184.10255432128906, -177.1648712158203, -170.2271728515625, -163.28948974609375, -156.35179138183594, -149.41409301757812, -142.4763946533203, -135.53871154785156, -128.60101318359375, -121.663330078125, -114.72563171386719, -107.7879409790039, -100.85025024414062, -93.91256713867188, -86.9748764038086, -80.03718566894531, -73.0994873046875, -66.16180419921875, -59.2241096496582, -52.286415100097656, -45.348724365234375, -38.411033630371094, -31.473342895507812, -24.5356502532959, -17.597957611083984, -10.660266876220703, -3.722576141357422, 3.215118408203125, 10.152809143066406, 17.090484619140625, 24.028175354003906, 30.96586799621582, 37.903560638427734, 44.841251373291016, 51.7789421081543, 58.716636657714844, 65.65432739257812, 72.5920181274414, 79.52970886230469, 86.46739959716797, 93.40509033203125, 100.34278869628906, 107.28047180175781, 114.21817016601562, 121.1558609008789, 128.0935516357422, 135.03125, 141.96893310546875, 148.90663146972656, 155.8443145751953, 162.78201293945312, 169.71969604492188, 176.6573944091797, 183.5950927734375, 190.5327911376953, 197.47047424316406, 204.40817260742188, 211.34585571289062, 218.28355407714844, 225.22125244140625, 232.158935546875, 239.09661865234375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 1.0, 4.0, 4.0, 10.0, 11.0, 12.0, 11.0, 17.0, 20.0, 24.0, 23.0, 28.0, 35.0, 26.0, 32.0, 37.0, 40.0, 42.0, 46.0, 45.0, 39.0, 51.0, 48.0, 51.0, 36.0, 34.0, 25.0, 32.0, 24.0, 21.0, 21.0, 30.0, 22.0, 21.0, 15.0, 8.0, 13.0, 11.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-33.521141052246094, -32.4847297668457, -31.448320388793945, -30.411911010742188, -29.375499725341797, -28.33909034729004, -27.30268096923828, -26.26626968383789, -25.229860305786133, -24.193450927734375, -23.157039642333984, -22.120630264282227, -21.08422088623047, -20.047809600830078, -19.01140022277832, -17.974990844726562, -16.938579559326172, -15.902169227600098, -14.865758895874023, -13.829349517822266, -12.792939186096191, -11.756528854370117, -10.72011947631836, -9.683709144592285, -8.647298812866211, -7.610888481140137, -6.574478626251221, -5.538068771362305, -4.5016584396362305, -3.4652481079101562, -2.4288382530212402, -1.3924283981323242, -0.35601806640625, 0.6803920269012451, 1.7168021202087402, 2.7532122135162354, 3.7896223068237305, 4.826032638549805, 5.862442493438721, 6.898852348327637, 7.935262680053711, 8.971673011779785, 10.00808334350586, 11.044492721557617, 12.080903053283691, 13.117313385009766, 14.153722763061523, 15.190133094787598, 16.226543426513672, 17.26295280456543, 18.29936408996582, 19.335773468017578, 20.37218475341797, 21.408594131469727, 22.445003509521484, 23.481414794921875, 24.517824172973633, 25.55423355102539, 26.59064483642578, 27.62705421447754, 28.663463592529297, 29.699874877929688, 30.736284255981445, 31.772693634033203, 32.809104919433594]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 8.0, 10.0, 14.0, 14.0, 20.0, 20.0, 36.0, 30.0, 34.0, 29.0, 40.0, 52.0, 42.0, 48.0, 49.0, 52.0, 50.0, 44.0, 32.0, 42.0, 37.0, 40.0, 39.0, 25.0, 38.0, 15.0, 27.0, 19.0, 14.0, 16.0, 11.0, 11.0, 8.0, 10.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.49493408203125, -5.3062744140625, -5.11761474609375, -4.928955078125, -4.74029541015625, -4.5516357421875, -4.36297607421875, -4.17431640625, -3.98565673828125, -3.7969970703125, -3.60833740234375, -3.419677734375, -3.23101806640625, -3.0423583984375, -2.85369873046875, -2.6650390625, -2.47637939453125, -2.2877197265625, -2.09906005859375, -1.910400390625, -1.72174072265625, -1.5330810546875, -1.34442138671875, -1.15576171875, -0.96710205078125, -0.7784423828125, -0.58978271484375, -0.401123046875, -0.21246337890625, -0.0238037109375, 0.16485595703125, 0.353515625, 0.54217529296875, 0.7308349609375, 0.91949462890625, 1.108154296875, 1.29681396484375, 1.4854736328125, 1.67413330078125, 1.86279296875, 2.05145263671875, 2.2401123046875, 2.42877197265625, 2.617431640625, 2.80609130859375, 2.9947509765625, 3.18341064453125, 3.3720703125, 3.56072998046875, 3.7493896484375, 3.93804931640625, 4.126708984375, 4.31536865234375, 4.5040283203125, 4.69268798828125, 4.88134765625, 5.07000732421875, 5.2586669921875, 5.44732666015625, 5.635986328125, 5.82464599609375, 6.0133056640625, 6.20196533203125, 6.390625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 6.0, 12.0, 7.0, 9.0, 15.0, 15.0, 21.0, 23.0, 29.0, 35.0, 33.0, 55.0, 67.0, 96.0, 122.0, 151.0, 214.0, 246.0, 351.0, 659.0, 22471.0, 4105454.0, 61639.0, 903.0, 384.0, 301.0, 196.0, 149.0, 148.0, 104.0, 61.0, 58.0, 48.0, 31.0, 35.0, 17.0, 15.0, 19.0, 15.0, 14.0, 6.0, 5.0, 10.0, 8.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-44.03125, -42.6796875, -41.328125, -39.9765625, -38.625, -37.2734375, -35.921875, -34.5703125, -33.21875, -31.8671875, -30.515625, -29.1640625, -27.8125, -26.4609375, -25.109375, -23.7578125, -22.40625, -21.0546875, -19.703125, -18.3515625, -17.0, -15.6484375, -14.296875, -12.9453125, -11.59375, -10.2421875, -8.890625, -7.5390625, -6.1875, -4.8359375, -3.484375, -2.1328125, -0.78125, 0.5703125, 1.921875, 3.2734375, 4.625, 5.9765625, 7.328125, 8.6796875, 10.03125, 11.3828125, 12.734375, 14.0859375, 15.4375, 16.7890625, 18.140625, 19.4921875, 20.84375, 22.1953125, 23.546875, 24.8984375, 26.25, 27.6015625, 28.953125, 30.3046875, 31.65625, 33.0078125, 34.359375, 35.7109375, 37.0625, 38.4140625, 39.765625, 41.1171875, 42.46875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 7.0, 4.0, 11.0, 18.0, 19.0, 27.0, 19.0, 33.0, 53.0, 61.0, 92.0, 111.0, 183.0, 307.0, 489.0, 613.0, 601.0, 462.0, 289.0, 214.0, 111.0, 92.0, 63.0, 51.0, 32.0, 16.0, 19.0, 15.0, 15.0, 15.0, 4.0, 4.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.4609375, -8.1790771484375, -7.897216796875, -7.6153564453125, -7.33349609375, -7.0516357421875, -6.769775390625, -6.4879150390625, -6.2060546875, -5.9241943359375, -5.642333984375, -5.3604736328125, -5.07861328125, -4.7967529296875, -4.514892578125, -4.2330322265625, -3.951171875, -3.6693115234375, -3.387451171875, -3.1055908203125, -2.82373046875, -2.5418701171875, -2.260009765625, -1.9781494140625, -1.6962890625, -1.4144287109375, -1.132568359375, -0.8507080078125, -0.56884765625, -0.2869873046875, -0.005126953125, 0.2767333984375, 0.55859375, 0.8404541015625, 1.122314453125, 1.4041748046875, 1.68603515625, 1.9678955078125, 2.249755859375, 2.5316162109375, 2.8134765625, 3.0953369140625, 3.377197265625, 3.6590576171875, 3.94091796875, 4.2227783203125, 4.504638671875, 4.7864990234375, 5.068359375, 5.3502197265625, 5.632080078125, 5.9139404296875, 6.19580078125, 6.4776611328125, 6.759521484375, 7.0413818359375, 7.3232421875, 7.6051025390625, 7.886962890625, 8.1688232421875, 8.45068359375, 8.7325439453125, 9.014404296875, 9.2962646484375, 9.578125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 11.0, 11.0, 25.0, 19.0, 28.0, 44.0, 58.0, 108.0, 251.0, 711.0, 6705.0, 1068312.0, 3104273.0, 12103.0, 936.0, 312.0, 126.0, 62.0, 47.0, 35.0, 24.0, 13.0, 21.0, 14.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.46875, -32.27685546875, -31.0849609375, -29.89306640625, -28.701171875, -27.50927734375, -26.3173828125, -25.12548828125, -23.93359375, -22.74169921875, -21.5498046875, -20.35791015625, -19.166015625, -17.97412109375, -16.7822265625, -15.59033203125, -14.3984375, -13.20654296875, -12.0146484375, -10.82275390625, -9.630859375, -8.43896484375, -7.2470703125, -6.05517578125, -4.86328125, -3.67138671875, -2.4794921875, -1.28759765625, -0.095703125, 1.09619140625, 2.2880859375, 3.47998046875, 4.671875, 5.86376953125, 7.0556640625, 8.24755859375, 9.439453125, 10.63134765625, 11.8232421875, 13.01513671875, 14.20703125, 15.39892578125, 16.5908203125, 17.78271484375, 18.974609375, 20.16650390625, 21.3583984375, 22.55029296875, 23.7421875, 24.93408203125, 26.1259765625, 27.31787109375, 28.509765625, 29.70166015625, 30.8935546875, 32.08544921875, 33.27734375, 34.46923828125, 35.6611328125, 36.85302734375, 38.044921875, 39.23681640625, 40.4287109375, 41.62060546875, 42.8125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 13.0, 22.0, 120.0, 216.0, 278.0, 207.0, 96.0, 42.0, 15.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.4635238647461, -78.320556640625, -76.17758178710938, -74.03461456298828, -71.89164733886719, -69.74867248535156, -67.60570526123047, -65.46273803710938, -63.319766998291016, -61.176795959472656, -59.03382873535156, -56.8908576965332, -54.747886657714844, -52.60491943359375, -50.46194839477539, -48.31897735595703, -46.17601013183594, -44.03303909301758, -41.890071868896484, -39.747100830078125, -37.60413360595703, -35.46116256713867, -33.31819152832031, -31.175222396850586, -29.03225326538086, -26.889284133911133, -24.746315002441406, -22.603343963623047, -20.46037483215332, -18.317405700683594, -16.174434661865234, -14.031465530395508, -11.888500213623047, -9.74553108215332, -7.602560997009277, -5.459591388702393, -3.316621780395508, -1.1736526489257812, 0.9693174362182617, 3.1122875213623047, 5.255256652832031, 7.398226261138916, 9.5411958694458, 11.684165954589844, 13.82713508605957, 15.970104217529297, 18.113075256347656, 20.256044387817383, 22.39901351928711, 24.541982650756836, 26.684951782226562, 28.827922821044922, 30.97089195251465, 33.113861083984375, 35.256832122802734, 37.399803161621094, 39.54277038574219, 41.68574142456055, 43.82870864868164, 45.9716796875, 48.114646911621094, 50.25761795043945, 52.40058898925781, 54.543556213378906, 56.686527252197266]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 3.0, 10.0, 10.0, 7.0, 10.0, 13.0, 11.0, 21.0, 14.0, 28.0, 22.0, 27.0, 26.0, 21.0, 35.0, 27.0, 28.0, 36.0, 39.0, 39.0, 33.0, 29.0, 49.0, 33.0, 33.0, 35.0, 36.0, 42.0, 29.0, 27.0, 25.0, 30.0, 20.0, 32.0, 23.0, 13.0, 11.0, 12.0, 12.0, 7.0, 11.0, 8.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-28.293987274169922, -27.503644943237305, -26.713300704956055, -25.922958374023438, -25.13261604309082, -24.34227180480957, -23.551929473876953, -22.761585235595703, -21.971242904663086, -21.18090057373047, -20.39055633544922, -19.6002140045166, -18.809871673583984, -18.019527435302734, -17.229185104370117, -16.4388427734375, -15.648499488830566, -14.858156204223633, -14.067813873291016, -13.277470588684082, -12.487127304077148, -11.696784973144531, -10.906441688537598, -10.116098403930664, -9.325756072998047, -8.535412788391113, -7.745069980621338, -6.9547271728515625, -6.164383888244629, -5.3740410804748535, -4.583698272705078, -3.7933549880981445, -3.003011703491211, -2.2126686573028564, -1.4223257303237915, -0.6319828033447266, 0.15836024284362793, 0.9487032890319824, 1.7390460968017578, 2.5293893814086914, 3.319732189178467, 4.110074996948242, 4.900418281555176, 5.690761089324951, 6.481103897094727, 7.27144718170166, 8.061790466308594, 8.852132797241211, 9.642476081848145, 10.432819366455078, 11.223161697387695, 12.013504981994629, 12.803848266601562, 13.59419059753418, 14.384533882141113, 15.174877166748047, 15.965219497680664, 16.75556182861328, 17.54590606689453, 18.33624839782715, 19.126590728759766, 19.916934967041016, 20.707277297973633, 21.49761962890625, 22.2879638671875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 6.0, 12.0, 8.0, 12.0, 16.0, 21.0, 21.0, 24.0, 25.0, 29.0, 26.0, 27.0, 42.0, 36.0, 39.0, 32.0, 31.0, 38.0, 37.0, 43.0, 40.0, 34.0, 33.0, 29.0, 32.0, 33.0, 31.0, 22.0, 28.0, 27.0, 25.0, 13.0, 17.0, 16.0, 8.0, 11.0, 11.0, 12.0, 8.0, 2.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.8125, -4.66558837890625, -4.5186767578125, -4.37176513671875, -4.224853515625, -4.07794189453125, -3.9310302734375, -3.78411865234375, -3.63720703125, -3.49029541015625, -3.3433837890625, -3.19647216796875, -3.049560546875, -2.90264892578125, -2.7557373046875, -2.60882568359375, -2.4619140625, -2.31500244140625, -2.1680908203125, -2.02117919921875, -1.874267578125, -1.72735595703125, -1.5804443359375, -1.43353271484375, -1.28662109375, -1.13970947265625, -0.9927978515625, -0.84588623046875, -0.698974609375, -0.55206298828125, -0.4051513671875, -0.25823974609375, -0.111328125, 0.03558349609375, 0.1824951171875, 0.32940673828125, 0.476318359375, 0.62322998046875, 0.7701416015625, 0.91705322265625, 1.06396484375, 1.21087646484375, 1.3577880859375, 1.50469970703125, 1.651611328125, 1.79852294921875, 1.9454345703125, 2.09234619140625, 2.2392578125, 2.38616943359375, 2.5330810546875, 2.67999267578125, 2.826904296875, 2.97381591796875, 3.1207275390625, 3.26763916015625, 3.41455078125, 3.56146240234375, 3.7083740234375, 3.85528564453125, 4.002197265625, 4.14910888671875, 4.2960205078125, 4.44293212890625, 4.58984375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 4.0, 5.0, 10.0, 16.0, 16.0, 30.0, 37.0, 54.0, 85.0, 120.0, 202.0, 306.0, 417.0, 746.0, 1058.0, 1677.0, 2677.0, 4441.0, 7027.0, 11598.0, 18864.0, 30980.0, 51803.0, 87186.0, 145139.0, 207290.0, 183758.0, 117105.0, 69732.0, 41598.0, 25020.0, 15047.0, 9143.0, 5766.0, 3441.0, 2221.0, 1343.0, 895.0, 572.0, 376.0, 270.0, 163.0, 109.0, 65.0, 46.0, 36.0, 28.0, 12.0, 11.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5, -0.48262786865234375, -0.4652557373046875, -0.44788360595703125, -0.430511474609375, -0.41313934326171875, -0.3957672119140625, -0.37839508056640625, -0.36102294921875, -0.34365081787109375, -0.3262786865234375, -0.30890655517578125, -0.291534423828125, -0.27416229248046875, -0.2567901611328125, -0.23941802978515625, -0.2220458984375, -0.20467376708984375, -0.1873016357421875, -0.16992950439453125, -0.152557373046875, -0.13518524169921875, -0.1178131103515625, -0.10044097900390625, -0.08306884765625, -0.06569671630859375, -0.0483245849609375, -0.03095245361328125, -0.013580322265625, 0.00379180908203125, 0.0211639404296875, 0.03853607177734375, 0.055908203125, 0.07328033447265625, 0.0906524658203125, 0.10802459716796875, 0.125396728515625, 0.14276885986328125, 0.1601409912109375, 0.17751312255859375, 0.19488525390625, 0.21225738525390625, 0.2296295166015625, 0.24700164794921875, 0.264373779296875, 0.28174591064453125, 0.2991180419921875, 0.31649017333984375, 0.3338623046875, 0.35123443603515625, 0.3686065673828125, 0.38597869873046875, 0.403350830078125, 0.42072296142578125, 0.4380950927734375, 0.45546722412109375, 0.47283935546875, 0.49021148681640625, 0.5075836181640625, 0.5249557495117188, 0.542327880859375, 0.5597000122070312, 0.5770721435546875, 0.5944442749023438, 0.61181640625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 10.0, 10.0, 10.0, 14.0, 11.0, 15.0, 27.0, 22.0, 36.0, 25.0, 29.0, 38.0, 36.0, 31.0, 48.0, 30.0, 38.0, 38.0, 1074.0, 45.0, 63.0, 33.0, 36.0, 38.0, 45.0, 29.0, 18.0, 21.0, 20.0, 19.0, 24.0, 17.0, 14.0, 12.0, 13.0, 5.0, 9.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.703125, -3.59765625, -3.4921875, -3.38671875, -3.28125, -3.17578125, -3.0703125, -2.96484375, -2.859375, -2.75390625, -2.6484375, -2.54296875, -2.4375, -2.33203125, -2.2265625, -2.12109375, -2.015625, -1.91015625, -1.8046875, -1.69921875, -1.59375, -1.48828125, -1.3828125, -1.27734375, -1.171875, -1.06640625, -0.9609375, -0.85546875, -0.75, -0.64453125, -0.5390625, -0.43359375, -0.328125, -0.22265625, -0.1171875, -0.01171875, 0.09375, 0.19921875, 0.3046875, 0.41015625, 0.515625, 0.62109375, 0.7265625, 0.83203125, 0.9375, 1.04296875, 1.1484375, 1.25390625, 1.359375, 1.46484375, 1.5703125, 1.67578125, 1.78125, 1.88671875, 1.9921875, 2.09765625, 2.203125, 2.30859375, 2.4140625, 2.51953125, 2.625, 2.73046875, 2.8359375, 2.94140625, 3.046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 11.0, 9.0, 18.0, 18.0, 28.0, 51.0, 77.0, 105.0, 147.0, 183.0, 282.0, 424.0, 617.0, 938.0, 1406.0, 2074.0, 3115.0, 4703.0, 7198.0, 10773.0, 16309.0, 24464.0, 36473.0, 54621.0, 80096.0, 114811.0, 235153.0, 1113356.0, 122663.0, 87252.0, 59554.0, 39981.0, 26921.0, 17926.0, 11813.0, 7924.0, 5216.0, 3413.0, 2253.0, 1575.0, 1053.0, 681.0, 473.0, 313.0, 231.0, 145.0, 94.0, 62.0, 35.0, 36.0, 18.0, 13.0, 8.0, 8.0, 6.0, 8.0, 3.0, 1.0], "bins": [-0.32763671875, -0.31774139404296875, -0.3078460693359375, -0.29795074462890625, -0.288055419921875, -0.27816009521484375, -0.2682647705078125, -0.25836944580078125, -0.24847412109375, -0.23857879638671875, -0.2286834716796875, -0.21878814697265625, -0.208892822265625, -0.19899749755859375, -0.1891021728515625, -0.17920684814453125, -0.1693115234375, -0.15941619873046875, -0.1495208740234375, -0.13962554931640625, -0.129730224609375, -0.11983489990234375, -0.1099395751953125, -0.10004425048828125, -0.09014892578125, -0.08025360107421875, -0.0703582763671875, -0.06046295166015625, -0.050567626953125, -0.04067230224609375, -0.0307769775390625, -0.02088165283203125, -0.010986328125, -0.00109100341796875, 0.0088043212890625, 0.01869964599609375, 0.028594970703125, 0.03849029541015625, 0.0483856201171875, 0.05828094482421875, 0.06817626953125, 0.07807159423828125, 0.0879669189453125, 0.09786224365234375, 0.107757568359375, 0.11765289306640625, 0.1275482177734375, 0.13744354248046875, 0.1473388671875, 0.15723419189453125, 0.1671295166015625, 0.17702484130859375, 0.186920166015625, 0.19681549072265625, 0.2067108154296875, 0.21660614013671875, 0.22650146484375, 0.23639678955078125, 0.2462921142578125, 0.25618743896484375, 0.266082763671875, 0.27597808837890625, 0.2858734130859375, 0.29576873779296875, 0.3056640625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 5.0, 12.0, 9.0, 12.0, 15.0, 24.0, 25.0, 33.0, 34.0, 45.0, 80.0, 74.0, 100.0, 105.0, 99.0, 61.0, 40.0, 37.0, 44.0, 21.0, 19.0, 13.0, 9.0, 10.0, 9.0, 9.0, 10.0, 3.0, 5.0, 5.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0106201171875, -0.01029050350189209, -0.00996088981628418, -0.00963127613067627, -0.00930166244506836, -0.00897204875946045, -0.008642435073852539, -0.008312821388244629, -0.007983207702636719, -0.007653594017028809, -0.0073239803314208984, -0.006994366645812988, -0.006664752960205078, -0.006335139274597168, -0.006005525588989258, -0.005675911903381348, -0.0053462982177734375, -0.005016684532165527, -0.004687070846557617, -0.004357457160949707, -0.004027843475341797, -0.0036982297897338867, -0.0033686161041259766, -0.0030390024185180664, -0.0027093887329101562, -0.002379775047302246, -0.002050161361694336, -0.0017205476760864258, -0.0013909339904785156, -0.0010613203048706055, -0.0007317066192626953, -0.00040209293365478516, -7.2479248046875e-05, 0.00025713443756103516, 0.0005867481231689453, 0.0009163618087768555, 0.0012459754943847656, 0.0015755891799926758, 0.001905202865600586, 0.002234816551208496, 0.0025644302368164062, 0.0028940439224243164, 0.0032236576080322266, 0.0035532712936401367, 0.003882884979248047, 0.004212498664855957, 0.004542112350463867, 0.004871726036071777, 0.0052013397216796875, 0.005530953407287598, 0.005860567092895508, 0.006190180778503418, 0.006519794464111328, 0.006849408149719238, 0.0071790218353271484, 0.007508635520935059, 0.007838249206542969, 0.008167862892150879, 0.008497476577758789, 0.0088270902633667, 0.00915670394897461, 0.00948631763458252, 0.00981593132019043, 0.01014554500579834, 0.01047515869140625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 7.0, 6.0, 7.0, 10.0, 13.0, 16.0, 23.0, 29.0, 23.0, 30.0, 34.0, 67.0, 88.0, 143.0, 176.0, 283.0, 543.0, 2707.0, 983789.0, 58184.0, 1042.0, 462.0, 240.0, 133.0, 123.0, 78.0, 67.0, 43.0, 44.0, 27.0, 19.0, 14.0, 7.0, 10.0, 3.0, 7.0, 12.0, 5.0, 3.0, 3.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.1812744140625, -0.17557334899902344, -0.16987228393554688, -0.1641712188720703, -0.15847015380859375, -0.1527690887451172, -0.14706802368164062, -0.14136695861816406, -0.1356658935546875, -0.12996482849121094, -0.12426376342773438, -0.11856269836425781, -0.11286163330078125, -0.10716056823730469, -0.10145950317382812, -0.09575843811035156, -0.090057373046875, -0.08435630798339844, -0.07865524291992188, -0.07295417785644531, -0.06725311279296875, -0.06155204772949219, -0.055850982666015625, -0.05014991760253906, -0.0444488525390625, -0.03874778747558594, -0.033046722412109375, -0.027345657348632812, -0.02164459228515625, -0.015943527221679688, -0.010242462158203125, -0.0045413970947265625, 0.00115966796875, 0.0068607330322265625, 0.012561798095703125, 0.018262863159179688, 0.02396392822265625, 0.029664993286132812, 0.035366058349609375, 0.04106712341308594, 0.0467681884765625, 0.05246925354003906, 0.058170318603515625, 0.06387138366699219, 0.06957244873046875, 0.07527351379394531, 0.08097457885742188, 0.08667564392089844, 0.092376708984375, 0.09807777404785156, 0.10377883911132812, 0.10947990417480469, 0.11518096923828125, 0.12088203430175781, 0.12658309936523438, 0.13228416442871094, 0.1379852294921875, 0.14368629455566406, 0.14938735961914062, 0.1550884246826172, 0.16078948974609375, 0.1664905548095703, 0.17219161987304688, 0.17789268493652344, 0.18359375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 149.0, 851.0, 17.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022697191685438156, -0.0202452652156353, -0.017793338745832443, -0.015341412276029587, -0.01288948580622673, -0.010437559336423874, -0.007985632866621017, -0.005533706396818161, -0.0030817799270153046, -0.0006298534572124481, 0.0018220730125904083, 0.004273999482393265, 0.006725925952196121, 0.009177852421998978, 0.011629778891801834, 0.01408170536160469, 0.016533631831407547, 0.018985558301210403, 0.02143748477101326, 0.023889411240816116, 0.026341337710618973, 0.02879326418042183, 0.031245190650224686, 0.03369711712002754, 0.0361490435898304, 0.038600970059633255, 0.04105289652943611, 0.04350482299923897, 0.045956749469041824, 0.04840867593884468, 0.05086060240864754, 0.053312528878450394, 0.05576445162296295, 0.05821637809276581, 0.060668304562568665, 0.06312023103237152, 0.06557215750217438, 0.06802408397197723, 0.07047601044178009, 0.07292793691158295, 0.0753798633813858, 0.07783178985118866, 0.08028371632099152, 0.08273564279079437, 0.08518756926059723, 0.08763949573040009, 0.09009142220020294, 0.0925433486700058, 0.09499527513980865, 0.09744720160961151, 0.09989912807941437, 0.10235105454921722, 0.10480298101902008, 0.10725490748882294, 0.1097068339586258, 0.11215876042842865, 0.1146106868982315, 0.11706261336803436, 0.11951453983783722, 0.12196646630764008, 0.12441839277744293, 0.1268703192472458, 0.12932224571704865, 0.1317741721868515, 0.13422609865665436]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 6.0, 2.0, 7.0, 13.0, 9.0, 16.0, 21.0, 25.0, 27.0, 31.0, 36.0, 25.0, 42.0, 55.0, 45.0, 48.0, 53.0, 59.0, 42.0, 49.0, 44.0, 46.0, 39.0, 39.0, 28.0, 30.0, 32.0, 26.0, 27.0, 20.0, 15.0, 10.0, 5.0, 10.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.008723914623260498, -0.008495654910802841, -0.008267395198345184, -0.008039135485887527, -0.007810875773429871, -0.007582616060972214, -0.007354356348514557, -0.0071260966360569, -0.006897836923599243, -0.006669577211141586, -0.0064413174986839294, -0.006213057786226273, -0.005984798073768616, -0.005756538361310959, -0.005528278648853302, -0.005300018936395645, -0.005071759223937988, -0.004843499511480331, -0.0046152397990226746, -0.004386980086565018, -0.004158720374107361, -0.003930460661649704, -0.003702200949192047, -0.0034739412367343903, -0.0032456815242767334, -0.0030174218118190765, -0.0027891620993614197, -0.002560902386903763, -0.002332642674446106, -0.002104382961988449, -0.0018761232495307922, -0.0016478635370731354, -0.0014196038246154785, -0.0011913441121578217, -0.0009630843997001648, -0.0007348246872425079, -0.0005065649747848511, -0.0002783052623271942, -5.0045549869537354e-05, 0.0001782141625881195, 0.00040647387504577637, 0.0006347335875034332, 0.0008629932999610901, 0.001091253012418747, 0.0013195127248764038, 0.0015477724373340607, 0.0017760321497917175, 0.0020042918622493744, 0.0022325515747070312, 0.002460811287164688, 0.002689070999622345, 0.002917330712080002, 0.0031455904245376587, 0.0033738501369953156, 0.0036021098494529724, 0.0038303695619106293, 0.004058629274368286, 0.004286888986825943, 0.0045151486992836, 0.004743408411741257, 0.004971668124198914, 0.0051999278366565704, 0.005428187549114227, 0.005656447261571884, 0.005884706974029541]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 6.0, 13.0, 7.0, 12.0, 16.0, 21.0, 21.0, 25.0, 24.0, 29.0, 27.0, 26.0, 43.0, 35.0, 40.0, 32.0, 30.0, 38.0, 37.0, 44.0, 40.0, 33.0, 33.0, 29.0, 32.0, 33.0, 33.0, 20.0, 29.0, 27.0, 24.0, 14.0, 17.0, 15.0, 8.0, 11.0, 12.0, 11.0, 8.0, 2.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.80859375, -4.66168212890625, -4.5147705078125, -4.36785888671875, -4.220947265625, -4.07403564453125, -3.9271240234375, -3.78021240234375, -3.63330078125, -3.48638916015625, -3.3394775390625, -3.19256591796875, -3.045654296875, -2.89874267578125, -2.7518310546875, -2.60491943359375, -2.4580078125, -2.31109619140625, -2.1641845703125, -2.01727294921875, -1.870361328125, -1.72344970703125, -1.5765380859375, -1.42962646484375, -1.28271484375, -1.13580322265625, -0.9888916015625, -0.84197998046875, -0.695068359375, -0.54815673828125, -0.4012451171875, -0.25433349609375, -0.107421875, 0.03948974609375, 0.1864013671875, 0.33331298828125, 0.480224609375, 0.62713623046875, 0.7740478515625, 0.92095947265625, 1.06787109375, 1.21478271484375, 1.3616943359375, 1.50860595703125, 1.655517578125, 1.80242919921875, 1.9493408203125, 2.09625244140625, 2.2431640625, 2.39007568359375, 2.5369873046875, 2.68389892578125, 2.830810546875, 2.97772216796875, 3.1246337890625, 3.27154541015625, 3.41845703125, 3.56536865234375, 3.7122802734375, 3.85919189453125, 4.006103515625, 4.15301513671875, 4.2999267578125, 4.44683837890625, 4.59375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 4.0, 6.0, 6.0, 5.0, 10.0, 17.0, 12.0, 20.0, 23.0, 30.0, 44.0, 71.0, 92.0, 104.0, 127.0, 163.0, 218.0, 278.0, 383.0, 486.0, 621.0, 825.0, 1197.0, 1887.0, 4153.0, 14596.0, 63164.0, 250795.0, 471102.0, 176484.0, 42376.0, 10042.0, 3233.0, 1629.0, 1083.0, 756.0, 605.0, 424.0, 343.0, 265.0, 197.0, 180.0, 109.0, 96.0, 70.0, 57.0, 48.0, 27.0, 24.0, 20.0, 16.0, 17.0, 10.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8671875, -8.58447265625, -8.3017578125, -8.01904296875, -7.736328125, -7.45361328125, -7.1708984375, -6.88818359375, -6.60546875, -6.32275390625, -6.0400390625, -5.75732421875, -5.474609375, -5.19189453125, -4.9091796875, -4.62646484375, -4.34375, -4.06103515625, -3.7783203125, -3.49560546875, -3.212890625, -2.93017578125, -2.6474609375, -2.36474609375, -2.08203125, -1.79931640625, -1.5166015625, -1.23388671875, -0.951171875, -0.66845703125, -0.3857421875, -0.10302734375, 0.1796875, 0.46240234375, 0.7451171875, 1.02783203125, 1.310546875, 1.59326171875, 1.8759765625, 2.15869140625, 2.44140625, 2.72412109375, 3.0068359375, 3.28955078125, 3.572265625, 3.85498046875, 4.1376953125, 4.42041015625, 4.703125, 4.98583984375, 5.2685546875, 5.55126953125, 5.833984375, 6.11669921875, 6.3994140625, 6.68212890625, 6.96484375, 7.24755859375, 7.5302734375, 7.81298828125, 8.095703125, 8.37841796875, 8.6611328125, 8.94384765625, 9.2265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 7.0, 8.0, 10.0, 10.0, 17.0, 20.0, 19.0, 17.0, 22.0, 28.0, 39.0, 48.0, 46.0, 82.0, 107.0, 161.0, 327.0, 1368.0, 179.0, 116.0, 71.0, 60.0, 45.0, 41.0, 28.0, 33.0, 30.0, 22.0, 23.0, 8.0, 9.0, 6.0, 5.0, 8.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.1015625, -13.67529296875, -13.2490234375, -12.82275390625, -12.396484375, -11.97021484375, -11.5439453125, -11.11767578125, -10.69140625, -10.26513671875, -9.8388671875, -9.41259765625, -8.986328125, -8.56005859375, -8.1337890625, -7.70751953125, -7.28125, -6.85498046875, -6.4287109375, -6.00244140625, -5.576171875, -5.14990234375, -4.7236328125, -4.29736328125, -3.87109375, -3.44482421875, -3.0185546875, -2.59228515625, -2.166015625, -1.73974609375, -1.3134765625, -0.88720703125, -0.4609375, -0.03466796875, 0.3916015625, 0.81787109375, 1.244140625, 1.67041015625, 2.0966796875, 2.52294921875, 2.94921875, 3.37548828125, 3.8017578125, 4.22802734375, 4.654296875, 5.08056640625, 5.5068359375, 5.93310546875, 6.359375, 6.78564453125, 7.2119140625, 7.63818359375, 8.064453125, 8.49072265625, 8.9169921875, 9.34326171875, 9.76953125, 10.19580078125, 10.6220703125, 11.04833984375, 11.474609375, 11.90087890625, 12.3271484375, 12.75341796875, 13.1796875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 9.0, 10.0, 19.0, 22.0, 14.0, 40.0, 38.0, 41.0, 78.0, 109.0, 153.0, 260.0, 370.0, 636.0, 1355.0, 6242.0, 3124873.0, 8155.0, 1397.0, 682.0, 359.0, 244.0, 168.0, 103.0, 77.0, 61.0, 41.0, 29.0, 18.0, 17.0, 15.0, 10.0, 8.0, 7.0, 7.0, 5.0, 2.0, 6.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.28125, -46.64599609375, -45.0107421875, -43.37548828125, -41.740234375, -40.10498046875, -38.4697265625, -36.83447265625, -35.19921875, -33.56396484375, -31.9287109375, -30.29345703125, -28.658203125, -27.02294921875, -25.3876953125, -23.75244140625, -22.1171875, -20.48193359375, -18.8466796875, -17.21142578125, -15.576171875, -13.94091796875, -12.3056640625, -10.67041015625, -9.03515625, -7.39990234375, -5.7646484375, -4.12939453125, -2.494140625, -0.85888671875, 0.7763671875, 2.41162109375, 4.046875, 5.68212890625, 7.3173828125, 8.95263671875, 10.587890625, 12.22314453125, 13.8583984375, 15.49365234375, 17.12890625, 18.76416015625, 20.3994140625, 22.03466796875, 23.669921875, 25.30517578125, 26.9404296875, 28.57568359375, 30.2109375, 31.84619140625, 33.4814453125, 35.11669921875, 36.751953125, 38.38720703125, 40.0224609375, 41.65771484375, 43.29296875, 44.92822265625, 46.5634765625, 48.19873046875, 49.833984375, 51.46923828125, 53.1044921875, 54.73974609375, 56.375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 42.0, 146.0, 272.0, 298.0, 165.0, 50.0, 23.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.94337463378906, -49.07318115234375, -47.2029914855957, -45.33279800415039, -43.462608337402344, -41.59241485595703, -39.722225189208984, -37.85203170776367, -35.981842041015625, -34.11164855957031, -32.241458892822266, -30.371267318725586, -28.501075744628906, -26.630882263183594, -24.760692596435547, -22.890499114990234, -21.020307540893555, -19.150115966796875, -17.279924392700195, -15.409732818603516, -13.539541244506836, -11.66934871673584, -9.79915714263916, -7.9289655685424805, -6.058773994445801, -4.188582420349121, -2.3183906078338623, -0.4481987953186035, 1.4219927787780762, 3.292184829711914, 5.162376403808594, 7.032567977905273, 8.902759552001953, 10.772951126098633, 12.643142700195312, 14.513334274291992, 16.383525848388672, 18.253719329833984, 20.12390899658203, 21.994102478027344, 23.86429214477539, 25.73448371887207, 27.60467529296875, 29.47486686706543, 31.34505844116211, 33.21525192260742, 35.08544158935547, 36.95563507080078, 38.825828552246094, 40.696022033691406, 42.56621170043945, 44.436405181884766, 46.30659484863281, 48.176788330078125, 50.04697799682617, 51.917171478271484, 53.78736114501953, 55.657554626464844, 57.52774429321289, 59.3979377746582, 61.26812744140625, 63.13832092285156, 65.00851440429688, 66.87870025634766, 68.74889373779297]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 7.0, 12.0, 14.0, 7.0, 12.0, 12.0, 20.0, 26.0, 22.0, 22.0, 39.0, 35.0, 38.0, 44.0, 38.0, 43.0, 53.0, 45.0, 44.0, 34.0, 37.0, 41.0, 30.0, 33.0, 40.0, 39.0, 43.0, 31.0, 24.0, 19.0, 24.0, 15.0, 16.0, 9.0, 6.0, 10.0, 5.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-41.3906364440918, -40.25326919555664, -39.115901947021484, -37.97853469848633, -36.84116744995117, -35.703800201416016, -34.56643295288086, -33.42906188964844, -32.29169464111328, -31.154327392578125, -30.01696014404297, -28.879592895507812, -27.742225646972656, -26.6048583984375, -25.46748924255371, -24.330121994018555, -23.19275665283203, -22.055389404296875, -20.91802215576172, -19.780654907226562, -18.643287658691406, -17.50592041015625, -16.36855125427246, -15.231184005737305, -14.093816757202148, -12.956449508666992, -11.819082260131836, -10.681714057922363, -9.544346809387207, -8.40697956085205, -7.269611835479736, -6.132244110107422, -4.994876861572266, -3.8575093746185303, -2.720141887664795, -1.5827744007110596, -0.4454069137573242, 0.691960334777832, 1.8293280601501465, 2.966695785522461, 4.104063034057617, 5.241430282592773, 6.378798007965088, 7.516165733337402, 8.653532981872559, 9.790900230407715, 10.928268432617188, 12.065635681152344, 13.2030029296875, 14.340370178222656, 15.477737426757812, 16.61510467529297, 17.752471923828125, 18.88983917236328, 20.02720832824707, 21.164575576782227, 22.301942825317383, 23.43931007385254, 24.576677322387695, 25.71404457092285, 26.85141372680664, 27.988780975341797, 29.126148223876953, 30.26351547241211, 31.400882720947266]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 4.0, 7.0, 11.0, 7.0, 15.0, 8.0, 11.0, 15.0, 17.0, 22.0, 26.0, 30.0, 31.0, 32.0, 39.0, 40.0, 36.0, 32.0, 43.0, 35.0, 38.0, 38.0, 40.0, 39.0, 30.0, 39.0, 36.0, 24.0, 35.0, 31.0, 24.0, 22.0, 21.0, 22.0, 18.0, 11.0, 21.0, 11.0, 6.0, 5.0, 5.0, 6.0, 5.0, 9.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.15234375, -4.9964599609375, -4.840576171875, -4.6846923828125, -4.52880859375, -4.3729248046875, -4.217041015625, -4.0611572265625, -3.9052734375, -3.7493896484375, -3.593505859375, -3.4376220703125, -3.28173828125, -3.1258544921875, -2.969970703125, -2.8140869140625, -2.658203125, -2.5023193359375, -2.346435546875, -2.1905517578125, -2.03466796875, -1.8787841796875, -1.722900390625, -1.5670166015625, -1.4111328125, -1.2552490234375, -1.099365234375, -0.9434814453125, -0.78759765625, -0.6317138671875, -0.475830078125, -0.3199462890625, -0.1640625, -0.0081787109375, 0.147705078125, 0.3035888671875, 0.45947265625, 0.6153564453125, 0.771240234375, 0.9271240234375, 1.0830078125, 1.2388916015625, 1.394775390625, 1.5506591796875, 1.70654296875, 1.8624267578125, 2.018310546875, 2.1741943359375, 2.330078125, 2.4859619140625, 2.641845703125, 2.7977294921875, 2.95361328125, 3.1094970703125, 3.265380859375, 3.4212646484375, 3.5771484375, 3.7330322265625, 3.888916015625, 4.0447998046875, 4.20068359375, 4.3565673828125, 4.512451171875, 4.6683349609375, 4.82421875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 15.0, 11.0, 28.0, 37.0, 43.0, 64.0, 112.0, 199.0, 302.0, 594.0, 1087.0, 2038.0, 4186.0, 10357.0, 30976.0, 152383.0, 839023.0, 2063722.0, 879344.0, 157613.0, 32730.0, 10672.0, 4291.0, 1926.0, 1076.0, 580.0, 328.0, 205.0, 123.0, 71.0, 44.0, 30.0, 18.0, 19.0, 9.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.515625, -8.26153564453125, -8.0074462890625, -7.75335693359375, -7.499267578125, -7.24517822265625, -6.9910888671875, -6.73699951171875, -6.48291015625, -6.22882080078125, -5.9747314453125, -5.72064208984375, -5.466552734375, -5.21246337890625, -4.9583740234375, -4.70428466796875, -4.4501953125, -4.19610595703125, -3.9420166015625, -3.68792724609375, -3.433837890625, -3.17974853515625, -2.9256591796875, -2.67156982421875, -2.41748046875, -2.16339111328125, -1.9093017578125, -1.65521240234375, -1.401123046875, -1.14703369140625, -0.8929443359375, -0.63885498046875, -0.384765625, -0.13067626953125, 0.1234130859375, 0.37750244140625, 0.631591796875, 0.88568115234375, 1.1397705078125, 1.39385986328125, 1.64794921875, 1.90203857421875, 2.1561279296875, 2.41021728515625, 2.664306640625, 2.91839599609375, 3.1724853515625, 3.42657470703125, 3.6806640625, 3.93475341796875, 4.1888427734375, 4.44293212890625, 4.697021484375, 4.95111083984375, 5.2052001953125, 5.45928955078125, 5.71337890625, 5.96746826171875, 6.2215576171875, 6.47564697265625, 6.729736328125, 6.98382568359375, 7.2379150390625, 7.49200439453125, 7.74609375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 5.0, 9.0, 16.0, 24.0, 26.0, 39.0, 46.0, 55.0, 80.0, 103.0, 129.0, 191.0, 240.0, 297.0, 448.0, 519.0, 459.0, 336.0, 254.0, 159.0, 158.0, 116.0, 85.0, 65.0, 50.0, 39.0, 31.0, 28.0, 16.0, 10.0, 14.0, 7.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.421875, -7.142822265625, -6.86376953125, -6.584716796875, -6.3056640625, -6.026611328125, -5.74755859375, -5.468505859375, -5.189453125, -4.910400390625, -4.63134765625, -4.352294921875, -4.0732421875, -3.794189453125, -3.51513671875, -3.236083984375, -2.95703125, -2.677978515625, -2.39892578125, -2.119873046875, -1.8408203125, -1.561767578125, -1.28271484375, -1.003662109375, -0.724609375, -0.445556640625, -0.16650390625, 0.112548828125, 0.3916015625, 0.670654296875, 0.94970703125, 1.228759765625, 1.5078125, 1.786865234375, 2.06591796875, 2.344970703125, 2.6240234375, 2.903076171875, 3.18212890625, 3.461181640625, 3.740234375, 4.019287109375, 4.29833984375, 4.577392578125, 4.8564453125, 5.135498046875, 5.41455078125, 5.693603515625, 5.97265625, 6.251708984375, 6.53076171875, 6.809814453125, 7.0888671875, 7.367919921875, 7.64697265625, 7.926025390625, 8.205078125, 8.484130859375, 8.76318359375, 9.042236328125, 9.3212890625, 9.600341796875, 9.87939453125, 10.158447265625, 10.4375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 3.0, 3.0, 12.0, 6.0, 19.0, 21.0, 41.0, 56.0, 60.0, 112.0, 178.0, 281.0, 486.0, 805.0, 1669.0, 4903.0, 35532.0, 613371.0, 3251050.0, 261274.0, 18031.0, 3319.0, 1325.0, 645.0, 365.0, 230.0, 156.0, 113.0, 81.0, 55.0, 28.0, 15.0, 11.0, 10.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.140625, -16.6417236328125, -16.142822265625, -15.6439208984375, -15.14501953125, -14.6461181640625, -14.147216796875, -13.6483154296875, -13.1494140625, -12.6505126953125, -12.151611328125, -11.6527099609375, -11.15380859375, -10.6549072265625, -10.156005859375, -9.6571044921875, -9.158203125, -8.6593017578125, -8.160400390625, -7.6614990234375, -7.16259765625, -6.6636962890625, -6.164794921875, -5.6658935546875, -5.1669921875, -4.6680908203125, -4.169189453125, -3.6702880859375, -3.17138671875, -2.6724853515625, -2.173583984375, -1.6746826171875, -1.17578125, -0.6768798828125, -0.177978515625, 0.3209228515625, 0.81982421875, 1.3187255859375, 1.817626953125, 2.3165283203125, 2.8154296875, 3.3143310546875, 3.813232421875, 4.3121337890625, 4.81103515625, 5.3099365234375, 5.808837890625, 6.3077392578125, 6.806640625, 7.3055419921875, 7.804443359375, 8.3033447265625, 8.80224609375, 9.3011474609375, 9.800048828125, 10.2989501953125, 10.7978515625, 11.2967529296875, 11.795654296875, 12.2945556640625, 12.79345703125, 13.2923583984375, 13.791259765625, 14.2901611328125, 14.7890625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 213.0, 772.0, 27.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-502.45086669921875, -492.8404541015625, -483.23004150390625, -473.6195983886719, -464.0091857910156, -454.3987731933594, -444.7883605957031, -435.17791748046875, -425.5675048828125, -415.95709228515625, -406.3466796875, -396.7362365722656, -387.1258239746094, -377.5154113769531, -367.9049987792969, -358.2945556640625, -348.68414306640625, -339.07373046875, -329.46331787109375, -319.8528747558594, -310.2424621582031, -300.6320495605469, -291.0216369628906, -281.41119384765625, -271.8008117675781, -262.1903991699219, -252.57997131347656, -242.9695587158203, -233.359130859375, -223.74871826171875, -214.1383056640625, -204.5278778076172, -194.91744995117188, -185.30703735351562, -175.6966094970703, -166.08619689941406, -156.47576904296875, -146.8653564453125, -137.25494384765625, -127.64451599121094, -118.03410339355469, -108.4236831665039, -98.81326293945312, -89.20285034179688, -79.59242248535156, -69.98200988769531, -60.37158966064453, -50.76116943359375, -41.15074920654297, -31.540328979492188, -21.92991065979004, -12.31949234008789, -2.7090721130371094, 6.901348114013672, 16.511764526367188, 26.12218475341797, 35.73260498046875, 45.34302520751953, 54.95344543457031, 64.56385803222656, 74.17428588867188, 83.78469848632812, 93.3951187133789, 103.00553894042969, 112.61595916748047]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 11.0, 4.0, 2.0, 18.0, 12.0, 18.0, 21.0, 19.0, 22.0, 16.0, 28.0, 27.0, 32.0, 32.0, 37.0, 38.0, 45.0, 42.0, 32.0, 42.0, 44.0, 26.0, 25.0, 33.0, 24.0, 42.0, 27.0, 32.0, 40.0, 24.0, 22.0, 22.0, 27.0, 20.0, 15.0, 15.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-30.332887649536133, -29.39901351928711, -28.465139389038086, -27.531265258789062, -26.59739112854004, -25.663516998291016, -24.729644775390625, -23.79576873779297, -22.861896514892578, -21.928022384643555, -20.99414825439453, -20.060274124145508, -19.126399993896484, -18.19252586364746, -17.258651733398438, -16.324779510498047, -15.39090347290039, -14.457029342651367, -13.523155212402344, -12.58928108215332, -11.655406951904297, -10.721532821655273, -9.787659645080566, -8.853785514831543, -7.9199113845825195, -6.986037254333496, -6.052163124084473, -5.118289470672607, -4.184415340423584, -3.2505412101745605, -2.3166675567626953, -1.3827934265136719, -0.4489173889160156, 0.48495662212371826, 1.4188306331634521, 2.3527045249938965, 3.28657865524292, 4.220452785491943, 5.154326438903809, 6.088200569152832, 7.0220746994018555, 7.955948829650879, 8.889822959899902, 9.82369613647461, 10.757570266723633, 11.691444396972656, 12.62531852722168, 13.559192657470703, 14.493066787719727, 15.42694091796875, 16.360815048217773, 17.294689178466797, 18.22856330871582, 19.162437438964844, 20.096309661865234, 21.03018569946289, 21.96405792236328, 22.897932052612305, 23.831806182861328, 24.76568031311035, 25.699554443359375, 26.6334285736084, 27.567302703857422, 28.501174926757812, 29.43505096435547]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 21.0, 15.0, 15.0, 25.0, 23.0, 22.0, 32.0, 36.0, 42.0, 51.0, 36.0, 52.0, 48.0, 60.0, 56.0, 46.0, 31.0, 50.0, 47.0, 40.0, 34.0, 35.0, 35.0, 19.0, 30.0, 11.0, 17.0, 12.0, 9.0, 6.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.1796875, -5.02783203125, -4.8759765625, -4.72412109375, -4.572265625, -4.42041015625, -4.2685546875, -4.11669921875, -3.96484375, -3.81298828125, -3.6611328125, -3.50927734375, -3.357421875, -3.20556640625, -3.0537109375, -2.90185546875, -2.75, -2.59814453125, -2.4462890625, -2.29443359375, -2.142578125, -1.99072265625, -1.8388671875, -1.68701171875, -1.53515625, -1.38330078125, -1.2314453125, -1.07958984375, -0.927734375, -0.77587890625, -0.6240234375, -0.47216796875, -0.3203125, -0.16845703125, -0.0166015625, 0.13525390625, 0.287109375, 0.43896484375, 0.5908203125, 0.74267578125, 0.89453125, 1.04638671875, 1.1982421875, 1.35009765625, 1.501953125, 1.65380859375, 1.8056640625, 1.95751953125, 2.109375, 2.26123046875, 2.4130859375, 2.56494140625, 2.716796875, 2.86865234375, 3.0205078125, 3.17236328125, 3.32421875, 3.47607421875, 3.6279296875, 3.77978515625, 3.931640625, 4.08349609375, 4.2353515625, 4.38720703125, 4.5390625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 6.0, 15.0, 24.0, 33.0, 40.0, 59.0, 86.0, 123.0, 196.0, 269.0, 426.0, 623.0, 1019.0, 1513.0, 2324.0, 3890.0, 6016.0, 9648.0, 15784.0, 26389.0, 44503.0, 76195.0, 130555.0, 199063.0, 201225.0, 133936.0, 78531.0, 45755.0, 27100.0, 16118.0, 10025.0, 6124.0, 3849.0, 2486.0, 1530.0, 1037.0, 664.0, 430.0, 301.0, 173.0, 166.0, 105.0, 58.0, 50.0, 23.0, 15.0, 14.0, 16.0, 8.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.43359375, -0.4200553894042969, -0.40651702880859375, -0.3929786682128906, -0.3794403076171875, -0.3659019470214844, -0.35236358642578125, -0.3388252258300781, -0.325286865234375, -0.3117485046386719, -0.29821014404296875, -0.2846717834472656, -0.2711334228515625, -0.2575950622558594, -0.24405670166015625, -0.23051834106445312, -0.21697998046875, -0.20344161987304688, -0.18990325927734375, -0.17636489868164062, -0.1628265380859375, -0.14928817749023438, -0.13574981689453125, -0.12221145629882812, -0.108673095703125, -0.09513473510742188, -0.08159637451171875, -0.06805801391601562, -0.0545196533203125, -0.040981292724609375, -0.02744293212890625, -0.013904571533203125, -0.0003662109375, 0.013172149658203125, 0.02671051025390625, 0.040248870849609375, 0.0537872314453125, 0.06732559204101562, 0.08086395263671875, 0.09440231323242188, 0.107940673828125, 0.12147903442382812, 0.13501739501953125, 0.14855575561523438, 0.1620941162109375, 0.17563247680664062, 0.18917083740234375, 0.20270919799804688, 0.21624755859375, 0.22978591918945312, 0.24332427978515625, 0.2568626403808594, 0.2704010009765625, 0.2839393615722656, 0.29747772216796875, 0.3110160827636719, 0.324554443359375, 0.3380928039550781, 0.35163116455078125, 0.3651695251464844, 0.3787078857421875, 0.3922462463378906, 0.40578460693359375, 0.4193229675292969, 0.432861328125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 9.0, 6.0, 10.0, 14.0, 17.0, 25.0, 16.0, 27.0, 30.0, 23.0, 35.0, 35.0, 35.0, 53.0, 44.0, 52.0, 46.0, 1060.0, 37.0, 50.0, 44.0, 60.0, 38.0, 34.0, 25.0, 41.0, 25.0, 27.0, 16.0, 26.0, 14.0, 8.0, 9.0, 6.0, 7.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.55078125, -3.451629638671875, -3.35247802734375, -3.253326416015625, -3.1541748046875, -3.055023193359375, -2.95587158203125, -2.856719970703125, -2.757568359375, -2.658416748046875, -2.55926513671875, -2.460113525390625, -2.3609619140625, -2.261810302734375, -2.16265869140625, -2.063507080078125, -1.96435546875, -1.865203857421875, -1.76605224609375, -1.666900634765625, -1.5677490234375, -1.468597412109375, -1.36944580078125, -1.270294189453125, -1.171142578125, -1.071990966796875, -0.97283935546875, -0.873687744140625, -0.7745361328125, -0.675384521484375, -0.57623291015625, -0.477081298828125, -0.3779296875, -0.278778076171875, -0.17962646484375, -0.080474853515625, 0.0186767578125, 0.117828369140625, 0.21697998046875, 0.316131591796875, 0.415283203125, 0.514434814453125, 0.61358642578125, 0.712738037109375, 0.8118896484375, 0.911041259765625, 1.01019287109375, 1.109344482421875, 1.20849609375, 1.307647705078125, 1.40679931640625, 1.505950927734375, 1.6051025390625, 1.704254150390625, 1.80340576171875, 1.902557373046875, 2.001708984375, 2.100860595703125, 2.20001220703125, 2.299163818359375, 2.3983154296875, 2.497467041015625, 2.59661865234375, 2.695770263671875, 2.794921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 7.0, 6.0, 18.0, 20.0, 26.0, 44.0, 60.0, 74.0, 114.0, 191.0, 274.0, 410.0, 561.0, 805.0, 1161.0, 1691.0, 2413.0, 3517.0, 5120.0, 7295.0, 10727.0, 15748.0, 22775.0, 32962.0, 46819.0, 65056.0, 88727.0, 116395.0, 1172310.0, 142427.0, 101853.0, 75621.0, 55439.0, 38931.0, 27412.0, 18811.0, 12774.0, 8946.0, 6080.0, 4108.0, 2907.0, 1954.0, 1408.0, 932.0, 714.0, 460.0, 330.0, 226.0, 148.0, 106.0, 71.0, 51.0, 30.0, 28.0, 17.0, 14.0, 3.0, 10.0, 4.0, 2.0, 1.0], "bins": [-0.228759765625, -0.22155380249023438, -0.21434783935546875, -0.20714187622070312, -0.1999359130859375, -0.19272994995117188, -0.18552398681640625, -0.17831802368164062, -0.171112060546875, -0.16390609741210938, -0.15670013427734375, -0.14949417114257812, -0.1422882080078125, -0.13508224487304688, -0.12787628173828125, -0.12067031860351562, -0.11346435546875, -0.10625839233398438, -0.09905242919921875, -0.09184646606445312, -0.0846405029296875, -0.07743453979492188, -0.07022857666015625, -0.06302261352539062, -0.055816650390625, -0.048610687255859375, -0.04140472412109375, -0.034198760986328125, -0.0269927978515625, -0.019786834716796875, -0.01258087158203125, -0.005374908447265625, 0.0018310546875, 0.009037017822265625, 0.01624298095703125, 0.023448944091796875, 0.0306549072265625, 0.037860870361328125, 0.04506683349609375, 0.052272796630859375, 0.059478759765625, 0.06668472290039062, 0.07389068603515625, 0.08109664916992188, 0.0883026123046875, 0.09550857543945312, 0.10271453857421875, 0.10992050170898438, 0.11712646484375, 0.12433242797851562, 0.13153839111328125, 0.13874435424804688, 0.1459503173828125, 0.15315628051757812, 0.16036224365234375, 0.16756820678710938, 0.174774169921875, 0.18198013305664062, 0.18918609619140625, 0.19639205932617188, 0.2035980224609375, 0.21080398559570312, 0.21800994873046875, 0.22521591186523438, 0.232421875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 1.0, 6.0, 5.0, 6.0, 7.0, 9.0, 9.0, 7.0, 15.0, 16.0, 28.0, 34.0, 36.0, 53.0, 75.0, 83.0, 104.0, 110.0, 78.0, 76.0, 44.0, 34.0, 29.0, 29.0, 29.0, 16.0, 15.0, 10.0, 12.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00537109375, -0.0051937103271484375, -0.005016326904296875, -0.0048389434814453125, -0.00466156005859375, -0.0044841766357421875, -0.004306793212890625, -0.0041294097900390625, -0.0039520263671875, -0.0037746429443359375, -0.003597259521484375, -0.0034198760986328125, -0.00324249267578125, -0.0030651092529296875, -0.002887725830078125, -0.0027103424072265625, -0.002532958984375, -0.0023555755615234375, -0.002178192138671875, -0.0020008087158203125, -0.00182342529296875, -0.0016460418701171875, -0.001468658447265625, -0.0012912750244140625, -0.0011138916015625, -0.0009365081787109375, -0.000759124755859375, -0.0005817413330078125, -0.00040435791015625, -0.0002269744873046875, -4.9591064453125e-05, 0.0001277923583984375, 0.00030517578125, 0.0004825592041015625, 0.000659942626953125, 0.0008373260498046875, 0.00101470947265625, 0.0011920928955078125, 0.001369476318359375, 0.0015468597412109375, 0.0017242431640625, 0.0019016265869140625, 0.002079010009765625, 0.0022563934326171875, 0.00243377685546875, 0.0026111602783203125, 0.002788543701171875, 0.0029659271240234375, 0.003143310546875, 0.0033206939697265625, 0.003498077392578125, 0.0036754608154296875, 0.00385284423828125, 0.0040302276611328125, 0.004207611083984375, 0.0043849945068359375, 0.0045623779296875, 0.0047397613525390625, 0.004917144775390625, 0.0050945281982421875, 0.00527191162109375, 0.0054492950439453125, 0.005626678466796875, 0.0058040618896484375, 0.0059814453125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 11.0, 11.0, 12.0, 21.0, 25.0, 27.0, 57.0, 67.0, 84.0, 111.0, 141.0, 282.0, 606.0, 4394.0, 977582.0, 62715.0, 1167.0, 436.0, 246.0, 148.0, 106.0, 53.0, 52.0, 38.0, 27.0, 19.0, 22.0, 11.0, 17.0, 10.0, 9.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1065673828125, -0.10341072082519531, -0.10025405883789062, -0.09709739685058594, -0.09394073486328125, -0.09078407287597656, -0.08762741088867188, -0.08447074890136719, -0.0813140869140625, -0.07815742492675781, -0.07500076293945312, -0.07184410095214844, -0.06868743896484375, -0.06553077697753906, -0.062374114990234375, -0.05921745300292969, -0.056060791015625, -0.05290412902832031, -0.049747467041015625, -0.04659080505371094, -0.04343414306640625, -0.04027748107910156, -0.037120819091796875, -0.03396415710449219, -0.0308074951171875, -0.027650833129882812, -0.024494171142578125, -0.021337509155273438, -0.01818084716796875, -0.015024185180664062, -0.011867523193359375, -0.008710861206054688, -0.00555419921875, -0.0023975372314453125, 0.000759124755859375, 0.0039157867431640625, 0.00707244873046875, 0.010229110717773438, 0.013385772705078125, 0.016542434692382812, 0.0196990966796875, 0.022855758666992188, 0.026012420654296875, 0.029169082641601562, 0.03232574462890625, 0.03548240661621094, 0.038639068603515625, 0.04179573059082031, 0.044952392578125, 0.04810905456542969, 0.051265716552734375, 0.05442237854003906, 0.05757904052734375, 0.06073570251464844, 0.06389236450195312, 0.06704902648925781, 0.0702056884765625, 0.07336235046386719, 0.07651901245117188, 0.07967567443847656, 0.08283233642578125, 0.08598899841308594, 0.08914566040039062, 0.09230232238769531, 0.095458984375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 113.0, 895.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015621923841536045, -0.013453865423798561, -0.011285806074738503, -0.009117746725678444, -0.00694968830794096, -0.004781628958880901, -0.0026135705411434174, -0.0004455121234059334, 0.0017225472256541252, 0.0038906061090528965, 0.006058664992451668, 0.008226724341511726, 0.01039478275924921, 0.012562842108309269, 0.014730900526046753, 0.01689895987510681, 0.01906701922416687, 0.02123507857322693, 0.023403137922286987, 0.025571195408701897, 0.027739254757761955, 0.029907314106822014, 0.03207537159323692, 0.03424343094229698, 0.03641149029135704, 0.0385795496404171, 0.04074760898947716, 0.042915668338537216, 0.045083723962306976, 0.047251783311367035, 0.049419842660427094, 0.05158790200948715, 0.05375596135854721, 0.05592402070760727, 0.05809208005666733, 0.060260139405727386, 0.062428198754787445, 0.0645962581038475, 0.06676431745290756, 0.06893236935138702, 0.07110042870044708, 0.07326848804950714, 0.0754365473985672, 0.07760460674762726, 0.07977266609668732, 0.08194072544574738, 0.08410878479480743, 0.08627684414386749, 0.08844490349292755, 0.09061296284198761, 0.09278102219104767, 0.09494908154010773, 0.09711714088916779, 0.09928520023822784, 0.1014532595872879, 0.10362131893634796, 0.10578937828540802, 0.10795743763446808, 0.11012549698352814, 0.1122935563325882, 0.11446161568164825, 0.11662967503070831, 0.11879773437976837, 0.12096579372882843, 0.12313384562730789]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 12.0, 8.0, 11.0, 21.0, 20.0, 19.0, 54.0, 58.0, 54.0, 65.0, 68.0, 79.0, 68.0, 97.0, 87.0, 64.0, 44.0, 52.0, 38.0, 32.0, 17.0, 12.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007954180240631104, -0.007755565457046032, -0.00755695067346096, -0.007358335889875889, -0.007159721106290817, -0.006961106322705746, -0.006762491539120674, -0.006563876755535603, -0.006365261971950531, -0.0061666471883654594, -0.005968032404780388, -0.005769417621195316, -0.005570802837610245, -0.005372188054025173, -0.005173573270440102, -0.00497495848685503, -0.0047763437032699585, -0.004577728919684887, -0.004379114136099815, -0.004180499352514744, -0.003981884568929672, -0.0037832697853446007, -0.003584655001759529, -0.0033860402181744576, -0.003187425434589386, -0.0029888106510043144, -0.002790195867419243, -0.0025915810838341713, -0.0023929663002490997, -0.002194351516664028, -0.0019957367330789566, -0.001797121949493885, -0.0015985071659088135, -0.001399892382323742, -0.0012012775987386703, -0.0010026628151535988, -0.0008040480315685272, -0.0006054332479834557, -0.0004068184643983841, -0.00020820368081331253, -9.588897228240967e-06, 0.0001890258863568306, 0.00038764066994190216, 0.0005862554535269737, 0.0007848702371120453, 0.0009834850206971169, 0.0011820998042821884, 0.00138071458786726, 0.0015793293714523315, 0.001777944155037403, 0.0019765589386224747, 0.0021751737222075462, 0.002373788505792618, 0.0025724032893776894, 0.002771018072962761, 0.0029696328565478325, 0.003168247640132904, 0.0033668624237179756, 0.003565477207303047, 0.0037640919908881187, 0.00396270677447319, 0.004161321558058262, 0.0043599363416433334, 0.004558551125228405, 0.0047571659088134766]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 21.0, 15.0, 15.0, 25.0, 23.0, 22.0, 32.0, 36.0, 42.0, 51.0, 36.0, 52.0, 48.0, 60.0, 56.0, 46.0, 31.0, 50.0, 48.0, 39.0, 34.0, 35.0, 34.0, 20.0, 30.0, 11.0, 17.0, 12.0, 9.0, 6.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.1796875, -5.02783203125, -4.8759765625, -4.72412109375, -4.572265625, -4.42041015625, -4.2685546875, -4.11669921875, -3.96484375, -3.81298828125, -3.6611328125, -3.50927734375, -3.357421875, -3.20556640625, -3.0537109375, -2.90185546875, -2.75, -2.59814453125, -2.4462890625, -2.29443359375, -2.142578125, -1.99072265625, -1.8388671875, -1.68701171875, -1.53515625, -1.38330078125, -1.2314453125, -1.07958984375, -0.927734375, -0.77587890625, -0.6240234375, -0.47216796875, -0.3203125, -0.16845703125, -0.0166015625, 0.13525390625, 0.287109375, 0.43896484375, 0.5908203125, 0.74267578125, 0.89453125, 1.04638671875, 1.1982421875, 1.35009765625, 1.501953125, 1.65380859375, 1.8056640625, 1.95751953125, 2.109375, 2.26123046875, 2.4130859375, 2.56494140625, 2.716796875, 2.86865234375, 3.0205078125, 3.17236328125, 3.32421875, 3.47607421875, 3.6279296875, 3.77978515625, 3.931640625, 4.08349609375, 4.2353515625, 4.38720703125, 4.5390625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 14.0, 13.0, 24.0, 25.0, 25.0, 49.0, 67.0, 96.0, 136.0, 162.0, 246.0, 363.0, 542.0, 817.0, 1134.0, 1657.0, 2459.0, 4586.0, 16460.0, 177026.0, 734871.0, 86537.0, 10402.0, 3809.0, 2188.0, 1507.0, 993.0, 686.0, 474.0, 311.0, 244.0, 182.0, 122.0, 100.0, 66.0, 46.0, 30.0, 26.0, 17.0, 10.0, 5.0, 6.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.491455078125, -11.10009765625, -10.708740234375, -10.3173828125, -9.926025390625, -9.53466796875, -9.143310546875, -8.751953125, -8.360595703125, -7.96923828125, -7.577880859375, -7.1865234375, -6.795166015625, -6.40380859375, -6.012451171875, -5.62109375, -5.229736328125, -4.83837890625, -4.447021484375, -4.0556640625, -3.664306640625, -3.27294921875, -2.881591796875, -2.490234375, -2.098876953125, -1.70751953125, -1.316162109375, -0.9248046875, -0.533447265625, -0.14208984375, 0.249267578125, 0.640625, 1.031982421875, 1.42333984375, 1.814697265625, 2.2060546875, 2.597412109375, 2.98876953125, 3.380126953125, 3.771484375, 4.162841796875, 4.55419921875, 4.945556640625, 5.3369140625, 5.728271484375, 6.11962890625, 6.510986328125, 6.90234375, 7.293701171875, 7.68505859375, 8.076416015625, 8.4677734375, 8.859130859375, 9.25048828125, 9.641845703125, 10.033203125, 10.424560546875, 10.81591796875, 11.207275390625, 11.5986328125, 11.989990234375, 12.38134765625, 12.772705078125, 13.1640625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 11.0, 4.0, 10.0, 10.0, 4.0, 9.0, 7.0, 16.0, 19.0, 20.0, 21.0, 25.0, 28.0, 33.0, 33.0, 38.0, 71.0, 72.0, 134.0, 238.0, 1468.0, 202.0, 104.0, 71.0, 66.0, 45.0, 36.0, 37.0, 29.0, 26.0, 20.0, 18.0, 17.0, 12.0, 19.0, 8.0, 11.0, 9.0, 8.0, 3.0, 7.0, 5.0, 5.0, 2.0, 2.0, 6.0, 2.0, 2.0, 1.0], "bins": [-10.71875, -10.415283203125, -10.11181640625, -9.808349609375, -9.5048828125, -9.201416015625, -8.89794921875, -8.594482421875, -8.291015625, -7.987548828125, -7.68408203125, -7.380615234375, -7.0771484375, -6.773681640625, -6.47021484375, -6.166748046875, -5.86328125, -5.559814453125, -5.25634765625, -4.952880859375, -4.6494140625, -4.345947265625, -4.04248046875, -3.739013671875, -3.435546875, -3.132080078125, -2.82861328125, -2.525146484375, -2.2216796875, -1.918212890625, -1.61474609375, -1.311279296875, -1.0078125, -0.704345703125, -0.40087890625, -0.097412109375, 0.2060546875, 0.509521484375, 0.81298828125, 1.116455078125, 1.419921875, 1.723388671875, 2.02685546875, 2.330322265625, 2.6337890625, 2.937255859375, 3.24072265625, 3.544189453125, 3.84765625, 4.151123046875, 4.45458984375, 4.758056640625, 5.0615234375, 5.364990234375, 5.66845703125, 5.971923828125, 6.275390625, 6.578857421875, 6.88232421875, 7.185791015625, 7.4892578125, 7.792724609375, 8.09619140625, 8.399658203125, 8.703125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 0.0, 7.0, 9.0, 12.0, 12.0, 19.0, 20.0, 18.0, 29.0, 32.0, 42.0, 63.0, 87.0, 120.0, 168.0, 273.0, 439.0, 749.0, 1740.0, 12778.0, 3117465.0, 8122.0, 1553.0, 676.0, 383.0, 227.0, 179.0, 115.0, 76.0, 70.0, 43.0, 31.0, 35.0, 19.0, 16.0, 11.0, 14.0, 5.0, 8.0, 13.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.125, -32.96630859375, -31.8076171875, -30.64892578125, -29.490234375, -28.33154296875, -27.1728515625, -26.01416015625, -24.85546875, -23.69677734375, -22.5380859375, -21.37939453125, -20.220703125, -19.06201171875, -17.9033203125, -16.74462890625, -15.5859375, -14.42724609375, -13.2685546875, -12.10986328125, -10.951171875, -9.79248046875, -8.6337890625, -7.47509765625, -6.31640625, -5.15771484375, -3.9990234375, -2.84033203125, -1.681640625, -0.52294921875, 0.6357421875, 1.79443359375, 2.953125, 4.11181640625, 5.2705078125, 6.42919921875, 7.587890625, 8.74658203125, 9.9052734375, 11.06396484375, 12.22265625, 13.38134765625, 14.5400390625, 15.69873046875, 16.857421875, 18.01611328125, 19.1748046875, 20.33349609375, 21.4921875, 22.65087890625, 23.8095703125, 24.96826171875, 26.126953125, 27.28564453125, 28.4443359375, 29.60302734375, 30.76171875, 31.92041015625, 33.0791015625, 34.23779296875, 35.396484375, 36.55517578125, 37.7138671875, 38.87255859375, 40.03125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 25.0, 69.0, 133.0, 257.0, 254.0, 158.0, 70.0, 21.0, 8.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.35519790649414, -40.84904861450195, -39.34290313720703, -37.836753845214844, -36.33060836791992, -34.824459075927734, -33.31831359863281, -31.812164306640625, -30.30601692199707, -28.799869537353516, -27.29372215270996, -25.787574768066406, -24.28142547607422, -22.775279998779297, -21.26913070678711, -19.762983322143555, -18.2568359375, -16.750688552856445, -15.24454116821289, -13.73839282989502, -12.232245445251465, -10.72609806060791, -9.219949722290039, -7.713802337646484, -6.20765495300293, -4.701507568359375, -3.195359706878662, -1.6892118453979492, -0.18306446075439453, 1.3230829238891602, 2.8292312622070312, 4.335378646850586, 5.841522216796875, 7.34766960144043, 8.853816986083984, 10.359965324401855, 11.86611270904541, 13.372260093688965, 14.878408432006836, 16.38455581665039, 17.890703201293945, 19.3968505859375, 20.902997970581055, 22.40914535522461, 23.915294647216797, 25.42144012451172, 26.927589416503906, 28.43373680114746, 29.939884185791016, 31.44603157043457, 32.952178955078125, 34.45832824707031, 35.964473724365234, 37.47062301635742, 38.976768493652344, 40.48291778564453, 41.98906707763672, 43.495216369628906, 45.00136184692383, 46.507511138916016, 48.01365661621094, 49.519805908203125, 51.02595520019531, 52.532100677490234, 54.038246154785156]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 1.0, 4.0, 11.0, 14.0, 13.0, 12.0, 9.0, 20.0, 20.0, 21.0, 25.0, 21.0, 28.0, 26.0, 34.0, 34.0, 35.0, 41.0, 39.0, 37.0, 35.0, 38.0, 44.0, 43.0, 40.0, 32.0, 31.0, 30.0, 26.0, 25.0, 27.0, 30.0, 26.0, 11.0, 14.0, 21.0, 11.0, 9.0, 12.0, 7.0, 11.0, 7.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.226558685302734, -24.397172927856445, -23.567785263061523, -22.738399505615234, -21.909011840820312, -21.079626083374023, -20.250240325927734, -19.420852661132812, -18.591466903686523, -17.762081146240234, -16.932693481445312, -16.103307723999023, -15.273921012878418, -14.444534301757812, -13.615147590637207, -12.785760879516602, -11.956374168395996, -11.12698745727539, -10.297600746154785, -9.46821403503418, -8.63882827758789, -7.809441566467285, -6.98005485534668, -6.150668621063232, -5.321281909942627, -4.4918951988220215, -3.662508964538574, -2.8331222534179688, -2.0037357807159424, -1.174349308013916, -0.34496259689331055, 0.4844236373901367, 1.3138103485107422, 2.1431968212127686, 2.972583293914795, 3.8019700050354004, 4.631356239318848, 5.460742950439453, 6.290129661560059, 7.119515895843506, 7.948902606964111, 8.778288841247559, 9.607675552368164, 10.43706226348877, 11.266448974609375, 12.095834732055664, 12.925222396850586, 13.754608154296875, 14.58399486541748, 15.413381576538086, 16.242767333984375, 17.072154998779297, 17.901540756225586, 18.730926513671875, 19.560314178466797, 20.389699935913086, 21.219087600708008, 22.048473358154297, 22.87786102294922, 23.707246780395508, 24.53663444519043, 25.36602020263672, 26.19540786743164, 27.02479362487793, 27.85417938232422]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 14.0, 8.0, 11.0, 16.0, 14.0, 22.0, 17.0, 15.0, 21.0, 36.0, 28.0, 28.0, 30.0, 53.0, 40.0, 46.0, 58.0, 45.0, 33.0, 51.0, 39.0, 40.0, 38.0, 37.0, 31.0, 29.0, 38.0, 22.0, 25.0, 19.0, 18.0, 13.0, 10.0, 15.0, 4.0, 8.0, 6.0, 5.0, 6.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3359375, -4.19158935546875, -4.0472412109375, -3.90289306640625, -3.758544921875, -3.61419677734375, -3.4698486328125, -3.32550048828125, -3.18115234375, -3.03680419921875, -2.8924560546875, -2.74810791015625, -2.603759765625, -2.45941162109375, -2.3150634765625, -2.17071533203125, -2.0263671875, -1.88201904296875, -1.7376708984375, -1.59332275390625, -1.448974609375, -1.30462646484375, -1.1602783203125, -1.01593017578125, -0.87158203125, -0.72723388671875, -0.5828857421875, -0.43853759765625, -0.294189453125, -0.14984130859375, -0.0054931640625, 0.13885498046875, 0.283203125, 0.42755126953125, 0.5718994140625, 0.71624755859375, 0.860595703125, 1.00494384765625, 1.1492919921875, 1.29364013671875, 1.43798828125, 1.58233642578125, 1.7266845703125, 1.87103271484375, 2.015380859375, 2.15972900390625, 2.3040771484375, 2.44842529296875, 2.5927734375, 2.73712158203125, 2.8814697265625, 3.02581787109375, 3.170166015625, 3.31451416015625, 3.4588623046875, 3.60321044921875, 3.74755859375, 3.89190673828125, 4.0362548828125, 4.18060302734375, 4.324951171875, 4.46929931640625, 4.6136474609375, 4.75799560546875, 4.90234375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 14.0, 15.0, 21.0, 23.0, 35.0, 58.0, 80.0, 108.0, 143.0, 203.0, 282.0, 427.0, 670.0, 1195.0, 1931.0, 3801.0, 7845.0, 20786.0, 79997.0, 421921.0, 1553060.0, 1561153.0, 424944.0, 78751.0, 20019.0, 7743.0, 3774.0, 2042.0, 1127.0, 701.0, 456.0, 308.0, 176.0, 130.0, 102.0, 66.0, 54.0, 33.0, 20.0, 13.0, 12.0, 9.0, 9.0, 4.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.80859375, -5.6270751953125, -5.445556640625, -5.2640380859375, -5.08251953125, -4.9010009765625, -4.719482421875, -4.5379638671875, -4.3564453125, -4.1749267578125, -3.993408203125, -3.8118896484375, -3.63037109375, -3.4488525390625, -3.267333984375, -3.0858154296875, -2.904296875, -2.7227783203125, -2.541259765625, -2.3597412109375, -2.17822265625, -1.9967041015625, -1.815185546875, -1.6336669921875, -1.4521484375, -1.2706298828125, -1.089111328125, -0.9075927734375, -0.72607421875, -0.5445556640625, -0.363037109375, -0.1815185546875, 0.0, 0.1815185546875, 0.363037109375, 0.5445556640625, 0.72607421875, 0.9075927734375, 1.089111328125, 1.2706298828125, 1.4521484375, 1.6336669921875, 1.815185546875, 1.9967041015625, 2.17822265625, 2.3597412109375, 2.541259765625, 2.7227783203125, 2.904296875, 3.0858154296875, 3.267333984375, 3.4488525390625, 3.63037109375, 3.8118896484375, 3.993408203125, 4.1749267578125, 4.3564453125, 4.5379638671875, 4.719482421875, 4.9010009765625, 5.08251953125, 5.2640380859375, 5.445556640625, 5.6270751953125, 5.80859375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 7.0, 12.0, 36.0, 65.0, 131.0, 244.0, 418.0, 694.0, 851.0, 703.0, 429.0, 217.0, 127.0, 62.0, 26.0, 26.0, 13.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.688720703125, -17.25244140625, -16.816162109375, -16.3798828125, -15.943603515625, -15.50732421875, -15.071044921875, -14.634765625, -14.198486328125, -13.76220703125, -13.325927734375, -12.8896484375, -12.453369140625, -12.01708984375, -11.580810546875, -11.14453125, -10.708251953125, -10.27197265625, -9.835693359375, -9.3994140625, -8.963134765625, -8.52685546875, -8.090576171875, -7.654296875, -7.218017578125, -6.78173828125, -6.345458984375, -5.9091796875, -5.472900390625, -5.03662109375, -4.600341796875, -4.1640625, -3.727783203125, -3.29150390625, -2.855224609375, -2.4189453125, -1.982666015625, -1.54638671875, -1.110107421875, -0.673828125, -0.237548828125, 0.19873046875, 0.635009765625, 1.0712890625, 1.507568359375, 1.94384765625, 2.380126953125, 2.81640625, 3.252685546875, 3.68896484375, 4.125244140625, 4.5615234375, 4.997802734375, 5.43408203125, 5.870361328125, 6.306640625, 6.742919921875, 7.17919921875, 7.615478515625, 8.0517578125, 8.488037109375, 8.92431640625, 9.360595703125, 9.796875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 11.0, 11.0, 21.0, 31.0, 50.0, 173.0, 349.0, 877.0, 3366.0, 223381.0, 3951946.0, 11464.0, 1662.0, 536.0, 208.0, 103.0, 43.0, 26.0, 9.0, 6.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.21875, -20.26513671875, -19.3115234375, -18.35791015625, -17.404296875, -16.45068359375, -15.4970703125, -14.54345703125, -13.58984375, -12.63623046875, -11.6826171875, -10.72900390625, -9.775390625, -8.82177734375, -7.8681640625, -6.91455078125, -5.9609375, -5.00732421875, -4.0537109375, -3.10009765625, -2.146484375, -1.19287109375, -0.2392578125, 0.71435546875, 1.66796875, 2.62158203125, 3.5751953125, 4.52880859375, 5.482421875, 6.43603515625, 7.3896484375, 8.34326171875, 9.296875, 10.25048828125, 11.2041015625, 12.15771484375, 13.111328125, 14.06494140625, 15.0185546875, 15.97216796875, 16.92578125, 17.87939453125, 18.8330078125, 19.78662109375, 20.740234375, 21.69384765625, 22.6474609375, 23.60107421875, 24.5546875, 25.50830078125, 26.4619140625, 27.41552734375, 28.369140625, 29.32275390625, 30.2763671875, 31.22998046875, 32.18359375, 33.13720703125, 34.0908203125, 35.04443359375, 35.998046875, 36.95166015625, 37.9052734375, 38.85888671875, 39.8125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 132.0, 676.0, 193.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.4481506347656, -297.6725769042969, -291.89703369140625, -286.1214599609375, -280.34588623046875, -274.5703430175781, -268.7947692871094, -263.01922607421875, -257.24365234375, -251.4680938720703, -245.69252014160156, -239.91696166992188, -234.1414031982422, -228.3658447265625, -222.59027099609375, -216.81471252441406, -211.03915405273438, -205.2635955810547, -199.48802185058594, -193.71246337890625, -187.93690490722656, -182.16134643554688, -176.38577270507812, -170.61021423339844, -164.8346405029297, -159.05908203125, -153.28350830078125, -147.50794982910156, -141.73239135742188, -135.9568328857422, -130.18125915527344, -124.40570068359375, -118.63013458251953, -112.85456848144531, -107.07901000976562, -101.3034439086914, -95.52788543701172, -89.7523193359375, -83.97676086425781, -78.2011947631836, -72.42562866210938, -66.65006256103516, -60.87450408935547, -55.09893798828125, -49.32337951660156, -43.547813415527344, -37.77225112915039, -31.996688842773438, -26.22113037109375, -20.445568084716797, -14.670004844665527, -8.894441604614258, -3.1188793182373047, 2.6566829681396484, 8.432247161865234, 14.207809448242188, 19.98337173461914, 25.758934020996094, 31.534496307373047, 37.31005859375, 43.08562469482422, 48.861183166503906, 54.636749267578125, 60.41231155395508, 66.18787384033203]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 5.0, 5.0, 4.0, 9.0, 12.0, 12.0, 15.0, 15.0, 15.0, 20.0, 24.0, 19.0, 29.0, 34.0, 40.0, 29.0, 30.0, 30.0, 47.0, 34.0, 37.0, 45.0, 48.0, 45.0, 46.0, 31.0, 43.0, 32.0, 30.0, 32.0, 21.0, 18.0, 19.0, 20.0, 20.0, 15.0, 14.0, 9.0, 4.0, 9.0, 10.0, 5.0, 6.0, 3.0, 0.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-26.45172119140625, -25.59737205505371, -24.743022918701172, -23.888675689697266, -23.034326553344727, -22.179977416992188, -21.32562828063965, -20.47127914428711, -19.616931915283203, -18.762582778930664, -17.908233642578125, -17.05388641357422, -16.19953727722168, -15.34518814086914, -14.490839004516602, -13.636490821838379, -12.78214168548584, -11.9277925491333, -11.073444366455078, -10.219095230102539, -9.364747047424316, -8.510397911071777, -7.6560492515563965, -6.801700592041016, -5.947351932525635, -5.093003273010254, -4.238654613494873, -3.384305715560913, -2.5299570560455322, -1.6756081581115723, -0.8212594985961914, 0.03308916091918945, 0.8874378204345703, 1.7417864799499512, 2.596135139465332, 3.450484037399292, 4.304832458496094, 5.159181594848633, 6.013530254364014, 6.8678789138793945, 7.722227573394775, 8.576576232910156, 9.430925369262695, 10.285273551940918, 11.139622688293457, 11.99397087097168, 12.848320007324219, 13.702669143676758, 14.55701732635498, 15.41136646270752, 16.265714645385742, 17.12006378173828, 17.97441291809082, 18.82876205444336, 19.683109283447266, 20.537458419799805, 21.391807556152344, 22.246156692504883, 23.100505828857422, 23.954853057861328, 24.809202194213867, 25.663551330566406, 26.517900466918945, 27.372249603271484, 28.22659683227539]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 12.0, 17.0, 10.0, 13.0, 26.0, 22.0, 24.0, 26.0, 32.0, 37.0, 31.0, 34.0, 35.0, 51.0, 46.0, 47.0, 46.0, 45.0, 39.0, 34.0, 39.0, 47.0, 23.0, 27.0, 26.0, 24.0, 24.0, 22.0, 20.0, 21.0, 11.0, 15.0, 15.0, 7.0, 4.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.234375, -3.13543701171875, -3.0364990234375, -2.93756103515625, -2.838623046875, -2.73968505859375, -2.6407470703125, -2.54180908203125, -2.44287109375, -2.34393310546875, -2.2449951171875, -2.14605712890625, -2.047119140625, -1.94818115234375, -1.8492431640625, -1.75030517578125, -1.6513671875, -1.55242919921875, -1.4534912109375, -1.35455322265625, -1.255615234375, -1.15667724609375, -1.0577392578125, -0.95880126953125, -0.85986328125, -0.76092529296875, -0.6619873046875, -0.56304931640625, -0.464111328125, -0.36517333984375, -0.2662353515625, -0.16729736328125, -0.068359375, 0.03057861328125, 0.1295166015625, 0.22845458984375, 0.327392578125, 0.42633056640625, 0.5252685546875, 0.62420654296875, 0.72314453125, 0.82208251953125, 0.9210205078125, 1.01995849609375, 1.118896484375, 1.21783447265625, 1.3167724609375, 1.41571044921875, 1.5146484375, 1.61358642578125, 1.7125244140625, 1.81146240234375, 1.910400390625, 2.00933837890625, 2.1082763671875, 2.20721435546875, 2.30615234375, 2.40509033203125, 2.5040283203125, 2.60296630859375, 2.701904296875, 2.80084228515625, 2.8997802734375, 2.99871826171875, 3.09765625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 6.0, 8.0, 16.0, 15.0, 32.0, 40.0, 45.0, 68.0, 136.0, 188.0, 253.0, 367.0, 553.0, 761.0, 1139.0, 1696.0, 2635.0, 3884.0, 5912.0, 9072.0, 14099.0, 22936.0, 36674.0, 59473.0, 95825.0, 148497.0, 198556.0, 162032.0, 106156.0, 66356.0, 40753.0, 25299.0, 15711.0, 10089.0, 6401.0, 4219.0, 2826.0, 1872.0, 1198.0, 907.0, 607.0, 391.0, 272.0, 176.0, 113.0, 90.0, 64.0, 48.0, 29.0, 25.0, 8.0, 12.0, 6.0, 8.0, 6.0, 4.0, 1.0, 3.0], "bins": [-0.306640625, -0.2972373962402344, -0.28783416748046875, -0.2784309387207031, -0.2690277099609375, -0.2596244812011719, -0.25022125244140625, -0.24081802368164062, -0.231414794921875, -0.22201156616210938, -0.21260833740234375, -0.20320510864257812, -0.1938018798828125, -0.18439865112304688, -0.17499542236328125, -0.16559219360351562, -0.15618896484375, -0.14678573608398438, -0.13738250732421875, -0.12797927856445312, -0.1185760498046875, -0.10917282104492188, -0.09976959228515625, -0.09036636352539062, -0.080963134765625, -0.07155990600585938, -0.06215667724609375, -0.052753448486328125, -0.0433502197265625, -0.033946990966796875, -0.02454376220703125, -0.015140533447265625, -0.0057373046875, 0.003665924072265625, 0.01306915283203125, 0.022472381591796875, 0.0318756103515625, 0.041278839111328125, 0.05068206787109375, 0.060085296630859375, 0.069488525390625, 0.07889175415039062, 0.08829498291015625, 0.09769821166992188, 0.1071014404296875, 0.11650466918945312, 0.12590789794921875, 0.13531112670898438, 0.14471435546875, 0.15411758422851562, 0.16352081298828125, 0.17292404174804688, 0.1823272705078125, 0.19173049926757812, 0.20113372802734375, 0.21053695678710938, 0.219940185546875, 0.22934341430664062, 0.23874664306640625, 0.24814987182617188, 0.2575531005859375, 0.2669563293457031, 0.27635955810546875, 0.2857627868652344, 0.295166015625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 16.0, 21.0, 18.0, 14.0, 18.0, 18.0, 27.0, 29.0, 27.0, 23.0, 36.0, 42.0, 44.0, 39.0, 39.0, 48.0, 1064.0, 39.0, 39.0, 38.0, 39.0, 45.0, 35.0, 30.0, 23.0, 27.0, 23.0, 20.0, 18.0, 16.0, 15.0, 16.0, 23.0, 9.0, 4.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.931640625, -1.867034912109375, -1.80242919921875, -1.737823486328125, -1.6732177734375, -1.608612060546875, -1.54400634765625, -1.479400634765625, -1.414794921875, -1.350189208984375, -1.28558349609375, -1.220977783203125, -1.1563720703125, -1.091766357421875, -1.02716064453125, -0.962554931640625, -0.89794921875, -0.833343505859375, -0.76873779296875, -0.704132080078125, -0.6395263671875, -0.574920654296875, -0.51031494140625, -0.445709228515625, -0.381103515625, -0.316497802734375, -0.25189208984375, -0.187286376953125, -0.1226806640625, -0.058074951171875, 0.00653076171875, 0.071136474609375, 0.1357421875, 0.200347900390625, 0.26495361328125, 0.329559326171875, 0.3941650390625, 0.458770751953125, 0.52337646484375, 0.587982177734375, 0.652587890625, 0.717193603515625, 0.78179931640625, 0.846405029296875, 0.9110107421875, 0.975616455078125, 1.04022216796875, 1.104827880859375, 1.16943359375, 1.234039306640625, 1.29864501953125, 1.363250732421875, 1.4278564453125, 1.492462158203125, 1.55706787109375, 1.621673583984375, 1.686279296875, 1.750885009765625, 1.81549072265625, 1.880096435546875, 1.9447021484375, 2.009307861328125, 2.07391357421875, 2.138519287109375, 2.203125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 4.0, 9.0, 14.0, 7.0, 25.0, 23.0, 31.0, 60.0, 117.0, 153.0, 230.0, 332.0, 471.0, 687.0, 961.0, 1397.0, 2031.0, 2916.0, 4265.0, 6215.0, 8884.0, 13221.0, 19171.0, 28317.0, 40882.0, 59233.0, 85300.0, 115815.0, 1100169.0, 233393.0, 111683.0, 81455.0, 56372.0, 38594.0, 26492.0, 18263.0, 12519.0, 8538.0, 5881.0, 3982.0, 2750.0, 1954.0, 1332.0, 903.0, 651.0, 484.0, 307.0, 228.0, 135.0, 98.0, 70.0, 37.0, 31.0, 20.0, 11.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0], "bins": [-0.1951904296875, -0.18907737731933594, -0.18296432495117188, -0.1768512725830078, -0.17073822021484375, -0.1646251678466797, -0.15851211547851562, -0.15239906311035156, -0.1462860107421875, -0.14017295837402344, -0.13405990600585938, -0.1279468536376953, -0.12183380126953125, -0.11572074890136719, -0.10960769653320312, -0.10349464416503906, -0.097381591796875, -0.09126853942871094, -0.08515548706054688, -0.07904243469238281, -0.07292938232421875, -0.06681632995605469, -0.060703277587890625, -0.05459022521972656, -0.0484771728515625, -0.04236412048339844, -0.036251068115234375, -0.030138015747070312, -0.02402496337890625, -0.017911911010742188, -0.011798858642578125, -0.0056858062744140625, 0.00042724609375, 0.0065402984619140625, 0.012653350830078125, 0.018766403198242188, 0.02487945556640625, 0.030992507934570312, 0.037105560302734375, 0.04321861267089844, 0.0493316650390625, 0.05544471740722656, 0.061557769775390625, 0.06767082214355469, 0.07378387451171875, 0.07989692687988281, 0.08600997924804688, 0.09212303161621094, 0.098236083984375, 0.10434913635253906, 0.11046218872070312, 0.11657524108886719, 0.12268829345703125, 0.1288013458251953, 0.13491439819335938, 0.14102745056152344, 0.1471405029296875, 0.15325355529785156, 0.15936660766601562, 0.1654796600341797, 0.17159271240234375, 0.1777057647705078, 0.18381881713867188, 0.18993186950683594, 0.196044921875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 11.0, 11.0, 6.0, 14.0, 22.0, 20.0, 26.0, 47.0, 63.0, 90.0, 92.0, 124.0, 119.0, 93.0, 62.0, 42.0, 29.0, 20.0, 21.0, 11.0, 13.0, 9.0, 10.0, 3.0, 7.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00463104248046875, -0.004510730504989624, -0.004390418529510498, -0.004270106554031372, -0.004149794578552246, -0.00402948260307312, -0.003909170627593994, -0.003788858652114868, -0.003668546676635742, -0.003548234701156616, -0.0034279227256774902, -0.0033076107501983643, -0.0031872987747192383, -0.0030669867992401123, -0.0029466748237609863, -0.0028263628482818604, -0.0027060508728027344, -0.0025857388973236084, -0.0024654269218444824, -0.0023451149463653564, -0.0022248029708862305, -0.0021044909954071045, -0.0019841790199279785, -0.0018638670444488525, -0.0017435550689697266, -0.0016232430934906006, -0.0015029311180114746, -0.0013826191425323486, -0.0012623071670532227, -0.0011419951915740967, -0.0010216832160949707, -0.0009013712406158447, -0.0007810592651367188, -0.0006607472896575928, -0.0005404353141784668, -0.0004201233386993408, -0.00029981136322021484, -0.00017949938774108887, -5.918741226196289e-05, 6.112456321716309e-05, 0.00018143653869628906, 0.00030174851417541504, 0.000422060489654541, 0.000542372465133667, 0.000662684440612793, 0.0007829964160919189, 0.0009033083915710449, 0.001023620367050171, 0.0011439323425292969, 0.0012642443180084229, 0.0013845562934875488, 0.0015048682689666748, 0.0016251802444458008, 0.0017454922199249268, 0.0018658041954040527, 0.0019861161708831787, 0.0021064281463623047, 0.0022267401218414307, 0.0023470520973205566, 0.0024673640727996826, 0.0025876760482788086, 0.0027079880237579346, 0.0028282999992370605, 0.0029486119747161865, 0.0030689239501953125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 24.0, 25.0, 28.0, 33.0, 52.0, 75.0, 113.0, 212.0, 340.0, 805.0, 9883.0, 1026974.0, 8176.0, 776.0, 383.0, 204.0, 115.0, 75.0, 65.0, 29.0, 25.0, 23.0, 25.0, 9.0, 10.0, 12.0, 5.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.05401611328125, -0.05189704895019531, -0.049777984619140625, -0.04765892028808594, -0.04553985595703125, -0.04342079162597656, -0.041301727294921875, -0.03918266296386719, -0.0370635986328125, -0.03494453430175781, -0.032825469970703125, -0.030706405639648438, -0.02858734130859375, -0.026468276977539062, -0.024349212646484375, -0.022230148315429688, -0.020111083984375, -0.017992019653320312, -0.015872955322265625, -0.013753890991210938, -0.01163482666015625, -0.009515762329101562, -0.007396697998046875, -0.0052776336669921875, -0.0031585693359375, -0.0010395050048828125, 0.001079559326171875, 0.0031986236572265625, 0.00531768798828125, 0.0074367523193359375, 0.009555816650390625, 0.011674880981445312, 0.0137939453125, 0.015913009643554688, 0.018032073974609375, 0.020151138305664062, 0.02227020263671875, 0.024389266967773438, 0.026508331298828125, 0.028627395629882812, 0.0307464599609375, 0.03286552429199219, 0.034984588623046875, 0.03710365295410156, 0.03922271728515625, 0.04134178161621094, 0.043460845947265625, 0.04557991027832031, 0.047698974609375, 0.04981803894042969, 0.051937103271484375, 0.05405616760253906, 0.05617523193359375, 0.05829429626464844, 0.060413360595703125, 0.06253242492675781, 0.0646514892578125, 0.06677055358886719, 0.06888961791992188, 0.07100868225097656, 0.07312774658203125, 0.07524681091308594, 0.07736587524414062, 0.07948493957519531, 0.08160400390625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 67.0, 863.0, 81.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01530770305544138, -0.014657065272331238, -0.014006426557898521, -0.01335578877478838, -0.012705150991678238, -0.012054513208568096, -0.011403875425457954, -0.010753236711025238, -0.010102598927915096, -0.009451961144804955, -0.008801322430372238, -0.008150684647262096, -0.007500046864151955, -0.006849409081041813, -0.006198770832270384, -0.005548132583498955, -0.004897494800388813, -0.004246857017278671, -0.003596218768507242, -0.002945580752566457, -0.0022949427366256714, -0.001644304720684886, -0.0009936667047441006, -0.0003430284559726715, 0.00030760932713747025, 0.0009582473430782557, 0.001608885359019041, 0.0022595233749598265, 0.002910161390900612, 0.0035607994068413973, 0.004211437422782183, 0.004862075671553612, 0.005512714385986328, 0.00616335216909647, 0.006813990417867899, 0.007464628666639328, 0.00811526644974947, 0.008765904232859612, 0.009416542947292328, 0.01006718073040247, 0.010717818513512611, 0.011368456296622753, 0.012019094079732895, 0.012669732794165611, 0.013320370577275753, 0.013971008360385895, 0.014621647074818611, 0.015272284857928753, 0.015922922641038895, 0.01657356135547161, 0.017224198207259178, 0.017874836921691895, 0.01852547377347946, 0.019176112487912178, 0.019826751202344894, 0.02047738805413246, 0.021128026768565178, 0.021778665482997894, 0.02242930233478546, 0.023079941049218178, 0.023730579763650894, 0.02438121661543846, 0.025031855329871178, 0.025682494044303894, 0.02633313089609146]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 6.0, 9.0, 9.0, 23.0, 18.0, 26.0, 34.0, 38.0, 34.0, 44.0, 41.0, 59.0, 56.0, 55.0, 62.0, 60.0, 57.0, 50.0, 51.0, 53.0, 49.0, 37.0, 23.0, 20.0, 24.0, 19.0, 14.0, 12.0, 3.0, 9.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0030756592750549316, -0.0029958300292491913, -0.002916000783443451, -0.0028361715376377106, -0.00275634229183197, -0.00267651304602623, -0.0025966838002204895, -0.002516854554414749, -0.002437025308609009, -0.0023571960628032684, -0.002277366816997528, -0.0021975375711917877, -0.0021177083253860474, -0.002037879079580307, -0.0019580498337745667, -0.0018782205879688263, -0.001798391342163086, -0.0017185620963573456, -0.0016387328505516052, -0.0015589036047458649, -0.0014790743589401245, -0.0013992451131343842, -0.0013194158673286438, -0.0012395866215229034, -0.001159757375717163, -0.0010799281299114227, -0.0010000988841056824, -0.000920269638299942, -0.0008404403924942017, -0.0007606111466884613, -0.000680781900882721, -0.0006009526550769806, -0.0005211234092712402, -0.0004412941634654999, -0.0003614649176597595, -0.00028163567185401917, -0.0002018064260482788, -0.00012197718024253845, -4.2147934436798096e-05, 3.768131136894226e-05, 0.00011751055717468262, 0.00019733980298042297, 0.00027716904878616333, 0.0003569982945919037, 0.00043682754039764404, 0.0005166567862033844, 0.0005964860320091248, 0.0006763152778148651, 0.0007561445236206055, 0.0008359737694263458, 0.0009158030152320862, 0.0009956322610378265, 0.001075461506843567, 0.0011552907526493073, 0.0012351199984550476, 0.001314949244260788, 0.0013947784900665283, 0.0014746077358722687, 0.001554436981678009, 0.0016342662274837494, 0.0017140954732894897, 0.00179392471909523, 0.0018737539649009705, 0.001953583210706711, 0.002033412456512451]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 12.0, 17.0, 10.0, 13.0, 26.0, 22.0, 24.0, 26.0, 32.0, 37.0, 31.0, 34.0, 35.0, 50.0, 47.0, 47.0, 46.0, 45.0, 39.0, 34.0, 39.0, 47.0, 23.0, 27.0, 26.0, 24.0, 24.0, 22.0, 20.0, 21.0, 11.0, 15.0, 15.0, 7.0, 4.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.234375, -3.13543701171875, -3.0364990234375, -2.93756103515625, -2.838623046875, -2.73968505859375, -2.6407470703125, -2.54180908203125, -2.44287109375, -2.34393310546875, -2.2449951171875, -2.14605712890625, -2.047119140625, -1.94818115234375, -1.8492431640625, -1.75030517578125, -1.6513671875, -1.55242919921875, -1.4534912109375, -1.35455322265625, -1.255615234375, -1.15667724609375, -1.0577392578125, -0.95880126953125, -0.85986328125, -0.76092529296875, -0.6619873046875, -0.56304931640625, -0.464111328125, -0.36517333984375, -0.2662353515625, -0.16729736328125, -0.068359375, 0.03057861328125, 0.1295166015625, 0.22845458984375, 0.327392578125, 0.42633056640625, 0.5252685546875, 0.62420654296875, 0.72314453125, 0.82208251953125, 0.9210205078125, 1.01995849609375, 1.118896484375, 1.21783447265625, 1.3167724609375, 1.41571044921875, 1.5146484375, 1.61358642578125, 1.7125244140625, 1.81146240234375, 1.910400390625, 2.00933837890625, 2.1082763671875, 2.20721435546875, 2.30615234375, 2.40509033203125, 2.5040283203125, 2.60296630859375, 2.701904296875, 2.80084228515625, 2.8997802734375, 2.99871826171875, 3.09765625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 9.0, 11.0, 20.0, 23.0, 35.0, 50.0, 60.0, 85.0, 139.0, 153.0, 209.0, 285.0, 370.0, 604.0, 954.0, 1658.0, 2998.0, 6954.0, 23355.0, 144343.0, 648618.0, 175293.0, 26558.0, 7602.0, 3276.0, 1709.0, 1014.0, 619.0, 418.0, 289.0, 220.0, 141.0, 105.0, 84.0, 72.0, 54.0, 31.0, 31.0, 31.0, 15.0, 10.0, 11.0, 7.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.99359130859375, -5.8035888671875, -5.61358642578125, -5.423583984375, -5.23358154296875, -5.0435791015625, -4.85357666015625, -4.66357421875, -4.47357177734375, -4.2835693359375, -4.09356689453125, -3.903564453125, -3.71356201171875, -3.5235595703125, -3.33355712890625, -3.1435546875, -2.95355224609375, -2.7635498046875, -2.57354736328125, -2.383544921875, -2.19354248046875, -2.0035400390625, -1.81353759765625, -1.62353515625, -1.43353271484375, -1.2435302734375, -1.05352783203125, -0.863525390625, -0.67352294921875, -0.4835205078125, -0.29351806640625, -0.103515625, 0.08648681640625, 0.2764892578125, 0.46649169921875, 0.656494140625, 0.84649658203125, 1.0364990234375, 1.22650146484375, 1.41650390625, 1.60650634765625, 1.7965087890625, 1.98651123046875, 2.176513671875, 2.36651611328125, 2.5565185546875, 2.74652099609375, 2.9365234375, 3.12652587890625, 3.3165283203125, 3.50653076171875, 3.696533203125, 3.88653564453125, 4.0765380859375, 4.26654052734375, 4.45654296875, 4.64654541015625, 4.8365478515625, 5.02655029296875, 5.216552734375, 5.40655517578125, 5.5965576171875, 5.78656005859375, 5.9765625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 5.0, 8.0, 7.0, 6.0, 10.0, 9.0, 20.0, 18.0, 27.0, 28.0, 30.0, 43.0, 36.0, 37.0, 54.0, 61.0, 159.0, 279.0, 1468.0, 237.0, 111.0, 74.0, 51.0, 47.0, 41.0, 28.0, 27.0, 17.0, 17.0, 18.0, 7.0, 16.0, 6.0, 6.0, 7.0, 7.0, 5.0, 2.0, 2.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-9.8046875, -9.52789306640625, -9.2510986328125, -8.97430419921875, -8.697509765625, -8.42071533203125, -8.1439208984375, -7.86712646484375, -7.59033203125, -7.31353759765625, -7.0367431640625, -6.75994873046875, -6.483154296875, -6.20635986328125, -5.9295654296875, -5.65277099609375, -5.3759765625, -5.09918212890625, -4.8223876953125, -4.54559326171875, -4.268798828125, -3.99200439453125, -3.7152099609375, -3.43841552734375, -3.16162109375, -2.88482666015625, -2.6080322265625, -2.33123779296875, -2.054443359375, -1.77764892578125, -1.5008544921875, -1.22406005859375, -0.947265625, -0.67047119140625, -0.3936767578125, -0.11688232421875, 0.159912109375, 0.43670654296875, 0.7135009765625, 0.99029541015625, 1.26708984375, 1.54388427734375, 1.8206787109375, 2.09747314453125, 2.374267578125, 2.65106201171875, 2.9278564453125, 3.20465087890625, 3.4814453125, 3.75823974609375, 4.0350341796875, 4.31182861328125, 4.588623046875, 4.86541748046875, 5.1422119140625, 5.41900634765625, 5.69580078125, 5.97259521484375, 6.2493896484375, 6.52618408203125, 6.802978515625, 7.07977294921875, 7.3565673828125, 7.63336181640625, 7.91015625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 10.0, 13.0, 14.0, 23.0, 44.0, 73.0, 95.0, 139.0, 213.0, 354.0, 890.0, 5458.0, 3119621.0, 16307.0, 1208.0, 484.0, 231.0, 170.0, 120.0, 80.0, 42.0, 29.0, 17.0, 11.0, 11.0, 11.0, 5.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.78125, -20.992431640625, -20.20361328125, -19.414794921875, -18.6259765625, -17.837158203125, -17.04833984375, -16.259521484375, -15.470703125, -14.681884765625, -13.89306640625, -13.104248046875, -12.3154296875, -11.526611328125, -10.73779296875, -9.948974609375, -9.16015625, -8.371337890625, -7.58251953125, -6.793701171875, -6.0048828125, -5.216064453125, -4.42724609375, -3.638427734375, -2.849609375, -2.060791015625, -1.27197265625, -0.483154296875, 0.3056640625, 1.094482421875, 1.88330078125, 2.672119140625, 3.4609375, 4.249755859375, 5.03857421875, 5.827392578125, 6.6162109375, 7.405029296875, 8.19384765625, 8.982666015625, 9.771484375, 10.560302734375, 11.34912109375, 12.137939453125, 12.9267578125, 13.715576171875, 14.50439453125, 15.293212890625, 16.08203125, 16.870849609375, 17.65966796875, 18.448486328125, 19.2373046875, 20.026123046875, 20.81494140625, 21.603759765625, 22.392578125, 23.181396484375, 23.97021484375, 24.759033203125, 25.5478515625, 26.336669921875, 27.12548828125, 27.914306640625, 28.703125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 11.0, 293.0, 645.0, 63.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.00791931152344, -103.30741882324219, -100.6069107055664, -97.90641021728516, -95.2059097290039, -92.50540161132812, -89.80490112304688, -87.10440063476562, -84.40390014648438, -81.70339965820312, -79.00289154052734, -76.3023910522461, -73.60189056396484, -70.90138244628906, -68.20088195800781, -65.50038146972656, -62.79987335205078, -60.099369049072266, -57.398868560791016, -54.6983642578125, -51.99786376953125, -49.297359466552734, -46.59685516357422, -43.89635467529297, -41.19585037231445, -38.49534606933594, -35.79484558105469, -33.09434127807617, -30.39383888244629, -27.693336486816406, -24.99283218383789, -22.292329788208008, -19.591827392578125, -16.891324996948242, -14.190821647644043, -11.490318298339844, -8.789815902709961, -6.089313507080078, -3.3888092041015625, -0.6883068084716797, 2.012195587158203, 4.712698459625244, 7.413201332092285, 10.113704681396484, 12.814207077026367, 15.51470947265625, 18.215213775634766, 20.91571617126465, 23.61621856689453, 26.316720962524414, 29.017223358154297, 31.717727661132812, 34.41822814941406, 37.11873245239258, 39.819236755371094, 42.519737243652344, 45.22024154663086, 47.920745849609375, 50.621246337890625, 53.32175064086914, 56.022254943847656, 58.722755432128906, 61.42325973510742, 64.12376403808594, 66.82426452636719]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 5.0, 4.0, 9.0, 13.0, 11.0, 21.0, 10.0, 23.0, 26.0, 25.0, 29.0, 24.0, 31.0, 33.0, 30.0, 35.0, 51.0, 44.0, 38.0, 43.0, 28.0, 27.0, 36.0, 39.0, 34.0, 32.0, 33.0, 39.0, 24.0, 31.0, 18.0, 28.0, 17.0, 20.0, 15.0, 10.0, 19.0, 7.0, 5.0, 4.0, 7.0, 7.0, 9.0, 2.0, 1.0, 5.0], "bins": [-24.096588134765625, -23.508955001831055, -22.921323776245117, -22.333690643310547, -21.746057510375977, -21.15842628479004, -20.57079315185547, -19.98316192626953, -19.39552879333496, -18.80789566040039, -18.220264434814453, -17.632631301879883, -17.044998168945312, -16.457366943359375, -15.869733810424805, -15.28210163116455, -14.69446849822998, -14.106836318969727, -13.519203186035156, -12.931571006774902, -12.343938827514648, -11.756305694580078, -11.168673515319824, -10.58104133605957, -9.993408203125, -9.405776023864746, -8.818142890930176, -8.230510711669922, -7.642878532409668, -7.055245876312256, -6.467613220214844, -5.87998104095459, -5.292348861694336, -4.704716205596924, -4.11708402633667, -3.529451370239258, -2.941818952560425, -2.354186534881592, -1.7665538787841797, -1.1789216995239258, -0.5912890434265137, -0.0036565661430358887, 0.5839759111404419, 1.1716084480285645, 1.7592408657073975, 2.3468732833862305, 2.9345059394836426, 3.5221381187438965, 4.109770774841309, 4.697403430938721, 5.285035610198975, 5.872668266296387, 6.460300445556641, 7.047933101654053, 7.635565757751465, 8.223197937011719, 8.810831069946289, 9.398463249206543, 9.986096382141113, 10.573728561401367, 11.161360740661621, 11.748992919921875, 12.336626052856445, 12.9242582321167, 13.511890411376953]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 3.0, 6.0, 2.0, 7.0, 10.0, 6.0, 14.0, 18.0, 20.0, 26.0, 27.0, 28.0, 32.0, 33.0, 31.0, 29.0, 36.0, 43.0, 39.0, 44.0, 43.0, 45.0, 41.0, 39.0, 33.0, 39.0, 31.0, 24.0, 32.0, 26.0, 43.0, 23.0, 21.0, 17.0, 19.0, 18.0, 8.0, 9.0, 11.0, 4.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.487945556640625, -3.37237548828125, -3.256805419921875, -3.1412353515625, -3.025665283203125, -2.91009521484375, -2.794525146484375, -2.678955078125, -2.563385009765625, -2.44781494140625, -2.332244873046875, -2.2166748046875, -2.101104736328125, -1.98553466796875, -1.869964599609375, -1.75439453125, -1.638824462890625, -1.52325439453125, -1.407684326171875, -1.2921142578125, -1.176544189453125, -1.06097412109375, -0.945404052734375, -0.829833984375, -0.714263916015625, -0.59869384765625, -0.483123779296875, -0.3675537109375, -0.251983642578125, -0.13641357421875, -0.020843505859375, 0.0947265625, 0.210296630859375, 0.32586669921875, 0.441436767578125, 0.5570068359375, 0.672576904296875, 0.78814697265625, 0.903717041015625, 1.019287109375, 1.134857177734375, 1.25042724609375, 1.365997314453125, 1.4815673828125, 1.597137451171875, 1.71270751953125, 1.828277587890625, 1.94384765625, 2.059417724609375, 2.17498779296875, 2.290557861328125, 2.4061279296875, 2.521697998046875, 2.63726806640625, 2.752838134765625, 2.868408203125, 2.983978271484375, 3.09954833984375, 3.215118408203125, 3.3306884765625, 3.446258544921875, 3.56182861328125, 3.677398681640625, 3.79296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 16.0, 16.0, 12.0, 30.0, 33.0, 35.0, 61.0, 77.0, 97.0, 145.0, 187.0, 280.0, 395.0, 538.0, 808.0, 1625.0, 5724.0, 115048.0, 3516468.0, 535385.0, 11990.0, 2130.0, 953.0, 615.0, 423.0, 307.0, 224.0, 161.0, 123.0, 95.0, 74.0, 40.0, 35.0, 23.0, 22.0, 23.0, 10.0, 7.0, 11.0, 6.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.953125, -17.36767578125, -16.7822265625, -16.19677734375, -15.611328125, -15.02587890625, -14.4404296875, -13.85498046875, -13.26953125, -12.68408203125, -12.0986328125, -11.51318359375, -10.927734375, -10.34228515625, -9.7568359375, -9.17138671875, -8.5859375, -8.00048828125, -7.4150390625, -6.82958984375, -6.244140625, -5.65869140625, -5.0732421875, -4.48779296875, -3.90234375, -3.31689453125, -2.7314453125, -2.14599609375, -1.560546875, -0.97509765625, -0.3896484375, 0.19580078125, 0.78125, 1.36669921875, 1.9521484375, 2.53759765625, 3.123046875, 3.70849609375, 4.2939453125, 4.87939453125, 5.46484375, 6.05029296875, 6.6357421875, 7.22119140625, 7.806640625, 8.39208984375, 8.9775390625, 9.56298828125, 10.1484375, 10.73388671875, 11.3193359375, 11.90478515625, 12.490234375, 13.07568359375, 13.6611328125, 14.24658203125, 14.83203125, 15.41748046875, 16.0029296875, 16.58837890625, 17.173828125, 17.75927734375, 18.3447265625, 18.93017578125, 19.515625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 5.0, 13.0, 18.0, 32.0, 43.0, 63.0, 98.0, 163.0, 235.0, 296.0, 422.0, 546.0, 587.0, 453.0, 330.0, 234.0, 172.0, 103.0, 84.0, 51.0, 37.0, 24.0, 15.0, 9.0, 11.0, 2.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.921875, -7.6905517578125, -7.459228515625, -7.2279052734375, -6.99658203125, -6.7652587890625, -6.533935546875, -6.3026123046875, -6.0712890625, -5.8399658203125, -5.608642578125, -5.3773193359375, -5.14599609375, -4.9146728515625, -4.683349609375, -4.4520263671875, -4.220703125, -3.9893798828125, -3.758056640625, -3.5267333984375, -3.29541015625, -3.0640869140625, -2.832763671875, -2.6014404296875, -2.3701171875, -2.1387939453125, -1.907470703125, -1.6761474609375, -1.44482421875, -1.2135009765625, -0.982177734375, -0.7508544921875, -0.51953125, -0.2882080078125, -0.056884765625, 0.1744384765625, 0.40576171875, 0.6370849609375, 0.868408203125, 1.0997314453125, 1.3310546875, 1.5623779296875, 1.793701171875, 2.0250244140625, 2.25634765625, 2.4876708984375, 2.718994140625, 2.9503173828125, 3.181640625, 3.4129638671875, 3.644287109375, 3.8756103515625, 4.10693359375, 4.3382568359375, 4.569580078125, 4.8009033203125, 5.0322265625, 5.2635498046875, 5.494873046875, 5.7261962890625, 5.95751953125, 6.1888427734375, 6.420166015625, 6.6514892578125, 6.8828125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 4.0, 12.0, 17.0, 23.0, 37.0, 85.0, 155.0, 366.0, 725.0, 1804.0, 5776.0, 27013.0, 266580.0, 2668384.0, 1119628.0, 85902.0, 12340.0, 3295.0, 1173.0, 498.0, 212.0, 137.0, 39.0, 27.0, 11.0, 5.0, 10.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.1171875, -8.85498046875, -8.5927734375, -8.33056640625, -8.068359375, -7.80615234375, -7.5439453125, -7.28173828125, -7.01953125, -6.75732421875, -6.4951171875, -6.23291015625, -5.970703125, -5.70849609375, -5.4462890625, -5.18408203125, -4.921875, -4.65966796875, -4.3974609375, -4.13525390625, -3.873046875, -3.61083984375, -3.3486328125, -3.08642578125, -2.82421875, -2.56201171875, -2.2998046875, -2.03759765625, -1.775390625, -1.51318359375, -1.2509765625, -0.98876953125, -0.7265625, -0.46435546875, -0.2021484375, 0.06005859375, 0.322265625, 0.58447265625, 0.8466796875, 1.10888671875, 1.37109375, 1.63330078125, 1.8955078125, 2.15771484375, 2.419921875, 2.68212890625, 2.9443359375, 3.20654296875, 3.46875, 3.73095703125, 3.9931640625, 4.25537109375, 4.517578125, 4.77978515625, 5.0419921875, 5.30419921875, 5.56640625, 5.82861328125, 6.0908203125, 6.35302734375, 6.615234375, 6.87744140625, 7.1396484375, 7.40185546875, 7.6640625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 6.0, 10.0, 25.0, 27.0, 61.0, 64.0, 78.0, 107.0, 111.0, 105.0, 104.0, 86.0, 60.0, 61.0, 38.0, 24.0, 17.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.49061393737793, -21.953781127929688, -20.416948318481445, -18.880115509033203, -17.343280792236328, -15.806448936462402, -14.269615173339844, -12.732782363891602, -11.19594955444336, -9.659116744995117, -8.122283935546875, -6.585450172424316, -5.048617362976074, -3.511784553527832, -1.9749507904052734, -0.43811798095703125, 1.098714828491211, 2.6355478763580322, 4.1723809242248535, 5.709214210510254, 7.246047019958496, 8.782879829406738, 10.319713592529297, 11.856546401977539, 13.393379211425781, 14.930212020874023, 16.467044830322266, 18.00387954711914, 19.54071044921875, 21.077545166015625, 22.614377975463867, 24.15121078491211, 25.68804168701172, 27.22487449645996, 28.761707305908203, 30.298542022705078, 31.835372924804688, 33.37220764160156, 34.90904235839844, 36.44587326049805, 37.982704162597656, 39.51953887939453, 41.05636978149414, 42.593204498291016, 44.130035400390625, 45.6668701171875, 47.203704833984375, 48.740535736083984, 50.27737045288086, 51.814205169677734, 53.351036071777344, 54.88787078857422, 56.42470169067383, 57.9615364074707, 59.49836730957031, 61.03520202636719, 62.57203674316406, 64.10887145996094, 65.64570617675781, 67.18253326416016, 68.71936798095703, 70.2562026977539, 71.79303741455078, 73.32986450195312, 74.86669921875]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 10.0, 5.0, 12.0, 9.0, 8.0, 11.0, 16.0, 14.0, 23.0, 23.0, 20.0, 22.0, 31.0, 34.0, 36.0, 32.0, 26.0, 33.0, 38.0, 34.0, 37.0, 40.0, 41.0, 33.0, 35.0, 40.0, 39.0, 31.0, 29.0, 30.0, 24.0, 26.0, 23.0, 16.0, 23.0, 15.0, 11.0, 15.0, 10.0, 6.0, 9.0, 2.0, 3.0, 6.0, 3.0, 7.0, 2.0, 6.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.584197998046875, -19.88762855529785, -19.191059112548828, -18.494491577148438, -17.797922134399414, -17.10135269165039, -16.404783248901367, -15.708213806152344, -15.011645317077637, -14.315075874328613, -13.618507385253906, -12.921937942504883, -12.22536849975586, -11.528800010681152, -10.832230567932129, -10.135662078857422, -9.439092636108398, -8.742523193359375, -8.045954704284668, -7.3493852615356445, -6.652816295623779, -5.956247329711914, -5.259677886962891, -4.563108921051025, -3.86653995513916, -3.169970989227295, -2.4734017848968506, -1.7768325805664062, -1.080263614654541, -0.3836946487426758, 0.31287479400634766, 1.009443759918213, 1.706014633178711, 2.402583599090576, 3.0991528034210205, 3.795722007751465, 4.49229097366333, 5.188859939575195, 5.885429382324219, 6.581998348236084, 7.278567314147949, 7.9751362800598145, 8.67170524597168, 9.368274688720703, 10.064844131469727, 10.761412620544434, 11.457982063293457, 12.154550552368164, 12.851119995117188, 13.547689437866211, 14.244257926940918, 14.940827369689941, 15.637395858764648, 16.333965301513672, 17.030534744262695, 17.72710418701172, 18.42367172241211, 19.120241165161133, 19.816810607910156, 20.513378143310547, 21.20994758605957, 21.906517028808594, 22.603086471557617, 23.29965591430664, 23.996225357055664]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 11.0, 11.0, 7.0, 23.0, 16.0, 24.0, 18.0, 20.0, 22.0, 38.0, 28.0, 32.0, 49.0, 31.0, 32.0, 29.0, 42.0, 32.0, 44.0, 54.0, 32.0, 46.0, 36.0, 31.0, 36.0, 39.0, 13.0, 23.0, 22.0, 17.0, 16.0, 11.0, 12.0, 15.0, 8.0, 13.0, 4.0, 4.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.09375, -37.77099609375, -36.4482421875, -35.12548828125, -33.802734375, -32.47998046875, -31.1572265625, -29.83447265625, -28.51171875, -27.18896484375, -25.8662109375, -24.54345703125, -23.220703125, -21.89794921875, -20.5751953125, -19.25244140625, -17.9296875, -16.60693359375, -15.2841796875, -13.96142578125, -12.638671875, -11.31591796875, -9.9931640625, -8.67041015625, -7.34765625, -6.02490234375, -4.7021484375, -3.37939453125, -2.056640625, -0.73388671875, 0.5888671875, 1.91162109375, 3.234375, 4.55712890625, 5.8798828125, 7.20263671875, 8.525390625, 9.84814453125, 11.1708984375, 12.49365234375, 13.81640625, 15.13916015625, 16.4619140625, 17.78466796875, 19.107421875, 20.43017578125, 21.7529296875, 23.07568359375, 24.3984375, 25.72119140625, 27.0439453125, 28.36669921875, 29.689453125, 31.01220703125, 32.3349609375, 33.65771484375, 34.98046875, 36.30322265625, 37.6259765625, 38.94873046875, 40.271484375, 41.59423828125, 42.9169921875, 44.23974609375, 45.5625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 8.0, 16.0, 11.0, 16.0, 39.0, 54.0, 96.0, 171.0, 268.0, 481.0, 814.0, 1532.0, 2869.0, 5160.0, 9510.0, 17232.0, 32337.0, 60639.0, 112853.0, 196248.0, 241178.0, 167531.0, 92166.0, 49199.0, 26476.0, 14361.0, 7806.0, 4131.0, 2388.0, 1225.0, 737.0, 412.0, 224.0, 131.0, 81.0, 53.0, 33.0, 19.0, 11.0, 10.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.67578125, -4.53118896484375, -4.3865966796875, -4.24200439453125, -4.097412109375, -3.95281982421875, -3.8082275390625, -3.66363525390625, -3.51904296875, -3.37445068359375, -3.2298583984375, -3.08526611328125, -2.940673828125, -2.79608154296875, -2.6514892578125, -2.50689697265625, -2.3623046875, -2.21771240234375, -2.0731201171875, -1.92852783203125, -1.783935546875, -1.63934326171875, -1.4947509765625, -1.35015869140625, -1.20556640625, -1.06097412109375, -0.9163818359375, -0.77178955078125, -0.627197265625, -0.48260498046875, -0.3380126953125, -0.19342041015625, -0.048828125, 0.09576416015625, 0.2403564453125, 0.38494873046875, 0.529541015625, 0.67413330078125, 0.8187255859375, 0.96331787109375, 1.10791015625, 1.25250244140625, 1.3970947265625, 1.54168701171875, 1.686279296875, 1.83087158203125, 1.9754638671875, 2.12005615234375, 2.2646484375, 2.40924072265625, 2.5538330078125, 2.69842529296875, 2.843017578125, 2.98760986328125, 3.1322021484375, 3.27679443359375, 3.42138671875, 3.56597900390625, 3.7105712890625, 3.85516357421875, 3.999755859375, 4.14434814453125, 4.2889404296875, 4.43353271484375, 4.578125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 11.0, 14.0, 11.0, 9.0, 28.0, 14.0, 21.0, 20.0, 24.0, 25.0, 22.0, 23.0, 29.0, 23.0, 39.0, 26.0, 41.0, 40.0, 34.0, 1069.0, 36.0, 47.0, 38.0, 40.0, 31.0, 34.0, 27.0, 33.0, 24.0, 28.0, 20.0, 21.0, 17.0, 18.0, 13.0, 12.0, 11.0, 11.0, 7.0, 8.0, 5.0, 9.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.84375, -23.04052734375, -22.2373046875, -21.43408203125, -20.630859375, -19.82763671875, -19.0244140625, -18.22119140625, -17.41796875, -16.61474609375, -15.8115234375, -15.00830078125, -14.205078125, -13.40185546875, -12.5986328125, -11.79541015625, -10.9921875, -10.18896484375, -9.3857421875, -8.58251953125, -7.779296875, -6.97607421875, -6.1728515625, -5.36962890625, -4.56640625, -3.76318359375, -2.9599609375, -2.15673828125, -1.353515625, -0.55029296875, 0.2529296875, 1.05615234375, 1.859375, 2.66259765625, 3.4658203125, 4.26904296875, 5.072265625, 5.87548828125, 6.6787109375, 7.48193359375, 8.28515625, 9.08837890625, 9.8916015625, 10.69482421875, 11.498046875, 12.30126953125, 13.1044921875, 13.90771484375, 14.7109375, 15.51416015625, 16.3173828125, 17.12060546875, 17.923828125, 18.72705078125, 19.5302734375, 20.33349609375, 21.13671875, 21.93994140625, 22.7431640625, 23.54638671875, 24.349609375, 25.15283203125, 25.9560546875, 26.75927734375, 27.5625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 8.0, 8.0, 13.0, 17.0, 38.0, 45.0, 90.0, 119.0, 167.0, 204.0, 331.0, 510.0, 739.0, 1108.0, 1520.0, 2259.0, 3394.0, 4848.0, 7160.0, 10200.0, 14749.0, 21386.0, 31250.0, 44939.0, 65710.0, 95184.0, 128621.0, 1195652.0, 135511.0, 102049.0, 71631.0, 49300.0, 33685.0, 23248.0, 16190.0, 10930.0, 7661.0, 5272.0, 3658.0, 2475.0, 1722.0, 1100.0, 768.0, 523.0, 387.0, 259.0, 167.0, 109.0, 67.0, 54.0, 33.0, 22.0, 22.0, 15.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.341796875, -2.265289306640625, -2.18878173828125, -2.112274169921875, -2.0357666015625, -1.959259033203125, -1.88275146484375, -1.806243896484375, -1.729736328125, -1.653228759765625, -1.57672119140625, -1.500213623046875, -1.4237060546875, -1.347198486328125, -1.27069091796875, -1.194183349609375, -1.11767578125, -1.041168212890625, -0.96466064453125, -0.888153076171875, -0.8116455078125, -0.735137939453125, -0.65863037109375, -0.582122802734375, -0.505615234375, -0.429107666015625, -0.35260009765625, -0.276092529296875, -0.1995849609375, -0.123077392578125, -0.04656982421875, 0.029937744140625, 0.1064453125, 0.182952880859375, 0.25946044921875, 0.335968017578125, 0.4124755859375, 0.488983154296875, 0.56549072265625, 0.641998291015625, 0.718505859375, 0.795013427734375, 0.87152099609375, 0.948028564453125, 1.0245361328125, 1.101043701171875, 1.17755126953125, 1.254058837890625, 1.33056640625, 1.407073974609375, 1.48358154296875, 1.560089111328125, 1.6365966796875, 1.713104248046875, 1.78961181640625, 1.866119384765625, 1.942626953125, 2.019134521484375, 2.09564208984375, 2.172149658203125, 2.2486572265625, 2.325164794921875, 2.40167236328125, 2.478179931640625, 2.5546875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 7.0, 5.0, 8.0, 10.0, 11.0, 10.0, 15.0, 26.0, 29.0, 39.0, 44.0, 58.0, 69.0, 80.0, 71.0, 67.0, 72.0, 64.0, 56.0, 43.0, 28.0, 26.0, 17.0, 25.0, 18.0, 9.0, 7.0, 17.0, 1.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.050872802734375, -0.049353599548339844, -0.04783439636230469, -0.04631519317626953, -0.044795989990234375, -0.04327678680419922, -0.04175758361816406, -0.040238380432128906, -0.03871917724609375, -0.037199974060058594, -0.03568077087402344, -0.03416156768798828, -0.032642364501953125, -0.03112316131591797, -0.029603958129882812, -0.028084754943847656, -0.0265655517578125, -0.025046348571777344, -0.023527145385742188, -0.02200794219970703, -0.020488739013671875, -0.01896953582763672, -0.017450332641601562, -0.015931129455566406, -0.01441192626953125, -0.012892723083496094, -0.011373519897460938, -0.009854316711425781, -0.008335113525390625, -0.006815910339355469, -0.0052967071533203125, -0.0037775039672851562, -0.00225830078125, -0.0007390975952148438, 0.0007801055908203125, 0.0022993087768554688, 0.003818511962890625, 0.005337715148925781, 0.0068569183349609375, 0.008376121520996094, 0.00989532470703125, 0.011414527893066406, 0.012933731079101562, 0.014452934265136719, 0.015972137451171875, 0.01749134063720703, 0.019010543823242188, 0.020529747009277344, 0.0220489501953125, 0.023568153381347656, 0.025087356567382812, 0.02660655975341797, 0.028125762939453125, 0.02964496612548828, 0.031164169311523438, 0.032683372497558594, 0.03420257568359375, 0.035721778869628906, 0.03724098205566406, 0.03876018524169922, 0.040279388427734375, 0.04179859161376953, 0.04331779479980469, 0.044836997985839844, 0.046356201171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 2.0, 1.0, 11.0, 6.0, 18.0, 21.0, 27.0, 36.0, 40.0, 38.0, 76.0, 97.0, 124.0, 165.0, 284.0, 406.0, 679.0, 1273.0, 2739.0, 6623.0, 19371.0, 66218.0, 238722.0, 461205.0, 175671.0, 49705.0, 14599.0, 5248.0, 2248.0, 1116.0, 575.0, 361.0, 234.0, 120.0, 106.0, 91.0, 79.0, 48.0, 36.0, 31.0, 18.0, 17.0, 19.0, 10.0, 17.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.2393798828125, -0.23150062561035156, -0.22362136840820312, -0.2157421112060547, -0.20786285400390625, -0.1999835968017578, -0.19210433959960938, -0.18422508239746094, -0.1763458251953125, -0.16846656799316406, -0.16058731079101562, -0.1527080535888672, -0.14482879638671875, -0.1369495391845703, -0.12907028198242188, -0.12119102478027344, -0.113311767578125, -0.10543251037597656, -0.09755325317382812, -0.08967399597167969, -0.08179473876953125, -0.07391548156738281, -0.06603622436523438, -0.05815696716308594, -0.0502777099609375, -0.04239845275878906, -0.034519195556640625, -0.026639938354492188, -0.01876068115234375, -0.010881423950195312, -0.003002166748046875, 0.0048770904541015625, 0.01275634765625, 0.020635604858398438, 0.028514862060546875, 0.03639411926269531, 0.04427337646484375, 0.05215263366699219, 0.060031890869140625, 0.06791114807128906, 0.0757904052734375, 0.08366966247558594, 0.09154891967773438, 0.09942817687988281, 0.10730743408203125, 0.11518669128417969, 0.12306594848632812, 0.13094520568847656, 0.138824462890625, 0.14670372009277344, 0.15458297729492188, 0.1624622344970703, 0.17034149169921875, 0.1782207489013672, 0.18610000610351562, 0.19397926330566406, 0.2018585205078125, 0.20973777770996094, 0.21761703491210938, 0.2254962921142578, 0.23337554931640625, 0.2412548065185547, 0.24913406372070312, 0.25701332092285156, 0.264892578125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 18.0, 44.0, 155.0, 248.0, 228.0, 129.0, 68.0, 35.0, 29.0, 12.0, 10.0, 3.0, 5.0, 9.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05374011769890785, -0.04865960776805878, -0.0435790978372097, -0.038498587906360626, -0.03341807797551155, -0.028337568044662476, -0.0232570581138134, -0.018176548182964325, -0.01309603825211525, -0.008015528321266174, -0.002935018390417099, 0.0021454915404319763, 0.007226001471281052, 0.012306511402130127, 0.017387021332979202, 0.022467531263828278, 0.027548041194677353, 0.03262855112552643, 0.037709061056375504, 0.04278957098722458, 0.047870080918073654, 0.05295059084892273, 0.058031100779771805, 0.06311161071062088, 0.06819212436676025, 0.07327263057231903, 0.0783531442284584, 0.08343365788459778, 0.08851416409015656, 0.09359467029571533, 0.0986751839518547, 0.10375569760799408, 0.10883620381355286, 0.11391671001911163, 0.11899722367525101, 0.12407773733139038, 0.12915824353694916, 0.13423874974250793, 0.1393192708492279, 0.14439977705478668, 0.14948028326034546, 0.15456078946590424, 0.159641295671463, 0.16472181677818298, 0.16980232298374176, 0.17488282918930054, 0.1799633502960205, 0.18504385650157928, 0.19012436270713806, 0.19520486891269684, 0.20028537511825562, 0.20536589622497559, 0.21044640243053436, 0.21552690863609314, 0.2206074297428131, 0.2256879359483719, 0.23076844215393066, 0.23584894835948944, 0.24092945456504822, 0.2460099756717682, 0.25109046697616577, 0.25617098808288574, 0.2612515091896057, 0.2663320004940033, 0.27141252160072327]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 3.0, 3.0, 6.0, 10.0, 14.0, 19.0, 10.0, 9.0, 22.0, 21.0, 23.0, 28.0, 34.0, 31.0, 38.0, 38.0, 36.0, 31.0, 50.0, 39.0, 49.0, 40.0, 37.0, 40.0, 40.0, 29.0, 31.0, 37.0, 35.0, 28.0, 22.0, 15.0, 29.0, 17.0, 17.0, 19.0, 8.0, 8.0, 9.0, 2.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.06254440546035767, -0.06078276038169861, -0.05902111902832985, -0.05725947767496109, -0.05549783259630203, -0.053736187517642975, -0.051974546164274216, -0.05021290481090546, -0.0484512597322464, -0.04668961465358734, -0.04492797330021858, -0.04316633194684982, -0.041404686868190765, -0.03964304178953171, -0.03788140043616295, -0.03611975908279419, -0.03435811400413513, -0.032596468925476074, -0.030834827572107315, -0.029073184356093407, -0.0273115411400795, -0.02554989792406559, -0.02378825470805168, -0.022026611492037773, -0.020264968276023865, -0.018503325060009956, -0.016741681843996048, -0.01498003862798214, -0.013218395411968231, -0.011456752195954323, -0.009695108979940414, -0.007933465763926506, -0.006171822547912598, -0.004410179331898689, -0.002648536115884781, -0.0008868928998708725, 0.0008747503161430359, 0.0026363935321569443, 0.004398036748170853, 0.006159679964184761, 0.00792132318019867, 0.009682966396212578, 0.011444609612226486, 0.013206252828240395, 0.014967896044254303, 0.01672953926026821, 0.01849118247628212, 0.020252825692296028, 0.022014468908309937, 0.023776112124323845, 0.025537755340337753, 0.02729939855635166, 0.02906104177236557, 0.03082268498837948, 0.03258432820439339, 0.034345969557762146, 0.036107614636421204, 0.03786925971508026, 0.03963090106844902, 0.04139254242181778, 0.04315418750047684, 0.044915832579135895, 0.046677473932504654, 0.04843911528587341, 0.05020076036453247]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 2.0, 7.0, 4.0, 9.0, 12.0, 9.0, 13.0, 8.0, 19.0, 19.0, 23.0, 20.0, 17.0, 24.0, 40.0, 25.0, 31.0, 51.0, 29.0, 35.0, 30.0, 41.0, 29.0, 46.0, 56.0, 33.0, 45.0, 31.0, 31.0, 40.0, 39.0, 13.0, 22.0, 19.0, 21.0, 15.0, 12.0, 9.0, 18.0, 7.0, 13.0, 4.0, 6.0, 5.0, 7.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.09375, -37.771484375, -36.44921875, -35.126953125, -33.8046875, -32.482421875, -31.16015625, -29.837890625, -28.515625, -27.193359375, -25.87109375, -24.548828125, -23.2265625, -21.904296875, -20.58203125, -19.259765625, -17.9375, -16.615234375, -15.29296875, -13.970703125, -12.6484375, -11.326171875, -10.00390625, -8.681640625, -7.359375, -6.037109375, -4.71484375, -3.392578125, -2.0703125, -0.748046875, 0.57421875, 1.896484375, 3.21875, 4.541015625, 5.86328125, 7.185546875, 8.5078125, 9.830078125, 11.15234375, 12.474609375, 13.796875, 15.119140625, 16.44140625, 17.763671875, 19.0859375, 20.408203125, 21.73046875, 23.052734375, 24.375, 25.697265625, 27.01953125, 28.341796875, 29.6640625, 30.986328125, 32.30859375, 33.630859375, 34.953125, 36.275390625, 37.59765625, 38.919921875, 40.2421875, 41.564453125, 42.88671875, 44.208984375, 45.53125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 2.0, 5.0, 2.0, 4.0, 8.0, 9.0, 7.0, 18.0, 11.0, 28.0, 32.0, 48.0, 59.0, 68.0, 105.0, 119.0, 190.0, 252.0, 378.0, 582.0, 886.0, 1392.0, 2632.0, 5519.0, 13063.0, 36342.0, 113747.0, 337116.0, 350781.0, 120586.0, 38402.0, 13480.0, 5702.0, 2680.0, 1501.0, 882.0, 551.0, 374.0, 251.0, 194.0, 138.0, 104.0, 63.0, 47.0, 43.0, 34.0, 33.0, 24.0, 14.0, 10.0, 10.0, 7.0, 8.0, 8.0, 6.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.66796875, -5.47918701171875, -5.2904052734375, -5.10162353515625, -4.912841796875, -4.72406005859375, -4.5352783203125, -4.34649658203125, -4.15771484375, -3.96893310546875, -3.7801513671875, -3.59136962890625, -3.402587890625, -3.21380615234375, -3.0250244140625, -2.83624267578125, -2.6474609375, -2.45867919921875, -2.2698974609375, -2.08111572265625, -1.892333984375, -1.70355224609375, -1.5147705078125, -1.32598876953125, -1.13720703125, -0.94842529296875, -0.7596435546875, -0.57086181640625, -0.382080078125, -0.19329833984375, -0.0045166015625, 0.18426513671875, 0.373046875, 0.56182861328125, 0.7506103515625, 0.93939208984375, 1.128173828125, 1.31695556640625, 1.5057373046875, 1.69451904296875, 1.88330078125, 2.07208251953125, 2.2608642578125, 2.44964599609375, 2.638427734375, 2.82720947265625, 3.0159912109375, 3.20477294921875, 3.3935546875, 3.58233642578125, 3.7711181640625, 3.95989990234375, 4.148681640625, 4.33746337890625, 4.5262451171875, 4.71502685546875, 4.90380859375, 5.09259033203125, 5.2813720703125, 5.47015380859375, 5.658935546875, 5.84771728515625, 6.0364990234375, 6.22528076171875, 6.4140625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 12.0, 13.0, 18.0, 27.0, 34.0, 46.0, 58.0, 54.0, 61.0, 71.0, 535.0, 1688.0, 79.0, 75.0, 60.0, 46.0, 46.0, 41.0, 18.0, 17.0, 13.0, 10.0, 10.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.25, -85.818359375, -82.38671875, -78.955078125, -75.5234375, -72.091796875, -68.66015625, -65.228515625, -61.796875, -58.365234375, -54.93359375, -51.501953125, -48.0703125, -44.638671875, -41.20703125, -37.775390625, -34.34375, -30.912109375, -27.48046875, -24.048828125, -20.6171875, -17.185546875, -13.75390625, -10.322265625, -6.890625, -3.458984375, -0.02734375, 3.404296875, 6.8359375, 10.267578125, 13.69921875, 17.130859375, 20.5625, 23.994140625, 27.42578125, 30.857421875, 34.2890625, 37.720703125, 41.15234375, 44.583984375, 48.015625, 51.447265625, 54.87890625, 58.310546875, 61.7421875, 65.173828125, 68.60546875, 72.037109375, 75.46875, 78.900390625, 82.33203125, 85.763671875, 89.1953125, 92.626953125, 96.05859375, 99.490234375, 102.921875, 106.353515625, 109.78515625, 113.216796875, 116.6484375, 120.080078125, 123.51171875, 126.943359375, 130.375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 11.0, 8.0, 12.0, 21.0, 30.0, 42.0, 66.0, 110.0, 157.0, 239.0, 427.0, 796.0, 1726.0, 5848.0, 72782.0, 2939283.0, 112798.0, 7253.0, 1954.0, 947.0, 458.0, 267.0, 172.0, 104.0, 68.0, 36.0, 26.0, 19.0, 15.0, 15.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.58349609375, -17.0263671875, -16.46923828125, -15.912109375, -15.35498046875, -14.7978515625, -14.24072265625, -13.68359375, -13.12646484375, -12.5693359375, -12.01220703125, -11.455078125, -10.89794921875, -10.3408203125, -9.78369140625, -9.2265625, -8.66943359375, -8.1123046875, -7.55517578125, -6.998046875, -6.44091796875, -5.8837890625, -5.32666015625, -4.76953125, -4.21240234375, -3.6552734375, -3.09814453125, -2.541015625, -1.98388671875, -1.4267578125, -0.86962890625, -0.3125, 0.24462890625, 0.8017578125, 1.35888671875, 1.916015625, 2.47314453125, 3.0302734375, 3.58740234375, 4.14453125, 4.70166015625, 5.2587890625, 5.81591796875, 6.373046875, 6.93017578125, 7.4873046875, 8.04443359375, 8.6015625, 9.15869140625, 9.7158203125, 10.27294921875, 10.830078125, 11.38720703125, 11.9443359375, 12.50146484375, 13.05859375, 13.61572265625, 14.1728515625, 14.72998046875, 15.287109375, 15.84423828125, 16.4013671875, 16.95849609375, 17.515625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 12.0, 16.0, 35.0, 137.0, 249.0, 261.0, 159.0, 63.0, 33.0, 11.0, 7.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.87174987792969, -111.63179779052734, -105.391845703125, -99.15188598632812, -92.91193389892578, -86.67198181152344, -80.43202209472656, -74.19207000732422, -67.95211791992188, -61.71216583251953, -55.47220993041992, -49.23225402832031, -42.99230194091797, -36.752349853515625, -30.512393951416016, -24.272438049316406, -18.032485961914062, -11.792531967163086, -5.552577972412109, 0.6873760223388672, 6.927330017089844, 13.16728401184082, 19.407238006591797, 25.647193908691406, 31.88714599609375, 38.127098083496094, 44.3670539855957, 50.60700988769531, 56.846961975097656, 63.0869140625, 69.32687377929688, 75.56682586669922, 81.8067626953125, 88.04671478271484, 94.28666687011719, 100.52662658691406, 106.7665786743164, 113.00653076171875, 119.24649047851562, 125.48644256591797, 131.7263946533203, 137.9663543701172, 144.206298828125, 150.44625854492188, 156.68621826171875, 162.92616271972656, 169.16612243652344, 175.40606689453125, 181.64602661132812, 187.885986328125, 194.1259307861328, 200.3658905029297, 206.6058349609375, 212.84579467773438, 219.08575439453125, 225.32571411132812, 231.56565856933594, 237.8056182861328, 244.04556274414062, 250.2855224609375, 256.5254821777344, 262.76544189453125, 269.00537109375, 275.2453308105469, 281.48529052734375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 9.0, 21.0, 20.0, 19.0, 18.0, 27.0, 26.0, 32.0, 46.0, 53.0, 35.0, 50.0, 45.0, 53.0, 54.0, 42.0, 55.0, 42.0, 53.0, 41.0, 37.0, 35.0, 29.0, 31.0, 24.0, 10.0, 14.0, 11.0, 15.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.05052947998047, -83.86641693115234, -80.68231201171875, -77.49819946289062, -74.3140869140625, -71.12997436523438, -67.94586944580078, -64.76175689697266, -61.5776481628418, -58.39353942871094, -55.20942687988281, -52.02531814575195, -48.841209411621094, -45.65709686279297, -42.47298812866211, -39.28887939453125, -36.104766845703125, -32.920658111572266, -29.73654556274414, -26.55243682861328, -23.36832618713379, -20.184215545654297, -17.000106811523438, -13.815996170043945, -10.631885528564453, -7.447775363922119, -4.263665199279785, -1.0795555114746094, 2.104555130004883, 5.288665771484375, 8.472774505615234, 11.656885147094727, 14.84100341796875, 18.025114059448242, 21.209224700927734, 24.393333435058594, 27.577444076538086, 30.761554718017578, 33.94566345214844, 37.12977600097656, 40.31388473510742, 43.49799346923828, 46.682106018066406, 49.866214752197266, 53.050323486328125, 56.23443603515625, 59.41854476928711, 62.60265350341797, 65.7867660522461, 68.97087860107422, 72.15498352050781, 75.33909606933594, 78.52320861816406, 81.70732116699219, 84.89142608642578, 88.0755386352539, 91.2596435546875, 94.44375610351562, 97.62786102294922, 100.81197357177734, 103.99608612060547, 107.18019104003906, 110.36430358886719, 113.54841613769531, 116.73252868652344]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 6.0, 6.0, 13.0, 9.0, 17.0, 32.0, 37.0, 52.0, 89.0, 107.0, 186.0, 231.0, 335.0, 446.0, 578.0, 860.0, 1168.0, 1648.0, 2166.0, 3041.0, 3792.0, 1018168.0, 4059.0, 3133.0, 2297.0, 1674.0, 1190.0, 872.0, 652.0, 502.0, 346.0, 232.0, 169.0, 132.0, 85.0, 74.0, 51.0, 28.0, 22.0, 14.0, 10.0, 6.0, 9.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.715913772583008, -16.202951431274414, -15.68998908996582, -15.177027702331543, -14.66406536102295, -14.151103019714355, -13.638141632080078, -13.125179290771484, -12.61221694946289, -12.099254608154297, -11.586292266845703, -11.073330879211426, -10.560368537902832, -10.047406196594238, -9.534444808959961, -9.021482467651367, -8.508520126342773, -7.99555778503418, -7.482595920562744, -6.969634056091309, -6.456671714782715, -5.943709373474121, -5.4307475090026855, -4.91778564453125, -4.404823303222656, -3.8918612003326416, -3.378899097442627, -2.8659369945526123, -2.3529748916625977, -1.840012788772583, -1.3270506858825684, -0.8140885829925537, -0.30112457275390625, 0.2118375301361084, 0.724799633026123, 1.2377617359161377, 1.7507238388061523, 2.263685941696167, 2.7766480445861816, 3.2896101474761963, 3.802572250366211, 4.315534591674805, 4.82849645614624, 5.341458320617676, 5.8544206619262695, 6.367383003234863, 6.880344867706299, 7.393306732177734, 7.906269073486328, 8.419231414794922, 8.932193756103516, 9.445155143737793, 9.958117485046387, 10.47107982635498, 10.984041213989258, 11.497003555297852, 12.009965896606445, 12.522928237915039, 13.035890579223633, 13.54885196685791, 14.061814308166504, 14.574776649475098, 15.087738037109375, 15.600700378417969, 16.113662719726562]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 13.0, 13.0, 42.0, 45.0, 79.0, 220.0, 51462328.0, 279.0, 37.0, 23.0, 15.0, 10.0, 9.0, 14.0, 4.0, 6.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3950.024169921875, -3832.3740234375, -3714.723876953125, -3597.07373046875, -3479.423583984375, -3361.7734375, -3244.123291015625, -3126.47314453125, -3008.822998046875, -2891.1728515625, -2773.522705078125, -2655.87255859375, -2538.222412109375, -2420.572265625, -2302.922119140625, -2185.27197265625, -2067.621826171875, -1949.9716796875, -1832.321533203125, -1714.67138671875, -1597.021240234375, -1479.37109375, -1361.720947265625, -1244.07080078125, -1126.420654296875, -1008.7705078125, -891.120361328125, -773.47021484375, -655.820068359375, -538.169921875, -420.519775390625, -302.86962890625, -185.21923828125, -67.569091796875, 50.0810546875, 167.731201171875, 285.38134765625, 403.031494140625, 520.681640625, 638.331787109375, 755.98193359375, 873.632080078125, 991.2822265625, 1108.932373046875, 1226.58251953125, 1344.232666015625, 1461.8828125, 1579.532958984375, 1697.18310546875, 1814.833251953125, 1932.4833984375, 2050.133544921875, 2167.78369140625, 2285.433837890625, 2403.083984375, 2520.734130859375, 2638.38427734375, 2756.034423828125, 2873.6845703125, 2991.334716796875, 3108.98486328125, 3226.635009765625, 3344.28515625, 3461.935302734375, 3579.58544921875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [5.0, 2.0, 10.0, 13.0, 19.0, 20.0, 48.0, 44.0, 98.0, 102.0, 156.0, 250.0, 384.0, 635.0, 873.0, 1407.0, 1975.0, 2891.0, 4386.0, 6686.0, 10199.0, 15661.0, 24655.0, 37671.0, 57893.0, 89095.0, 135667.0, 203810.0, 294215.0, 415767.0, 3460216.0, 530213.0, 326457.0, 227738.0, 153931.0, 101321.0, 65161.0, 42226.0, 27323.0, 17923.0, 11706.0, 7735.0, 4873.0, 3273.0, 2217.0, 1495.0, 1012.0, 636.0, 456.0, 311.0, 179.0, 140.0, 114.0, 61.0, 40.0, 23.0, 10.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 4.0], "bins": [-0.98876953125, -0.9565048217773438, -0.9242401123046875, -0.8919754028320312, -0.859710693359375, -0.8274459838867188, -0.7951812744140625, -0.7629165649414062, -0.73065185546875, -0.6983871459960938, -0.6661224365234375, -0.6338577270507812, -0.601593017578125, -0.5693283081054688, -0.5370635986328125, -0.5047988891601562, -0.4725341796875, -0.44026947021484375, -0.4080047607421875, -0.37574005126953125, -0.343475341796875, -0.31121063232421875, -0.2789459228515625, -0.24668121337890625, -0.21441650390625, -0.18215179443359375, -0.1498870849609375, -0.11762237548828125, -0.085357666015625, -0.05309295654296875, -0.0208282470703125, 0.01143646240234375, 0.043701171875, 0.07596588134765625, 0.1082305908203125, 0.14049530029296875, 0.172760009765625, 0.20502471923828125, 0.2372894287109375, 0.26955413818359375, 0.30181884765625, 0.33408355712890625, 0.3663482666015625, 0.39861297607421875, 0.430877685546875, 0.46314239501953125, 0.4954071044921875, 0.5276718139648438, 0.5599365234375, 0.5922012329101562, 0.6244659423828125, 0.6567306518554688, 0.688995361328125, 0.7212600708007812, 0.7535247802734375, 0.7857894897460938, 0.81805419921875, 0.8503189086914062, 0.8825836181640625, 0.9148483276367188, 0.947113037109375, 0.9793777465820312, 1.0116424560546875, 1.0439071655273438, 1.076171875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 1.0, 5.0, 9.0, 7.0, 10.0, 8.0, 17.0, 16.0, 19.0, 22.0, 33.0, 32.0, 32.0, 31.0, 28.0, 37.0, 33.0, 43.0, 50.0, 235.0, 854.0, 58.0, 32.0, 33.0, 25.0, 38.0, 42.0, 37.0, 33.0, 30.0, 22.0, 26.0, 21.0, 18.0, 19.0, 13.0, 11.0, 7.0, 9.0, 4.0, 3.0, 3.0, 7.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.8046875, -10.4908447265625, -10.177001953125, -9.8631591796875, -9.54931640625, -9.2354736328125, -8.921630859375, -8.6077880859375, -8.2939453125, -7.9801025390625, -7.666259765625, -7.3524169921875, -7.03857421875, -6.7247314453125, -6.410888671875, -6.0970458984375, -5.783203125, -5.4693603515625, -5.155517578125, -4.8416748046875, -4.52783203125, -4.2139892578125, -3.900146484375, -3.5863037109375, -3.2724609375, -2.9586181640625, -2.644775390625, -2.3309326171875, -2.01708984375, -1.7032470703125, -1.389404296875, -1.0755615234375, -0.76171875, -0.4478759765625, -0.134033203125, 0.1798095703125, 0.49365234375, 0.8074951171875, 1.121337890625, 1.4351806640625, 1.7490234375, 2.0628662109375, 2.376708984375, 2.6905517578125, 3.00439453125, 3.3182373046875, 3.632080078125, 3.9459228515625, 4.259765625, 4.5736083984375, 4.887451171875, 5.2012939453125, 5.51513671875, 5.8289794921875, 6.142822265625, 6.4566650390625, 6.7705078125, 7.0843505859375, 7.398193359375, 7.7120361328125, 8.02587890625, 8.3397216796875, 8.653564453125, 8.9674072265625, 9.28125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 11.0, 13.0, 18.0, 30.0, 45.0, 55.0, 77.0, 132.0, 171.0, 234.0, 333.0, 531.0, 756.0, 1176.0, 1654.0, 2509.0, 3712.0, 5889.0, 9277.0, 14619.0, 23564.0, 40509.0, 71329.0, 127116.0, 230793.0, 412105.0, 1726458.0, 2624920.0, 430468.0, 241871.0, 133743.0, 74929.0, 43402.0, 25458.0, 15925.0, 9797.0, 6101.0, 3845.0, 2541.0, 1684.0, 1180.0, 799.0, 539.0, 373.0, 242.0, 135.0, 119.0, 80.0, 62.0, 39.0, 26.0, 20.0, 16.0, 4.0, 6.0, 1.0, 1.0, 3.0], "bins": [-1.58203125, -1.534149169921875, -1.48626708984375, -1.438385009765625, -1.3905029296875, -1.342620849609375, -1.29473876953125, -1.246856689453125, -1.198974609375, -1.151092529296875, -1.10321044921875, -1.055328369140625, -1.0074462890625, -0.959564208984375, -0.91168212890625, -0.863800048828125, -0.81591796875, -0.768035888671875, -0.72015380859375, -0.672271728515625, -0.6243896484375, -0.576507568359375, -0.52862548828125, -0.480743408203125, -0.432861328125, -0.384979248046875, -0.33709716796875, -0.289215087890625, -0.2413330078125, -0.193450927734375, -0.14556884765625, -0.097686767578125, -0.0498046875, -0.001922607421875, 0.04595947265625, 0.093841552734375, 0.1417236328125, 0.189605712890625, 0.23748779296875, 0.285369873046875, 0.333251953125, 0.381134033203125, 0.42901611328125, 0.476898193359375, 0.5247802734375, 0.572662353515625, 0.62054443359375, 0.668426513671875, 0.71630859375, 0.764190673828125, 0.81207275390625, 0.859954833984375, 0.9078369140625, 0.955718994140625, 1.00360107421875, 1.051483154296875, 1.099365234375, 1.147247314453125, 1.19512939453125, 1.243011474609375, 1.2908935546875, 1.338775634765625, 1.38665771484375, 1.434539794921875, 1.482421875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 6.0, 12.0, 15.0, 12.0, 22.0, 18.0, 23.0, 30.0, 27.0, 33.0, 27.0, 43.0, 43.0, 33.0, 64.0, 139.0, 915.0, 94.0, 38.0, 39.0, 43.0, 39.0, 44.0, 40.0, 45.0, 29.0, 35.0, 28.0, 22.0, 17.0, 10.0, 6.0, 4.0, 4.0, 4.0, 6.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5546875, -8.266845703125, -7.97900390625, -7.691162109375, -7.4033203125, -7.115478515625, -6.82763671875, -6.539794921875, -6.251953125, -5.964111328125, -5.67626953125, -5.388427734375, -5.1005859375, -4.812744140625, -4.52490234375, -4.237060546875, -3.94921875, -3.661376953125, -3.37353515625, -3.085693359375, -2.7978515625, -2.510009765625, -2.22216796875, -1.934326171875, -1.646484375, -1.358642578125, -1.07080078125, -0.782958984375, -0.4951171875, -0.207275390625, 0.08056640625, 0.368408203125, 0.65625, 0.944091796875, 1.23193359375, 1.519775390625, 1.8076171875, 2.095458984375, 2.38330078125, 2.671142578125, 2.958984375, 3.246826171875, 3.53466796875, 3.822509765625, 4.1103515625, 4.398193359375, 4.68603515625, 4.973876953125, 5.26171875, 5.549560546875, 5.83740234375, 6.125244140625, 6.4130859375, 6.700927734375, 6.98876953125, 7.276611328125, 7.564453125, 7.852294921875, 8.14013671875, 8.427978515625, 8.7158203125, 9.003662109375, 9.29150390625, 9.579345703125, 9.8671875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 13.0, 18.0, 31.0, 48.0, 56.0, 119.0, 170.0, 297.0, 503.0, 852.0, 1556.0, 3234.0, 7772.0, 27150.0, 209948.0, 5960213.0, 57262.0, 12772.0, 4666.0, 2126.0, 1102.0, 557.0, 366.0, 191.0, 160.0, 92.0, 56.0, 35.0, 24.0, 12.0, 8.0, 7.0, 1.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.390625, -12.961669921875, -12.53271484375, -12.103759765625, -11.6748046875, -11.245849609375, -10.81689453125, -10.387939453125, -9.958984375, -9.530029296875, -9.10107421875, -8.672119140625, -8.2431640625, -7.814208984375, -7.38525390625, -6.956298828125, -6.52734375, -6.098388671875, -5.66943359375, -5.240478515625, -4.8115234375, -4.382568359375, -3.95361328125, -3.524658203125, -3.095703125, -2.666748046875, -2.23779296875, -1.808837890625, -1.3798828125, -0.950927734375, -0.52197265625, -0.093017578125, 0.3359375, 0.764892578125, 1.19384765625, 1.622802734375, 2.0517578125, 2.480712890625, 2.90966796875, 3.338623046875, 3.767578125, 4.196533203125, 4.62548828125, 5.054443359375, 5.4833984375, 5.912353515625, 6.34130859375, 6.770263671875, 7.19921875, 7.628173828125, 8.05712890625, 8.486083984375, 8.9150390625, 9.343994140625, 9.77294921875, 10.201904296875, 10.630859375, 11.059814453125, 11.48876953125, 11.917724609375, 12.3466796875, 12.775634765625, 13.20458984375, 13.633544921875, 14.0625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 9.0, 8.0, 5.0, 9.0, 14.0, 17.0, 16.0, 26.0, 32.0, 34.0, 40.0, 36.0, 41.0, 37.0, 46.0, 62.0, 238.0, 856.0, 74.0, 41.0, 41.0, 52.0, 38.0, 45.0, 31.0, 33.0, 24.0, 19.0, 18.0, 15.0, 10.0, 11.0, 8.0, 7.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.8125, -8.55670166015625, -8.3009033203125, -8.04510498046875, -7.789306640625, -7.53350830078125, -7.2777099609375, -7.02191162109375, -6.76611328125, -6.51031494140625, -6.2545166015625, -5.99871826171875, -5.742919921875, -5.48712158203125, -5.2313232421875, -4.97552490234375, -4.7197265625, -4.46392822265625, -4.2081298828125, -3.95233154296875, -3.696533203125, -3.44073486328125, -3.1849365234375, -2.92913818359375, -2.67333984375, -2.41754150390625, -2.1617431640625, -1.90594482421875, -1.650146484375, -1.39434814453125, -1.1385498046875, -0.88275146484375, -0.626953125, -0.37115478515625, -0.1153564453125, 0.14044189453125, 0.396240234375, 0.65203857421875, 0.9078369140625, 1.16363525390625, 1.41943359375, 1.67523193359375, 1.9310302734375, 2.18682861328125, 2.442626953125, 2.69842529296875, 2.9542236328125, 3.21002197265625, 3.4658203125, 3.72161865234375, 3.9774169921875, 4.23321533203125, 4.489013671875, 4.74481201171875, 5.0006103515625, 5.25640869140625, 5.51220703125, 5.76800537109375, 6.0238037109375, 6.27960205078125, 6.535400390625, 6.79119873046875, 7.0469970703125, 7.30279541015625, 7.55859375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 15.0, 27.0, 105.0, 505.0, 295.0, 45.0, 10.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.380470275878906, -35.396690368652344, -33.41291046142578, -31.429128646850586, -29.44534683227539, -27.461566925048828, -25.477787017822266, -23.494007110595703, -21.510225296020508, -19.526445388793945, -17.54266357421875, -15.558883666992188, -13.575102806091309, -11.59132194519043, -9.607542037963867, -7.623761177062988, -5.639980316162109, -3.6561996936798096, -1.6724190711975098, 0.31136131286621094, 2.29514217376709, 4.278923034667969, 6.262702941894531, 8.24648380279541, 10.230264663696289, 12.214045524597168, 14.197826385498047, 16.18160629272461, 18.165386199951172, 20.149168014526367, 22.13294792175293, 24.116729736328125, 26.100509643554688, 28.08428955078125, 30.068071365356445, 32.051849365234375, 34.0356330871582, 36.019412994384766, 38.00319290161133, 39.98697280883789, 41.97075653076172, 43.95453643798828, 45.938316345214844, 47.922096252441406, 49.905879974365234, 51.8896598815918, 53.87343978881836, 55.85721969604492, 57.840999603271484, 59.82477951049805, 61.80855941772461, 63.79234313964844, 65.776123046875, 67.75990295410156, 69.74368286132812, 71.72746276855469, 73.71124267578125, 75.69502258300781, 77.67880249023438, 79.66258239746094, 81.6463623046875, 83.63014221191406, 85.61392211914062, 87.59770965576172, 89.58148956298828]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 5.0, 7.0, 10.0, 12.0, 17.0, 14.0, 39.0, 37.0, 54.0, 76.0, 76.0, 109.0, 89.0, 86.0, 68.0, 86.0, 54.0, 44.0, 21.0, 29.0, 15.0, 12.0, 14.0, 5.0, 6.0, 2.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.823284149169922, -26.987491607666016, -26.151697158813477, -25.31590461730957, -24.48011016845703, -23.644317626953125, -22.80852508544922, -21.972732543945312, -21.136938095092773, -20.301145553588867, -19.465351104736328, -18.629558563232422, -17.793766021728516, -16.957971572875977, -16.12217903137207, -15.286385536193848, -14.450592041015625, -13.614798545837402, -12.77900505065918, -11.943212509155273, -11.10741901397705, -10.271625518798828, -9.435832977294922, -8.6000394821167, -7.764245986938477, -6.928452491760254, -6.0926594734191895, -5.256866455078125, -4.421072959899902, -3.5852794647216797, -2.7494864463806152, -1.9136934280395508, -1.0778999328613281, -0.24210667610168457, 0.593686580657959, 1.4294798374176025, 2.265273094177246, 3.1010665893554688, 3.936859607696533, 4.772652626037598, 5.60844612121582, 6.444239616394043, 7.280032634735107, 8.115825653076172, 8.951619148254395, 9.787412643432617, 10.623205184936523, 11.458998680114746, 12.294792175292969, 13.130585670471191, 13.966379165649414, 14.80217170715332, 15.637965202331543, 16.473758697509766, 17.309551239013672, 18.145343780517578, 18.981138229370117, 19.816930770874023, 20.652725219726562, 21.48851776123047, 22.324310302734375, 23.160104751586914, 23.99589729309082, 24.83169174194336, 25.667484283447266]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 8.0, 21.0, 15.0, 30.0, 36.0, 48.0, 85.0, 107.0, 160.0, 226.0, 334.0, 488.0, 843.0, 1529.0, 2899.0, 6189.0, 19250.0, 267553.0, 3848261.0, 28294.0, 8487.0, 3791.0, 1978.0, 1137.0, 755.0, 526.0, 341.0, 227.0, 165.0, 132.0, 86.0, 74.0, 46.0, 47.0, 25.0, 18.0, 14.0, 10.0, 11.0, 4.0, 6.0, 9.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.36572265625, -0.3527069091796875, -0.339691162109375, -0.3266754150390625, -0.31365966796875, -0.3006439208984375, -0.287628173828125, -0.2746124267578125, -0.2615966796875, -0.2485809326171875, -0.235565185546875, -0.2225494384765625, -0.20953369140625, -0.1965179443359375, -0.183502197265625, -0.1704864501953125, -0.157470703125, -0.1444549560546875, -0.131439208984375, -0.1184234619140625, -0.10540771484375, -0.0923919677734375, -0.079376220703125, -0.0663604736328125, -0.0533447265625, -0.0403289794921875, -0.027313232421875, -0.0142974853515625, -0.00128173828125, 0.0117340087890625, 0.024749755859375, 0.0377655029296875, 0.05078125, 0.0637969970703125, 0.076812744140625, 0.0898284912109375, 0.10284423828125, 0.1158599853515625, 0.128875732421875, 0.1418914794921875, 0.1549072265625, 0.1679229736328125, 0.180938720703125, 0.1939544677734375, 0.20697021484375, 0.2199859619140625, 0.233001708984375, 0.2460174560546875, 0.259033203125, 0.2720489501953125, 0.285064697265625, 0.2980804443359375, 0.31109619140625, 0.3241119384765625, 0.337127685546875, 0.3501434326171875, 0.3631591796875, 0.3761749267578125, 0.389190673828125, 0.4022064208984375, 0.41522216796875, 0.4282379150390625, 0.441253662109375, 0.4542694091796875, 0.46728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 9.0, 10.0, 7.0, 10.0, 19.0, 19.0, 215.0, 586.0, 15.0, 15.0, 10.0, 12.0, 12.0, 7.0, 2.0, 5.0, 4.0, 4.0, 2.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08587646484375, -0.08260536193847656, -0.07933425903320312, -0.07606315612792969, -0.07279205322265625, -0.06952095031738281, -0.06624984741210938, -0.06297874450683594, -0.0597076416015625, -0.05643653869628906, -0.053165435791015625, -0.04989433288574219, -0.04662322998046875, -0.04335212707519531, -0.040081024169921875, -0.03680992126464844, -0.033538818359375, -0.030267715454101562, -0.026996612548828125, -0.023725509643554688, -0.02045440673828125, -0.017183303833007812, -0.013912200927734375, -0.010641098022460938, -0.0073699951171875, -0.0040988922119140625, -0.000827789306640625, 0.0024433135986328125, 0.00571441650390625, 0.008985519409179688, 0.012256622314453125, 0.015527725219726562, 0.018798828125, 0.022069931030273438, 0.025341033935546875, 0.028612136840820312, 0.03188323974609375, 0.03515434265136719, 0.038425445556640625, 0.04169654846191406, 0.0449676513671875, 0.04823875427246094, 0.051509857177734375, 0.05478096008300781, 0.05805206298828125, 0.06132316589355469, 0.06459426879882812, 0.06786537170410156, 0.071136474609375, 0.07440757751464844, 0.07767868041992188, 0.08094978332519531, 0.08422088623046875, 0.08749198913574219, 0.09076309204101562, 0.09403419494628906, 0.0973052978515625, 0.10057640075683594, 0.10384750366210938, 0.10711860656738281, 0.11038970947265625, 0.11366081237792969, 0.11693191528320312, 0.12020301818847656, 0.12347412109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 7.0, 9.0, 16.0, 23.0, 22.0, 39.0, 54.0, 85.0, 118.0, 218.0, 338.0, 621.0, 1319.0, 2945.0, 7330.0, 22733.0, 113413.0, 3676197.0, 315887.0, 34448.0, 10277.0, 4192.0, 1839.0, 882.0, 539.0, 277.0, 165.0, 97.0, 47.0, 39.0, 33.0, 16.0, 9.0, 7.0, 8.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.32373046875, -0.31317901611328125, -0.3026275634765625, -0.29207611083984375, -0.281524658203125, -0.27097320556640625, -0.2604217529296875, -0.24987030029296875, -0.23931884765625, -0.22876739501953125, -0.2182159423828125, -0.20766448974609375, -0.197113037109375, -0.18656158447265625, -0.1760101318359375, -0.16545867919921875, -0.1549072265625, -0.14435577392578125, -0.1338043212890625, -0.12325286865234375, -0.112701416015625, -0.10214996337890625, -0.0915985107421875, -0.08104705810546875, -0.07049560546875, -0.05994415283203125, -0.0493927001953125, -0.03884124755859375, -0.028289794921875, -0.01773834228515625, -0.0071868896484375, 0.00336456298828125, 0.013916015625, 0.02446746826171875, 0.0350189208984375, 0.04557037353515625, 0.056121826171875, 0.06667327880859375, 0.0772247314453125, 0.08777618408203125, 0.09832763671875, 0.10887908935546875, 0.1194305419921875, 0.12998199462890625, 0.140533447265625, 0.15108489990234375, 0.1616363525390625, 0.17218780517578125, 0.1827392578125, 0.19329071044921875, 0.2038421630859375, 0.21439361572265625, 0.224945068359375, 0.23549652099609375, 0.2460479736328125, 0.25659942626953125, 0.26715087890625, 0.27770233154296875, 0.2882537841796875, 0.29880523681640625, 0.309356689453125, 0.31990814208984375, 0.3304595947265625, 0.34101104736328125, 0.3515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 7.0, 11.0, 16.0, 20.0, 23.0, 23.0, 34.0, 68.0, 145.0, 320.0, 1486.0, 1294.0, 295.0, 136.0, 60.0, 35.0, 22.0, 20.0, 7.0, 4.0, 7.0, 4.0, 6.0, 3.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.161865234375, -0.15723419189453125, -0.1526031494140625, -0.14797210693359375, -0.143341064453125, -0.13871002197265625, -0.1340789794921875, -0.12944793701171875, -0.12481689453125, -0.12018585205078125, -0.1155548095703125, -0.11092376708984375, -0.106292724609375, -0.10166168212890625, -0.0970306396484375, -0.09239959716796875, -0.0877685546875, -0.08313751220703125, -0.0785064697265625, -0.07387542724609375, -0.069244384765625, -0.06461334228515625, -0.0599822998046875, -0.05535125732421875, -0.05072021484375, -0.04608917236328125, -0.0414581298828125, -0.03682708740234375, -0.032196044921875, -0.02756500244140625, -0.0229339599609375, -0.01830291748046875, -0.013671875, -0.00904083251953125, -0.0044097900390625, 0.00022125244140625, 0.004852294921875, 0.00948333740234375, 0.0141143798828125, 0.01874542236328125, 0.02337646484375, 0.02800750732421875, 0.0326385498046875, 0.03726959228515625, 0.041900634765625, 0.04653167724609375, 0.0511627197265625, 0.05579376220703125, 0.0604248046875, 0.06505584716796875, 0.0696868896484375, 0.07431793212890625, 0.078948974609375, 0.08358001708984375, 0.0882110595703125, 0.09284210205078125, 0.09747314453125, 0.10210418701171875, 0.1067352294921875, 0.11136627197265625, 0.115997314453125, 0.12062835693359375, 0.1252593994140625, 0.12989044189453125, 0.134521484375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 13.0, 40.0, 212.0, 568.0, 139.0, 26.0, 7.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4585137367248535, -2.405585527420044, -2.3526575565338135, -2.299729347229004, -2.2468013763427734, -2.193873167037964, -2.1409449577331543, -2.088016986846924, -2.0350887775421143, -1.9821606874465942, -1.9292325973510742, -1.8763043880462646, -1.8233762979507446, -1.7704482078552246, -1.7175201177597046, -1.6645920276641846, -1.6116639375686646, -1.5587358474731445, -1.5058077573776245, -1.4528796672821045, -1.399951457977295, -1.347023367881775, -1.2940952777862549, -1.2411671876907349, -1.1882390975952148, -1.1353110074996948, -1.0823829174041748, -1.0294547080993652, -0.9765266180038452, -0.9235985279083252, -0.8706704378128052, -0.8177423477172852, -0.764814019203186, -0.711885929107666, -0.6589577794075012, -0.6060296893119812, -0.5531015396118164, -0.5001734495162964, -0.44724535942077637, -0.39431723952293396, -0.34138911962509155, -0.28846099972724915, -0.23553289473056793, -0.18260478973388672, -0.1296766698360443, -0.0767485499382019, -0.023820459842681885, 0.029107660055160522, 0.08203577995300293, 0.13496389985084534, 0.18789200484752655, 0.24082010984420776, 0.29374822974205017, 0.3466763496398926, 0.3996044397354126, 0.452532559633255, 0.5054606795310974, 0.5583887696266174, 0.6113169193267822, 0.6642450094223022, 0.7171730995178223, 0.7701012492179871, 0.8230293393135071, 0.8759574890136719, 0.9288855791091919]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 2.0, 4.0, 7.0, 6.0, 7.0, 9.0, 8.0, 22.0, 15.0, 28.0, 28.0, 48.0, 33.0, 43.0, 63.0, 66.0, 67.0, 62.0, 60.0, 72.0, 61.0, 61.0, 56.0, 33.0, 25.0, 21.0, 21.0, 16.0, 14.0, 6.0, 9.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4421434998512268, -0.42885932326316833, -0.41557517647743225, -0.4022909998893738, -0.3890068233013153, -0.37572264671325684, -0.36243849992752075, -0.3491543233394623, -0.3358701467514038, -0.32258597016334534, -0.30930182337760925, -0.2960176467895508, -0.2827334702014923, -0.26944929361343384, -0.25616514682769775, -0.24288097023963928, -0.2295968234539032, -0.21631266176700592, -0.20302848517894745, -0.18974432349205017, -0.1764601469039917, -0.16317598521709442, -0.14989182353019714, -0.13660764694213867, -0.1233234852552414, -0.11003931611776352, -0.09675514698028564, -0.08347098529338837, -0.07018681615591049, -0.05690264701843262, -0.04361848533153534, -0.030334316194057465, -0.01705014705657959, -0.0037659797817468643, 0.009518187493085861, 0.022802352905273438, 0.03608652204275131, 0.04937069118022919, 0.06265485286712646, 0.07593902200460434, 0.08922319114208221, 0.10250736027956009, 0.11579152941703796, 0.12907569110393524, 0.14235985279083252, 0.155644029378891, 0.16892819106578827, 0.18221235275268555, 0.19549652934074402, 0.2087806910276413, 0.22206486761569977, 0.23534902930259705, 0.24863320589065552, 0.2619173526763916, 0.2752015292644501, 0.28848570585250854, 0.30176985263824463, 0.3150540292263031, 0.3283381760120392, 0.34162235260009766, 0.35490652918815613, 0.3681907057762146, 0.3814748525619507, 0.39475902915000916, 0.4080432057380676]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 12.0, 22.0, 39.0, 49.0, 79.0, 113.0, 171.0, 259.0, 457.0, 786.0, 1318.0, 2156.0, 3820.0, 7611.0, 15885.0, 41856.0, 888592.0, 49255.0, 17633.0, 8203.0, 4316.0, 2347.0, 1320.0, 809.0, 510.0, 330.0, 220.0, 126.0, 77.0, 42.0, 37.0, 21.0, 25.0, 14.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61962890625, -0.6016998291015625, -0.583770751953125, -0.5658416748046875, -0.54791259765625, -0.5299835205078125, -0.512054443359375, -0.4941253662109375, -0.4761962890625, -0.4582672119140625, -0.440338134765625, -0.4224090576171875, -0.40447998046875, -0.3865509033203125, -0.368621826171875, -0.3506927490234375, -0.332763671875, -0.3148345947265625, -0.296905517578125, -0.2789764404296875, -0.26104736328125, -0.2431182861328125, -0.225189208984375, -0.2072601318359375, -0.1893310546875, -0.1714019775390625, -0.153472900390625, -0.1355438232421875, -0.11761474609375, -0.0996856689453125, -0.081756591796875, -0.0638275146484375, -0.0458984375, -0.0279693603515625, -0.010040283203125, 0.0078887939453125, 0.02581787109375, 0.0437469482421875, 0.061676025390625, 0.0796051025390625, 0.0975341796875, 0.1154632568359375, 0.133392333984375, 0.1513214111328125, 0.16925048828125, 0.1871795654296875, 0.205108642578125, 0.2230377197265625, 0.240966796875, 0.2588958740234375, 0.276824951171875, 0.2947540283203125, 0.31268310546875, 0.3306121826171875, 0.348541259765625, 0.3664703369140625, 0.3843994140625, 0.4023284912109375, 0.420257568359375, 0.4381866455078125, 0.45611572265625, 0.4740447998046875, 0.491973876953125, 0.5099029541015625, 0.52783203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 6.0, 5.0, 9.0, 11.0, 14.0, 14.0, 15.0, 106.0, 572.0, 140.0, 16.0, 18.0, 7.0, 6.0, 11.0, 6.0, 5.0, 9.0, 2.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.07566452026367188, -0.07247161865234375, -0.06927871704101562, -0.0660858154296875, -0.06289291381835938, -0.05970001220703125, -0.056507110595703125, -0.053314208984375, -0.050121307373046875, -0.04692840576171875, -0.043735504150390625, -0.0405426025390625, -0.037349700927734375, -0.03415679931640625, -0.030963897705078125, -0.02777099609375, -0.024578094482421875, -0.02138519287109375, -0.018192291259765625, -0.0149993896484375, -0.011806488037109375, -0.00861358642578125, -0.005420684814453125, -0.002227783203125, 0.000965118408203125, 0.00415802001953125, 0.007350921630859375, 0.0105438232421875, 0.013736724853515625, 0.01692962646484375, 0.020122528076171875, 0.0233154296875, 0.026508331298828125, 0.02970123291015625, 0.032894134521484375, 0.0360870361328125, 0.039279937744140625, 0.04247283935546875, 0.045665740966796875, 0.048858642578125, 0.052051544189453125, 0.05524444580078125, 0.058437347412109375, 0.0616302490234375, 0.06482315063476562, 0.06801605224609375, 0.07120895385742188, 0.07440185546875, 0.07759475708007812, 0.08078765869140625, 0.08398056030273438, 0.0871734619140625, 0.09036636352539062, 0.09355926513671875, 0.09675216674804688, 0.099945068359375, 0.10313796997070312, 0.10633087158203125, 0.10952377319335938, 0.1127166748046875, 0.11590957641601562, 0.11910247802734375, 0.12229537963867188, 0.12548828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 12.0, 22.0, 21.0, 50.0, 62.0, 124.0, 173.0, 348.0, 554.0, 1234.0, 3098.0, 9634.0, 43561.0, 313602.0, 570693.0, 82133.0, 15344.0, 4404.0, 1670.0, 772.0, 386.0, 217.0, 160.0, 93.0, 46.0, 37.0, 24.0, 17.0, 11.0, 13.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43603515625, -0.42108917236328125, -0.4061431884765625, -0.39119720458984375, -0.376251220703125, -0.36130523681640625, -0.3463592529296875, -0.33141326904296875, -0.31646728515625, -0.30152130126953125, -0.2865753173828125, -0.27162933349609375, -0.256683349609375, -0.24173736572265625, -0.2267913818359375, -0.21184539794921875, -0.1968994140625, -0.18195343017578125, -0.1670074462890625, -0.15206146240234375, -0.137115478515625, -0.12216949462890625, -0.1072235107421875, -0.09227752685546875, -0.07733154296875, -0.06238555908203125, -0.0474395751953125, -0.03249359130859375, -0.017547607421875, -0.00260162353515625, 0.0123443603515625, 0.02729034423828125, 0.042236328125, 0.05718231201171875, 0.0721282958984375, 0.08707427978515625, 0.102020263671875, 0.11696624755859375, 0.1319122314453125, 0.14685821533203125, 0.16180419921875, 0.17675018310546875, 0.1916961669921875, 0.20664215087890625, 0.221588134765625, 0.23653411865234375, 0.2514801025390625, 0.26642608642578125, 0.2813720703125, 0.29631805419921875, 0.3112640380859375, 0.32621002197265625, 0.341156005859375, 0.35610198974609375, 0.3710479736328125, 0.38599395751953125, 0.40093994140625, 0.41588592529296875, 0.4308319091796875, 0.44577789306640625, 0.460723876953125, 0.47566986083984375, 0.4906158447265625, 0.5055618286132812, 0.5205078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 8.0, 3.0, 6.0, 6.0, 9.0, 11.0, 11.0, 19.0, 18.0, 27.0, 16.0, 28.0, 30.0, 28.0, 36.0, 25.0, 35.0, 29.0, 38.0, 36.0, 46.0, 35.0, 64.0, 36.0, 54.0, 34.0, 32.0, 38.0, 26.0, 45.0, 31.0, 20.0, 14.0, 21.0, 17.0, 11.0, 6.0, 14.0, 16.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298583984375, -0.28871917724609375, -0.2788543701171875, -0.26898956298828125, -0.259124755859375, -0.24925994873046875, -0.2393951416015625, -0.22953033447265625, -0.21966552734375, -0.20980072021484375, -0.1999359130859375, -0.19007110595703125, -0.180206298828125, -0.17034149169921875, -0.1604766845703125, -0.15061187744140625, -0.1407470703125, -0.13088226318359375, -0.1210174560546875, -0.11115264892578125, -0.101287841796875, -0.09142303466796875, -0.0815582275390625, -0.07169342041015625, -0.06182861328125, -0.05196380615234375, -0.0420989990234375, -0.03223419189453125, -0.022369384765625, -0.01250457763671875, -0.0026397705078125, 0.00722503662109375, 0.01708984375, 0.02695465087890625, 0.0368194580078125, 0.04668426513671875, 0.056549072265625, 0.06641387939453125, 0.0762786865234375, 0.08614349365234375, 0.09600830078125, 0.10587310791015625, 0.1157379150390625, 0.12560272216796875, 0.135467529296875, 0.14533233642578125, 0.1551971435546875, 0.16506195068359375, 0.1749267578125, 0.18479156494140625, 0.1946563720703125, 0.20452117919921875, 0.214385986328125, 0.22425079345703125, 0.2341156005859375, 0.24398040771484375, 0.25384521484375, 0.26371002197265625, 0.2735748291015625, 0.28343963623046875, 0.293304443359375, 0.30316925048828125, 0.3130340576171875, 0.32289886474609375, 0.332763671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 10.0, 13.0, 25.0, 28.0, 50.0, 95.0, 141.0, 270.0, 535.0, 1328.0, 4437.0, 30374.0, 951660.0, 50990.0, 5679.0, 1549.0, 604.0, 318.0, 168.0, 92.0, 50.0, 35.0, 29.0, 11.0, 13.0, 5.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64111328125, -0.618682861328125, -0.59625244140625, -0.573822021484375, -0.5513916015625, -0.528961181640625, -0.50653076171875, -0.484100341796875, -0.461669921875, -0.439239501953125, -0.41680908203125, -0.394378662109375, -0.3719482421875, -0.349517822265625, -0.32708740234375, -0.304656982421875, -0.2822265625, -0.259796142578125, -0.23736572265625, -0.214935302734375, -0.1925048828125, -0.170074462890625, -0.14764404296875, -0.125213623046875, -0.102783203125, -0.080352783203125, -0.05792236328125, -0.035491943359375, -0.0130615234375, 0.009368896484375, 0.03179931640625, 0.054229736328125, 0.07666015625, 0.099090576171875, 0.12152099609375, 0.143951416015625, 0.1663818359375, 0.188812255859375, 0.21124267578125, 0.233673095703125, 0.256103515625, 0.278533935546875, 0.30096435546875, 0.323394775390625, 0.3458251953125, 0.368255615234375, 0.39068603515625, 0.413116455078125, 0.435546875, 0.457977294921875, 0.48040771484375, 0.502838134765625, 0.5252685546875, 0.547698974609375, 0.57012939453125, 0.592559814453125, 0.614990234375, 0.637420654296875, 0.65985107421875, 0.682281494140625, 0.7047119140625, 0.727142333984375, 0.74957275390625, 0.772003173828125, 0.79443359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 15.0, 26.0, 43.0, 135.0, 469.0, 161.0, 62.0, 33.0, 15.0, 10.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001132965087890625, -0.0011035650968551636, -0.0010741651058197021, -0.0010447651147842407, -0.0010153651237487793, -0.0009859651327133179, -0.0009565651416778564, -0.000927165150642395, -0.0008977651596069336, -0.0008683651685714722, -0.0008389651775360107, -0.0008095651865005493, -0.0007801651954650879, -0.0007507652044296265, -0.000721365213394165, -0.0006919652223587036, -0.0006625652313232422, -0.0006331652402877808, -0.0006037652492523193, -0.0005743652582168579, -0.0005449652671813965, -0.0005155652761459351, -0.00048616528511047363, -0.0004567652940750122, -0.0004273653030395508, -0.00039796531200408936, -0.00036856532096862793, -0.0003391653299331665, -0.0003097653388977051, -0.00028036534786224365, -0.0002509653568267822, -0.0002215653657913208, -0.00019216537475585938, -0.00016276538372039795, -0.00013336539268493652, -0.0001039654016494751, -7.456541061401367e-05, -4.5165419578552246e-05, -1.576542854309082e-05, 1.3634562492370605e-05, 4.303455352783203e-05, 7.243454456329346e-05, 0.00010183453559875488, 0.0001312345266342163, 0.00016063451766967773, 0.00019003450870513916, 0.00021943449974060059, 0.000248834490776062, 0.00027823448181152344, 0.00030763447284698486, 0.0003370344638824463, 0.0003664344549179077, 0.00039583444595336914, 0.00042523443698883057, 0.000454634428024292, 0.0004840344190597534, 0.0005134344100952148, 0.0005428344011306763, 0.0005722343921661377, 0.0006016343832015991, 0.0006310343742370605, 0.000660434365272522, 0.0006898343563079834, 0.0007192343473434448, 0.0007486343383789062]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 4.0, 9.0, 14.0, 18.0, 22.0, 29.0, 66.0, 75.0, 146.0, 264.0, 457.0, 942.0, 2222.0, 6227.0, 26643.0, 298306.0, 651915.0, 46450.0, 9327.0, 2943.0, 1123.0, 588.0, 310.0, 139.0, 111.0, 65.0, 45.0, 34.0, 20.0, 7.0, 13.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.425048828125, -0.4126014709472656, -0.40015411376953125, -0.3877067565917969, -0.3752593994140625, -0.3628120422363281, -0.35036468505859375, -0.3379173278808594, -0.325469970703125, -0.3130226135253906, -0.30057525634765625, -0.2881278991699219, -0.2756805419921875, -0.2632331848144531, -0.25078582763671875, -0.23833847045898438, -0.22589111328125, -0.21344375610351562, -0.20099639892578125, -0.18854904174804688, -0.1761016845703125, -0.16365432739257812, -0.15120697021484375, -0.13875961303710938, -0.126312255859375, -0.11386489868164062, -0.10141754150390625, -0.08897018432617188, -0.0765228271484375, -0.06407546997070312, -0.05162811279296875, -0.039180755615234375, -0.0267333984375, -0.014286041259765625, -0.00183868408203125, 0.010608673095703125, 0.0230560302734375, 0.035503387451171875, 0.04795074462890625, 0.060398101806640625, 0.072845458984375, 0.08529281616210938, 0.09774017333984375, 0.11018753051757812, 0.1226348876953125, 0.13508224487304688, 0.14752960205078125, 0.15997695922851562, 0.17242431640625, 0.18487167358398438, 0.19731903076171875, 0.20976638793945312, 0.2222137451171875, 0.23466110229492188, 0.24710845947265625, 0.2595558166503906, 0.272003173828125, 0.2844505310058594, 0.29689788818359375, 0.3093452453613281, 0.3217926025390625, 0.3342399597167969, 0.34668731689453125, 0.3591346740722656, 0.37158203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 6.0, 7.0, 14.0, 16.0, 29.0, 36.0, 43.0, 82.0, 112.0, 118.0, 96.0, 86.0, 87.0, 77.0, 46.0, 33.0, 32.0, 19.0, 22.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.44921875, -0.43688201904296875, -0.4245452880859375, -0.41220855712890625, -0.399871826171875, -0.38753509521484375, -0.3751983642578125, -0.36286163330078125, -0.35052490234375, -0.33818817138671875, -0.3258514404296875, -0.31351470947265625, -0.301177978515625, -0.28884124755859375, -0.2765045166015625, -0.26416778564453125, -0.2518310546875, -0.23949432373046875, -0.2271575927734375, -0.21482086181640625, -0.202484130859375, -0.19014739990234375, -0.1778106689453125, -0.16547393798828125, -0.15313720703125, -0.14080047607421875, -0.1284637451171875, -0.11612701416015625, -0.103790283203125, -0.09145355224609375, -0.0791168212890625, -0.06678009033203125, -0.054443359375, -0.04210662841796875, -0.0297698974609375, -0.01743316650390625, -0.005096435546875, 0.00724029541015625, 0.0195770263671875, 0.03191375732421875, 0.04425048828125, 0.05658721923828125, 0.0689239501953125, 0.08126068115234375, 0.093597412109375, 0.10593414306640625, 0.1182708740234375, 0.13060760498046875, 0.1429443359375, 0.15528106689453125, 0.1676177978515625, 0.17995452880859375, 0.192291259765625, 0.20462799072265625, 0.2169647216796875, 0.22930145263671875, 0.24163818359375, 0.25397491455078125, 0.2663116455078125, 0.27864837646484375, 0.290985107421875, 0.30332183837890625, 0.3156585693359375, 0.32799530029296875, 0.34033203125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 9.0, 11.0, 17.0, 37.0, 69.0, 215.0, 369.0, 175.0, 48.0, 24.0, 10.0, 3.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.021965980529785, -5.831284999847412, -5.640604496002197, -5.449923515319824, -5.259242534637451, -5.068561553955078, -4.877881050109863, -4.68720006942749, -4.496519088745117, -4.305838108062744, -4.115157604217529, -3.9244766235351562, -3.733795642852783, -3.5431149005889893, -3.3524341583251953, -3.1617531776428223, -2.9710726737976074, -2.7803919315338135, -2.5897109508514404, -2.3990302085876465, -2.2083492279052734, -2.0176684856414795, -1.8269877433776855, -1.636306881904602, -1.4456260204315186, -1.254945158958435, -1.0642642974853516, -0.8735835552215576, -0.6829026937484741, -0.4922218322753906, -0.3015410900115967, -0.11086022853851318, 0.07982110977172852, 0.2705019414424896, 0.46118277311325073, 0.6518635749816895, 0.842544436454773, 1.0332252979278564, 1.2239060401916504, 1.4145869016647339, 1.6052677631378174, 1.7959486246109009, 1.9866294860839844, 2.1773102283477783, 2.3679909706115723, 2.5586719512939453, 2.7493526935577393, 2.940033435821533, 3.1307144165039062, 3.3213951587677, 3.5120761394500732, 3.702756881713867, 3.8934378623962402, 4.084118843078613, 4.274799346923828, 4.465480327606201, 4.656161308288574, 4.846842288970947, 5.037522792816162, 5.228203773498535, 5.418884754180908, 5.609565734863281, 5.800246238708496, 5.990927219390869, 6.181607723236084]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 11.0, 1.0, 1.0, 1.0, 7.0, 4.0, 15.0, 10.0, 20.0, 36.0, 55.0, 91.0, 120.0, 126.0, 124.0, 135.0, 82.0, 51.0, 32.0, 11.0, 21.0, 7.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 0.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.942081451416016, -6.730679512023926, -6.519277095794678, -6.307875156402588, -6.09647274017334, -5.88507080078125, -5.673668384552002, -5.462266445159912, -5.250864028930664, -5.039462089538574, -4.828059673309326, -4.616657733917236, -4.405255317687988, -4.193853378295898, -3.9824509620666504, -3.7710490226745605, -3.5596468448638916, -3.3482446670532227, -3.1368424892425537, -2.9254403114318848, -2.714038133621216, -2.502635955810547, -2.291234016418457, -2.079831600189209, -1.8684295415878296, -1.6570273637771606, -1.4456251859664917, -1.2342231273651123, -1.0228209495544434, -0.8114187717437744, -0.6000165939331055, -0.3886144161224365, -0.17721223831176758, 0.03418992459774017, 0.24559208750724792, 0.4569942355155945, 0.6683964133262634, 0.8797985315322876, 1.0912007093429565, 1.3026028871536255, 1.5140050649642944, 1.7254072427749634, 1.9368094205856323, 2.1482114791870117, 2.3596136569976807, 2.5710158348083496, 2.7824180126190186, 2.9938201904296875, 3.2052223682403564, 3.4166245460510254, 3.6280267238616943, 3.8394289016723633, 4.050830841064453, 4.262233257293701, 4.473635196685791, 4.685037612915039, 4.896439552307129, 5.107841491699219, 5.319243907928467, 5.530645847320557, 5.742048263549805, 5.9534502029418945, 6.164852619171143, 6.376254558563232, 6.5876569747924805]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 22.0, 47.0, 95.0, 328.0, 1278.0, 7537.0, 318178.0, 3851336.0, 12527.0, 2172.0, 467.0, 152.0, 42.0, 27.0, 18.0, 11.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0703125, -1.976531982421875, -1.88275146484375, -1.788970947265625, -1.6951904296875, -1.601409912109375, -1.50762939453125, -1.413848876953125, -1.320068359375, -1.226287841796875, -1.13250732421875, -1.038726806640625, -0.9449462890625, -0.851165771484375, -0.75738525390625, -0.663604736328125, -0.56982421875, -0.476043701171875, -0.38226318359375, -0.288482666015625, -0.1947021484375, -0.100921630859375, -0.00714111328125, 0.086639404296875, 0.180419921875, 0.274200439453125, 0.36798095703125, 0.461761474609375, 0.5555419921875, 0.649322509765625, 0.74310302734375, 0.836883544921875, 0.9306640625, 1.024444580078125, 1.11822509765625, 1.212005615234375, 1.3057861328125, 1.399566650390625, 1.49334716796875, 1.587127685546875, 1.680908203125, 1.774688720703125, 1.86846923828125, 1.962249755859375, 2.0560302734375, 2.149810791015625, 2.24359130859375, 2.337371826171875, 2.43115234375, 2.524932861328125, 2.61871337890625, 2.712493896484375, 2.8062744140625, 2.900054931640625, 2.99383544921875, 3.087615966796875, 3.181396484375, 3.275177001953125, 3.36895751953125, 3.462738037109375, 3.5565185546875, 3.650299072265625, 3.74407958984375, 3.837860107421875, 3.931640625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 3.0, 8.0, 11.0, 6.0, 5.0, 8.0, 4.0, 11.0, 16.0, 37.0, 74.0, 190.0, 257.0, 179.0, 80.0, 23.0, 16.0, 7.0, 6.0, 8.0, 7.0, 4.0, 7.0, 3.0, 6.0, 9.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0732421875, -0.07091999053955078, -0.06859779357910156, -0.06627559661865234, -0.06395339965820312, -0.061631202697753906, -0.05930900573730469, -0.05698680877685547, -0.05466461181640625, -0.05234241485595703, -0.05002021789550781, -0.047698020935058594, -0.045375823974609375, -0.043053627014160156, -0.04073143005371094, -0.03840923309326172, -0.0360870361328125, -0.03376483917236328, -0.03144264221191406, -0.029120445251464844, -0.026798248291015625, -0.024476051330566406, -0.022153854370117188, -0.01983165740966797, -0.01750946044921875, -0.015187263488769531, -0.012865066528320312, -0.010542869567871094, -0.008220672607421875, -0.005898475646972656, -0.0035762786865234375, -0.0012540817260742188, 0.001068115234375, 0.0033903121948242188, 0.0057125091552734375, 0.008034706115722656, 0.010356903076171875, 0.012679100036621094, 0.015001296997070312, 0.01732349395751953, 0.01964569091796875, 0.02196788787841797, 0.024290084838867188, 0.026612281799316406, 0.028934478759765625, 0.031256675720214844, 0.03357887268066406, 0.03590106964111328, 0.0382232666015625, 0.04054546356201172, 0.04286766052246094, 0.045189857482910156, 0.047512054443359375, 0.049834251403808594, 0.05215644836425781, 0.05447864532470703, 0.05680084228515625, 0.05912303924560547, 0.06144523620605469, 0.0637674331665039, 0.06608963012695312, 0.06841182708740234, 0.07073402404785156, 0.07305622100830078, 0.07537841796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 8.0, 15.0, 17.0, 18.0, 42.0, 73.0, 82.0, 191.0, 315.0, 543.0, 1137.0, 2507.0, 5992.0, 17145.0, 65612.0, 2041670.0, 1966500.0, 65371.0, 16707.0, 5747.0, 2317.0, 1069.0, 518.0, 275.0, 138.0, 87.0, 79.0, 31.0, 23.0, 22.0, 15.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6688766479492188, -0.6497650146484375, -0.6306533813476562, -0.611541748046875, -0.5924301147460938, -0.5733184814453125, -0.5542068481445312, -0.53509521484375, -0.5159835815429688, -0.4968719482421875, -0.47776031494140625, -0.458648681640625, -0.43953704833984375, -0.4204254150390625, -0.40131378173828125, -0.3822021484375, -0.36309051513671875, -0.3439788818359375, -0.32486724853515625, -0.305755615234375, -0.28664398193359375, -0.2675323486328125, -0.24842071533203125, -0.22930908203125, -0.21019744873046875, -0.1910858154296875, -0.17197418212890625, -0.152862548828125, -0.13375091552734375, -0.1146392822265625, -0.09552764892578125, -0.076416015625, -0.05730438232421875, -0.0381927490234375, -0.01908111572265625, 3.0517578125e-05, 0.01914215087890625, 0.0382537841796875, 0.05736541748046875, 0.07647705078125, 0.09558868408203125, 0.1147003173828125, 0.13381195068359375, 0.152923583984375, 0.17203521728515625, 0.1911468505859375, 0.21025848388671875, 0.2293701171875, 0.24848175048828125, 0.2675933837890625, 0.28670501708984375, 0.305816650390625, 0.32492828369140625, 0.3440399169921875, 0.36315155029296875, 0.38226318359375, 0.40137481689453125, 0.4204864501953125, 0.43959808349609375, 0.458709716796875, 0.47782135009765625, 0.4969329833984375, 0.5160446166992188, 0.53515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 2.0, 4.0, 4.0, 7.0, 8.0, 10.0, 7.0, 12.0, 10.0, 18.0, 18.0, 24.0, 23.0, 22.0, 51.0, 68.0, 87.0, 184.0, 469.0, 1526.0, 721.0, 276.0, 150.0, 93.0, 56.0, 33.0, 39.0, 23.0, 17.0, 22.0, 10.0, 19.0, 4.0, 7.0, 7.0, 3.0, 2.0, 3.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0762939453125, -0.07402801513671875, -0.0717620849609375, -0.06949615478515625, -0.067230224609375, -0.06496429443359375, -0.0626983642578125, -0.06043243408203125, -0.05816650390625, -0.05590057373046875, -0.0536346435546875, -0.05136871337890625, -0.049102783203125, -0.04683685302734375, -0.0445709228515625, -0.04230499267578125, -0.0400390625, -0.03777313232421875, -0.0355072021484375, -0.03324127197265625, -0.030975341796875, -0.02870941162109375, -0.0264434814453125, -0.02417755126953125, -0.02191162109375, -0.01964569091796875, -0.0173797607421875, -0.01511383056640625, -0.012847900390625, -0.01058197021484375, -0.0083160400390625, -0.00605010986328125, -0.0037841796875, -0.00151824951171875, 0.0007476806640625, 0.00301361083984375, 0.005279541015625, 0.00754547119140625, 0.0098114013671875, 0.01207733154296875, 0.01434326171875, 0.01660919189453125, 0.0188751220703125, 0.02114105224609375, 0.023406982421875, 0.02567291259765625, 0.0279388427734375, 0.03020477294921875, 0.032470703125, 0.03473663330078125, 0.0370025634765625, 0.03926849365234375, 0.041534423828125, 0.04380035400390625, 0.0460662841796875, 0.04833221435546875, 0.05059814453125, 0.05286407470703125, 0.0551300048828125, 0.05739593505859375, 0.059661865234375, 0.06192779541015625, 0.0641937255859375, 0.06645965576171875, 0.0687255859375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 16.0, 102.0, 750.0, 105.0, 19.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8531599044799805, -3.7578370571136475, -3.6625144481658936, -3.5671916007995605, -3.4718689918518066, -3.3765461444854736, -3.2812232971191406, -3.1859006881713867, -3.0905778408050537, -2.9952549934387207, -2.899932384490967, -2.804609537124634, -2.70928692817688, -2.613964080810547, -2.518641471862793, -2.42331862449646, -2.327995777130127, -2.232672929763794, -2.13735032081604, -2.042027473449707, -1.9467047452926636, -1.8513820171356201, -1.7560592889785767, -1.6607365608215332, -1.5654139518737793, -1.4700912237167358, -1.3747684955596924, -1.2794456481933594, -1.184122920036316, -1.0888001918792725, -0.993477463722229, -0.8981546759605408, -0.8028318881988525, -0.7075091600418091, -0.6121863722801208, -0.5168636441230774, -0.42154088616371155, -0.3262181282043457, -0.23089540004730225, -0.135572612285614, -0.04024988412857056, 0.05507286638021469, 0.15039561688899994, 0.2457183599472046, 0.34104111790657043, 0.4363638758659363, 0.5316866040229797, 0.627009391784668, 0.7223321199417114, 0.8176548480987549, 0.9129776358604431, 1.0083003044128418, 1.1036231517791748, 1.1989458799362183, 1.2942686080932617, 1.3895914554595947, 1.4849140644073486, 1.580236792564392, 1.6755595207214355, 1.7708823680877686, 1.866205096244812, 1.9615278244018555, 2.0568504333496094, 2.1521732807159424, 2.2474961280822754]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 2.0, 10.0, 8.0, 12.0, 17.0, 13.0, 16.0, 41.0, 47.0, 50.0, 69.0, 76.0, 92.0, 64.0, 72.0, 83.0, 71.0, 51.0, 42.0, 37.0, 27.0, 18.0, 7.0, 12.0, 9.0, 8.0, 9.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5329259634017944, -0.5160823464393616, -0.4992387890815735, -0.4823951721191406, -0.46555158495903015, -0.4487079977989197, -0.4318644106388092, -0.41502082347869873, -0.39817720651626587, -0.3813336193561554, -0.3644900321960449, -0.34764641523361206, -0.3308028280735016, -0.3139592409133911, -0.29711565375328064, -0.28027206659317017, -0.2634284794330597, -0.24658489227294922, -0.22974129021167755, -0.21289770305156708, -0.1960541009902954, -0.17921051383018494, -0.16236692667007446, -0.145523339509964, -0.12867973744869232, -0.11183614283800125, -0.09499254822731018, -0.07814896106719971, -0.061305366456508636, -0.044461771845817566, -0.027618184685707092, -0.010774590075016022, 0.006069004535675049, 0.02291259728372097, 0.03975619003176689, 0.056599780917167664, 0.07344337552785873, 0.0902869701385498, 0.10713055729866028, 0.12397415190935135, 0.14081774652004242, 0.1576613336801529, 0.17450493574142456, 0.19134852290153503, 0.2081921100616455, 0.22503571212291718, 0.24187929928302765, 0.2587229013442993, 0.2755664885044098, 0.29241007566452026, 0.30925366282463074, 0.3260972499847412, 0.3429408669471741, 0.35978445410728455, 0.376628041267395, 0.3934716284275055, 0.41031521558761597, 0.42715880274772644, 0.4440023899078369, 0.4608460068702698, 0.47768959403038025, 0.4945331811904907, 0.5113767385482788, 0.5282203555107117, 0.5450639724731445]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 22.0, 27.0, 20.0, 38.0, 62.0, 83.0, 104.0, 182.0, 253.0, 429.0, 703.0, 1139.0, 1981.0, 3648.0, 7079.0, 15528.0, 49139.0, 546014.0, 356170.0, 38317.0, 13246.0, 6421.0, 3240.0, 1817.0, 1041.0, 677.0, 402.0, 257.0, 153.0, 111.0, 71.0, 52.0, 34.0, 18.0, 19.0, 17.0, 9.0, 8.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5126953125, -0.4971199035644531, -0.48154449462890625, -0.4659690856933594, -0.4503936767578125, -0.4348182678222656, -0.41924285888671875, -0.4036674499511719, -0.388092041015625, -0.3725166320800781, -0.35694122314453125, -0.3413658142089844, -0.3257904052734375, -0.3102149963378906, -0.29463958740234375, -0.2790641784667969, -0.26348876953125, -0.24791336059570312, -0.23233795166015625, -0.21676254272460938, -0.2011871337890625, -0.18561172485351562, -0.17003631591796875, -0.15446090698242188, -0.138885498046875, -0.12331008911132812, -0.10773468017578125, -0.09215927124023438, -0.0765838623046875, -0.061008453369140625, -0.04543304443359375, -0.029857635498046875, -0.0142822265625, 0.001293182373046875, 0.01686859130859375, 0.032444000244140625, 0.0480194091796875, 0.06359481811523438, 0.07917022705078125, 0.09474563598632812, 0.110321044921875, 0.12589645385742188, 0.14147186279296875, 0.15704727172851562, 0.1726226806640625, 0.18819808959960938, 0.20377349853515625, 0.21934890747070312, 0.23492431640625, 0.2504997253417969, 0.26607513427734375, 0.2816505432128906, 0.2972259521484375, 0.3128013610839844, 0.32837677001953125, 0.3439521789550781, 0.359527587890625, 0.3751029968261719, 0.39067840576171875, 0.4062538146972656, 0.4218292236328125, 0.4374046325683594, 0.45298004150390625, 0.4685554504394531, 0.484130859375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 8.0, 5.0, 8.0, 13.0, 14.0, 41.0, 74.0, 113.0, 163.0, 167.0, 139.0, 88.0, 50.0, 23.0, 16.0, 7.0, 11.0, 7.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.066650390625, -0.06465578079223633, -0.06266117095947266, -0.060666561126708984, -0.05867195129394531, -0.05667734146118164, -0.05468273162841797, -0.0526881217956543, -0.050693511962890625, -0.04869890213012695, -0.04670429229736328, -0.04470968246459961, -0.04271507263183594, -0.040720462799072266, -0.038725852966308594, -0.03673124313354492, -0.03473663330078125, -0.03274202346801758, -0.030747413635253906, -0.028752803802490234, -0.026758193969726562, -0.02476358413696289, -0.02276897430419922, -0.020774364471435547, -0.018779754638671875, -0.016785144805908203, -0.014790534973144531, -0.01279592514038086, -0.010801315307617188, -0.008806705474853516, -0.006812095642089844, -0.004817485809326172, -0.0028228759765625, -0.0008282661437988281, 0.0011663436889648438, 0.0031609535217285156, 0.0051555633544921875, 0.007150173187255859, 0.009144783020019531, 0.011139392852783203, 0.013134002685546875, 0.015128612518310547, 0.01712322235107422, 0.01911783218383789, 0.021112442016601562, 0.023107051849365234, 0.025101661682128906, 0.027096271514892578, 0.02909088134765625, 0.031085491180419922, 0.033080101013183594, 0.035074710845947266, 0.03706932067871094, 0.03906393051147461, 0.04105854034423828, 0.04305315017700195, 0.045047760009765625, 0.0470423698425293, 0.04903697967529297, 0.05103158950805664, 0.05302619934082031, 0.055020809173583984, 0.057015419006347656, 0.05901002883911133, 0.061004638671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 4.0, 3.0, 5.0, 14.0, 26.0, 108.0, 386.0, 4096.0, 747898.0, 293398.0, 2182.0, 283.0, 76.0, 22.0, 9.0, 8.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.52734375, -1.4762725830078125, -1.425201416015625, -1.3741302490234375, -1.32305908203125, -1.2719879150390625, -1.220916748046875, -1.1698455810546875, -1.1187744140625, -1.0677032470703125, -1.016632080078125, -0.9655609130859375, -0.91448974609375, -0.8634185791015625, -0.812347412109375, -0.7612762451171875, -0.710205078125, -0.6591339111328125, -0.608062744140625, -0.5569915771484375, -0.50592041015625, -0.4548492431640625, -0.403778076171875, -0.3527069091796875, -0.3016357421875, -0.2505645751953125, -0.199493408203125, -0.1484222412109375, -0.09735107421875, -0.0462799072265625, 0.004791259765625, 0.0558624267578125, 0.10693359375, 0.1580047607421875, 0.209075927734375, 0.2601470947265625, 0.31121826171875, 0.3622894287109375, 0.413360595703125, 0.4644317626953125, 0.5155029296875, 0.5665740966796875, 0.617645263671875, 0.6687164306640625, 0.71978759765625, 0.7708587646484375, 0.821929931640625, 0.8730010986328125, 0.924072265625, 0.9751434326171875, 1.026214599609375, 1.0772857666015625, 1.12835693359375, 1.1794281005859375, 1.230499267578125, 1.2815704345703125, 1.3326416015625, 1.3837127685546875, 1.434783935546875, 1.4858551025390625, 1.53692626953125, 1.5879974365234375, 1.639068603515625, 1.6901397705078125, 1.7412109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 6.0, 5.0, 5.0, 7.0, 4.0, 11.0, 17.0, 22.0, 12.0, 23.0, 25.0, 26.0, 31.0, 34.0, 47.0, 58.0, 50.0, 41.0, 49.0, 45.0, 40.0, 49.0, 45.0, 35.0, 28.0, 46.0, 36.0, 21.0, 26.0, 29.0, 20.0, 24.0, 13.0, 15.0, 7.0, 9.0, 9.0, 10.0, 4.0, 9.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2237548828125, -0.21648025512695312, -0.20920562744140625, -0.20193099975585938, -0.1946563720703125, -0.18738174438476562, -0.18010711669921875, -0.17283248901367188, -0.165557861328125, -0.15828323364257812, -0.15100860595703125, -0.14373397827148438, -0.1364593505859375, -0.12918472290039062, -0.12191009521484375, -0.11463546752929688, -0.10736083984375, -0.10008621215820312, -0.09281158447265625, -0.08553695678710938, -0.0782623291015625, -0.07098770141601562, -0.06371307373046875, -0.056438446044921875, -0.049163818359375, -0.041889190673828125, -0.03461456298828125, -0.027339935302734375, -0.0200653076171875, -0.012790679931640625, -0.00551605224609375, 0.001758575439453125, 0.009033203125, 0.016307830810546875, 0.02358245849609375, 0.030857086181640625, 0.0381317138671875, 0.045406341552734375, 0.05268096923828125, 0.059955596923828125, 0.067230224609375, 0.07450485229492188, 0.08177947998046875, 0.08905410766601562, 0.0963287353515625, 0.10360336303710938, 0.11087799072265625, 0.11815261840820312, 0.12542724609375, 0.13270187377929688, 0.13997650146484375, 0.14725112915039062, 0.1545257568359375, 0.16180038452148438, 0.16907501220703125, 0.17634963989257812, 0.183624267578125, 0.19089889526367188, 0.19817352294921875, 0.20544815063476562, 0.2127227783203125, 0.21999740600585938, 0.22727203369140625, 0.23454666137695312, 0.2418212890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 5.0, 10.0, 21.0, 48.0, 133.0, 1137.0, 1024972.0, 21632.0, 426.0, 97.0, 31.0, 17.0, 12.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.421875, -4.29840087890625, -4.1749267578125, -4.05145263671875, -3.927978515625, -3.80450439453125, -3.6810302734375, -3.55755615234375, -3.43408203125, -3.31060791015625, -3.1871337890625, -3.06365966796875, -2.940185546875, -2.81671142578125, -2.6932373046875, -2.56976318359375, -2.4462890625, -2.32281494140625, -2.1993408203125, -2.07586669921875, -1.952392578125, -1.82891845703125, -1.7054443359375, -1.58197021484375, -1.45849609375, -1.33502197265625, -1.2115478515625, -1.08807373046875, -0.964599609375, -0.84112548828125, -0.7176513671875, -0.59417724609375, -0.470703125, -0.34722900390625, -0.2237548828125, -0.10028076171875, 0.023193359375, 0.14666748046875, 0.2701416015625, 0.39361572265625, 0.51708984375, 0.64056396484375, 0.7640380859375, 0.88751220703125, 1.010986328125, 1.13446044921875, 1.2579345703125, 1.38140869140625, 1.5048828125, 1.62835693359375, 1.7518310546875, 1.87530517578125, 1.998779296875, 2.12225341796875, 2.2457275390625, 2.36920166015625, 2.49267578125, 2.61614990234375, 2.7396240234375, 2.86309814453125, 2.986572265625, 3.11004638671875, 3.2335205078125, 3.35699462890625, 3.48046875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 3.0, 5.0, 9.0, 5.0, 9.0, 23.0, 31.0, 40.0, 78.0, 108.0, 265.0, 177.0, 72.0, 54.0, 30.0, 23.0, 15.0, 14.0, 6.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0007991790771484375, -0.0007747560739517212, -0.0007503330707550049, -0.0007259100675582886, -0.0007014870643615723, -0.000677064061164856, -0.0006526410579681396, -0.0006282180547714233, -0.000603795051574707, -0.0005793720483779907, -0.0005549490451812744, -0.0005305260419845581, -0.0005061030387878418, -0.0004816800355911255, -0.0004572570323944092, -0.00043283402919769287, -0.00040841102600097656, -0.00038398802280426025, -0.00035956501960754395, -0.00033514201641082764, -0.00031071901321411133, -0.000286296010017395, -0.0002618730068206787, -0.0002374500036239624, -0.0002130270004272461, -0.00018860399723052979, -0.00016418099403381348, -0.00013975799083709717, -0.00011533498764038086, -9.091198444366455e-05, -6.648898124694824e-05, -4.2065978050231934e-05, -1.7642974853515625e-05, 6.780028343200684e-06, 3.120303153991699e-05, 5.56260347366333e-05, 8.004903793334961e-05, 0.00010447204113006592, 0.00012889504432678223, 0.00015331804752349854, 0.00017774105072021484, 0.00020216405391693115, 0.00022658705711364746, 0.00025101006031036377, 0.0002754330635070801, 0.0002998560667037964, 0.0003242790699005127, 0.000348702073097229, 0.0003731250762939453, 0.0003975480794906616, 0.00042197108268737793, 0.00044639408588409424, 0.00047081708908081055, 0.0004952400922775269, 0.0005196630954742432, 0.0005440860986709595, 0.0005685091018676758, 0.0005929321050643921, 0.0006173551082611084, 0.0006417781114578247, 0.000666201114654541, 0.0006906241178512573, 0.0007150471210479736, 0.0007394701242446899, 0.0007638931274414062]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 6.0, 8.0, 11.0, 23.0, 37.0, 87.0, 190.0, 469.0, 1317.0, 4749.0, 38002.0, 821872.0, 166783.0, 11270.0, 2365.0, 757.0, 301.0, 133.0, 69.0, 33.0, 23.0, 15.0, 8.0, 6.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.5026168823242188, -0.4822845458984375, -0.46195220947265625, -0.441619873046875, -0.42128753662109375, -0.4009552001953125, -0.38062286376953125, -0.36029052734375, -0.33995819091796875, -0.3196258544921875, -0.29929351806640625, -0.278961181640625, -0.25862884521484375, -0.2382965087890625, -0.21796417236328125, -0.1976318359375, -0.17729949951171875, -0.1569671630859375, -0.13663482666015625, -0.116302490234375, -0.09597015380859375, -0.0756378173828125, -0.05530548095703125, -0.03497314453125, -0.01464080810546875, 0.0056915283203125, 0.02602386474609375, 0.046356201171875, 0.06668853759765625, 0.0870208740234375, 0.10735321044921875, 0.127685546875, 0.14801788330078125, 0.1683502197265625, 0.18868255615234375, 0.209014892578125, 0.22934722900390625, 0.2496795654296875, 0.27001190185546875, 0.29034423828125, 0.31067657470703125, 0.3310089111328125, 0.35134124755859375, 0.371673583984375, 0.39200592041015625, 0.4123382568359375, 0.43267059326171875, 0.4530029296875, 0.47333526611328125, 0.4936676025390625, 0.5139999389648438, 0.534332275390625, 0.5546646118164062, 0.5749969482421875, 0.5953292846679688, 0.61566162109375, 0.6359939575195312, 0.6563262939453125, 0.6766586303710938, 0.696990966796875, 0.7173233032226562, 0.7376556396484375, 0.7579879760742188, 0.7783203125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 8.0, 10.0, 15.0, 21.0, 35.0, 47.0, 86.0, 127.0, 152.0, 144.0, 96.0, 86.0, 54.0, 33.0, 25.0, 13.0, 11.0, 8.0, 10.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32568359375, -0.3136024475097656, -0.30152130126953125, -0.2894401550292969, -0.2773590087890625, -0.2652778625488281, -0.25319671630859375, -0.24111557006835938, -0.229034423828125, -0.21695327758789062, -0.20487213134765625, -0.19279098510742188, -0.1807098388671875, -0.16862869262695312, -0.15654754638671875, -0.14446640014648438, -0.13238525390625, -0.12030410766601562, -0.10822296142578125, -0.09614181518554688, -0.0840606689453125, -0.07197952270507812, -0.05989837646484375, -0.047817230224609375, -0.035736083984375, -0.023654937744140625, -0.01157379150390625, 0.000507354736328125, 0.0125885009765625, 0.024669647216796875, 0.03675079345703125, 0.048831939697265625, 0.0609130859375, 0.07299423217773438, 0.08507537841796875, 0.09715652465820312, 0.1092376708984375, 0.12131881713867188, 0.13339996337890625, 0.14548110961914062, 0.157562255859375, 0.16964340209960938, 0.18172454833984375, 0.19380569458007812, 0.2058868408203125, 0.21796798706054688, 0.23004913330078125, 0.24213027954101562, 0.25421142578125, 0.2662925720214844, 0.27837371826171875, 0.2904548645019531, 0.3025360107421875, 0.3146171569824219, 0.32669830322265625, 0.3387794494628906, 0.350860595703125, 0.3629417419433594, 0.37502288818359375, 0.3871040344238281, 0.3991851806640625, 0.4112663269042969, 0.42334747314453125, 0.4354286193847656, 0.447509765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 8.0, 10.0, 22.0, 90.0, 266.0, 371.0, 147.0, 59.0, 16.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.099022388458252, -4.949929237365723, -4.800836563110352, -4.651743412017822, -4.502650260925293, -4.353557586669922, -4.204464435577393, -4.055371284484863, -3.906278610229492, -3.757185697555542, -3.608092784881592, -3.4589996337890625, -3.3099067211151123, -3.160813808441162, -3.011720657348633, -2.8626277446746826, -2.7135348320007324, -2.5644419193267822, -2.415349006652832, -2.2662558555603027, -2.1171629428863525, -1.9680700302124023, -1.8189769983291626, -1.6698839664459229, -1.5207910537719727, -1.3716981410980225, -1.2226051092147827, -1.073512077331543, -0.9244191646575928, -0.7753261923789978, -0.6262332201004028, -0.4771401882171631, -0.3280477523803711, -0.17895478010177612, -0.029861807823181152, 0.11923116445541382, 0.2683241367340088, 0.41741710901260376, 0.5665100812911987, 0.7156031131744385, 0.8646960258483887, 1.0137889385223389, 1.1628819704055786, 1.3119750022888184, 1.4610679149627686, 1.6101608276367188, 1.7592538595199585, 1.9083468914031982, 2.0574398040771484, 2.2065327167510986, 2.355625629425049, 2.504718780517578, 2.6538116931915283, 2.8029046058654785, 2.951997756958008, 3.101090669631958, 3.250183582305908, 3.3992764949798584, 3.5483694076538086, 3.697462558746338, 3.846555471420288, 3.9956483840942383, 4.144741535186768, 4.293834686279297, 4.442927360534668]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 6.0, 9.0, 9.0, 15.0, 31.0, 45.0, 67.0, 96.0, 119.0, 134.0, 115.0, 111.0, 73.0, 60.0, 37.0, 22.0, 11.0, 8.0, 3.0, 1.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.652742624282837, -3.521327018737793, -3.38991117477417, -3.258495569229126, -3.127079963684082, -2.995664358139038, -2.864248752593994, -2.732832908630371, -2.601417303085327, -2.470001697540283, -2.33858585357666, -2.207170248031616, -2.0757546424865723, -1.9443390369415283, -1.8129233121871948, -1.6815075874328613, -1.5500919818878174, -1.4186763763427734, -1.28726065158844, -1.1558449268341064, -1.0244293212890625, -0.8930136561393738, -0.7615979909896851, -0.6301823258399963, -0.4987666606903076, -0.3673509955406189, -0.23593533039093018, -0.10451966524124146, 0.026895999908447266, 0.158311665058136, 0.2897273302078247, 0.4211429953575134, 0.5525588989257812, 0.68397456407547, 0.8153902292251587, 0.9468058943748474, 1.0782215595245361, 1.20963716506958, 1.3410528898239136, 1.472468614578247, 1.603884220123291, 1.735299825668335, 1.8667155504226685, 1.998131275177002, 2.129546880722046, 2.26096248626709, 2.392378330230713, 2.523793935775757, 2.655209541320801, 2.7866251468658447, 2.9180407524108887, 3.0494565963745117, 3.1808722019195557, 3.3122878074645996, 3.4437036514282227, 3.5751192569732666, 3.7065348625183105, 3.8379504680633545, 3.9693660736083984, 4.1007819175720215, 4.2321977615356445, 4.363613128662109, 4.495028972625732, 4.626444339752197, 4.75786018371582]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 11.0, 8.0, 8.0, 10.0, 16.0, 23.0, 18.0, 40.0, 40.0, 54.0, 100.0, 124.0, 210.0, 298.0, 483.0, 792.0, 1421.0, 3765.0, 13737.0, 187080.0, 3943100.0, 31578.0, 6501.0, 2298.0, 1042.0, 559.0, 336.0, 190.0, 123.0, 86.0, 63.0, 45.0, 23.0, 32.0, 19.0, 12.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.5275726318359375, -1.477020263671875, -1.4264678955078125, -1.37591552734375, -1.3253631591796875, -1.274810791015625, -1.2242584228515625, -1.1737060546875, -1.1231536865234375, -1.072601318359375, -1.0220489501953125, -0.97149658203125, -0.9209442138671875, -0.870391845703125, -0.8198394775390625, -0.769287109375, -0.7187347412109375, -0.668182373046875, -0.6176300048828125, -0.56707763671875, -0.5165252685546875, -0.465972900390625, -0.4154205322265625, -0.3648681640625, -0.3143157958984375, -0.263763427734375, -0.2132110595703125, -0.16265869140625, -0.1121063232421875, -0.061553955078125, -0.0110015869140625, 0.03955078125, 0.0901031494140625, 0.140655517578125, 0.1912078857421875, 0.24176025390625, 0.2923126220703125, 0.342864990234375, 0.3934173583984375, 0.4439697265625, 0.4945220947265625, 0.545074462890625, 0.5956268310546875, 0.64617919921875, 0.6967315673828125, 0.747283935546875, 0.7978363037109375, 0.848388671875, 0.8989410400390625, 0.949493408203125, 1.0000457763671875, 1.05059814453125, 1.1011505126953125, 1.151702880859375, 1.2022552490234375, 1.2528076171875, 1.3033599853515625, 1.353912353515625, 1.4044647216796875, 1.45501708984375, 1.5055694580078125, 1.556121826171875, 1.6066741943359375, 1.6572265625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 5.0, 8.0, 7.0, 11.0, 29.0, 47.0, 111.0, 143.0, 177.0, 170.0, 111.0, 75.0, 28.0, 26.0, 11.0, 10.0, 12.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09283447265625, -0.09023857116699219, -0.08764266967773438, -0.08504676818847656, -0.08245086669921875, -0.07985496520996094, -0.07725906372070312, -0.07466316223144531, -0.0720672607421875, -0.06947135925292969, -0.06687545776367188, -0.06427955627441406, -0.06168365478515625, -0.05908775329589844, -0.056491851806640625, -0.05389595031738281, -0.051300048828125, -0.04870414733886719, -0.046108245849609375, -0.04351234436035156, -0.04091644287109375, -0.03832054138183594, -0.035724639892578125, -0.03312873840332031, -0.0305328369140625, -0.027936935424804688, -0.025341033935546875, -0.022745132446289062, -0.02014923095703125, -0.017553329467773438, -0.014957427978515625, -0.012361526489257812, -0.009765625, -0.0071697235107421875, -0.004573822021484375, -0.0019779205322265625, 0.00061798095703125, 0.0032138824462890625, 0.005809783935546875, 0.008405685424804688, 0.0110015869140625, 0.013597488403320312, 0.016193389892578125, 0.018789291381835938, 0.02138519287109375, 0.023981094360351562, 0.026576995849609375, 0.029172897338867188, 0.031768798828125, 0.03436470031738281, 0.036960601806640625, 0.03955650329589844, 0.04215240478515625, 0.04474830627441406, 0.047344207763671875, 0.04994010925292969, 0.0525360107421875, 0.05513191223144531, 0.057727813720703125, 0.06032371520996094, 0.06291961669921875, 0.06551551818847656, 0.06811141967773438, 0.07070732116699219, 0.07330322265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 9.0, 13.0, 9.0, 9.0, 28.0, 27.0, 51.0, 62.0, 135.0, 381.0, 2274.0, 27232.0, 4049153.0, 109291.0, 4463.0, 653.0, 190.0, 94.0, 56.0, 35.0, 24.0, 20.0, 11.0, 8.0, 4.0, 4.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.650390625, -1.596588134765625, -1.54278564453125, -1.488983154296875, -1.4351806640625, -1.381378173828125, -1.32757568359375, -1.273773193359375, -1.219970703125, -1.166168212890625, -1.11236572265625, -1.058563232421875, -1.0047607421875, -0.950958251953125, -0.89715576171875, -0.843353271484375, -0.78955078125, -0.735748291015625, -0.68194580078125, -0.628143310546875, -0.5743408203125, -0.520538330078125, -0.46673583984375, -0.412933349609375, -0.359130859375, -0.305328369140625, -0.25152587890625, -0.197723388671875, -0.1439208984375, -0.090118408203125, -0.03631591796875, 0.017486572265625, 0.0712890625, 0.125091552734375, 0.17889404296875, 0.232696533203125, 0.2864990234375, 0.340301513671875, 0.39410400390625, 0.447906494140625, 0.501708984375, 0.555511474609375, 0.60931396484375, 0.663116455078125, 0.7169189453125, 0.770721435546875, 0.82452392578125, 0.878326416015625, 0.93212890625, 0.985931396484375, 1.03973388671875, 1.093536376953125, 1.1473388671875, 1.201141357421875, 1.25494384765625, 1.308746337890625, 1.362548828125, 1.416351318359375, 1.47015380859375, 1.523956298828125, 1.5777587890625, 1.631561279296875, 1.68536376953125, 1.739166259765625, 1.79296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 10.0, 6.0, 6.0, 7.0, 9.0, 24.0, 17.0, 18.0, 37.0, 52.0, 68.0, 90.0, 187.0, 358.0, 746.0, 1261.0, 515.0, 217.0, 134.0, 87.0, 46.0, 46.0, 34.0, 12.0, 13.0, 14.0, 14.0, 7.0, 6.0, 8.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0870361328125, -0.08434200286865234, -0.08164787292480469, -0.07895374298095703, -0.07625961303710938, -0.07356548309326172, -0.07087135314941406, -0.0681772232055664, -0.06548309326171875, -0.0627889633178711, -0.06009483337402344, -0.05740070343017578, -0.054706573486328125, -0.05201244354248047, -0.04931831359863281, -0.046624183654785156, -0.0439300537109375, -0.041235923767089844, -0.03854179382324219, -0.03584766387939453, -0.033153533935546875, -0.03045940399169922, -0.027765274047851562, -0.025071144104003906, -0.02237701416015625, -0.019682884216308594, -0.016988754272460938, -0.014294624328613281, -0.011600494384765625, -0.008906364440917969, -0.0062122344970703125, -0.0035181045532226562, -0.000823974609375, 0.0018701553344726562, 0.0045642852783203125, 0.007258415222167969, 0.009952545166015625, 0.012646675109863281, 0.015340805053710938, 0.018034934997558594, 0.02072906494140625, 0.023423194885253906, 0.026117324829101562, 0.02881145477294922, 0.031505584716796875, 0.03419971466064453, 0.03689384460449219, 0.039587974548339844, 0.0422821044921875, 0.044976234436035156, 0.04767036437988281, 0.05036449432373047, 0.053058624267578125, 0.05575275421142578, 0.05844688415527344, 0.061141014099121094, 0.06383514404296875, 0.0665292739868164, 0.06922340393066406, 0.07191753387451172, 0.07461166381835938, 0.07730579376220703, 0.07999992370605469, 0.08269405364990234, 0.08538818359375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 35.0, 552.0, 381.0, 26.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9804832935333252, -1.8810842037200928, -1.7816851139068604, -1.682286024093628, -1.5828869342803955, -1.483487844467163, -1.3840886354446411, -1.2846895456314087, -1.1852904558181763, -1.0858913660049438, -0.9864922761917114, -0.8870931267738342, -0.7876940369606018, -0.6882949471473694, -0.5888957977294922, -0.48949670791625977, -0.39009761810302734, -0.2906985282897949, -0.1912994086742401, -0.0919002890586853, 0.007498800754547119, 0.10689789056777954, 0.20629703998565674, 0.30569612979888916, 0.4050952196121216, 0.504494309425354, 0.6038933992385864, 0.7032925486564636, 0.802691638469696, 0.9020907282829285, 1.0014898777008057, 1.100888967514038, 1.2002878189086914, 1.2996869087219238, 1.3990859985351562, 1.4984850883483887, 1.597884178161621, 1.6972832679748535, 1.7966824769973755, 1.896081566810608, 1.9954806566238403, 2.0948798656463623, 2.1942789554595947, 2.293678045272827, 2.3930771350860596, 2.492476224899292, 2.5918753147125244, 2.691274404525757, 2.7906734943389893, 2.8900725841522217, 2.989471673965454, 3.0888707637786865, 3.188269853591919, 3.2876689434051514, 3.387068271636963, 3.4864673614501953, 3.5858664512634277, 3.68526554107666, 3.7846646308898926, 3.884063720703125, 3.9834628105163574, 4.08286190032959, 4.182260990142822, 4.281660079956055, 4.381059169769287]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 10.0, 10.0, 14.0, 18.0, 18.0, 31.0, 42.0, 47.0, 57.0, 68.0, 75.0, 61.0, 94.0, 69.0, 60.0, 70.0, 43.0, 48.0, 33.0, 27.0, 23.0, 12.0, 14.0, 12.0, 8.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4672037363052368, -0.45223161578178406, -0.4372595250606537, -0.4222874045372009, -0.40731531381607056, -0.3923431932926178, -0.37737107276916504, -0.36239898204803467, -0.3474268615245819, -0.33245474100112915, -0.3174826502799988, -0.302510529756546, -0.28753840923309326, -0.2725663185119629, -0.25759419798851013, -0.24262209236621857, -0.227649986743927, -0.21267788112163544, -0.19770577549934387, -0.1827336549758911, -0.16776154935359955, -0.15278944373130798, -0.13781732320785522, -0.12284521758556366, -0.1078731119632721, -0.09290100634098053, -0.07792889326810837, -0.0629567801952362, -0.04798467457294464, -0.033012568950653076, -0.018040455877780914, -0.0030683428049087524, 0.011903762817382812, 0.026875872164964676, 0.04184798151254654, 0.0568200908601284, 0.07179220020771027, 0.08676430583000183, 0.10173641890287399, 0.11670853197574615, 0.13168063759803772, 0.14665274322032928, 0.16162484884262085, 0.1765969693660736, 0.19156907498836517, 0.20654118061065674, 0.2215133011341095, 0.23648540675640106, 0.2514575123786926, 0.2664296329021454, 0.28140172362327576, 0.2963738441467285, 0.3113459348678589, 0.32631805539131165, 0.3412901759147644, 0.3562622666358948, 0.37123438715934753, 0.3862065076828003, 0.40117859840393066, 0.4161507189273834, 0.4311228394508362, 0.44609493017196655, 0.4610670506954193, 0.47603917121887207, 0.49101126194000244]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 1.0, 4.0, 8.0, 5.0, 6.0, 14.0, 23.0, 22.0, 25.0, 48.0, 60.0, 73.0, 129.0, 207.0, 336.0, 701.0, 1604.0, 5694.0, 46333.0, 824743.0, 153594.0, 10429.0, 2396.0, 906.0, 477.0, 240.0, 132.0, 103.0, 63.0, 44.0, 35.0, 20.0, 14.0, 13.0, 18.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74365234375, -0.7167892456054688, -0.6899261474609375, -0.6630630493164062, -0.636199951171875, -0.6093368530273438, -0.5824737548828125, -0.5556106567382812, -0.52874755859375, -0.5018844604492188, -0.4750213623046875, -0.44815826416015625, -0.421295166015625, -0.39443206787109375, -0.3675689697265625, -0.34070587158203125, -0.3138427734375, -0.28697967529296875, -0.2601165771484375, -0.23325347900390625, -0.206390380859375, -0.17952728271484375, -0.1526641845703125, -0.12580108642578125, -0.09893798828125, -0.07207489013671875, -0.0452117919921875, -0.01834869384765625, 0.008514404296875, 0.03537750244140625, 0.0622406005859375, 0.08910369873046875, 0.115966796875, 0.14282989501953125, 0.1696929931640625, 0.19655609130859375, 0.223419189453125, 0.25028228759765625, 0.2771453857421875, 0.30400848388671875, 0.33087158203125, 0.35773468017578125, 0.3845977783203125, 0.41146087646484375, 0.438323974609375, 0.46518707275390625, 0.4920501708984375, 0.5189132690429688, 0.5457763671875, 0.5726394653320312, 0.5995025634765625, 0.6263656616210938, 0.653228759765625, 0.6800918579101562, 0.7069549560546875, 0.7338180541992188, 0.76068115234375, 0.7875442504882812, 0.8144073486328125, 0.8412704467773438, 0.868133544921875, 0.8949966430664062, 0.9218597412109375, 0.9487228393554688, 0.9755859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 0.0, 4.0, 10.0, 18.0, 33.0, 47.0, 90.0, 130.0, 153.0, 156.0, 114.0, 94.0, 54.0, 38.0, 28.0, 11.0, 3.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.07951641082763672, -0.07718467712402344, -0.07485294342041016, -0.07252120971679688, -0.0701894760131836, -0.06785774230957031, -0.06552600860595703, -0.06319427490234375, -0.06086254119873047, -0.05853080749511719, -0.056199073791503906, -0.053867340087890625, -0.051535606384277344, -0.04920387268066406, -0.04687213897705078, -0.0445404052734375, -0.04220867156982422, -0.03987693786621094, -0.037545204162597656, -0.035213470458984375, -0.032881736755371094, -0.030550003051757812, -0.02821826934814453, -0.02588653564453125, -0.02355480194091797, -0.021223068237304688, -0.018891334533691406, -0.016559600830078125, -0.014227867126464844, -0.011896133422851562, -0.009564399719238281, -0.007232666015625, -0.004900932312011719, -0.0025691986083984375, -0.00023746490478515625, 0.002094268798828125, 0.004426002502441406, 0.0067577362060546875, 0.009089469909667969, 0.01142120361328125, 0.013752937316894531, 0.016084671020507812, 0.018416404724121094, 0.020748138427734375, 0.023079872131347656, 0.025411605834960938, 0.02774333953857422, 0.0300750732421875, 0.03240680694580078, 0.03473854064941406, 0.037070274353027344, 0.039402008056640625, 0.041733741760253906, 0.04406547546386719, 0.04639720916748047, 0.04872894287109375, 0.05106067657470703, 0.05339241027832031, 0.055724143981933594, 0.058055877685546875, 0.060387611389160156, 0.06271934509277344, 0.06505107879638672, 0.0673828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 14.0, 18.0, 21.0, 28.0, 37.0, 54.0, 86.0, 146.0, 238.0, 510.0, 1176.0, 3659.0, 15731.0, 95059.0, 565886.0, 310837.0, 42876.0, 8059.0, 2309.0, 868.0, 383.0, 197.0, 110.0, 63.0, 54.0, 33.0, 22.0, 26.0, 16.0, 11.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62646484375, -0.60845947265625, -0.5904541015625, -0.57244873046875, -0.554443359375, -0.53643798828125, -0.5184326171875, -0.50042724609375, -0.482421875, -0.46441650390625, -0.4464111328125, -0.42840576171875, -0.410400390625, -0.39239501953125, -0.3743896484375, -0.35638427734375, -0.33837890625, -0.32037353515625, -0.3023681640625, -0.28436279296875, -0.266357421875, -0.24835205078125, -0.2303466796875, -0.21234130859375, -0.1943359375, -0.17633056640625, -0.1583251953125, -0.14031982421875, -0.122314453125, -0.10430908203125, -0.0863037109375, -0.06829833984375, -0.05029296875, -0.03228759765625, -0.0142822265625, 0.00372314453125, 0.021728515625, 0.03973388671875, 0.0577392578125, 0.07574462890625, 0.09375, 0.11175537109375, 0.1297607421875, 0.14776611328125, 0.165771484375, 0.18377685546875, 0.2017822265625, 0.21978759765625, 0.23779296875, 0.25579833984375, 0.2738037109375, 0.29180908203125, 0.309814453125, 0.32781982421875, 0.3458251953125, 0.36383056640625, 0.3818359375, 0.39984130859375, 0.4178466796875, 0.43585205078125, 0.453857421875, 0.47186279296875, 0.4898681640625, 0.50787353515625, 0.52587890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 3.0, 9.0, 14.0, 8.0, 11.0, 13.0, 9.0, 11.0, 19.0, 19.0, 24.0, 35.0, 30.0, 36.0, 39.0, 39.0, 46.0, 38.0, 55.0, 44.0, 37.0, 49.0, 44.0, 53.0, 27.0, 28.0, 33.0, 28.0, 33.0, 24.0, 23.0, 17.0, 23.0, 12.0, 13.0, 8.0, 7.0, 8.0, 9.0, 5.0, 0.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2354736328125, -0.2281360626220703, -0.22079849243164062, -0.21346092224121094, -0.20612335205078125, -0.19878578186035156, -0.19144821166992188, -0.1841106414794922, -0.1767730712890625, -0.1694355010986328, -0.16209793090820312, -0.15476036071777344, -0.14742279052734375, -0.14008522033691406, -0.13274765014648438, -0.1254100799560547, -0.118072509765625, -0.11073493957519531, -0.10339736938476562, -0.09605979919433594, -0.08872222900390625, -0.08138465881347656, -0.07404708862304688, -0.06670951843261719, -0.0593719482421875, -0.05203437805175781, -0.044696807861328125, -0.03735923767089844, -0.03002166748046875, -0.022684097290039062, -0.015346527099609375, -0.008008956909179688, -0.00067138671875, 0.0066661834716796875, 0.014003753662109375, 0.021341323852539062, 0.02867889404296875, 0.03601646423339844, 0.043354034423828125, 0.05069160461425781, 0.0580291748046875, 0.06536674499511719, 0.07270431518554688, 0.08004188537597656, 0.08737945556640625, 0.09471702575683594, 0.10205459594726562, 0.10939216613769531, 0.116729736328125, 0.12406730651855469, 0.13140487670898438, 0.13874244689941406, 0.14608001708984375, 0.15341758728027344, 0.16075515747070312, 0.1680927276611328, 0.1754302978515625, 0.1827678680419922, 0.19010543823242188, 0.19744300842285156, 0.20478057861328125, 0.21211814880371094, 0.21945571899414062, 0.2267932891845703, 0.234130859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 8.0, 11.0, 24.0, 26.0, 69.0, 193.0, 613.0, 2899.0, 487333.0, 553173.0, 3214.0, 629.0, 206.0, 63.0, 37.0, 20.0, 15.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.642852783203125, -1.59722900390625, -1.551605224609375, -1.5059814453125, -1.460357666015625, -1.41473388671875, -1.369110107421875, -1.323486328125, -1.277862548828125, -1.23223876953125, -1.186614990234375, -1.1409912109375, -1.095367431640625, -1.04974365234375, -1.004119873046875, -0.95849609375, -0.912872314453125, -0.86724853515625, -0.821624755859375, -0.7760009765625, -0.730377197265625, -0.68475341796875, -0.639129638671875, -0.593505859375, -0.547882080078125, -0.50225830078125, -0.456634521484375, -0.4110107421875, -0.365386962890625, -0.31976318359375, -0.274139404296875, -0.228515625, -0.182891845703125, -0.13726806640625, -0.091644287109375, -0.0460205078125, -0.000396728515625, 0.04522705078125, 0.090850830078125, 0.136474609375, 0.182098388671875, 0.22772216796875, 0.273345947265625, 0.3189697265625, 0.364593505859375, 0.41021728515625, 0.455841064453125, 0.50146484375, 0.547088623046875, 0.59271240234375, 0.638336181640625, 0.6839599609375, 0.729583740234375, 0.77520751953125, 0.820831298828125, 0.866455078125, 0.912078857421875, 0.95770263671875, 1.003326416015625, 1.0489501953125, 1.094573974609375, 1.14019775390625, 1.185821533203125, 1.2314453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 10.0, 13.0, 10.0, 27.0, 23.0, 23.0, 34.0, 61.0, 62.0, 72.0, 99.0, 112.0, 109.0, 56.0, 56.0, 40.0, 46.0, 21.0, 19.0, 19.0, 16.0, 11.0, 13.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012993812561035156, -0.00012536346912384033, -0.0001207888126373291, -0.00011621415615081787, -0.00011163949966430664, -0.00010706484317779541, -0.00010249018669128418, -9.791553020477295e-05, -9.334087371826172e-05, -8.876621723175049e-05, -8.419156074523926e-05, -7.961690425872803e-05, -7.50422477722168e-05, -7.046759128570557e-05, -6.589293479919434e-05, -6.13182783126831e-05, -5.6743621826171875e-05, -5.2168965339660645e-05, -4.7594308853149414e-05, -4.3019652366638184e-05, -3.844499588012695e-05, -3.387033939361572e-05, -2.9295682907104492e-05, -2.4721026420593262e-05, -2.014636993408203e-05, -1.55717134475708e-05, -1.099705696105957e-05, -6.42240047454834e-06, -1.8477439880371094e-06, 2.726912498474121e-06, 7.3015689849853516e-06, 1.1876225471496582e-05, 1.6450881958007812e-05, 2.1025538444519043e-05, 2.5600194931030273e-05, 3.0174851417541504e-05, 3.4749507904052734e-05, 3.9324164390563965e-05, 4.3898820877075195e-05, 4.8473477363586426e-05, 5.3048133850097656e-05, 5.762279033660889e-05, 6.219744682312012e-05, 6.677210330963135e-05, 7.134675979614258e-05, 7.592141628265381e-05, 8.049607276916504e-05, 8.507072925567627e-05, 8.96453857421875e-05, 9.422004222869873e-05, 9.879469871520996e-05, 0.00010336935520172119, 0.00010794401168823242, 0.00011251866817474365, 0.00011709332466125488, 0.00012166798114776611, 0.00012624263763427734, 0.00013081729412078857, 0.0001353919506072998, 0.00013996660709381104, 0.00014454126358032227, 0.0001491159200668335, 0.00015369057655334473, 0.00015826523303985596, 0.0001628398895263672]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 12.0, 14.0, 27.0, 40.0, 87.0, 179.0, 445.0, 1241.0, 6435.0, 559971.0, 471827.0, 6111.0, 1263.0, 416.0, 198.0, 99.0, 78.0, 35.0, 29.0, 13.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92724609375, -0.8915634155273438, -0.8558807373046875, -0.8201980590820312, -0.784515380859375, -0.7488327026367188, -0.7131500244140625, -0.6774673461914062, -0.64178466796875, -0.6061019897460938, -0.5704193115234375, -0.5347366333007812, -0.499053955078125, -0.46337127685546875, -0.4276885986328125, -0.39200592041015625, -0.3563232421875, -0.32064056396484375, -0.2849578857421875, -0.24927520751953125, -0.213592529296875, -0.17790985107421875, -0.1422271728515625, -0.10654449462890625, -0.07086181640625, -0.03517913818359375, 0.0005035400390625, 0.03618621826171875, 0.071868896484375, 0.10755157470703125, 0.1432342529296875, 0.17891693115234375, 0.214599609375, 0.25028228759765625, 0.2859649658203125, 0.32164764404296875, 0.357330322265625, 0.39301300048828125, 0.4286956787109375, 0.46437835693359375, 0.50006103515625, 0.5357437133789062, 0.5714263916015625, 0.6071090698242188, 0.642791748046875, 0.6784744262695312, 0.7141571044921875, 0.7498397827148438, 0.7855224609375, 0.8212051391601562, 0.8568878173828125, 0.8925704956054688, 0.928253173828125, 0.9639358520507812, 0.9996185302734375, 1.0353012084960938, 1.07098388671875, 1.1066665649414062, 1.1423492431640625, 1.1780319213867188, 1.213714599609375, 1.2493972778320312, 1.2850799560546875, 1.3207626342773438, 1.3564453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 12.0, 6.0, 22.0, 47.0, 112.0, 305.0, 287.0, 123.0, 49.0, 18.0, 7.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4099082946777344, -0.39037322998046875, -0.3708381652832031, -0.3513031005859375, -0.3317680358886719, -0.31223297119140625, -0.2926979064941406, -0.273162841796875, -0.2536277770996094, -0.23409271240234375, -0.21455764770507812, -0.1950225830078125, -0.17548751831054688, -0.15595245361328125, -0.13641738891601562, -0.11688232421875, -0.09734725952148438, -0.07781219482421875, -0.058277130126953125, -0.0387420654296875, -0.019207000732421875, 0.00032806396484375, 0.019863128662109375, 0.039398193359375, 0.058933258056640625, 0.07846832275390625, 0.09800338745117188, 0.1175384521484375, 0.13707351684570312, 0.15660858154296875, 0.17614364624023438, 0.1956787109375, 0.21521377563476562, 0.23474884033203125, 0.2542839050292969, 0.2738189697265625, 0.2933540344238281, 0.31288909912109375, 0.3324241638183594, 0.351959228515625, 0.3714942932128906, 0.39102935791015625, 0.4105644226074219, 0.4300994873046875, 0.4496345520019531, 0.46916961669921875, 0.4887046813964844, 0.50823974609375, 0.5277748107910156, 0.5473098754882812, 0.5668449401855469, 0.5863800048828125, 0.6059150695800781, 0.6254501342773438, 0.6449851989746094, 0.664520263671875, 0.6840553283691406, 0.7035903930664062, 0.7231254577636719, 0.7426605224609375, 0.7621955871582031, 0.7817306518554688, 0.8012657165527344, 0.82080078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 11.0, 53.0, 684.0, 227.0, 29.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.582576274871826, -2.1321871280670166, -1.6817981004714966, -1.2314090728759766, -0.781019926071167, -0.3306307792663574, 0.11975812911987305, 0.5701472759246826, 1.0205364227294922, 1.4709255695343018, 1.9213145971298218, 2.371703624725342, 2.8220927715301514, 3.272481918334961, 3.7228708267211914, 4.173259735107422, 4.6236491203308105, 5.074038028717041, 5.52442741394043, 5.97481632232666, 6.425205230712891, 6.875594615936279, 7.32598352432251, 7.776372909545898, 8.226761817932129, 8.67715072631836, 9.12753963470459, 9.57792854309082, 10.028318405151367, 10.478707313537598, 10.929096221923828, 11.379485130310059, 11.829874038696289, 12.28026294708252, 12.73065185546875, 13.181041717529297, 13.631430625915527, 14.081819534301758, 14.532208442687988, 14.982597351074219, 15.432987213134766, 15.883376121520996, 16.333765029907227, 16.784154891967773, 17.234542846679688, 17.684932708740234, 18.13532257080078, 18.585710525512695, 19.03609848022461, 19.486488342285156, 19.93687629699707, 20.387266159057617, 20.83765411376953, 21.288043975830078, 21.738433837890625, 22.18882179260254, 22.639211654663086, 23.089601516723633, 23.539989471435547, 23.990379333496094, 24.440767288208008, 24.891157150268555, 25.34154510498047, 25.791934967041016, 26.242324829101562]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 5.0, 12.0, 17.0, 18.0, 21.0, 24.0, 41.0, 46.0, 46.0, 46.0, 53.0, 61.0, 71.0, 59.0, 66.0, 77.0, 53.0, 45.0, 52.0, 42.0, 25.0, 32.0, 23.0, 11.0, 13.0, 14.0, 3.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.796495199203491, -2.7146565914154053, -2.6328182220458984, -2.5509796142578125, -2.4691410064697266, -2.3873026371002197, -2.305464029312134, -2.223625659942627, -2.141787052154541, -2.059948444366455, -1.9781100749969482, -1.8962714672088623, -1.814432978630066, -1.7325944900512695, -1.6507558822631836, -1.5689173936843872, -1.4870789051055908, -1.4052404165267944, -1.323401927947998, -1.241563320159912, -1.1597248315811157, -1.0778863430023193, -0.9960477948188782, -0.914209246635437, -0.8323707580566406, -0.7505322694778442, -0.6686937212944031, -0.5868551731109619, -0.5050166845321655, -0.42317816615104675, -0.341339647769928, -0.2595010995864868, -0.17766261100769043, -0.09582409262657166, -0.01398557424545288, 0.0678529441356659, 0.14969146251678467, 0.23152998089790344, 0.3133684992790222, 0.3952070474624634, 0.47704553604125977, 0.5588840246200562, 0.6407225728034973, 0.7225611209869385, 0.8043996095657349, 0.8862380981445312, 0.9680766463279724, 1.0499151945114136, 1.13175368309021, 1.2135921716690063, 1.2954306602478027, 1.3772692680358887, 1.459107756614685, 1.5409462451934814, 1.6227848529815674, 1.7046233415603638, 1.7864618301391602, 1.8683003187179565, 1.950138807296753, 2.031977415084839, 2.1138157844543457, 2.1956543922424316, 2.2774930000305176, 2.3593316078186035, 2.4411699771881104]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 7.0, 5.0, 19.0, 34.0, 81.0, 171.0, 392.0, 1083.0, 10233.0, 4158523.0, 22225.0, 1044.0, 262.0, 96.0, 41.0, 25.0, 17.0, 11.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4140625, -5.25750732421875, -5.1009521484375, -4.94439697265625, -4.787841796875, -4.63128662109375, -4.4747314453125, -4.31817626953125, -4.16162109375, -4.00506591796875, -3.8485107421875, -3.69195556640625, -3.535400390625, -3.37884521484375, -3.2222900390625, -3.06573486328125, -2.9091796875, -2.75262451171875, -2.5960693359375, -2.43951416015625, -2.282958984375, -2.12640380859375, -1.9698486328125, -1.81329345703125, -1.65673828125, -1.50018310546875, -1.3436279296875, -1.18707275390625, -1.030517578125, -0.87396240234375, -0.7174072265625, -0.56085205078125, -0.404296875, -0.24774169921875, -0.0911865234375, 0.06536865234375, 0.221923828125, 0.37847900390625, 0.5350341796875, 0.69158935546875, 0.84814453125, 1.00469970703125, 1.1612548828125, 1.31781005859375, 1.474365234375, 1.63092041015625, 1.7874755859375, 1.94403076171875, 2.1005859375, 2.25714111328125, 2.4136962890625, 2.57025146484375, 2.726806640625, 2.88336181640625, 3.0399169921875, 3.19647216796875, 3.35302734375, 3.50958251953125, 3.6661376953125, 3.82269287109375, 3.979248046875, 4.13580322265625, 4.2923583984375, 4.44891357421875, 4.60546875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 14.0, 10.0, 27.0, 58.0, 83.0, 114.0, 137.0, 134.0, 133.0, 98.0, 72.0, 44.0, 23.0, 15.0, 13.0, 9.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125732421875, -0.1221761703491211, -0.11861991882324219, -0.11506366729736328, -0.11150741577148438, -0.10795116424560547, -0.10439491271972656, -0.10083866119384766, -0.09728240966796875, -0.09372615814208984, -0.09016990661621094, -0.08661365509033203, -0.08305740356445312, -0.07950115203857422, -0.07594490051269531, -0.0723886489868164, -0.0688323974609375, -0.0652761459350586, -0.06171989440917969, -0.05816364288330078, -0.054607391357421875, -0.05105113983154297, -0.04749488830566406, -0.043938636779785156, -0.04038238525390625, -0.036826133728027344, -0.03326988220214844, -0.02971363067626953, -0.026157379150390625, -0.02260112762451172, -0.019044876098632812, -0.015488624572753906, -0.011932373046875, -0.008376121520996094, -0.0048198699951171875, -0.0012636184692382812, 0.002292633056640625, 0.005848884582519531, 0.009405136108398438, 0.012961387634277344, 0.01651763916015625, 0.020073890686035156, 0.023630142211914062, 0.02718639373779297, 0.030742645263671875, 0.03429889678955078, 0.03785514831542969, 0.041411399841308594, 0.0449676513671875, 0.048523902893066406, 0.05208015441894531, 0.05563640594482422, 0.059192657470703125, 0.06274890899658203, 0.06630516052246094, 0.06986141204833984, 0.07341766357421875, 0.07697391510009766, 0.08053016662597656, 0.08408641815185547, 0.08764266967773438, 0.09119892120361328, 0.09475517272949219, 0.0983114242553711, 0.10186767578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 13.0, 10.0, 16.0, 12.0, 27.0, 32.0, 28.0, 45.0, 51.0, 66.0, 91.0, 128.0, 158.0, 251.0, 619.0, 5357.0, 2198501.0, 1979961.0, 7089.0, 862.0, 283.0, 165.0, 129.0, 96.0, 75.0, 49.0, 36.0, 27.0, 19.0, 17.0, 17.0, 12.0, 9.0, 9.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.357421875, -2.2813720703125, -2.205322265625, -2.1292724609375, -2.05322265625, -1.9771728515625, -1.901123046875, -1.8250732421875, -1.7490234375, -1.6729736328125, -1.596923828125, -1.5208740234375, -1.44482421875, -1.3687744140625, -1.292724609375, -1.2166748046875, -1.140625, -1.0645751953125, -0.988525390625, -0.9124755859375, -0.83642578125, -0.7603759765625, -0.684326171875, -0.6082763671875, -0.5322265625, -0.4561767578125, -0.380126953125, -0.3040771484375, -0.22802734375, -0.1519775390625, -0.075927734375, 0.0001220703125, 0.076171875, 0.1522216796875, 0.228271484375, 0.3043212890625, 0.38037109375, 0.4564208984375, 0.532470703125, 0.6085205078125, 0.6845703125, 0.7606201171875, 0.836669921875, 0.9127197265625, 0.98876953125, 1.0648193359375, 1.140869140625, 1.2169189453125, 1.29296875, 1.3690185546875, 1.445068359375, 1.5211181640625, 1.59716796875, 1.6732177734375, 1.749267578125, 1.8253173828125, 1.9013671875, 1.9774169921875, 2.053466796875, 2.1295166015625, 2.20556640625, 2.2816162109375, 2.357666015625, 2.4337158203125, 2.509765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 13.0, 11.0, 24.0, 53.0, 84.0, 219.0, 654.0, 2022.0, 524.0, 180.0, 83.0, 52.0, 50.0, 20.0, 22.0, 9.0, 6.0, 9.0, 12.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.243408203125, -0.23723602294921875, -0.2310638427734375, -0.22489166259765625, -0.218719482421875, -0.21254730224609375, -0.2063751220703125, -0.20020294189453125, -0.19403076171875, -0.18785858154296875, -0.1816864013671875, -0.17551422119140625, -0.169342041015625, -0.16316986083984375, -0.1569976806640625, -0.15082550048828125, -0.1446533203125, -0.13848114013671875, -0.1323089599609375, -0.12613677978515625, -0.119964599609375, -0.11379241943359375, -0.1076202392578125, -0.10144805908203125, -0.09527587890625, -0.08910369873046875, -0.0829315185546875, -0.07675933837890625, -0.070587158203125, -0.06441497802734375, -0.0582427978515625, -0.05207061767578125, -0.0458984375, -0.03972625732421875, -0.0335540771484375, -0.02738189697265625, -0.021209716796875, -0.01503753662109375, -0.0088653564453125, -0.00269317626953125, 0.00347900390625, 0.00965118408203125, 0.0158233642578125, 0.02199554443359375, 0.028167724609375, 0.03433990478515625, 0.0405120849609375, 0.04668426513671875, 0.0528564453125, 0.05902862548828125, 0.0652008056640625, 0.07137298583984375, 0.077545166015625, 0.08371734619140625, 0.0898895263671875, 0.09606170654296875, 0.10223388671875, 0.10840606689453125, 0.1145782470703125, 0.12075042724609375, 0.126922607421875, 0.13309478759765625, 0.1392669677734375, 0.14543914794921875, 0.151611328125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 13.0, 39.0, 116.0, 304.0, 311.0, 125.0, 39.0, 21.0, 15.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.244680643081665, -2.154935598373413, -2.065190553665161, -1.9754453897476196, -1.8857003450393677, -1.7959553003311157, -1.7062101364135742, -1.6164650917053223, -1.5267200469970703, -1.4369750022888184, -1.3472299575805664, -1.257484793663025, -1.167739748954773, -1.077994704246521, -0.9882495999336243, -0.8985044956207275, -0.8087594509124756, -0.7190144062042236, -0.6292693018913269, -0.5395241975784302, -0.4497791528701782, -0.3600340783596039, -0.27028900384902954, -0.1805438995361328, -0.09079885482788086, -0.0010537803173065186, 0.08869129419326782, 0.17843636870384216, 0.2681814432144165, 0.35792651772499084, 0.4476715922355652, 0.5374166965484619, 0.627161979675293, 0.7169070243835449, 0.8066521286964417, 0.8963972330093384, 0.9861422777175903, 1.0758873224258423, 1.1656324863433838, 1.2553775310516357, 1.3451225757598877, 1.4348676204681396, 1.5246126651763916, 1.614357829093933, 1.704102873802185, 1.793847918510437, 1.8835930824279785, 1.9733381271362305, 2.0630831718444824, 2.1528282165527344, 2.2425732612609863, 2.3323183059692383, 2.4220633506774902, 2.5118086338043213, 2.6015536785125732, 2.691298723220825, 2.781043767929077, 2.870788812637329, 2.960533857345581, 3.050278902053833, 3.140024185180664, 3.229769229888916, 3.319514274597168, 3.40925931930542, 3.499004364013672]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 8.0, 6.0, 12.0, 9.0, 22.0, 22.0, 42.0, 39.0, 52.0, 58.0, 56.0, 75.0, 68.0, 81.0, 87.0, 68.0, 61.0, 51.0, 44.0, 29.0, 27.0, 31.0, 14.0, 9.0, 8.0, 6.0, 9.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9387330412864685, -0.9107680320739746, -0.8828029632568359, -0.8548378944396973, -0.8268728852272034, -0.7989078760147095, -0.7709428071975708, -0.7429777383804321, -0.7150127291679382, -0.6870477199554443, -0.6590826511383057, -0.631117582321167, -0.6031525731086731, -0.5751875638961792, -0.5472224950790405, -0.5192574262619019, -0.49129241704940796, -0.4633273780345917, -0.4353623390197754, -0.4073973000049591, -0.3794322609901428, -0.35146722197532654, -0.32350218296051025, -0.29553714394569397, -0.2675721049308777, -0.2396070659160614, -0.21164202690124512, -0.18367698788642883, -0.15571194887161255, -0.12774690985679626, -0.09978187084197998, -0.0718168318271637, -0.04385173320770264, -0.015886694192886353, 0.012078344821929932, 0.040043383836746216, 0.0680084228515625, 0.09597346186637878, 0.12393850088119507, 0.15190353989601135, 0.17986857891082764, 0.20783361792564392, 0.2357986569404602, 0.2637636959552765, 0.2917287349700928, 0.31969377398490906, 0.34765881299972534, 0.3756238520145416, 0.4035888910293579, 0.4315539300441742, 0.4595189690589905, 0.48748400807380676, 0.515449047088623, 0.5434141159057617, 0.5713791251182556, 0.5993441343307495, 0.6273092031478882, 0.6552742719650269, 0.6832392811775208, 0.7112042903900146, 0.7391693592071533, 0.767134428024292, 0.7950994372367859, 0.8230644464492798, 0.8510295152664185]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 9.0, 9.0, 9.0, 2.0, 11.0, 14.0, 13.0, 15.0, 17.0, 42.0, 43.0, 80.0, 99.0, 141.0, 257.0, 423.0, 731.0, 1485.0, 3401.0, 9681.0, 45303.0, 338752.0, 541677.0, 82781.0, 14817.0, 4536.0, 1814.0, 919.0, 530.0, 312.0, 178.0, 114.0, 86.0, 62.0, 37.0, 27.0, 19.0, 20.0, 17.0, 10.0, 7.0, 10.0, 7.0, 8.0, 7.0, 6.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.75537109375, -0.7325897216796875, -0.709808349609375, -0.6870269775390625, -0.66424560546875, -0.6414642333984375, -0.618682861328125, -0.5959014892578125, -0.5731201171875, -0.5503387451171875, -0.527557373046875, -0.5047760009765625, -0.48199462890625, -0.4592132568359375, -0.436431884765625, -0.4136505126953125, -0.390869140625, -0.3680877685546875, -0.345306396484375, -0.3225250244140625, -0.29974365234375, -0.2769622802734375, -0.254180908203125, -0.2313995361328125, -0.2086181640625, -0.1858367919921875, -0.163055419921875, -0.1402740478515625, -0.11749267578125, -0.0947113037109375, -0.071929931640625, -0.0491485595703125, -0.0263671875, -0.0035858154296875, 0.019195556640625, 0.0419769287109375, 0.06475830078125, 0.0875396728515625, 0.110321044921875, 0.1331024169921875, 0.1558837890625, 0.1786651611328125, 0.201446533203125, 0.2242279052734375, 0.24700927734375, 0.2697906494140625, 0.292572021484375, 0.3153533935546875, 0.338134765625, 0.3609161376953125, 0.383697509765625, 0.4064788818359375, 0.42926025390625, 0.4520416259765625, 0.474822998046875, 0.4976043701171875, 0.5203857421875, 0.5431671142578125, 0.565948486328125, 0.5887298583984375, 0.61151123046875, 0.6342926025390625, 0.657073974609375, 0.6798553466796875, 0.70263671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 10.0, 20.0, 50.0, 54.0, 84.0, 112.0, 119.0, 128.0, 122.0, 82.0, 65.0, 50.0, 28.0, 28.0, 15.0, 10.0, 5.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10821533203125, -0.10505867004394531, -0.10190200805664062, -0.09874534606933594, -0.09558868408203125, -0.09243202209472656, -0.08927536010742188, -0.08611869812011719, -0.0829620361328125, -0.07980537414550781, -0.07664871215820312, -0.07349205017089844, -0.07033538818359375, -0.06717872619628906, -0.06402206420898438, -0.06086540222167969, -0.057708740234375, -0.05455207824707031, -0.051395416259765625, -0.04823875427246094, -0.04508209228515625, -0.04192543029785156, -0.038768768310546875, -0.03561210632324219, -0.0324554443359375, -0.029298782348632812, -0.026142120361328125, -0.022985458374023438, -0.01982879638671875, -0.016672134399414062, -0.013515472412109375, -0.010358810424804688, -0.0072021484375, -0.0040454864501953125, -0.000888824462890625, 0.0022678375244140625, 0.00542449951171875, 0.008581161499023438, 0.011737823486328125, 0.014894485473632812, 0.0180511474609375, 0.021207809448242188, 0.024364471435546875, 0.027521133422851562, 0.03067779541015625, 0.03383445739746094, 0.036991119384765625, 0.04014778137207031, 0.043304443359375, 0.04646110534667969, 0.049617767333984375, 0.05277442932128906, 0.05593109130859375, 0.05908775329589844, 0.062244415283203125, 0.06540107727050781, 0.0685577392578125, 0.07171440124511719, 0.07487106323242188, 0.07802772521972656, 0.08118438720703125, 0.08434104919433594, 0.08749771118164062, 0.09065437316894531, 0.09381103515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 11.0, 18.0, 20.0, 30.0, 33.0, 45.0, 73.0, 157.0, 229.0, 509.0, 1066.0, 3143.0, 12878.0, 80590.0, 534803.0, 355994.0, 46104.0, 8616.0, 2345.0, 884.0, 390.0, 224.0, 106.0, 86.0, 53.0, 29.0, 35.0, 19.0, 15.0, 10.0, 4.0, 7.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.603515625, -0.5845718383789062, -0.5656280517578125, -0.5466842651367188, -0.527740478515625, -0.5087966918945312, -0.4898529052734375, -0.47090911865234375, -0.45196533203125, -0.43302154541015625, -0.4140777587890625, -0.39513397216796875, -0.376190185546875, -0.35724639892578125, -0.3383026123046875, -0.31935882568359375, -0.3004150390625, -0.28147125244140625, -0.2625274658203125, -0.24358367919921875, -0.224639892578125, -0.20569610595703125, -0.1867523193359375, -0.16780853271484375, -0.14886474609375, -0.12992095947265625, -0.1109771728515625, -0.09203338623046875, -0.073089599609375, -0.05414581298828125, -0.0352020263671875, -0.01625823974609375, 0.002685546875, 0.02162933349609375, 0.0405731201171875, 0.05951690673828125, 0.078460693359375, 0.09740447998046875, 0.1163482666015625, 0.13529205322265625, 0.15423583984375, 0.17317962646484375, 0.1921234130859375, 0.21106719970703125, 0.230010986328125, 0.24895477294921875, 0.2678985595703125, 0.28684234619140625, 0.3057861328125, 0.32472991943359375, 0.3436737060546875, 0.36261749267578125, 0.381561279296875, 0.40050506591796875, 0.4194488525390625, 0.43839263916015625, 0.45733642578125, 0.47628021240234375, 0.4952239990234375, 0.5141677856445312, 0.533111572265625, 0.5520553588867188, 0.5709991455078125, 0.5899429321289062, 0.60888671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 8.0, 11.0, 19.0, 12.0, 14.0, 28.0, 25.0, 29.0, 20.0, 25.0, 32.0, 39.0, 28.0, 51.0, 51.0, 49.0, 48.0, 52.0, 38.0, 48.0, 44.0, 42.0, 38.0, 34.0, 25.0, 28.0, 20.0, 20.0, 20.0, 13.0, 18.0, 8.0, 9.0, 7.0, 4.0, 7.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2459716796875, -0.23764991760253906, -0.22932815551757812, -0.2210063934326172, -0.21268463134765625, -0.2043628692626953, -0.19604110717773438, -0.18771934509277344, -0.1793975830078125, -0.17107582092285156, -0.16275405883789062, -0.1544322967529297, -0.14611053466796875, -0.1377887725830078, -0.12946701049804688, -0.12114524841308594, -0.112823486328125, -0.10450172424316406, -0.09617996215820312, -0.08785820007324219, -0.07953643798828125, -0.07121467590332031, -0.06289291381835938, -0.05457115173339844, -0.0462493896484375, -0.03792762756347656, -0.029605865478515625, -0.021284103393554688, -0.01296234130859375, -0.0046405792236328125, 0.003681182861328125, 0.012002944946289062, 0.02032470703125, 0.028646469116210938, 0.036968231201171875, 0.04528999328613281, 0.05361175537109375, 0.06193351745605469, 0.07025527954101562, 0.07857704162597656, 0.0868988037109375, 0.09522056579589844, 0.10354232788085938, 0.11186408996582031, 0.12018585205078125, 0.1285076141357422, 0.13682937622070312, 0.14515113830566406, 0.153472900390625, 0.16179466247558594, 0.17011642456054688, 0.1784381866455078, 0.18675994873046875, 0.1950817108154297, 0.20340347290039062, 0.21172523498535156, 0.2200469970703125, 0.22836875915527344, 0.23669052124023438, 0.2450122833251953, 0.25333404541015625, 0.2616558074951172, 0.2699775695800781, 0.27829933166503906, 0.28662109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 6.0, 9.0, 16.0, 19.0, 66.0, 148.0, 343.0, 2027.0, 49772.0, 985876.0, 9026.0, 866.0, 218.0, 87.0, 43.0, 23.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.951171875, -1.902740478515625, -1.85430908203125, -1.805877685546875, -1.7574462890625, -1.709014892578125, -1.66058349609375, -1.612152099609375, -1.563720703125, -1.515289306640625, -1.46685791015625, -1.418426513671875, -1.3699951171875, -1.321563720703125, -1.27313232421875, -1.224700927734375, -1.17626953125, -1.127838134765625, -1.07940673828125, -1.030975341796875, -0.9825439453125, -0.934112548828125, -0.88568115234375, -0.837249755859375, -0.788818359375, -0.740386962890625, -0.69195556640625, -0.643524169921875, -0.5950927734375, -0.546661376953125, -0.49822998046875, -0.449798583984375, -0.4013671875, -0.352935791015625, -0.30450439453125, -0.256072998046875, -0.2076416015625, -0.159210205078125, -0.11077880859375, -0.062347412109375, -0.013916015625, 0.034515380859375, 0.08294677734375, 0.131378173828125, 0.1798095703125, 0.228240966796875, 0.27667236328125, 0.325103759765625, 0.37353515625, 0.421966552734375, 0.47039794921875, 0.518829345703125, 0.5672607421875, 0.615692138671875, 0.66412353515625, 0.712554931640625, 0.760986328125, 0.809417724609375, 0.85784912109375, 0.906280517578125, 0.9547119140625, 1.003143310546875, 1.05157470703125, 1.100006103515625, 1.1484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 16.0, 12.0, 28.0, 22.0, 39.0, 65.0, 61.0, 127.0, 132.0, 112.0, 99.0, 69.0, 55.0, 32.0, 30.0, 23.0, 10.0, 14.0, 9.0, 8.0, 2.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013816356658935547, -0.0001340806484222412, -0.00012999773025512695, -0.0001259148120880127, -0.00012183189392089844, -0.00011774897575378418, -0.00011366605758666992, -0.00010958313941955566, -0.0001055002212524414, -0.00010141730308532715, -9.733438491821289e-05, -9.325146675109863e-05, -8.916854858398438e-05, -8.508563041687012e-05, -8.100271224975586e-05, -7.69197940826416e-05, -7.283687591552734e-05, -6.875395774841309e-05, -6.467103958129883e-05, -6.058812141418457e-05, -5.650520324707031e-05, -5.2422285079956055e-05, -4.83393669128418e-05, -4.425644874572754e-05, -4.017353057861328e-05, -3.6090612411499023e-05, -3.2007694244384766e-05, -2.7924776077270508e-05, -2.384185791015625e-05, -1.9758939743041992e-05, -1.5676021575927734e-05, -1.1593103408813477e-05, -7.510185241699219e-06, -3.427267074584961e-06, 6.556510925292969e-07, 4.738569259643555e-06, 8.821487426757812e-06, 1.290440559387207e-05, 1.6987323760986328e-05, 2.1070241928100586e-05, 2.5153160095214844e-05, 2.92360782623291e-05, 3.331899642944336e-05, 3.740191459655762e-05, 4.1484832763671875e-05, 4.556775093078613e-05, 4.965066909790039e-05, 5.373358726501465e-05, 5.7816505432128906e-05, 6.189942359924316e-05, 6.598234176635742e-05, 7.006525993347168e-05, 7.414817810058594e-05, 7.82310962677002e-05, 8.231401443481445e-05, 8.639693260192871e-05, 9.047985076904297e-05, 9.456276893615723e-05, 9.864568710327148e-05, 0.00010272860527038574, 0.0001068115234375, 0.00011089444160461426, 0.00011497735977172852, 0.00011906027793884277, 0.00012314319610595703]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 16.0, 25.0, 29.0, 57.0, 75.0, 151.0, 284.0, 694.0, 1878.0, 6137.0, 29552.0, 652911.0, 330191.0, 19332.0, 4668.0, 1442.0, 549.0, 266.0, 103.0, 63.0, 45.0, 20.0, 14.0, 9.0, 3.0, 5.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.4602508544921875, -0.442474365234375, -0.4246978759765625, -0.40692138671875, -0.3891448974609375, -0.371368408203125, -0.3535919189453125, -0.3358154296875, -0.3180389404296875, -0.300262451171875, -0.2824859619140625, -0.26470947265625, -0.2469329833984375, -0.229156494140625, -0.2113800048828125, -0.193603515625, -0.1758270263671875, -0.158050537109375, -0.1402740478515625, -0.12249755859375, -0.1047210693359375, -0.086944580078125, -0.0691680908203125, -0.0513916015625, -0.0336151123046875, -0.015838623046875, 0.0019378662109375, 0.01971435546875, 0.0374908447265625, 0.055267333984375, 0.0730438232421875, 0.0908203125, 0.1085968017578125, 0.126373291015625, 0.1441497802734375, 0.16192626953125, 0.1797027587890625, 0.197479248046875, 0.2152557373046875, 0.2330322265625, 0.2508087158203125, 0.268585205078125, 0.2863616943359375, 0.30413818359375, 0.3219146728515625, 0.339691162109375, 0.3574676513671875, 0.375244140625, 0.3930206298828125, 0.410797119140625, 0.4285736083984375, 0.44635009765625, 0.4641265869140625, 0.481903076171875, 0.4996795654296875, 0.5174560546875, 0.5352325439453125, 0.553009033203125, 0.5707855224609375, 0.58856201171875, 0.6063385009765625, 0.624114990234375, 0.6418914794921875, 0.65966796875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 10.0, 15.0, 19.0, 45.0, 71.0, 84.0, 158.0, 156.0, 141.0, 112.0, 69.0, 35.0, 24.0, 12.0, 4.0, 5.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.330322265625, -0.32177162170410156, -0.3132209777832031, -0.3046703338623047, -0.29611968994140625, -0.2875690460205078, -0.2790184020996094, -0.27046775817871094, -0.2619171142578125, -0.25336647033691406, -0.24481582641601562, -0.2362651824951172, -0.22771453857421875, -0.2191638946533203, -0.21061325073242188, -0.20206260681152344, -0.193511962890625, -0.18496131896972656, -0.17641067504882812, -0.1678600311279297, -0.15930938720703125, -0.1507587432861328, -0.14220809936523438, -0.13365745544433594, -0.1251068115234375, -0.11655616760253906, -0.10800552368164062, -0.09945487976074219, -0.09090423583984375, -0.08235359191894531, -0.07380294799804688, -0.06525230407714844, -0.05670166015625, -0.04815101623535156, -0.039600372314453125, -0.031049728393554688, -0.02249908447265625, -0.013948440551757812, -0.005397796630859375, 0.0031528472900390625, 0.0117034912109375, 0.020254135131835938, 0.028804779052734375, 0.03735542297363281, 0.04590606689453125, 0.05445671081542969, 0.06300735473632812, 0.07155799865722656, 0.080108642578125, 0.08865928649902344, 0.09720993041992188, 0.10576057434082031, 0.11431121826171875, 0.12286186218261719, 0.13141250610351562, 0.13996315002441406, 0.1485137939453125, 0.15706443786621094, 0.16561508178710938, 0.1741657257080078, 0.18271636962890625, 0.1912670135498047, 0.19981765747070312, 0.20836830139160156, 0.2169189453125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 20.0, 74.0, 323.0, 441.0, 108.0, 26.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.791337013244629, -13.51680850982666, -13.242279052734375, -12.967750549316406, -12.693221092224121, -12.418692588806152, -12.144163131713867, -11.869634628295898, -11.59510612487793, -11.320577621459961, -11.046048164367676, -10.771519660949707, -10.496990203857422, -10.222461700439453, -9.947932243347168, -9.6734037399292, -9.398874282836914, -9.124345779418945, -8.84981632232666, -8.575287818908691, -8.300758361816406, -8.026229858398438, -7.7517008781433105, -7.477171897888184, -7.202642917633057, -6.92811393737793, -6.653584957122803, -6.379055976867676, -6.104527473449707, -5.829998016357422, -5.555469512939453, -5.280940532684326, -5.006411552429199, -4.731882572174072, -4.457353591918945, -4.182824611663818, -3.9082958698272705, -3.6337668895721436, -3.3592381477355957, -3.0847091674804688, -2.810180425643921, -2.535651445388794, -2.261122703552246, -1.9865937232971191, -1.7120647430419922, -1.4375357627868652, -1.1630069017410278, -0.8884780406951904, -0.6139490604400635, -0.3394201397895813, -0.06489121913909912, 0.20963770151138306, 0.48416662216186523, 0.7586956024169922, 1.0332244634628296, 1.307753324508667, 1.582282304763794, 1.856811285018921, 2.1313400268554688, 2.4058690071105957, 2.6803979873657227, 2.9549269676208496, 3.2294559478759766, 3.5039846897125244, 3.7785136699676514]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 8.0, 15.0, 16.0, 23.0, 25.0, 33.0, 55.0, 42.0, 49.0, 58.0, 56.0, 80.0, 77.0, 65.0, 64.0, 55.0, 45.0, 44.0, 27.0, 36.0, 31.0, 26.0, 18.0, 15.0, 11.0, 5.0, 7.0, 6.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5152783393859863, -2.426679849624634, -2.3380813598632812, -2.2494828701019287, -2.160884380340576, -2.0722861289978027, -1.9836876392364502, -1.8950891494750977, -1.8064906597137451, -1.7178921699523926, -1.62929368019104, -1.540695309638977, -1.4520968198776245, -1.363498330116272, -1.274899959564209, -1.1863014698028564, -1.097702980041504, -1.0091044902801514, -0.9205060601234436, -0.8319076299667358, -0.7433091402053833, -0.6547106504440308, -0.566112220287323, -0.47751379013061523, -0.3889153003692627, -0.30031684041023254, -0.2117183804512024, -0.12311992049217224, -0.03452146053314209, 0.05407699942588806, 0.1426754593849182, 0.23127388954162598, 0.3198723793029785, 0.40847083926200867, 0.4970692992210388, 0.5856677293777466, 0.6742662191390991, 0.7628647089004517, 0.8514631390571594, 0.9400615692138672, 1.0286600589752197, 1.1172585487365723, 1.2058570384979248, 1.2944554090499878, 1.3830538988113403, 1.4716523885726929, 1.5602507591247559, 1.6488492488861084, 1.737447738647461, 1.8260462284088135, 1.914644718170166, 2.0032432079315186, 2.091841697692871, 2.1804399490356445, 2.269038438796997, 2.3576369285583496, 2.446235418319702, 2.5348339080810547, 2.6234323978424072, 2.7120308876037598, 2.800629138946533, 2.8892276287078857, 2.9778261184692383, 3.066424608230591, 3.1550230979919434]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 5.0, 7.0, 7.0, 9.0, 12.0, 12.0, 18.0, 22.0, 34.0, 42.0, 60.0, 82.0, 120.0, 171.0, 271.0, 475.0, 992.0, 2167.0, 6326.0, 28143.0, 375996.0, 3689679.0, 71808.0, 11951.0, 3389.0, 1309.0, 544.0, 238.0, 142.0, 88.0, 60.0, 36.0, 22.0, 14.0, 8.0, 4.0, 5.0, 5.0, 0.0, 2.0, 2.0], "bins": [-1.7431640625, -1.7037429809570312, -1.6643218994140625, -1.6249008178710938, -1.585479736328125, -1.5460586547851562, -1.5066375732421875, -1.4672164916992188, -1.42779541015625, -1.3883743286132812, -1.3489532470703125, -1.3095321655273438, -1.270111083984375, -1.2306900024414062, -1.1912689208984375, -1.1518478393554688, -1.1124267578125, -1.0730056762695312, -1.0335845947265625, -0.9941635131835938, -0.954742431640625, -0.9153213500976562, -0.8759002685546875, -0.8364791870117188, -0.79705810546875, -0.7576370239257812, -0.7182159423828125, -0.6787948608398438, -0.639373779296875, -0.5999526977539062, -0.5605316162109375, -0.5211105346679688, -0.481689453125, -0.44226837158203125, -0.4028472900390625, -0.36342620849609375, -0.324005126953125, -0.28458404541015625, -0.2451629638671875, -0.20574188232421875, -0.16632080078125, -0.12689971923828125, -0.0874786376953125, -0.04805755615234375, -0.008636474609375, 0.03078460693359375, 0.0702056884765625, 0.10962677001953125, 0.1490478515625, 0.18846893310546875, 0.2278900146484375, 0.26731109619140625, 0.306732177734375, 0.34615325927734375, 0.3855743408203125, 0.42499542236328125, 0.46441650390625, 0.5038375854492188, 0.5432586669921875, 0.5826797485351562, 0.622100830078125, 0.6615219116210938, 0.7009429931640625, 0.7403640747070312, 0.77978515625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 2.0, 6.0, 11.0, 18.0, 23.0, 34.0, 44.0, 56.0, 75.0, 83.0, 100.0, 68.0, 106.0, 85.0, 64.0, 58.0, 48.0, 35.0, 17.0, 19.0, 12.0, 9.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10906982421875, -0.10572052001953125, -0.1023712158203125, -0.09902191162109375, -0.095672607421875, -0.09232330322265625, -0.0889739990234375, -0.08562469482421875, -0.082275390625, -0.07892608642578125, -0.0755767822265625, -0.07222747802734375, -0.068878173828125, -0.06552886962890625, -0.0621795654296875, -0.05883026123046875, -0.05548095703125, -0.05213165283203125, -0.0487823486328125, -0.04543304443359375, -0.042083740234375, -0.03873443603515625, -0.0353851318359375, -0.03203582763671875, -0.0286865234375, -0.02533721923828125, -0.0219879150390625, -0.01863861083984375, -0.015289306640625, -0.01194000244140625, -0.0085906982421875, -0.00524139404296875, -0.00189208984375, 0.00145721435546875, 0.0048065185546875, 0.00815582275390625, 0.011505126953125, 0.01485443115234375, 0.0182037353515625, 0.02155303955078125, 0.02490234375, 0.02825164794921875, 0.0316009521484375, 0.03495025634765625, 0.038299560546875, 0.04164886474609375, 0.0449981689453125, 0.04834747314453125, 0.05169677734375, 0.05504608154296875, 0.0583953857421875, 0.06174468994140625, 0.065093994140625, 0.06844329833984375, 0.0717926025390625, 0.07514190673828125, 0.0784912109375, 0.08184051513671875, 0.0851898193359375, 0.08853912353515625, 0.091888427734375, 0.09523773193359375, 0.0985870361328125, 0.10193634033203125, 0.10528564453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 6.0, 5.0, 10.0, 16.0, 15.0, 22.0, 31.0, 34.0, 50.0, 68.0, 90.0, 135.0, 226.0, 505.0, 1265.0, 5009.0, 196005.0, 3973048.0, 14676.0, 1706.0, 586.0, 296.0, 160.0, 89.0, 67.0, 35.0, 24.0, 19.0, 18.0, 11.0, 11.0, 6.0, 10.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9853515625, -1.9173736572265625, -1.849395751953125, -1.7814178466796875, -1.71343994140625, -1.6454620361328125, -1.577484130859375, -1.5095062255859375, -1.4415283203125, -1.3735504150390625, -1.305572509765625, -1.2375946044921875, -1.16961669921875, -1.1016387939453125, -1.033660888671875, -0.9656829833984375, -0.897705078125, -0.8297271728515625, -0.761749267578125, -0.6937713623046875, -0.62579345703125, -0.5578155517578125, -0.489837646484375, -0.4218597412109375, -0.3538818359375, -0.2859039306640625, -0.217926025390625, -0.1499481201171875, -0.08197021484375, -0.0139923095703125, 0.053985595703125, 0.1219635009765625, 0.18994140625, 0.2579193115234375, 0.325897216796875, 0.3938751220703125, 0.46185302734375, 0.5298309326171875, 0.597808837890625, 0.6657867431640625, 0.7337646484375, 0.8017425537109375, 0.869720458984375, 0.9376983642578125, 1.00567626953125, 1.0736541748046875, 1.141632080078125, 1.2096099853515625, 1.277587890625, 1.3455657958984375, 1.413543701171875, 1.4815216064453125, 1.54949951171875, 1.6174774169921875, 1.685455322265625, 1.7534332275390625, 1.8214111328125, 1.8893890380859375, 1.957366943359375, 2.0253448486328125, 2.09332275390625, 2.1613006591796875, 2.229278564453125, 2.2972564697265625, 2.365234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 7.0, 4.0, 18.0, 21.0, 41.0, 67.0, 153.0, 408.0, 2172.0, 723.0, 231.0, 104.0, 69.0, 24.0, 15.0, 12.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43017578125, -0.4207496643066406, -0.41132354736328125, -0.4018974304199219, -0.3924713134765625, -0.3830451965332031, -0.37361907958984375, -0.3641929626464844, -0.354766845703125, -0.3453407287597656, -0.33591461181640625, -0.3264884948730469, -0.3170623779296875, -0.3076362609863281, -0.29821014404296875, -0.2887840270996094, -0.27935791015625, -0.2699317932128906, -0.26050567626953125, -0.2510795593261719, -0.2416534423828125, -0.23222732543945312, -0.22280120849609375, -0.21337509155273438, -0.203948974609375, -0.19452285766601562, -0.18509674072265625, -0.17567062377929688, -0.1662445068359375, -0.15681838989257812, -0.14739227294921875, -0.13796615600585938, -0.1285400390625, -0.11911392211914062, -0.10968780517578125, -0.10026168823242188, -0.0908355712890625, -0.08140945434570312, -0.07198333740234375, -0.06255722045898438, -0.053131103515625, -0.043704986572265625, -0.03427886962890625, -0.024852752685546875, -0.0154266357421875, -0.006000518798828125, 0.00342559814453125, 0.012851715087890625, 0.02227783203125, 0.031703948974609375, 0.04113006591796875, 0.050556182861328125, 0.0599822998046875, 0.06940841674804688, 0.07883453369140625, 0.08826065063476562, 0.097686767578125, 0.10711288452148438, 0.11653900146484375, 0.12596511840820312, 0.1353912353515625, 0.14481735229492188, 0.15424346923828125, 0.16366958618164062, 0.173095703125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 19.0, 50.0, 113.0, 234.0, 249.0, 168.0, 70.0, 31.0, 15.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6778669357299805, -1.6155760288238525, -1.553285002708435, -1.4909940958023071, -1.4287031888961792, -1.3664121627807617, -1.3041212558746338, -1.2418303489685059, -1.179539442062378, -1.11724853515625, -1.0549575090408325, -0.9926666021347046, -0.9303756952285767, -0.868084728717804, -0.8057937622070312, -0.7435028553009033, -0.6812118887901306, -0.6189209222793579, -0.55663001537323, -0.4943390488624573, -0.43204814195632935, -0.36975717544555664, -0.3074662387371063, -0.245175302028656, -0.1828843653202057, -0.12059342861175537, -0.05830248445272446, 0.0039884597063064575, 0.06627939641475677, 0.1285703480243683, 0.1908612847328186, 0.2531522214412689, 0.31544315814971924, 0.37773409485816956, 0.4400250315666199, 0.5023159980773926, 0.5646069049835205, 0.6268978714942932, 0.6891888380050659, 0.7514797449111938, 0.8137706518173218, 0.8760616183280945, 0.9383525252342224, 1.0006434917449951, 1.062934398651123, 1.125225305557251, 1.1875163316726685, 1.2498072385787964, 1.3120982646942139, 1.3743891716003418, 1.4366801977157593, 1.4989711046218872, 1.5612620115280151, 1.6235530376434326, 1.6858439445495605, 1.7481348514556885, 1.8104257583618164, 1.8727166652679443, 1.9350076913833618, 1.9972985982894897, 2.0595896244049072, 2.121880531311035, 2.184171438217163, 2.246462345123291, 2.308753252029419]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 2.0, 10.0, 11.0, 10.0, 9.0, 9.0, 21.0, 26.0, 24.0, 28.0, 23.0, 22.0, 34.0, 31.0, 55.0, 42.0, 61.0, 40.0, 56.0, 52.0, 41.0, 48.0, 36.0, 37.0, 36.0, 43.0, 33.0, 23.0, 22.0, 21.0, 15.0, 15.0, 10.0, 12.0, 14.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5707749128341675, -0.5530621409416199, -0.5353493094444275, -0.5176365375518799, -0.4999237060546875, -0.4822109341621399, -0.4644981324672699, -0.4467853307723999, -0.4290725290775299, -0.4113597273826599, -0.3936469256877899, -0.3759341239929199, -0.3582213521003723, -0.34050852060317993, -0.3227957487106323, -0.30508294701576233, -0.28737014532089233, -0.26965734362602234, -0.25194454193115234, -0.23423175513744354, -0.21651895344257355, -0.19880615174770355, -0.18109336495399475, -0.16338056325912476, -0.14566776156425476, -0.12795495986938477, -0.11024216562509537, -0.09252937138080597, -0.07481656968593597, -0.05710376799106598, -0.03939097374677658, -0.021678179502487183, -0.0039653778076171875, 0.01374742016196251, 0.031460218131542206, 0.0491730161011219, 0.0668858140707016, 0.0845986157655716, 0.10231141000986099, 0.12002420425415039, 0.13773700594902039, 0.15544980764389038, 0.17316260933876038, 0.19087539613246918, 0.20858819782733917, 0.22630099952220917, 0.24401378631591797, 0.26172658801078796, 0.27943938970565796, 0.29715219140052795, 0.31486499309539795, 0.33257779479026794, 0.35029059648513794, 0.36800336837768555, 0.38571617007255554, 0.40342897176742554, 0.42114177346229553, 0.4388545751571655, 0.4565673768520355, 0.4742801785469055, 0.4919929504394531, 0.5097057819366455, 0.5274185538291931, 0.5451313257217407, 0.5628441572189331]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 4.0, 3.0, 5.0, 14.0, 11.0, 18.0, 20.0, 34.0, 46.0, 65.0, 95.0, 151.0, 221.0, 417.0, 762.0, 1573.0, 4090.0, 13976.0, 82537.0, 571111.0, 319499.0, 39943.0, 8521.0, 2759.0, 1206.0, 557.0, 331.0, 192.0, 126.0, 81.0, 58.0, 36.0, 28.0, 13.0, 14.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.97998046875, -0.9533615112304688, -0.9267425537109375, -0.9001235961914062, -0.873504638671875, -0.8468856811523438, -0.8202667236328125, -0.7936477661132812, -0.76702880859375, -0.7404098510742188, -0.7137908935546875, -0.6871719360351562, -0.660552978515625, -0.6339340209960938, -0.6073150634765625, -0.5806961059570312, -0.5540771484375, -0.5274581909179688, -0.5008392333984375, -0.47422027587890625, -0.447601318359375, -0.42098236083984375, -0.3943634033203125, -0.36774444580078125, -0.34112548828125, -0.31450653076171875, -0.2878875732421875, -0.26126861572265625, -0.234649658203125, -0.20803070068359375, -0.1814117431640625, -0.15479278564453125, -0.128173828125, -0.10155487060546875, -0.0749359130859375, -0.04831695556640625, -0.021697998046875, 0.00492095947265625, 0.0315399169921875, 0.05815887451171875, 0.08477783203125, 0.11139678955078125, 0.1380157470703125, 0.16463470458984375, 0.191253662109375, 0.21787261962890625, 0.2444915771484375, 0.27111053466796875, 0.2977294921875, 0.32434844970703125, 0.3509674072265625, 0.37758636474609375, 0.404205322265625, 0.43082427978515625, 0.4574432373046875, 0.48406219482421875, 0.51068115234375, 0.5373001098632812, 0.5639190673828125, 0.5905380249023438, 0.617156982421875, 0.6437759399414062, 0.6703948974609375, 0.6970138549804688, 0.7236328125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 12.0, 8.0, 20.0, 28.0, 36.0, 51.0, 60.0, 81.0, 74.0, 76.0, 94.0, 95.0, 80.0, 59.0, 56.0, 33.0, 35.0, 31.0, 21.0, 10.0, 8.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10687255859375, -0.10346698760986328, -0.10006141662597656, -0.09665584564208984, -0.09325027465820312, -0.0898447036743164, -0.08643913269042969, -0.08303356170654297, -0.07962799072265625, -0.07622241973876953, -0.07281684875488281, -0.0694112777709961, -0.06600570678710938, -0.06260013580322266, -0.05919456481933594, -0.05578899383544922, -0.0523834228515625, -0.04897785186767578, -0.04557228088378906, -0.042166709899902344, -0.038761138916015625, -0.035355567932128906, -0.03194999694824219, -0.02854442596435547, -0.02513885498046875, -0.02173328399658203, -0.018327713012695312, -0.014922142028808594, -0.011516571044921875, -0.008111000061035156, -0.0047054290771484375, -0.0012998580932617188, 0.002105712890625, 0.005511283874511719, 0.008916854858398438, 0.012322425842285156, 0.015727996826171875, 0.019133567810058594, 0.022539138793945312, 0.02594470977783203, 0.02935028076171875, 0.03275585174560547, 0.03616142272949219, 0.039566993713378906, 0.042972564697265625, 0.046378135681152344, 0.04978370666503906, 0.05318927764892578, 0.0565948486328125, 0.06000041961669922, 0.06340599060058594, 0.06681156158447266, 0.07021713256835938, 0.0736227035522461, 0.07702827453613281, 0.08043384552001953, 0.08383941650390625, 0.08724498748779297, 0.09065055847167969, 0.0940561294555664, 0.09746170043945312, 0.10086727142333984, 0.10427284240722656, 0.10767841339111328, 0.111083984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 10.0, 13.0, 20.0, 18.0, 52.0, 64.0, 109.0, 154.0, 294.0, 514.0, 1135.0, 2956.0, 9347.0, 38819.0, 219569.0, 568778.0, 164318.0, 30161.0, 7441.0, 2499.0, 1042.0, 495.0, 292.0, 143.0, 99.0, 67.0, 33.0, 39.0, 22.0, 21.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5688095092773438, -0.5507049560546875, -0.5326004028320312, -0.514495849609375, -0.49639129638671875, -0.4782867431640625, -0.46018218994140625, -0.44207763671875, -0.42397308349609375, -0.4058685302734375, -0.38776397705078125, -0.369659423828125, -0.35155487060546875, -0.3334503173828125, -0.31534576416015625, -0.2972412109375, -0.27913665771484375, -0.2610321044921875, -0.24292755126953125, -0.224822998046875, -0.20671844482421875, -0.1886138916015625, -0.17050933837890625, -0.15240478515625, -0.13430023193359375, -0.1161956787109375, -0.09809112548828125, -0.079986572265625, -0.06188201904296875, -0.0437774658203125, -0.02567291259765625, -0.007568359375, 0.01053619384765625, 0.0286407470703125, 0.04674530029296875, 0.064849853515625, 0.08295440673828125, 0.1010589599609375, 0.11916351318359375, 0.13726806640625, 0.15537261962890625, 0.1734771728515625, 0.19158172607421875, 0.209686279296875, 0.22779083251953125, 0.2458953857421875, 0.26399993896484375, 0.2821044921875, 0.30020904541015625, 0.3183135986328125, 0.33641815185546875, 0.354522705078125, 0.37262725830078125, 0.3907318115234375, 0.40883636474609375, 0.42694091796875, 0.44504547119140625, 0.4631500244140625, 0.48125457763671875, 0.499359130859375, 0.5174636840820312, 0.5355682373046875, 0.5536727905273438, 0.57177734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 7.0, 10.0, 11.0, 16.0, 17.0, 16.0, 24.0, 26.0, 29.0, 32.0, 40.0, 32.0, 49.0, 57.0, 42.0, 68.0, 67.0, 56.0, 49.0, 59.0, 45.0, 31.0, 39.0, 25.0, 29.0, 20.0, 17.0, 19.0, 14.0, 8.0, 3.0, 8.0, 10.0, 3.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4521484375, -0.4392852783203125, -0.426422119140625, -0.4135589599609375, -0.40069580078125, -0.3878326416015625, -0.374969482421875, -0.3621063232421875, -0.3492431640625, -0.3363800048828125, -0.323516845703125, -0.3106536865234375, -0.29779052734375, -0.2849273681640625, -0.272064208984375, -0.2592010498046875, -0.246337890625, -0.2334747314453125, -0.220611572265625, -0.2077484130859375, -0.19488525390625, -0.1820220947265625, -0.169158935546875, -0.1562957763671875, -0.1434326171875, -0.1305694580078125, -0.117706298828125, -0.1048431396484375, -0.09197998046875, -0.0791168212890625, -0.066253662109375, -0.0533905029296875, -0.04052734375, -0.0276641845703125, -0.014801025390625, -0.0019378662109375, 0.01092529296875, 0.0237884521484375, 0.036651611328125, 0.0495147705078125, 0.0623779296875, 0.0752410888671875, 0.088104248046875, 0.1009674072265625, 0.11383056640625, 0.1266937255859375, 0.139556884765625, 0.1524200439453125, 0.165283203125, 0.1781463623046875, 0.191009521484375, 0.2038726806640625, 0.21673583984375, 0.2295989990234375, 0.242462158203125, 0.2553253173828125, 0.2681884765625, 0.2810516357421875, 0.293914794921875, 0.3067779541015625, 0.31964111328125, 0.3325042724609375, 0.345367431640625, 0.3582305908203125, 0.37109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 7.0, 18.0, 22.0, 44.0, 90.0, 190.0, 424.0, 1028.0, 2953.0, 10804.0, 67947.0, 804678.0, 138006.0, 15832.0, 4122.0, 1345.0, 528.0, 237.0, 108.0, 56.0, 35.0, 20.0, 13.0, 12.0, 3.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447509765625, -0.4333610534667969, -0.41921234130859375, -0.4050636291503906, -0.3909149169921875, -0.3767662048339844, -0.36261749267578125, -0.3484687805175781, -0.334320068359375, -0.3201713562011719, -0.30602264404296875, -0.2918739318847656, -0.2777252197265625, -0.2635765075683594, -0.24942779541015625, -0.23527908325195312, -0.22113037109375, -0.20698165893554688, -0.19283294677734375, -0.17868423461914062, -0.1645355224609375, -0.15038681030273438, -0.13623809814453125, -0.12208938598632812, -0.107940673828125, -0.09379196166992188, -0.07964324951171875, -0.06549453735351562, -0.0513458251953125, -0.037197113037109375, -0.02304840087890625, -0.008899688720703125, 0.0052490234375, 0.019397735595703125, 0.03354644775390625, 0.047695159912109375, 0.0618438720703125, 0.07599258422851562, 0.09014129638671875, 0.10429000854492188, 0.118438720703125, 0.13258743286132812, 0.14673614501953125, 0.16088485717773438, 0.1750335693359375, 0.18918228149414062, 0.20333099365234375, 0.21747970581054688, 0.23162841796875, 0.24577713012695312, 0.25992584228515625, 0.2740745544433594, 0.2882232666015625, 0.3023719787597656, 0.31652069091796875, 0.3306694030761719, 0.344818115234375, 0.3589668273925781, 0.37311553955078125, 0.3872642517089844, 0.4014129638671875, 0.4155616760253906, 0.42971038818359375, 0.4438591003417969, 0.4580078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 8.0, 9.0, 17.0, 17.0, 23.0, 51.0, 63.0, 72.0, 79.0, 89.0, 92.0, 103.0, 72.0, 57.0, 55.0, 57.0, 29.0, 17.0, 14.0, 14.0, 8.0, 12.0, 8.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010842084884643555, -0.00010530184954404831, -0.00010218285024166107, -9.906385093927383e-05, -9.59448516368866e-05, -9.282585233449936e-05, -8.970685303211212e-05, -8.658785372972488e-05, -8.346885442733765e-05, -8.034985512495041e-05, -7.723085582256317e-05, -7.411185652017593e-05, -7.09928572177887e-05, -6.787385791540146e-05, -6.475485861301422e-05, -6.163585931062698e-05, -5.8516860008239746e-05, -5.539786070585251e-05, -5.227886140346527e-05, -4.9159862101078033e-05, -4.6040862798690796e-05, -4.292186349630356e-05, -3.980286419391632e-05, -3.668386489152908e-05, -3.3564865589141846e-05, -3.0445866286754608e-05, -2.732686698436737e-05, -2.4207867681980133e-05, -2.1088868379592896e-05, -1.7969869077205658e-05, -1.485086977481842e-05, -1.1731870472431183e-05, -8.612871170043945e-06, -5.493871867656708e-06, -2.3748725652694702e-06, 7.441267371177673e-07, 3.863126039505005e-06, 6.9821253418922424e-06, 1.010112464427948e-05, 1.3220123946666718e-05, 1.6339123249053955e-05, 1.9458122551441193e-05, 2.257712185382843e-05, 2.5696121156215668e-05, 2.8815120458602905e-05, 3.193411976099014e-05, 3.505311906337738e-05, 3.817211836576462e-05, 4.1291117668151855e-05, 4.441011697053909e-05, 4.752911627292633e-05, 5.064811557531357e-05, 5.3767114877700806e-05, 5.688611418008804e-05, 6.000511348247528e-05, 6.312411278486252e-05, 6.624311208724976e-05, 6.9362111389637e-05, 7.248111069202423e-05, 7.560010999441147e-05, 7.87191092967987e-05, 8.183810859918594e-05, 8.495710790157318e-05, 8.807610720396042e-05, 9.119510650634766e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 5.0, 9.0, 15.0, 24.0, 27.0, 40.0, 62.0, 98.0, 145.0, 264.0, 472.0, 811.0, 1650.0, 3658.0, 9454.0, 29638.0, 169664.0, 687245.0, 108022.0, 23145.0, 7827.0, 3164.0, 1412.0, 681.0, 385.0, 240.0, 134.0, 82.0, 59.0, 36.0, 20.0, 13.0, 15.0, 12.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.282958984375, -0.2733345031738281, -0.26371002197265625, -0.2540855407714844, -0.2444610595703125, -0.23483657836914062, -0.22521209716796875, -0.21558761596679688, -0.205963134765625, -0.19633865356445312, -0.18671417236328125, -0.17708969116210938, -0.1674652099609375, -0.15784072875976562, -0.14821624755859375, -0.13859176635742188, -0.12896728515625, -0.11934280395507812, -0.10971832275390625, -0.10009384155273438, -0.0904693603515625, -0.08084487915039062, -0.07122039794921875, -0.061595916748046875, -0.051971435546875, -0.042346954345703125, -0.03272247314453125, -0.023097991943359375, -0.0134735107421875, -0.003849029541015625, 0.00577545166015625, 0.015399932861328125, 0.0250244140625, 0.034648895263671875, 0.04427337646484375, 0.053897857666015625, 0.0635223388671875, 0.07314682006835938, 0.08277130126953125, 0.09239578247070312, 0.102020263671875, 0.11164474487304688, 0.12126922607421875, 0.13089370727539062, 0.1405181884765625, 0.15014266967773438, 0.15976715087890625, 0.16939163208007812, 0.17901611328125, 0.18864059448242188, 0.19826507568359375, 0.20788955688476562, 0.2175140380859375, 0.22713851928710938, 0.23676300048828125, 0.24638748168945312, 0.256011962890625, 0.2656364440917969, 0.27526092529296875, 0.2848854064941406, 0.2945098876953125, 0.3041343688964844, 0.31375885009765625, 0.3233833312988281, 0.3330078125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 1.0, 5.0, 4.0, 2.0, 9.0, 7.0, 15.0, 31.0, 28.0, 45.0, 59.0, 92.0, 99.0, 142.0, 118.0, 92.0, 73.0, 53.0, 41.0, 25.0, 13.0, 6.0, 6.0, 6.0, 8.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2076416015625, -0.20068740844726562, -0.19373321533203125, -0.18677902221679688, -0.1798248291015625, -0.17287063598632812, -0.16591644287109375, -0.15896224975585938, -0.152008056640625, -0.14505386352539062, -0.13809967041015625, -0.13114547729492188, -0.1241912841796875, -0.11723709106445312, -0.11028289794921875, -0.10332870483398438, -0.09637451171875, -0.08942031860351562, -0.08246612548828125, -0.07551193237304688, -0.0685577392578125, -0.061603546142578125, -0.05464935302734375, -0.047695159912109375, -0.040740966796875, -0.033786773681640625, -0.02683258056640625, -0.019878387451171875, -0.0129241943359375, -0.005970001220703125, 0.00098419189453125, 0.007938385009765625, 0.014892578125, 0.021846771240234375, 0.02880096435546875, 0.035755157470703125, 0.0427093505859375, 0.049663543701171875, 0.05661773681640625, 0.06357192993164062, 0.070526123046875, 0.07748031616210938, 0.08443450927734375, 0.09138870239257812, 0.0983428955078125, 0.10529708862304688, 0.11225128173828125, 0.11920547485351562, 0.12615966796875, 0.13311386108398438, 0.14006805419921875, 0.14702224731445312, 0.1539764404296875, 0.16093063354492188, 0.16788482666015625, 0.17483901977539062, 0.181793212890625, 0.18874740600585938, 0.19570159912109375, 0.20265579223632812, 0.2096099853515625, 0.21656417846679688, 0.22351837158203125, 0.23047256469726562, 0.2374267578125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 9.0, 68.0, 311.0, 423.0, 158.0, 28.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.710105895996094, -13.41294002532959, -13.115774154663086, -12.818608283996582, -12.521442413330078, -12.224276542663574, -11.92711067199707, -11.62994384765625, -11.332778930664062, -11.035613059997559, -10.738447189331055, -10.44128131866455, -10.144115447998047, -9.846949577331543, -9.549783706665039, -9.252616882324219, -8.955451011657715, -8.658285140991211, -8.361119270324707, -8.063953399658203, -7.766787528991699, -7.469621658325195, -7.172455310821533, -6.875289440155029, -6.578123569488525, -6.2809576988220215, -5.983791828155518, -5.686625957489014, -5.389459609985352, -5.092293739318848, -4.795127868652344, -4.49796199798584, -4.2007951736450195, -3.9036293029785156, -3.6064634323120117, -3.3092973232269287, -3.012131452560425, -2.714965581893921, -2.417799472808838, -2.120633602142334, -1.82346773147583, -1.5263018608093262, -1.2291358709335327, -0.931969940662384, -0.6348040103912354, -0.33763813972473145, -0.04047214984893799, 0.25669384002685547, 0.5538597106933594, 0.8510256409645081, 1.1481915712356567, 1.4453575611114502, 1.742523431777954, 2.039689302444458, 2.336855411529541, 2.634021282196045, 2.931187152862549, 3.2283530235290527, 3.5255188941955566, 3.8226850032806396, 4.119851112365723, 4.417016983032227, 4.7141828536987305, 5.011348724365234, 5.308514595031738]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 8.0, 10.0, 14.0, 24.0, 17.0, 22.0, 13.0, 30.0, 37.0, 36.0, 39.0, 54.0, 44.0, 48.0, 55.0, 57.0, 50.0, 46.0, 51.0, 47.0, 47.0, 33.0, 40.0, 29.0, 24.0, 23.0, 14.0, 15.0, 16.0, 12.0, 7.0, 4.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.1682190895080566, -2.0930838584899902, -2.017948865890503, -1.9428136348724365, -1.8676784038543701, -1.7925432920455933, -1.7174081802368164, -1.64227294921875, -1.5671378374099731, -1.4920027256011963, -1.4168674945831299, -1.341732382774353, -1.2665972709655762, -1.1914620399475098, -1.116326928138733, -1.041191816329956, -0.9660565853118896, -0.890921413898468, -0.8157862424850464, -0.7406511306762695, -0.6655159592628479, -0.5903807878494263, -0.5152456760406494, -0.4401105046272278, -0.36497533321380615, -0.2898401618003845, -0.21470502018928528, -0.13956986367702484, -0.0644347071647644, 0.010700464248657227, 0.08583560585975647, 0.1609707474708557, 0.23610591888427734, 0.311241090297699, 0.3863762319087982, 0.46151137351989746, 0.5366465449333191, 0.6117817163467407, 0.6869168281555176, 0.7620519995689392, 0.8371871709823608, 0.9123223423957825, 0.9874575138092041, 1.062592625617981, 1.1377277374267578, 1.2128629684448242, 1.287998080253601, 1.363133192062378, 1.4382684230804443, 1.5134035348892212, 1.5885387659072876, 1.6636738777160645, 1.7388091087341309, 1.8139442205429077, 1.8890793323516846, 1.964214563369751, 2.0393495559692383, 2.1144847869873047, 2.189619779586792, 2.2647550106048584, 2.339890241622925, 2.415025234222412, 2.4901604652404785, 2.565295696258545, 2.6404309272766113]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 6.0, 10.0, 15.0, 8.0, 14.0, 14.0, 13.0, 19.0, 35.0, 44.0, 57.0, 67.0, 83.0, 155.0, 212.0, 339.0, 656.0, 1297.0, 3190.0, 10635.0, 55863.0, 3707325.0, 374808.0, 28233.0, 6775.0, 2288.0, 923.0, 498.0, 269.0, 148.0, 86.0, 51.0, 37.0, 32.0, 25.0, 5.0, 12.0, 8.0, 10.0, 5.0, 3.0, 4.0, 2.0], "bins": [-1.4052734375, -1.3724441528320312, -1.3396148681640625, -1.3067855834960938, -1.273956298828125, -1.2411270141601562, -1.2082977294921875, -1.1754684448242188, -1.14263916015625, -1.1098098754882812, -1.0769805908203125, -1.0441513061523438, -1.011322021484375, -0.9784927368164062, -0.9456634521484375, -0.9128341674804688, -0.8800048828125, -0.8471755981445312, -0.8143463134765625, -0.7815170288085938, -0.748687744140625, -0.7158584594726562, -0.6830291748046875, -0.6501998901367188, -0.61737060546875, -0.5845413208007812, -0.5517120361328125, -0.5188827514648438, -0.486053466796875, -0.45322418212890625, -0.4203948974609375, -0.38756561279296875, -0.354736328125, -0.32190704345703125, -0.2890777587890625, -0.25624847412109375, -0.223419189453125, -0.19058990478515625, -0.1577606201171875, -0.12493133544921875, -0.09210205078125, -0.05927276611328125, -0.0264434814453125, 0.00638580322265625, 0.039215087890625, 0.07204437255859375, 0.1048736572265625, 0.13770294189453125, 0.1705322265625, 0.20336151123046875, 0.2361907958984375, 0.26902008056640625, 0.301849365234375, 0.33467864990234375, 0.3675079345703125, 0.40033721923828125, 0.43316650390625, 0.46599578857421875, 0.4988250732421875, 0.5316543579101562, 0.564483642578125, 0.5973129272460938, 0.6301422119140625, 0.6629714965820312, 0.69580078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 12.0, 13.0, 27.0, 33.0, 50.0, 56.0, 79.0, 85.0, 78.0, 84.0, 85.0, 88.0, 81.0, 78.0, 30.0, 36.0, 20.0, 21.0, 12.0, 10.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11016845703125, -0.10618114471435547, -0.10219383239746094, -0.0982065200805664, -0.09421920776367188, -0.09023189544677734, -0.08624458312988281, -0.08225727081298828, -0.07826995849609375, -0.07428264617919922, -0.07029533386230469, -0.06630802154541016, -0.062320709228515625, -0.058333396911621094, -0.05434608459472656, -0.05035877227783203, -0.0463714599609375, -0.04238414764404297, -0.03839683532714844, -0.034409523010253906, -0.030422210693359375, -0.026434898376464844, -0.022447586059570312, -0.01846027374267578, -0.01447296142578125, -0.010485649108886719, -0.0064983367919921875, -0.0025110244750976562, 0.001476287841796875, 0.005463600158691406, 0.009450912475585938, 0.013438224792480469, 0.017425537109375, 0.02141284942626953, 0.025400161743164062, 0.029387474060058594, 0.033374786376953125, 0.037362098693847656, 0.04134941101074219, 0.04533672332763672, 0.04932403564453125, 0.05331134796142578, 0.05729866027832031, 0.061285972595214844, 0.06527328491210938, 0.0692605972290039, 0.07324790954589844, 0.07723522186279297, 0.0812225341796875, 0.08520984649658203, 0.08919715881347656, 0.0931844711303711, 0.09717178344726562, 0.10115909576416016, 0.10514640808105469, 0.10913372039794922, 0.11312103271484375, 0.11710834503173828, 0.12109565734863281, 0.12508296966552734, 0.12907028198242188, 0.1330575942993164, 0.13704490661621094, 0.14103221893310547, 0.14501953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 11.0, 24.0, 66.0, 119.0, 224.0, 638.0, 2163.0, 13994.0, 1709350.0, 2450420.0, 13989.0, 2232.0, 611.0, 227.0, 111.0, 33.0, 27.0, 16.0, 7.0, 7.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.938262939453125, -1.88726806640625, -1.836273193359375, -1.7852783203125, -1.734283447265625, -1.68328857421875, -1.632293701171875, -1.581298828125, -1.530303955078125, -1.47930908203125, -1.428314208984375, -1.3773193359375, -1.326324462890625, -1.27532958984375, -1.224334716796875, -1.17333984375, -1.122344970703125, -1.07135009765625, -1.020355224609375, -0.9693603515625, -0.918365478515625, -0.86737060546875, -0.816375732421875, -0.765380859375, -0.714385986328125, -0.66339111328125, -0.612396240234375, -0.5614013671875, -0.510406494140625, -0.45941162109375, -0.408416748046875, -0.357421875, -0.306427001953125, -0.25543212890625, -0.204437255859375, -0.1534423828125, -0.102447509765625, -0.05145263671875, -0.000457763671875, 0.050537109375, 0.101531982421875, 0.15252685546875, 0.203521728515625, 0.2545166015625, 0.305511474609375, 0.35650634765625, 0.407501220703125, 0.45849609375, 0.509490966796875, 0.56048583984375, 0.611480712890625, 0.6624755859375, 0.713470458984375, 0.76446533203125, 0.815460205078125, 0.866455078125, 0.917449951171875, 0.96844482421875, 1.019439697265625, 1.0704345703125, 1.121429443359375, 1.17242431640625, 1.223419189453125, 1.2744140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 3.0, 9.0, 14.0, 25.0, 30.0, 64.0, 128.0, 343.0, 1747.0, 1188.0, 288.0, 108.0, 50.0, 33.0, 10.0, 11.0, 7.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.360107421875, -0.35190582275390625, -0.3437042236328125, -0.33550262451171875, -0.327301025390625, -0.31909942626953125, -0.3108978271484375, -0.30269622802734375, -0.29449462890625, -0.28629302978515625, -0.2780914306640625, -0.26988983154296875, -0.261688232421875, -0.25348663330078125, -0.2452850341796875, -0.23708343505859375, -0.2288818359375, -0.22068023681640625, -0.2124786376953125, -0.20427703857421875, -0.196075439453125, -0.18787384033203125, -0.1796722412109375, -0.17147064208984375, -0.16326904296875, -0.15506744384765625, -0.1468658447265625, -0.13866424560546875, -0.130462646484375, -0.12226104736328125, -0.1140594482421875, -0.10585784912109375, -0.09765625, -0.08945465087890625, -0.0812530517578125, -0.07305145263671875, -0.064849853515625, -0.05664825439453125, -0.0484466552734375, -0.04024505615234375, -0.03204345703125, -0.02384185791015625, -0.0156402587890625, -0.00743865966796875, 0.000762939453125, 0.00896453857421875, 0.0171661376953125, 0.02536773681640625, 0.0335693359375, 0.04177093505859375, 0.0499725341796875, 0.05817413330078125, 0.066375732421875, 0.07457733154296875, 0.0827789306640625, 0.09098052978515625, 0.09918212890625, 0.10738372802734375, 0.1155853271484375, 0.12378692626953125, 0.131988525390625, 0.14019012451171875, 0.1483917236328125, 0.15659332275390625, 0.164794921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 14.0, 33.0, 141.0, 388.0, 313.0, 88.0, 16.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.229099988937378, -1.1403254270553589, -1.0515507459640503, -0.9627761840820312, -0.8740015625953674, -0.7852269411087036, -0.6964523792266846, -0.6076777577400208, -0.5189031362533569, -0.4301285147666931, -0.3413539230823517, -0.25257933139801025, -0.16380470991134644, -0.07503008842468262, 0.013744473457336426, 0.10251909494400024, 0.19129371643066406, 0.2800683379173279, 0.3688429296016693, 0.45761752128601074, 0.5463921427726746, 0.6351667642593384, 0.7239413261413574, 0.8127159476280212, 0.9014905691146851, 0.9902651906013489, 1.0790398120880127, 1.1678143739700317, 1.2565889358520508, 1.3453636169433594, 1.4341381788253784, 1.5229127407073975, 1.611687183380127, 1.700461745262146, 1.7892364263534546, 1.8780109882354736, 1.9667856693267822, 2.0555601119995117, 2.1443347930908203, 2.233109474182129, 2.3218841552734375, 2.410658836364746, 2.4994332790374756, 2.588207960128784, 2.6769826412200928, 2.7657570838928223, 2.854531764984131, 2.9433064460754395, 3.032080888748169, 3.1208555698394775, 3.209630012512207, 3.2984046936035156, 3.387179374694824, 3.475954055786133, 3.5647284984588623, 3.653503179550171, 3.7422776222229004, 3.831052303314209, 3.9198267459869385, 4.008601188659668, 4.097375869750977, 4.186150550842285, 4.274925231933594, 4.363699913024902, 4.452474594116211]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 12.0, 8.0, 9.0, 14.0, 18.0, 29.0, 29.0, 41.0, 43.0, 55.0, 57.0, 55.0, 57.0, 61.0, 59.0, 51.0, 61.0, 41.0, 52.0, 54.0, 34.0, 24.0, 38.0, 23.0, 17.0, 14.0, 9.0, 9.0, 5.0, 6.0, 2.0, 0.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6174001693725586, -0.597888708114624, -0.5783773064613342, -0.5588658452033997, -0.5393544435501099, -0.5198429822921753, -0.5003315210342407, -0.48082008957862854, -0.46130865812301636, -0.4417972266674042, -0.422285795211792, -0.4027743339538574, -0.38326290249824524, -0.36375147104263306, -0.3442400097846985, -0.3247285783290863, -0.3052171468734741, -0.28570571541786194, -0.26619428396224976, -0.24668282270431519, -0.227171391248703, -0.20765995979309082, -0.18814851343631744, -0.16863706707954407, -0.14912563562393188, -0.1296142041683197, -0.11010275781154633, -0.09059131890535355, -0.07107987999916077, -0.05156844109296799, -0.03205700218677521, -0.012545555830001831, 0.006965935230255127, 0.026477374136447906, 0.045988813042640686, 0.06550025194883347, 0.08501169085502625, 0.10452312976121902, 0.1240345686674118, 0.14354601502418518, 0.16305744647979736, 0.18256887793540955, 0.20208032429218292, 0.2215917706489563, 0.24110320210456848, 0.26061463356018066, 0.28012609481811523, 0.2996375262737274, 0.3191489577293396, 0.3386603891849518, 0.35817182064056396, 0.37768328189849854, 0.3971947133541107, 0.4167061448097229, 0.43621760606765747, 0.45572903752326965, 0.47524046897888184, 0.494751900434494, 0.5142633318901062, 0.5337747931480408, 0.5532861948013306, 0.5727976560592651, 0.5923091173171997, 0.6118205785751343, 0.6313319802284241]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 9.0, 26.0, 36.0, 57.0, 92.0, 146.0, 264.0, 577.0, 1372.0, 3687.0, 14599.0, 128606.0, 726245.0, 150026.0, 16105.0, 3982.0, 1423.0, 592.0, 286.0, 147.0, 109.0, 51.0, 37.0, 19.0, 14.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.103515625, -1.0724563598632812, -1.0413970947265625, -1.0103378295898438, -0.979278564453125, -0.9482192993164062, -0.9171600341796875, -0.8861007690429688, -0.85504150390625, -0.8239822387695312, -0.7929229736328125, -0.7618637084960938, -0.730804443359375, -0.6997451782226562, -0.6686859130859375, -0.6376266479492188, -0.6065673828125, -0.5755081176757812, -0.5444488525390625, -0.5133895874023438, -0.482330322265625, -0.45127105712890625, -0.4202117919921875, -0.38915252685546875, -0.35809326171875, -0.32703399658203125, -0.2959747314453125, -0.26491546630859375, -0.233856201171875, -0.20279693603515625, -0.1717376708984375, -0.14067840576171875, -0.109619140625, -0.07855987548828125, -0.0475006103515625, -0.01644134521484375, 0.014617919921875, 0.04567718505859375, 0.0767364501953125, 0.10779571533203125, 0.13885498046875, 0.16991424560546875, 0.2009735107421875, 0.23203277587890625, 0.263092041015625, 0.29415130615234375, 0.3252105712890625, 0.35626983642578125, 0.3873291015625, 0.41838836669921875, 0.4494476318359375, 0.48050689697265625, 0.511566162109375, 0.5426254272460938, 0.5736846923828125, 0.6047439575195312, 0.63580322265625, 0.6668624877929688, 0.6979217529296875, 0.7289810180664062, 0.760040283203125, 0.7910995483398438, 0.8221588134765625, 0.8532180786132812, 0.88427734375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 6.0, 5.0, 11.0, 20.0, 30.0, 39.0, 40.0, 64.0, 63.0, 74.0, 88.0, 94.0, 77.0, 91.0, 86.0, 61.0, 43.0, 25.0, 23.0, 17.0, 12.0, 11.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11566162109375, -0.11161327362060547, -0.10756492614746094, -0.1035165786743164, -0.09946823120117188, -0.09541988372802734, -0.09137153625488281, -0.08732318878173828, -0.08327484130859375, -0.07922649383544922, -0.07517814636230469, -0.07112979888916016, -0.06708145141601562, -0.0630331039428711, -0.05898475646972656, -0.05493640899658203, -0.0508880615234375, -0.04683971405029297, -0.04279136657714844, -0.038743019104003906, -0.034694671630859375, -0.030646324157714844, -0.026597976684570312, -0.02254962921142578, -0.01850128173828125, -0.014452934265136719, -0.010404586791992188, -0.006356239318847656, -0.002307891845703125, 0.0017404556274414062, 0.0057888031005859375, 0.009837150573730469, 0.013885498046875, 0.01793384552001953, 0.021982192993164062, 0.026030540466308594, 0.030078887939453125, 0.034127235412597656, 0.03817558288574219, 0.04222393035888672, 0.04627227783203125, 0.05032062530517578, 0.05436897277832031, 0.058417320251464844, 0.062465667724609375, 0.0665140151977539, 0.07056236267089844, 0.07461071014404297, 0.0786590576171875, 0.08270740509033203, 0.08675575256347656, 0.0908041000366211, 0.09485244750976562, 0.09890079498291016, 0.10294914245605469, 0.10699748992919922, 0.11104583740234375, 0.11509418487548828, 0.11914253234863281, 0.12319087982177734, 0.12723922729492188, 0.1312875747680664, 0.13533592224121094, 0.13938426971435547, 0.1434326171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 7.0, 12.0, 12.0, 13.0, 29.0, 50.0, 75.0, 102.0, 235.0, 417.0, 819.0, 1923.0, 6106.0, 25630.0, 162382.0, 605198.0, 203736.0, 30748.0, 6923.0, 2202.0, 916.0, 448.0, 215.0, 119.0, 74.0, 59.0, 36.0, 15.0, 15.0, 8.0, 11.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6056671142578125, -0.585845947265625, -0.5660247802734375, -0.54620361328125, -0.5263824462890625, -0.506561279296875, -0.4867401123046875, -0.4669189453125, -0.4470977783203125, -0.427276611328125, -0.4074554443359375, -0.38763427734375, -0.3678131103515625, -0.347991943359375, -0.3281707763671875, -0.308349609375, -0.2885284423828125, -0.268707275390625, -0.2488861083984375, -0.22906494140625, -0.2092437744140625, -0.189422607421875, -0.1696014404296875, -0.1497802734375, -0.1299591064453125, -0.110137939453125, -0.0903167724609375, -0.07049560546875, -0.0506744384765625, -0.030853271484375, -0.0110321044921875, 0.0087890625, 0.0286102294921875, 0.048431396484375, 0.0682525634765625, 0.08807373046875, 0.1078948974609375, 0.127716064453125, 0.1475372314453125, 0.1673583984375, 0.1871795654296875, 0.207000732421875, 0.2268218994140625, 0.24664306640625, 0.2664642333984375, 0.286285400390625, 0.3061065673828125, 0.325927734375, 0.3457489013671875, 0.365570068359375, 0.3853912353515625, 0.40521240234375, 0.4250335693359375, 0.444854736328125, 0.4646759033203125, 0.4844970703125, 0.5043182373046875, 0.524139404296875, 0.5439605712890625, 0.56378173828125, 0.5836029052734375, 0.603424072265625, 0.6232452392578125, 0.64306640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 8.0, 6.0, 7.0, 8.0, 11.0, 8.0, 17.0, 31.0, 31.0, 31.0, 38.0, 65.0, 46.0, 60.0, 61.0, 73.0, 50.0, 70.0, 57.0, 48.0, 54.0, 31.0, 39.0, 26.0, 23.0, 18.0, 15.0, 23.0, 9.0, 7.0, 4.0, 4.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5009765625, -0.48709869384765625, -0.4732208251953125, -0.45934295654296875, -0.445465087890625, -0.43158721923828125, -0.4177093505859375, -0.40383148193359375, -0.38995361328125, -0.37607574462890625, -0.3621978759765625, -0.34832000732421875, -0.334442138671875, -0.32056427001953125, -0.3066864013671875, -0.29280853271484375, -0.2789306640625, -0.26505279541015625, -0.2511749267578125, -0.23729705810546875, -0.223419189453125, -0.20954132080078125, -0.1956634521484375, -0.18178558349609375, -0.16790771484375, -0.15402984619140625, -0.1401519775390625, -0.12627410888671875, -0.112396240234375, -0.09851837158203125, -0.0846405029296875, -0.07076263427734375, -0.056884765625, -0.04300689697265625, -0.0291290283203125, -0.01525115966796875, -0.001373291015625, 0.01250457763671875, 0.0263824462890625, 0.04026031494140625, 0.05413818359375, 0.06801605224609375, 0.0818939208984375, 0.09577178955078125, 0.109649658203125, 0.12352752685546875, 0.1374053955078125, 0.15128326416015625, 0.1651611328125, 0.17903900146484375, 0.1929168701171875, 0.20679473876953125, 0.220672607421875, 0.23455047607421875, 0.2484283447265625, 0.26230621337890625, 0.27618408203125, 0.29006195068359375, 0.3039398193359375, 0.31781768798828125, 0.331695556640625, 0.34557342529296875, 0.3594512939453125, 0.37332916259765625, 0.38720703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 8.0, 8.0, 15.0, 15.0, 32.0, 38.0, 91.0, 159.0, 254.0, 565.0, 1228.0, 3321.0, 10159.0, 46736.0, 426119.0, 489555.0, 52681.0, 11414.0, 3568.0, 1320.0, 590.0, 270.0, 152.0, 94.0, 45.0, 50.0, 17.0, 15.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318115234375, -0.3078651428222656, -0.29761505126953125, -0.2873649597167969, -0.2771148681640625, -0.2668647766113281, -0.25661468505859375, -0.24636459350585938, -0.236114501953125, -0.22586441040039062, -0.21561431884765625, -0.20536422729492188, -0.1951141357421875, -0.18486404418945312, -0.17461395263671875, -0.16436386108398438, -0.15411376953125, -0.14386367797851562, -0.13361358642578125, -0.12336349487304688, -0.1131134033203125, -0.10286331176757812, -0.09261322021484375, -0.08236312866210938, -0.072113037109375, -0.061862945556640625, -0.05161285400390625, -0.041362762451171875, -0.0311126708984375, -0.020862579345703125, -0.01061248779296875, -0.000362396240234375, 0.0098876953125, 0.020137786865234375, 0.03038787841796875, 0.040637969970703125, 0.0508880615234375, 0.061138153076171875, 0.07138824462890625, 0.08163833618164062, 0.091888427734375, 0.10213851928710938, 0.11238861083984375, 0.12263870239257812, 0.1328887939453125, 0.14313888549804688, 0.15338897705078125, 0.16363906860351562, 0.17388916015625, 0.18413925170898438, 0.19438934326171875, 0.20463943481445312, 0.2148895263671875, 0.22513961791992188, 0.23538970947265625, 0.24563980102539062, 0.255889892578125, 0.2661399841308594, 0.27639007568359375, 0.2866401672363281, 0.2968902587890625, 0.3071403503417969, 0.31739044189453125, 0.3276405334472656, 0.337890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 13.0, 14.0, 14.0, 19.0, 24.0, 38.0, 38.0, 69.0, 84.0, 100.0, 117.0, 107.0, 94.0, 68.0, 42.0, 34.0, 31.0, 18.0, 12.0, 10.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00012183189392089844, -0.00011867564171552658, -0.00011551938951015472, -0.00011236313730478287, -0.00010920688509941101, -0.00010605063289403915, -0.0001028943806886673, -9.973812848329544e-05, -9.658187627792358e-05, -9.342562407255173e-05, -9.026937186717987e-05, -8.711311966180801e-05, -8.395686745643616e-05, -8.08006152510643e-05, -7.764436304569244e-05, -7.448811084032059e-05, -7.133185863494873e-05, -6.817560642957687e-05, -6.501935422420502e-05, -6.186310201883316e-05, -5.8706849813461304e-05, -5.555059760808945e-05, -5.239434540271759e-05, -4.9238093197345734e-05, -4.608184099197388e-05, -4.292558878660202e-05, -3.9769336581230164e-05, -3.661308437585831e-05, -3.345683217048645e-05, -3.0300579965114594e-05, -2.7144327759742737e-05, -2.398807555437088e-05, -2.0831823348999023e-05, -1.7675571143627167e-05, -1.451931893825531e-05, -1.1363066732883453e-05, -8.206814527511597e-06, -5.05056232213974e-06, -1.8943101167678833e-06, 1.2619420886039734e-06, 4.41819429397583e-06, 7.574446499347687e-06, 1.0730698704719543e-05, 1.38869509100914e-05, 1.7043203115463257e-05, 2.0199455320835114e-05, 2.335570752620697e-05, 2.6511959731578827e-05, 2.9668211936950684e-05, 3.282446414232254e-05, 3.59807163476944e-05, 3.9136968553066254e-05, 4.229322075843811e-05, 4.544947296380997e-05, 4.8605725169181824e-05, 5.176197737455368e-05, 5.491822957992554e-05, 5.8074481785297394e-05, 6.123073399066925e-05, 6.438698619604111e-05, 6.754323840141296e-05, 7.069949060678482e-05, 7.385574281215668e-05, 7.701199501752853e-05, 8.016824722290039e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 8.0, 9.0, 7.0, 23.0, 25.0, 42.0, 70.0, 88.0, 160.0, 271.0, 521.0, 1053.0, 2436.0, 6909.0, 26744.0, 251382.0, 676568.0, 63349.0, 11930.0, 3756.0, 1508.0, 714.0, 391.0, 215.0, 127.0, 82.0, 58.0, 27.0, 21.0, 16.0, 4.0, 12.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.2579383850097656, -0.24683380126953125, -0.23572921752929688, -0.2246246337890625, -0.21352005004882812, -0.20241546630859375, -0.19131088256835938, -0.180206298828125, -0.16910171508789062, -0.15799713134765625, -0.14689254760742188, -0.1357879638671875, -0.12468338012695312, -0.11357879638671875, -0.10247421264648438, -0.09136962890625, -0.08026504516601562, -0.06916046142578125, -0.058055877685546875, -0.0469512939453125, -0.035846710205078125, -0.02474212646484375, -0.013637542724609375, -0.002532958984375, 0.008571624755859375, 0.01967620849609375, 0.030780792236328125, 0.0418853759765625, 0.052989959716796875, 0.06409454345703125, 0.07519912719726562, 0.0863037109375, 0.09740829467773438, 0.10851287841796875, 0.11961746215820312, 0.1307220458984375, 0.14182662963867188, 0.15293121337890625, 0.16403579711914062, 0.175140380859375, 0.18624496459960938, 0.19734954833984375, 0.20845413208007812, 0.2195587158203125, 0.23066329956054688, 0.24176788330078125, 0.2528724670410156, 0.26397705078125, 0.2750816345214844, 0.28618621826171875, 0.2972908020019531, 0.3083953857421875, 0.3194999694824219, 0.33060455322265625, 0.3417091369628906, 0.352813720703125, 0.3639183044433594, 0.37502288818359375, 0.3861274719238281, 0.3972320556640625, 0.4083366394042969, 0.41944122314453125, 0.4305458068847656, 0.441650390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 9.0, 8.0, 9.0, 11.0, 7.0, 19.0, 27.0, 40.0, 43.0, 59.0, 48.0, 82.0, 81.0, 92.0, 90.0, 85.0, 64.0, 49.0, 33.0, 24.0, 27.0, 22.0, 12.0, 17.0, 8.0, 6.0, 3.0, 5.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1312255859375, -0.1267852783203125, -0.122344970703125, -0.1179046630859375, -0.11346435546875, -0.1090240478515625, -0.104583740234375, -0.1001434326171875, -0.095703125, -0.0912628173828125, -0.086822509765625, -0.0823822021484375, -0.07794189453125, -0.0735015869140625, -0.069061279296875, -0.0646209716796875, -0.0601806640625, -0.0557403564453125, -0.051300048828125, -0.0468597412109375, -0.04241943359375, -0.0379791259765625, -0.033538818359375, -0.0290985107421875, -0.024658203125, -0.0202178955078125, -0.015777587890625, -0.0113372802734375, -0.00689697265625, -0.0024566650390625, 0.001983642578125, 0.0064239501953125, 0.0108642578125, 0.0153045654296875, 0.019744873046875, 0.0241851806640625, 0.02862548828125, 0.0330657958984375, 0.037506103515625, 0.0419464111328125, 0.04638671875, 0.0508270263671875, 0.055267333984375, 0.0597076416015625, 0.06414794921875, 0.0685882568359375, 0.073028564453125, 0.0774688720703125, 0.0819091796875, 0.0863494873046875, 0.090789794921875, 0.0952301025390625, 0.09967041015625, 0.1041107177734375, 0.108551025390625, 0.1129913330078125, 0.117431640625, 0.1218719482421875, 0.126312255859375, 0.1307525634765625, 0.13519287109375, 0.1396331787109375, 0.144073486328125, 0.1485137939453125, 0.1529541015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 6.0, 18.0, 18.0, 42.0, 90.0, 149.0, 150.0, 162.0, 126.0, 91.0, 54.0, 32.0, 17.0, 15.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.038255214691162, -2.9267897605895996, -2.815324306488037, -2.7038588523864746, -2.592393398284912, -2.4809279441833496, -2.369462490081787, -2.2579967975616455, -2.146531343460083, -2.0350658893585205, -1.923600435256958, -1.8121349811553955, -1.7006694078445435, -1.589203953742981, -1.4777384996414185, -1.3662729263305664, -1.2548075914382935, -1.143342137336731, -1.0318766832351685, -0.9204111695289612, -0.8089456558227539, -0.6974802017211914, -0.5860147476196289, -0.47454923391342163, -0.36308377981185913, -0.25161829590797424, -0.14015282690525055, -0.028687357902526855, 0.08277812600135803, 0.19424360990524292, 0.3057090640068054, 0.4171745777130127, 0.5286400318145752, 0.6401054859161377, 0.751570999622345, 0.8630364537239075, 0.9745019674301147, 1.0859674215316772, 1.1974328756332397, 1.3088984489440918, 1.4203639030456543, 1.5318293571472168, 1.6432948112487793, 1.7547602653503418, 1.8662258386611938, 1.9776912927627563, 2.0891566276550293, 2.200622320175171, 2.3120875358581543, 2.423552989959717, 2.5350184440612793, 2.646483898162842, 2.7579493522644043, 2.869414806365967, 2.9808802604675293, 3.092345952987671, 3.2038114070892334, 3.315276861190796, 3.4267423152923584, 3.538207769393921, 3.6496732234954834, 3.761138916015625, 3.8726043701171875, 3.98406982421875, 4.0955352783203125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 4.0, 13.0, 13.0, 11.0, 16.0, 20.0, 25.0, 24.0, 29.0, 41.0, 43.0, 51.0, 48.0, 66.0, 67.0, 75.0, 45.0, 50.0, 52.0, 44.0, 34.0, 44.0, 36.0, 27.0, 24.0, 19.0, 24.0, 11.0, 12.0, 5.0, 5.0, 2.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.997396945953369, -2.919171094894409, -2.840945243835449, -2.76271915435791, -2.68449330329895, -2.6062674522399902, -2.5280416011810303, -2.4498157501220703, -2.3715898990631104, -2.2933640480041504, -2.2151381969451904, -2.1369123458862305, -2.0586862564086914, -1.9804604053497314, -1.9022345542907715, -1.8240087032318115, -1.745782732963562, -1.667556881904602, -1.5893309116363525, -1.5111050605773926, -1.4328792095184326, -1.3546533584594727, -1.2764273881912231, -1.1982015371322632, -1.1199755668640137, -1.0417497158050537, -0.963523805141449, -0.8852978944778442, -0.8070720434188843, -0.7288461327552795, -0.6506202220916748, -0.5723943710327148, -0.4941685199737549, -0.41594263911247253, -0.3377167582511902, -0.25949084758758545, -0.1812649667263031, -0.10303908586502075, -0.024813175201416016, 0.053412675857543945, 0.13163858652114868, 0.20986446738243103, 0.2880903482437134, 0.3663162589073181, 0.44454213976860046, 0.5227680206298828, 0.6009939312934875, 0.6792197823524475, 0.7574456930160522, 0.835671603679657, 0.9138974547386169, 0.9921233654022217, 1.0703492164611816, 1.1485750675201416, 1.2268010377883911, 1.305026888847351, 1.3832528591156006, 1.4614787101745605, 1.53970468044281, 1.61793053150177, 1.69615638256073, 1.7743823528289795, 1.8526082038879395, 1.9308340549468994, 2.0090599060058594]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 4.0, 10.0, 3.0, 4.0, 11.0, 21.0, 20.0, 25.0, 37.0, 42.0, 57.0, 100.0, 128.0, 184.0, 242.0, 394.0, 776.0, 1562.0, 3587.0, 10641.0, 46307.0, 701743.0, 3325839.0, 77429.0, 15901.0, 5036.0, 1975.0, 932.0, 487.0, 307.0, 156.0, 116.0, 66.0, 49.0, 28.0, 24.0, 13.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.3681640625, -1.33489990234375, -1.3016357421875, -1.26837158203125, -1.235107421875, -1.20184326171875, -1.1685791015625, -1.13531494140625, -1.10205078125, -1.06878662109375, -1.0355224609375, -1.00225830078125, -0.968994140625, -0.93572998046875, -0.9024658203125, -0.86920166015625, -0.8359375, -0.80267333984375, -0.7694091796875, -0.73614501953125, -0.702880859375, -0.66961669921875, -0.6363525390625, -0.60308837890625, -0.56982421875, -0.53656005859375, -0.5032958984375, -0.47003173828125, -0.436767578125, -0.40350341796875, -0.3702392578125, -0.33697509765625, -0.3037109375, -0.27044677734375, -0.2371826171875, -0.20391845703125, -0.170654296875, -0.13739013671875, -0.1041259765625, -0.07086181640625, -0.03759765625, -0.00433349609375, 0.0289306640625, 0.06219482421875, 0.095458984375, 0.12872314453125, 0.1619873046875, 0.19525146484375, 0.228515625, 0.26177978515625, 0.2950439453125, 0.32830810546875, 0.361572265625, 0.39483642578125, 0.4281005859375, 0.46136474609375, 0.49462890625, 0.52789306640625, 0.5611572265625, 0.59442138671875, 0.627685546875, 0.66094970703125, 0.6942138671875, 0.72747802734375, 0.7607421875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 14.0, 24.0, 26.0, 32.0, 47.0, 54.0, 68.0, 80.0, 87.0, 100.0, 83.0, 88.0, 63.0, 53.0, 54.0, 42.0, 24.0, 14.0, 11.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.148193359375, -0.14391517639160156, -0.13963699340820312, -0.1353588104248047, -0.13108062744140625, -0.1268024444580078, -0.12252426147460938, -0.11824607849121094, -0.1139678955078125, -0.10968971252441406, -0.10541152954101562, -0.10113334655761719, -0.09685516357421875, -0.09257698059082031, -0.08829879760742188, -0.08402061462402344, -0.079742431640625, -0.07546424865722656, -0.07118606567382812, -0.06690788269042969, -0.06262969970703125, -0.05835151672363281, -0.054073333740234375, -0.04979515075683594, -0.0455169677734375, -0.04123878479003906, -0.036960601806640625, -0.03268241882324219, -0.02840423583984375, -0.024126052856445312, -0.019847869873046875, -0.015569686889648438, -0.01129150390625, -0.0070133209228515625, -0.002735137939453125, 0.0015430450439453125, 0.00582122802734375, 0.010099411010742188, 0.014377593994140625, 0.018655776977539062, 0.0229339599609375, 0.027212142944335938, 0.031490325927734375, 0.03576850891113281, 0.04004669189453125, 0.04432487487792969, 0.048603057861328125, 0.05288124084472656, 0.057159423828125, 0.06143760681152344, 0.06571578979492188, 0.06999397277832031, 0.07427215576171875, 0.07855033874511719, 0.08282852172851562, 0.08710670471191406, 0.0913848876953125, 0.09566307067871094, 0.09994125366210938, 0.10421943664550781, 0.10849761962890625, 0.11277580261230469, 0.11705398559570312, 0.12133216857910156, 0.1256103515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 7.0, 16.0, 13.0, 26.0, 41.0, 38.0, 69.0, 82.0, 101.0, 199.0, 337.0, 866.0, 2881.0, 22010.0, 4099753.0, 61964.0, 3762.0, 906.0, 408.0, 215.0, 141.0, 109.0, 69.0, 57.0, 49.0, 31.0, 30.0, 12.0, 16.0, 11.0, 10.0, 9.0, 8.0, 3.0, 3.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.796875, -2.711181640625, -2.62548828125, -2.539794921875, -2.4541015625, -2.368408203125, -2.28271484375, -2.197021484375, -2.111328125, -2.025634765625, -1.93994140625, -1.854248046875, -1.7685546875, -1.682861328125, -1.59716796875, -1.511474609375, -1.42578125, -1.340087890625, -1.25439453125, -1.168701171875, -1.0830078125, -0.997314453125, -0.91162109375, -0.825927734375, -0.740234375, -0.654541015625, -0.56884765625, -0.483154296875, -0.3974609375, -0.311767578125, -0.22607421875, -0.140380859375, -0.0546875, 0.031005859375, 0.11669921875, 0.202392578125, 0.2880859375, 0.373779296875, 0.45947265625, 0.545166015625, 0.630859375, 0.716552734375, 0.80224609375, 0.887939453125, 0.9736328125, 1.059326171875, 1.14501953125, 1.230712890625, 1.31640625, 1.402099609375, 1.48779296875, 1.573486328125, 1.6591796875, 1.744873046875, 1.83056640625, 1.916259765625, 2.001953125, 2.087646484375, 2.17333984375, 2.259033203125, 2.3447265625, 2.430419921875, 2.51611328125, 2.601806640625, 2.6875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 8.0, 14.0, 35.0, 104.0, 679.0, 2824.0, 318.0, 63.0, 20.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64697265625, -0.6165847778320312, -0.5861968994140625, -0.5558090209960938, -0.525421142578125, -0.49503326416015625, -0.4646453857421875, -0.43425750732421875, -0.40386962890625, -0.37348175048828125, -0.3430938720703125, -0.31270599365234375, -0.282318115234375, -0.25193023681640625, -0.2215423583984375, -0.19115447998046875, -0.1607666015625, -0.13037872314453125, -0.0999908447265625, -0.06960296630859375, -0.039215087890625, -0.00882720947265625, 0.0215606689453125, 0.05194854736328125, 0.08233642578125, 0.11272430419921875, 0.1431121826171875, 0.17350006103515625, 0.203887939453125, 0.23427581787109375, 0.2646636962890625, 0.29505157470703125, 0.325439453125, 0.35582733154296875, 0.3862152099609375, 0.41660308837890625, 0.446990966796875, 0.47737884521484375, 0.5077667236328125, 0.5381546020507812, 0.56854248046875, 0.5989303588867188, 0.6293182373046875, 0.6597061157226562, 0.690093994140625, 0.7204818725585938, 0.7508697509765625, 0.7812576293945312, 0.8116455078125, 0.8420333862304688, 0.8724212646484375, 0.9028091430664062, 0.933197021484375, 0.9635848999023438, 0.9939727783203125, 1.0243606567382812, 1.05474853515625, 1.0851364135742188, 1.1155242919921875, 1.1459121704101562, 1.176300048828125, 1.2066879272460938, 1.2370758056640625, 1.2674636840820312, 1.2978515625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 10.0, 16.0, 66.0, 165.0, 294.0, 263.0, 99.0, 45.0, 13.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.0675811767578125, -5.928643226623535, -5.7897047996521, -5.650766849517822, -5.511828422546387, -5.372890472412109, -5.233952045440674, -5.0950140953063965, -4.956075668334961, -4.817137718200684, -4.678199291229248, -4.539261341094971, -4.400322914123535, -4.261384963989258, -4.122446537017822, -3.983508586883545, -3.8445706367492676, -3.705632448196411, -3.5666942596435547, -3.4277560710906982, -3.288817882537842, -3.1498799324035645, -3.010941743850708, -2.8720035552978516, -2.733065366744995, -2.5941271781921387, -2.4551889896392822, -2.316250801086426, -2.1773128509521484, -2.038374423980713, -1.8994364738464355, -1.760498285293579, -1.6215603351593018, -1.4826221466064453, -1.3436839580535889, -1.204745888710022, -1.0658077001571655, -0.9268695116043091, -0.7879313826560974, -0.6489932537078857, -0.5100550651550293, -0.37111690640449524, -0.23217874765396118, -0.09324058890342712, 0.045697569847106934, 0.18463575839996338, 0.32357388734817505, 0.4625120162963867, 0.6014502048492432, 0.7403883934020996, 0.8793265223503113, 1.018264651298523, 1.1572028398513794, 1.2961410284042358, 1.4350790977478027, 1.5740172863006592, 1.7129554748535156, 1.851893663406372, 1.9908318519592285, 2.129770040512085, 2.2687082290649414, 2.4076461791992188, 2.546584367752075, 2.6855225563049316, 2.824460744857788]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 4.0, 6.0, 5.0, 9.0, 13.0, 25.0, 28.0, 22.0, 39.0, 37.0, 42.0, 52.0, 67.0, 56.0, 78.0, 76.0, 67.0, 68.0, 54.0, 50.0, 39.0, 33.0, 31.0, 15.0, 14.0, 14.0, 14.0, 13.0, 11.0, 7.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5844693183898926, -1.5345063209533691, -1.4845434427261353, -1.4345804452896118, -1.3846174478530884, -1.3346545696258545, -1.284691572189331, -1.2347285747528076, -1.1847655773162842, -1.1348025798797607, -1.0848397016525269, -1.0348767042160034, -0.98491370677948, -0.9349507689476013, -0.8849878311157227, -0.8350248336791992, -0.7850619554519653, -0.7350990176200867, -0.6851360201835632, -0.6351730823516846, -0.5852100849151611, -0.5352471470832825, -0.4852842092514038, -0.43532124161720276, -0.3853582739830017, -0.33539530634880066, -0.2854323387145996, -0.23546940088272095, -0.1855064332485199, -0.13554346561431885, -0.08558052778244019, -0.035617560148239136, 0.014345407485961914, 0.06430836766958237, 0.11427132785320282, 0.16423428058624268, 0.21419724822044373, 0.2641602158546448, 0.31412315368652344, 0.3640861213207245, 0.41404908895492554, 0.4640120565891266, 0.5139750242233276, 0.5639379620552063, 0.613900899887085, 0.6638638973236084, 0.7138268351554871, 0.7637897729873657, 0.8137527704238892, 0.8637157082557678, 0.9136787056922913, 0.9636416435241699, 1.0136046409606934, 1.0635676383972168, 1.1135305166244507, 1.1634935140609741, 1.213456392288208, 1.2634193897247314, 1.3133822679519653, 1.3633452653884888, 1.4133082628250122, 1.463271141052246, 1.5132341384887695, 1.563197135925293, 1.6131601333618164]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 4.0, 5.0, 15.0, 6.0, 17.0, 23.0, 46.0, 48.0, 64.0, 65.0, 102.0, 146.0, 234.0, 297.0, 457.0, 683.0, 975.0, 1597.0, 2796.0, 5607.0, 13141.0, 41889.0, 170146.0, 479220.0, 240897.0, 57614.0, 17085.0, 6778.0, 3233.0, 1884.0, 1024.0, 765.0, 476.0, 350.0, 222.0, 177.0, 121.0, 90.0, 58.0, 52.0, 37.0, 32.0, 15.0, 18.0, 8.0, 5.0, 4.0, 11.0, 5.0, 2.0, 1.0, 4.0, 1.0], "bins": [-0.654296875, -0.6353988647460938, -0.6165008544921875, -0.5976028442382812, -0.578704833984375, -0.5598068237304688, -0.5409088134765625, -0.5220108032226562, -0.50311279296875, -0.48421478271484375, -0.4653167724609375, -0.44641876220703125, -0.427520751953125, -0.40862274169921875, -0.3897247314453125, -0.37082672119140625, -0.3519287109375, -0.33303070068359375, -0.3141326904296875, -0.29523468017578125, -0.276336669921875, -0.25743865966796875, -0.2385406494140625, -0.21964263916015625, -0.20074462890625, -0.18184661865234375, -0.1629486083984375, -0.14405059814453125, -0.125152587890625, -0.10625457763671875, -0.0873565673828125, -0.06845855712890625, -0.049560546875, -0.03066253662109375, -0.0117645263671875, 0.00713348388671875, 0.026031494140625, 0.04492950439453125, 0.0638275146484375, 0.08272552490234375, 0.10162353515625, 0.12052154541015625, 0.1394195556640625, 0.15831756591796875, 0.177215576171875, 0.19611358642578125, 0.2150115966796875, 0.23390960693359375, 0.2528076171875, 0.27170562744140625, 0.2906036376953125, 0.30950164794921875, 0.328399658203125, 0.34729766845703125, 0.3661956787109375, 0.38509368896484375, 0.40399169921875, 0.42288970947265625, 0.4417877197265625, 0.46068572998046875, 0.479583740234375, 0.49848175048828125, 0.5173797607421875, 0.5362777709960938, 0.55517578125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 13.0, 31.0, 31.0, 43.0, 73.0, 83.0, 95.0, 126.0, 117.0, 113.0, 82.0, 55.0, 46.0, 28.0, 12.0, 8.0, 10.0, 3.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.223388671875, -0.217315673828125, -0.21124267578125, -0.205169677734375, -0.1990966796875, -0.193023681640625, -0.18695068359375, -0.180877685546875, -0.1748046875, -0.168731689453125, -0.16265869140625, -0.156585693359375, -0.1505126953125, -0.144439697265625, -0.13836669921875, -0.132293701171875, -0.126220703125, -0.120147705078125, -0.11407470703125, -0.108001708984375, -0.1019287109375, -0.095855712890625, -0.08978271484375, -0.083709716796875, -0.07763671875, -0.071563720703125, -0.06549072265625, -0.059417724609375, -0.0533447265625, -0.047271728515625, -0.04119873046875, -0.035125732421875, -0.029052734375, -0.022979736328125, -0.01690673828125, -0.010833740234375, -0.0047607421875, 0.001312255859375, 0.00738525390625, 0.013458251953125, 0.01953125, 0.025604248046875, 0.03167724609375, 0.037750244140625, 0.0438232421875, 0.049896240234375, 0.05596923828125, 0.062042236328125, 0.068115234375, 0.074188232421875, 0.08026123046875, 0.086334228515625, 0.0924072265625, 0.098480224609375, 0.10455322265625, 0.110626220703125, 0.11669921875, 0.122772216796875, 0.12884521484375, 0.134918212890625, 0.1409912109375, 0.147064208984375, 0.15313720703125, 0.159210205078125, 0.165283203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 8.0, 12.0, 18.0, 17.0, 30.0, 36.0, 51.0, 97.0, 126.0, 232.0, 379.0, 783.0, 1748.0, 4679.0, 15188.0, 55436.0, 224157.0, 478543.0, 197401.0, 48876.0, 13146.0, 4232.0, 1679.0, 733.0, 357.0, 226.0, 106.0, 64.0, 48.0, 42.0, 24.0, 20.0, 16.0, 9.0, 9.0, 8.0, 5.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.399993896484375, -0.38641357421875, -0.372833251953125, -0.3592529296875, -0.345672607421875, -0.33209228515625, -0.318511962890625, -0.304931640625, -0.291351318359375, -0.27777099609375, -0.264190673828125, -0.2506103515625, -0.237030029296875, -0.22344970703125, -0.209869384765625, -0.1962890625, -0.182708740234375, -0.16912841796875, -0.155548095703125, -0.1419677734375, -0.128387451171875, -0.11480712890625, -0.101226806640625, -0.087646484375, -0.074066162109375, -0.06048583984375, -0.046905517578125, -0.0333251953125, -0.019744873046875, -0.00616455078125, 0.007415771484375, 0.02099609375, 0.034576416015625, 0.04815673828125, 0.061737060546875, 0.0753173828125, 0.088897705078125, 0.10247802734375, 0.116058349609375, 0.129638671875, 0.143218994140625, 0.15679931640625, 0.170379638671875, 0.1839599609375, 0.197540283203125, 0.21112060546875, 0.224700927734375, 0.23828125, 0.251861572265625, 0.26544189453125, 0.279022216796875, 0.2926025390625, 0.306182861328125, 0.31976318359375, 0.333343505859375, 0.346923828125, 0.360504150390625, 0.37408447265625, 0.387664794921875, 0.4012451171875, 0.414825439453125, 0.42840576171875, 0.441986083984375, 0.45556640625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 6.0, 3.0, 8.0, 13.0, 9.0, 14.0, 13.0, 17.0, 12.0, 24.0, 21.0, 20.0, 22.0, 34.0, 38.0, 36.0, 40.0, 46.0, 39.0, 40.0, 57.0, 45.0, 43.0, 37.0, 35.0, 39.0, 37.0, 48.0, 31.0, 33.0, 26.0, 10.0, 18.0, 11.0, 10.0, 14.0, 10.0, 7.0, 7.0, 4.0, 8.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28759765625, -0.2774620056152344, -0.26732635498046875, -0.2571907043457031, -0.2470550537109375, -0.23691940307617188, -0.22678375244140625, -0.21664810180664062, -0.206512451171875, -0.19637680053710938, -0.18624114990234375, -0.17610549926757812, -0.1659698486328125, -0.15583419799804688, -0.14569854736328125, -0.13556289672851562, -0.12542724609375, -0.11529159545898438, -0.10515594482421875, -0.09502029418945312, -0.0848846435546875, -0.07474899291992188, -0.06461334228515625, -0.054477691650390625, -0.044342041015625, -0.034206390380859375, -0.02407073974609375, -0.013935089111328125, -0.0037994384765625, 0.006336212158203125, 0.01647186279296875, 0.026607513427734375, 0.0367431640625, 0.046878814697265625, 0.05701446533203125, 0.06715011596679688, 0.0772857666015625, 0.08742141723632812, 0.09755706787109375, 0.10769271850585938, 0.117828369140625, 0.12796401977539062, 0.13809967041015625, 0.14823532104492188, 0.1583709716796875, 0.16850662231445312, 0.17864227294921875, 0.18877792358398438, 0.19891357421875, 0.20904922485351562, 0.21918487548828125, 0.22932052612304688, 0.2394561767578125, 0.24959182739257812, 0.25972747802734375, 0.2698631286621094, 0.279998779296875, 0.2901344299316406, 0.30027008056640625, 0.3104057312011719, 0.3205413818359375, 0.3306770324707031, 0.34081268310546875, 0.3509483337402344, 0.361083984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 5.0, 5.0, 4.0, 14.0, 16.0, 22.0, 41.0, 53.0, 95.0, 197.0, 365.0, 811.0, 1965.0, 5590.0, 19272.0, 100785.0, 642828.0, 228688.0, 34061.0, 8673.0, 2898.0, 1088.0, 490.0, 249.0, 145.0, 68.0, 46.0, 30.0, 14.0, 13.0, 5.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3447265625, -0.3347892761230469, -0.32485198974609375, -0.3149147033691406, -0.3049774169921875, -0.2950401306152344, -0.28510284423828125, -0.2751655578613281, -0.265228271484375, -0.2552909851074219, -0.24535369873046875, -0.23541641235351562, -0.2254791259765625, -0.21554183959960938, -0.20560455322265625, -0.19566726684570312, -0.18572998046875, -0.17579269409179688, -0.16585540771484375, -0.15591812133789062, -0.1459808349609375, -0.13604354858398438, -0.12610626220703125, -0.11616897583007812, -0.106231689453125, -0.09629440307617188, -0.08635711669921875, -0.07641983032226562, -0.0664825439453125, -0.056545257568359375, -0.04660797119140625, -0.036670684814453125, -0.0267333984375, -0.016796112060546875, -0.00685882568359375, 0.003078460693359375, 0.0130157470703125, 0.022953033447265625, 0.03289031982421875, 0.042827606201171875, 0.052764892578125, 0.06270217895507812, 0.07263946533203125, 0.08257675170898438, 0.0925140380859375, 0.10245132446289062, 0.11238861083984375, 0.12232589721679688, 0.13226318359375, 0.14220046997070312, 0.15213775634765625, 0.16207504272460938, 0.1720123291015625, 0.18194961547851562, 0.19188690185546875, 0.20182418823242188, 0.211761474609375, 0.22169876098632812, 0.23163604736328125, 0.24157333374023438, 0.2515106201171875, 0.2614479064941406, 0.27138519287109375, 0.2813224792480469, 0.291259765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 10.0, 11.0, 16.0, 23.0, 39.0, 32.0, 66.0, 67.0, 95.0, 126.0, 120.0, 104.0, 72.0, 56.0, 42.0, 31.0, 22.0, 16.0, 12.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171796798706055e-05, -7.890630513429642e-05, -7.609464228153229e-05, -7.328297942876816e-05, -7.047131657600403e-05, -6.76596537232399e-05, -6.484799087047577e-05, -6.203632801771164e-05, -5.922466516494751e-05, -5.641300231218338e-05, -5.360133945941925e-05, -5.078967660665512e-05, -4.797801375389099e-05, -4.516635090112686e-05, -4.235468804836273e-05, -3.95430251955986e-05, -3.673136234283447e-05, -3.391969949007034e-05, -3.110803663730621e-05, -2.8296373784542084e-05, -2.5484710931777954e-05, -2.2673048079013824e-05, -1.9861385226249695e-05, -1.7049722373485565e-05, -1.4238059520721436e-05, -1.1426396667957306e-05, -8.614733815193176e-06, -5.803070962429047e-06, -2.991408109664917e-06, -1.7974525690078735e-07, 2.6319175958633423e-06, 5.443580448627472e-06, 8.255243301391602e-06, 1.1066906154155731e-05, 1.387856900691986e-05, 1.669023185968399e-05, 1.950189471244812e-05, 2.231355756521225e-05, 2.512522041797638e-05, 2.793688327074051e-05, 3.074854612350464e-05, 3.356020897626877e-05, 3.63718718290329e-05, 3.918353468179703e-05, 4.199519753456116e-05, 4.480686038732529e-05, 4.7618523240089417e-05, 5.0430186092853546e-05, 5.3241848945617676e-05, 5.6053511798381805e-05, 5.8865174651145935e-05, 6.167683750391006e-05, 6.44885003566742e-05, 6.730016320943832e-05, 7.011182606220245e-05, 7.292348891496658e-05, 7.573515176773071e-05, 7.854681462049484e-05, 8.135847747325897e-05, 8.41701403260231e-05, 8.698180317878723e-05, 8.979346603155136e-05, 9.260512888431549e-05, 9.541679173707962e-05, 9.822845458984375e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 16.0, 16.0, 32.0, 60.0, 86.0, 133.0, 286.0, 684.0, 1489.0, 4428.0, 14838.0, 71256.0, 595927.0, 305539.0, 39146.0, 9489.0, 2951.0, 1178.0, 495.0, 233.0, 105.0, 53.0, 41.0, 25.0, 11.0, 11.0, 10.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41259765625, -0.4016914367675781, -0.39078521728515625, -0.3798789978027344, -0.3689727783203125, -0.3580665588378906, -0.34716033935546875, -0.3362541198730469, -0.325347900390625, -0.3144416809082031, -0.30353546142578125, -0.2926292419433594, -0.2817230224609375, -0.2708168029785156, -0.25991058349609375, -0.24900436401367188, -0.23809814453125, -0.22719192504882812, -0.21628570556640625, -0.20537948608398438, -0.1944732666015625, -0.18356704711914062, -0.17266082763671875, -0.16175460815429688, -0.150848388671875, -0.13994216918945312, -0.12903594970703125, -0.11812973022460938, -0.1072235107421875, -0.09631729125976562, -0.08541107177734375, -0.07450485229492188, -0.0635986328125, -0.052692413330078125, -0.04178619384765625, -0.030879974365234375, -0.0199737548828125, -0.009067535400390625, 0.00183868408203125, 0.012744903564453125, 0.023651123046875, 0.034557342529296875, 0.04546356201171875, 0.056369781494140625, 0.0672760009765625, 0.07818222045898438, 0.08908843994140625, 0.09999465942382812, 0.11090087890625, 0.12180709838867188, 0.13271331787109375, 0.14361953735351562, 0.1545257568359375, 0.16543197631835938, 0.17633819580078125, 0.18724441528320312, 0.198150634765625, 0.20905685424804688, 0.21996307373046875, 0.23086929321289062, 0.2417755126953125, 0.2526817321777344, 0.26358795166015625, 0.2744941711425781, 0.285400390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 7.0, 4.0, 7.0, 8.0, 4.0, 7.0, 7.0, 10.0, 18.0, 19.0, 18.0, 23.0, 41.0, 46.0, 51.0, 70.0, 77.0, 84.0, 79.0, 68.0, 68.0, 47.0, 42.0, 38.0, 23.0, 32.0, 25.0, 14.0, 9.0, 12.0, 7.0, 10.0, 4.0, 4.0, 7.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1729736328125, -0.1678619384765625, -0.162750244140625, -0.1576385498046875, -0.15252685546875, -0.1474151611328125, -0.142303466796875, -0.1371917724609375, -0.132080078125, -0.1269683837890625, -0.121856689453125, -0.1167449951171875, -0.11163330078125, -0.1065216064453125, -0.101409912109375, -0.0962982177734375, -0.0911865234375, -0.0860748291015625, -0.080963134765625, -0.0758514404296875, -0.07073974609375, -0.0656280517578125, -0.060516357421875, -0.0554046630859375, -0.05029296875, -0.0451812744140625, -0.040069580078125, -0.0349578857421875, -0.02984619140625, -0.0247344970703125, -0.019622802734375, -0.0145111083984375, -0.0093994140625, -0.0042877197265625, 0.000823974609375, 0.0059356689453125, 0.01104736328125, 0.0161590576171875, 0.021270751953125, 0.0263824462890625, 0.031494140625, 0.0366058349609375, 0.041717529296875, 0.0468292236328125, 0.05194091796875, 0.0570526123046875, 0.062164306640625, 0.0672760009765625, 0.0723876953125, 0.0774993896484375, 0.082611083984375, 0.0877227783203125, 0.09283447265625, 0.0979461669921875, 0.103057861328125, 0.1081695556640625, 0.11328125, 0.1183929443359375, 0.123504638671875, 0.1286163330078125, 0.13372802734375, 0.1388397216796875, 0.143951416015625, 0.1490631103515625, 0.1541748046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 22.0, 52.0, 86.0, 180.0, 219.0, 186.0, 132.0, 63.0, 24.0, 22.0, 9.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.021912097930908, -5.873057842254639, -5.724203586578369, -5.575348854064941, -5.426494598388672, -5.277640342712402, -5.128786087036133, -4.979931831359863, -4.831077575683594, -4.682223320007324, -4.533369064331055, -4.384514331817627, -4.235660076141357, -4.086805820465088, -3.9379515647888184, -3.789097309112549, -3.640242576599121, -3.4913883209228516, -3.342533826828003, -3.1936795711517334, -3.0448250770568848, -2.8959708213806152, -2.7471165657043457, -2.598262310028076, -2.4494078159332275, -2.300553560256958, -2.1516990661621094, -2.00284481048584, -1.8539904356002808, -1.7051360607147217, -1.5562818050384521, -1.407427430152893, -1.2585735321044922, -1.109719157218933, -0.9608648419380188, -0.8120105266571045, -0.6631561517715454, -0.5143017768859863, -0.365447461605072, -0.21659314632415771, -0.06773877143859863, 0.08111557364463806, 0.22996991872787476, 0.37882426381111145, 0.5276786088943481, 0.6765329837799072, 0.8253872990608215, 0.9742416143417358, 1.123095989227295, 1.271950364112854, 1.420804738998413, 1.5696589946746826, 1.7185133695602417, 1.8673677444458008, 2.0162220001220703, 2.16507625579834, 2.3139307498931885, 2.462785005569458, 2.6116394996643066, 2.760493755340576, 2.9093480110168457, 3.0582025051116943, 3.207056760787964, 3.3559112548828125, 3.504765510559082]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 5.0, 9.0, 5.0, 8.0, 10.0, 17.0, 15.0, 15.0, 21.0, 20.0, 33.0, 37.0, 29.0, 30.0, 39.0, 43.0, 48.0, 48.0, 33.0, 53.0, 37.0, 44.0, 50.0, 40.0, 39.0, 29.0, 25.0, 24.0, 25.0, 19.0, 19.0, 17.0, 20.0, 16.0, 9.0, 13.0, 16.0, 9.0, 8.0, 7.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-2.0773415565490723, -2.0180912017822266, -1.9588409662246704, -1.8995906114578247, -1.840340256690979, -1.7810900211334229, -1.7218396663665771, -1.6625893115997314, -1.6033389568328857, -1.54408860206604, -1.4848383665084839, -1.4255880117416382, -1.3663376569747925, -1.3070874214172363, -1.2478370666503906, -1.188586711883545, -1.1293364763259888, -1.070086121559143, -1.010835886001587, -0.9515855312347412, -0.8923351764678955, -0.8330848813056946, -0.7738345861434937, -0.714584231376648, -0.655333936214447, -0.5960836410522461, -0.5368332862854004, -0.47758299112319946, -0.41833266615867615, -0.35908234119415283, -0.2998320460319519, -0.2405817210674286, -0.18133139610290527, -0.12208107858896255, -0.06283076107501984, -0.003580451011657715, 0.0556698739528656, 0.11492019891738892, 0.17417049407958984, 0.23342081904411316, 0.2926711440086365, 0.3519214689731598, 0.4111717939376831, 0.47042208909988403, 0.529672384262085, 0.5889227390289307, 0.6481730341911316, 0.7074233293533325, 0.7666736841201782, 0.8259239792823792, 0.8851743340492249, 0.9444246292114258, 1.0036749839782715, 1.0629253387451172, 1.1221755743026733, 1.181425929069519, 1.2406761646270752, 1.299926519393921, 1.359176754951477, 1.4184271097183228, 1.4776774644851685, 1.5369277000427246, 1.5961780548095703, 1.655428409576416, 1.7146787643432617]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 17.0, 13.0, 15.0, 16.0, 26.0, 34.0, 52.0, 62.0, 103.0, 128.0, 199.0, 307.0, 500.0, 937.0, 1714.0, 4156.0, 12997.0, 79860.0, 3873505.0, 187265.0, 21336.0, 6079.0, 2345.0, 1127.0, 601.0, 314.0, 157.0, 107.0, 83.0, 55.0, 31.0, 29.0, 25.0, 15.0, 12.0, 13.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.041015625, -1.0109710693359375, -0.980926513671875, -0.9508819580078125, -0.92083740234375, -0.8907928466796875, -0.860748291015625, -0.8307037353515625, -0.8006591796875, -0.7706146240234375, -0.740570068359375, -0.7105255126953125, -0.68048095703125, -0.6504364013671875, -0.620391845703125, -0.5903472900390625, -0.560302734375, -0.5302581787109375, -0.500213623046875, -0.4701690673828125, -0.44012451171875, -0.4100799560546875, -0.380035400390625, -0.3499908447265625, -0.3199462890625, -0.2899017333984375, -0.259857177734375, -0.2298126220703125, -0.19976806640625, -0.1697235107421875, -0.139678955078125, -0.1096343994140625, -0.07958984375, -0.0495452880859375, -0.019500732421875, 0.0105438232421875, 0.04058837890625, 0.0706329345703125, 0.100677490234375, 0.1307220458984375, 0.1607666015625, 0.1908111572265625, 0.220855712890625, 0.2509002685546875, 0.28094482421875, 0.3109893798828125, 0.341033935546875, 0.3710784912109375, 0.401123046875, 0.4311676025390625, 0.461212158203125, 0.4912567138671875, 0.52130126953125, 0.5513458251953125, 0.581390380859375, 0.6114349365234375, 0.6414794921875, 0.6715240478515625, 0.701568603515625, 0.7316131591796875, 0.76165771484375, 0.7917022705078125, 0.821746826171875, 0.8517913818359375, 0.8818359375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 4.0, 7.0, 3.0, 16.0, 12.0, 28.0, 44.0, 46.0, 72.0, 110.0, 99.0, 98.0, 104.0, 86.0, 77.0, 71.0, 46.0, 26.0, 14.0, 8.0, 6.0, 7.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.215087890625, -0.2092113494873047, -0.20333480834960938, -0.19745826721191406, -0.19158172607421875, -0.18570518493652344, -0.17982864379882812, -0.1739521026611328, -0.1680755615234375, -0.1621990203857422, -0.15632247924804688, -0.15044593811035156, -0.14456939697265625, -0.13869285583496094, -0.13281631469726562, -0.1269397735595703, -0.121063232421875, -0.11518669128417969, -0.10931015014648438, -0.10343360900878906, -0.09755706787109375, -0.09168052673339844, -0.08580398559570312, -0.07992744445800781, -0.0740509033203125, -0.06817436218261719, -0.062297821044921875, -0.05642127990722656, -0.05054473876953125, -0.04466819763183594, -0.038791656494140625, -0.03291511535644531, -0.02703857421875, -0.021162033081054688, -0.015285491943359375, -0.009408950805664062, -0.00353240966796875, 0.0023441314697265625, 0.008220672607421875, 0.014097213745117188, 0.0199737548828125, 0.025850296020507812, 0.031726837158203125, 0.03760337829589844, 0.04347991943359375, 0.04935646057128906, 0.055233001708984375, 0.06110954284667969, 0.066986083984375, 0.07286262512207031, 0.07873916625976562, 0.08461570739746094, 0.09049224853515625, 0.09636878967285156, 0.10224533081054688, 0.10812187194824219, 0.1139984130859375, 0.11987495422363281, 0.12575149536132812, 0.13162803649902344, 0.13750457763671875, 0.14338111877441406, 0.14925765991210938, 0.1551342010498047, 0.1610107421875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 9.0, 7.0, 12.0, 14.0, 23.0, 25.0, 19.0, 28.0, 42.0, 68.0, 123.0, 289.0, 853.0, 3681.0, 23061.0, 628259.0, 3492849.0, 37733.0, 5142.0, 1163.0, 407.0, 112.0, 72.0, 48.0, 49.0, 34.0, 24.0, 25.0, 18.0, 16.0, 15.0, 15.0, 5.0, 4.0, 9.0, 10.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.16015625, -1.1271133422851562, -1.0940704345703125, -1.0610275268554688, -1.027984619140625, -0.9949417114257812, -0.9618988037109375, -0.9288558959960938, -0.89581298828125, -0.8627700805664062, -0.8297271728515625, -0.7966842651367188, -0.763641357421875, -0.7305984497070312, -0.6975555419921875, -0.6645126342773438, -0.6314697265625, -0.5984268188476562, -0.5653839111328125, -0.5323410034179688, -0.499298095703125, -0.46625518798828125, -0.4332122802734375, -0.40016937255859375, -0.36712646484375, -0.33408355712890625, -0.3010406494140625, -0.26799774169921875, -0.234954833984375, -0.20191192626953125, -0.1688690185546875, -0.13582611083984375, -0.102783203125, -0.06974029541015625, -0.0366973876953125, -0.00365447998046875, 0.029388427734375, 0.06243133544921875, 0.0954742431640625, 0.12851715087890625, 0.16156005859375, 0.19460296630859375, 0.2276458740234375, 0.26068878173828125, 0.293731689453125, 0.32677459716796875, 0.3598175048828125, 0.39286041259765625, 0.4259033203125, 0.45894622802734375, 0.4919891357421875, 0.5250320434570312, 0.558074951171875, 0.5911178588867188, 0.6241607666015625, 0.6572036743164062, 0.69024658203125, 0.7232894897460938, 0.7563323974609375, 0.7893753051757812, 0.822418212890625, 0.8554611206054688, 0.8885040283203125, 0.9215469360351562, 0.95458984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 21.0, 20.0, 46.0, 102.0, 249.0, 1317.0, 1844.0, 253.0, 106.0, 52.0, 32.0, 8.0, 10.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.175537109375, -0.16304397583007812, -0.15055084228515625, -0.13805770874023438, -0.1255645751953125, -0.11307144165039062, -0.10057830810546875, -0.08808517456054688, -0.075592041015625, -0.06309890747070312, -0.05060577392578125, -0.038112640380859375, -0.0256195068359375, -0.013126373291015625, -0.00063323974609375, 0.011859893798828125, 0.02435302734375, 0.036846160888671875, 0.04933929443359375, 0.061832427978515625, 0.0743255615234375, 0.08681869506835938, 0.09931182861328125, 0.11180496215820312, 0.124298095703125, 0.13679122924804688, 0.14928436279296875, 0.16177749633789062, 0.1742706298828125, 0.18676376342773438, 0.19925689697265625, 0.21175003051757812, 0.2242431640625, 0.23673629760742188, 0.24922943115234375, 0.2617225646972656, 0.2742156982421875, 0.2867088317871094, 0.29920196533203125, 0.3116950988769531, 0.324188232421875, 0.3366813659667969, 0.34917449951171875, 0.3616676330566406, 0.3741607666015625, 0.3866539001464844, 0.39914703369140625, 0.4116401672363281, 0.42413330078125, 0.4366264343261719, 0.44911956787109375, 0.4616127014160156, 0.4741058349609375, 0.4865989685058594, 0.49909210205078125, 0.5115852355957031, 0.524078369140625, 0.5365715026855469, 0.5490646362304688, 0.5615577697753906, 0.5740509033203125, 0.5865440368652344, 0.5990371704101562, 0.6115303039550781, 0.6240234375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 3.0, 4.0, 20.0, 34.0, 85.0, 179.0, 236.0, 182.0, 131.0, 60.0, 27.0, 8.0, 10.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3731882572174072, -2.3117642402648926, -2.250340223312378, -2.1889162063598633, -2.1274919509887695, -2.066067934036255, -2.0046439170837402, -1.9432199001312256, -1.881795883178711, -1.8203718662261963, -1.7589478492736816, -1.6975237131118774, -1.6360996961593628, -1.5746756792068481, -1.513251543045044, -1.4518275260925293, -1.3904035091400146, -1.3289794921875, -1.2675554752349854, -1.2061313390731812, -1.1447073221206665, -1.0832833051681519, -1.0218591690063477, -0.960435152053833, -0.8990111351013184, -0.8375871181488037, -0.7761630415916443, -0.7147389650344849, -0.6533149480819702, -0.5918909311294556, -0.5304668545722961, -0.4690428078174591, -0.4076188802719116, -0.3461948335170746, -0.28477078676223755, -0.2233467400074005, -0.16192269325256348, -0.10049864649772644, -0.039074599742889404, 0.022349447011947632, 0.08377349376678467, 0.1451975405216217, 0.20662158727645874, 0.2680456340312958, 0.3294696807861328, 0.39089372754096985, 0.4523177742958069, 0.5137418508529663, 0.575165867805481, 0.6365898847579956, 0.698013961315155, 0.7594380378723145, 0.8208620548248291, 0.8822860717773438, 0.9437101483345032, 1.0051342248916626, 1.0665582418441772, 1.127982258796692, 1.189406394958496, 1.2508304119110107, 1.3122544288635254, 1.37367844581604, 1.4351024627685547, 1.4965265989303589, 1.5579506158828735]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 7.0, 6.0, 20.0, 19.0, 31.0, 38.0, 49.0, 72.0, 70.0, 74.0, 80.0, 72.0, 93.0, 89.0, 58.0, 59.0, 46.0, 31.0, 32.0, 19.0, 11.0, 8.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3341453075408936, -1.2963017225265503, -1.258458137512207, -1.2206144332885742, -1.182770848274231, -1.1449272632598877, -1.1070836782455444, -1.0692400932312012, -1.0313963890075684, -0.9935528039932251, -0.9557091593742371, -0.9178655743598938, -0.8800219297409058, -0.8421783447265625, -0.8043347597122192, -0.7664911150932312, -0.7286475300788879, -0.6908039450645447, -0.6529603004455566, -0.6151167154312134, -0.5772730708122253, -0.5394294857978821, -0.501585841178894, -0.4637422561645508, -0.42589864134788513, -0.3880550265312195, -0.35021141171455383, -0.3123677968978882, -0.2745242118835449, -0.23668058216571808, -0.19883698225021362, -0.16099336743354797, -0.12314975261688232, -0.08530613780021667, -0.04746253043413162, -0.00961892306804657, 0.02822469174861908, 0.06606830656528473, 0.10391190648078918, 0.14175552129745483, 0.17959913611412048, 0.21744275093078613, 0.2552863657474518, 0.29312998056411743, 0.3309735655784607, 0.36881721019744873, 0.406660795211792, 0.44450441002845764, 0.4823480248451233, 0.5201916098594666, 0.5580352544784546, 0.5958788394927979, 0.6337224841117859, 0.6715660691261292, 0.7094097137451172, 0.7472532987594604, 0.7850968837738037, 0.822940468788147, 0.860784113407135, 0.8986276984214783, 0.9364713430404663, 0.9743149280548096, 1.0121585130691528, 1.050002098083496, 1.087845802307129]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 2.0, 6.0, 11.0, 6.0, 12.0, 21.0, 35.0, 46.0, 71.0, 106.0, 170.0, 265.0, 408.0, 674.0, 1124.0, 2062.0, 4698.0, 12620.0, 45812.0, 234993.0, 544810.0, 151321.0, 31689.0, 9486.0, 3751.0, 1806.0, 966.0, 625.0, 336.0, 218.0, 143.0, 87.0, 65.0, 38.0, 20.0, 15.0, 12.0, 5.0, 7.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.71435546875, -0.6908340454101562, -0.6673126220703125, -0.6437911987304688, -0.620269775390625, -0.5967483520507812, -0.5732269287109375, -0.5497055053710938, -0.52618408203125, -0.5026626586914062, -0.4791412353515625, -0.45561981201171875, -0.432098388671875, -0.40857696533203125, -0.3850555419921875, -0.36153411865234375, -0.3380126953125, -0.31449127197265625, -0.2909698486328125, -0.26744842529296875, -0.243927001953125, -0.22040557861328125, -0.1968841552734375, -0.17336273193359375, -0.14984130859375, -0.12631988525390625, -0.1027984619140625, -0.07927703857421875, -0.055755615234375, -0.03223419189453125, -0.0087127685546875, 0.01480865478515625, 0.038330078125, 0.06185150146484375, 0.0853729248046875, 0.10889434814453125, 0.132415771484375, 0.15593719482421875, 0.1794586181640625, 0.20298004150390625, 0.22650146484375, 0.25002288818359375, 0.2735443115234375, 0.29706573486328125, 0.320587158203125, 0.34410858154296875, 0.3676300048828125, 0.39115142822265625, 0.4146728515625, 0.43819427490234375, 0.4617156982421875, 0.48523712158203125, 0.508758544921875, 0.5322799682617188, 0.5558013916015625, 0.5793228149414062, 0.60284423828125, 0.6263656616210938, 0.6498870849609375, 0.6734085083007812, 0.696929931640625, 0.7204513549804688, 0.7439727783203125, 0.7674942016601562, 0.791015625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 7.0, 18.0, 18.0, 26.0, 44.0, 58.0, 78.0, 104.0, 111.0, 102.0, 90.0, 89.0, 75.0, 55.0, 42.0, 21.0, 16.0, 9.0, 8.0, 3.0, 5.0, 1.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.22607421875, -0.21984481811523438, -0.21361541748046875, -0.20738601684570312, -0.2011566162109375, -0.19492721557617188, -0.18869781494140625, -0.18246841430664062, -0.176239013671875, -0.17000961303710938, -0.16378021240234375, -0.15755081176757812, -0.1513214111328125, -0.14509201049804688, -0.13886260986328125, -0.13263320922851562, -0.12640380859375, -0.12017440795898438, -0.11394500732421875, -0.10771560668945312, -0.1014862060546875, -0.09525680541992188, -0.08902740478515625, -0.08279800415039062, -0.076568603515625, -0.07033920288085938, -0.06410980224609375, -0.057880401611328125, -0.0516510009765625, -0.045421600341796875, -0.03919219970703125, -0.032962799072265625, -0.0267333984375, -0.020503997802734375, -0.01427459716796875, -0.008045196533203125, -0.0018157958984375, 0.004413604736328125, 0.01064300537109375, 0.016872406005859375, 0.023101806640625, 0.029331207275390625, 0.03556060791015625, 0.041790008544921875, 0.0480194091796875, 0.054248809814453125, 0.06047821044921875, 0.06670761108398438, 0.07293701171875, 0.07916641235351562, 0.08539581298828125, 0.09162521362304688, 0.0978546142578125, 0.10408401489257812, 0.11031341552734375, 0.11654281616210938, 0.122772216796875, 0.12900161743164062, 0.13523101806640625, 0.14146041870117188, 0.1476898193359375, 0.15391921997070312, 0.16014862060546875, 0.16637802124023438, 0.172607421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 12.0, 6.0, 14.0, 14.0, 20.0, 39.0, 49.0, 87.0, 85.0, 186.0, 298.0, 553.0, 1197.0, 3265.0, 10887.0, 51064.0, 278714.0, 524447.0, 140922.0, 26280.0, 6397.0, 2074.0, 841.0, 447.0, 230.0, 127.0, 88.0, 51.0, 29.0, 30.0, 26.0, 22.0, 16.0, 10.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54638671875, -0.528350830078125, -0.51031494140625, -0.492279052734375, -0.4742431640625, -0.456207275390625, -0.43817138671875, -0.420135498046875, -0.402099609375, -0.384063720703125, -0.36602783203125, -0.347991943359375, -0.3299560546875, -0.311920166015625, -0.29388427734375, -0.275848388671875, -0.2578125, -0.239776611328125, -0.22174072265625, -0.203704833984375, -0.1856689453125, -0.167633056640625, -0.14959716796875, -0.131561279296875, -0.113525390625, -0.095489501953125, -0.07745361328125, -0.059417724609375, -0.0413818359375, -0.023345947265625, -0.00531005859375, 0.012725830078125, 0.03076171875, 0.048797607421875, 0.06683349609375, 0.084869384765625, 0.1029052734375, 0.120941162109375, 0.13897705078125, 0.157012939453125, 0.175048828125, 0.193084716796875, 0.21112060546875, 0.229156494140625, 0.2471923828125, 0.265228271484375, 0.28326416015625, 0.301300048828125, 0.3193359375, 0.337371826171875, 0.35540771484375, 0.373443603515625, 0.3914794921875, 0.409515380859375, 0.42755126953125, 0.445587158203125, 0.463623046875, 0.481658935546875, 0.49969482421875, 0.517730712890625, 0.5357666015625, 0.553802490234375, 0.57183837890625, 0.589874267578125, 0.60791015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 8.0, 4.0, 10.0, 7.0, 6.0, 19.0, 19.0, 12.0, 33.0, 24.0, 36.0, 34.0, 40.0, 45.0, 41.0, 39.0, 44.0, 43.0, 47.0, 43.0, 52.0, 52.0, 46.0, 45.0, 33.0, 41.0, 28.0, 32.0, 33.0, 17.0, 14.0, 16.0, 10.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42822265625, -0.41469573974609375, -0.4011688232421875, -0.38764190673828125, -0.374114990234375, -0.36058807373046875, -0.3470611572265625, -0.33353424072265625, -0.32000732421875, -0.30648040771484375, -0.2929534912109375, -0.27942657470703125, -0.265899658203125, -0.25237274169921875, -0.2388458251953125, -0.22531890869140625, -0.2117919921875, -0.19826507568359375, -0.1847381591796875, -0.17121124267578125, -0.157684326171875, -0.14415740966796875, -0.1306304931640625, -0.11710357666015625, -0.10357666015625, -0.09004974365234375, -0.0765228271484375, -0.06299591064453125, -0.049468994140625, -0.03594207763671875, -0.0224151611328125, -0.00888824462890625, 0.004638671875, 0.01816558837890625, 0.0316925048828125, 0.04521942138671875, 0.058746337890625, 0.07227325439453125, 0.0858001708984375, 0.09932708740234375, 0.11285400390625, 0.12638092041015625, 0.1399078369140625, 0.15343475341796875, 0.166961669921875, 0.18048858642578125, 0.1940155029296875, 0.20754241943359375, 0.2210693359375, 0.23459625244140625, 0.2481231689453125, 0.26165008544921875, 0.275177001953125, 0.28870391845703125, 0.3022308349609375, 0.31575775146484375, 0.32928466796875, 0.34281158447265625, 0.3563385009765625, 0.36986541748046875, 0.383392333984375, 0.39691925048828125, 0.4104461669921875, 0.42397308349609375, 0.4375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 1.0, 4.0, 8.0, 6.0, 9.0, 21.0, 18.0, 24.0, 48.0, 50.0, 90.0, 140.0, 228.0, 432.0, 885.0, 2199.0, 6141.0, 22992.0, 151949.0, 669502.0, 159574.0, 23658.0, 6353.0, 2196.0, 923.0, 425.0, 228.0, 147.0, 99.0, 59.0, 48.0, 26.0, 23.0, 20.0, 6.0, 8.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.2949104309082031, -0.28610992431640625, -0.2773094177246094, -0.2685089111328125, -0.2597084045410156, -0.25090789794921875, -0.24210739135742188, -0.233306884765625, -0.22450637817382812, -0.21570587158203125, -0.20690536499023438, -0.1981048583984375, -0.18930435180664062, -0.18050384521484375, -0.17170333862304688, -0.16290283203125, -0.15410232543945312, -0.14530181884765625, -0.13650131225585938, -0.1277008056640625, -0.11890029907226562, -0.11009979248046875, -0.10129928588867188, -0.092498779296875, -0.08369827270507812, -0.07489776611328125, -0.06609725952148438, -0.0572967529296875, -0.048496246337890625, -0.03969573974609375, -0.030895233154296875, -0.0220947265625, -0.013294219970703125, -0.00449371337890625, 0.004306793212890625, 0.0131072998046875, 0.021907806396484375, 0.03070831298828125, 0.039508819580078125, 0.048309326171875, 0.057109832763671875, 0.06591033935546875, 0.07471084594726562, 0.0835113525390625, 0.09231185913085938, 0.10111236572265625, 0.10991287231445312, 0.11871337890625, 0.12751388549804688, 0.13631439208984375, 0.14511489868164062, 0.1539154052734375, 0.16271591186523438, 0.17151641845703125, 0.18031692504882812, 0.189117431640625, 0.19791793823242188, 0.20671844482421875, 0.21551895141601562, 0.2243194580078125, 0.23311996459960938, 0.24192047119140625, 0.2507209777832031, 0.259521484375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 8.0, 8.0, 10.0, 8.0, 14.0, 25.0, 24.0, 32.0, 26.0, 48.0, 41.0, 75.0, 72.0, 82.0, 79.0, 73.0, 51.0, 52.0, 40.0, 28.0, 34.0, 17.0, 21.0, 17.0, 7.0, 13.0, 17.0, 6.0, 11.0, 6.0, 3.0, 4.0, 3.0, 2.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.799531936645508e-05, -5.5985525250434875e-05, -5.397573113441467e-05, -5.196593701839447e-05, -4.995614290237427e-05, -4.7946348786354065e-05, -4.593655467033386e-05, -4.392676055431366e-05, -4.191696643829346e-05, -3.9907172322273254e-05, -3.789737820625305e-05, -3.588758409023285e-05, -3.3877789974212646e-05, -3.1867995858192444e-05, -2.985820174217224e-05, -2.784840762615204e-05, -2.5838613510131836e-05, -2.3828819394111633e-05, -2.181902527809143e-05, -1.9809231162071228e-05, -1.7799437046051025e-05, -1.5789642930030823e-05, -1.377984881401062e-05, -1.1770054697990417e-05, -9.760260581970215e-06, -7.750466465950012e-06, -5.7406723499298096e-06, -3.730878233909607e-06, -1.7210841178894043e-06, 2.8870999813079834e-07, 2.298504114151001e-06, 4.308298230171204e-06, 6.318092346191406e-06, 8.327886462211609e-06, 1.0337680578231812e-05, 1.2347474694252014e-05, 1.4357268810272217e-05, 1.636706292629242e-05, 1.8376857042312622e-05, 2.0386651158332825e-05, 2.2396445274353027e-05, 2.440623939037323e-05, 2.6416033506393433e-05, 2.8425827622413635e-05, 3.0435621738433838e-05, 3.244541585445404e-05, 3.445520997047424e-05, 3.6465004086494446e-05, 3.847479820251465e-05, 4.048459231853485e-05, 4.2494386434555054e-05, 4.4504180550575256e-05, 4.651397466659546e-05, 4.852376878261566e-05, 5.0533562898635864e-05, 5.254335701465607e-05, 5.455315113067627e-05, 5.656294524669647e-05, 5.8572739362716675e-05, 6.058253347873688e-05, 6.259232759475708e-05, 6.460212171077728e-05, 6.661191582679749e-05, 6.862170994281769e-05, 7.063150405883789e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 12.0, 15.0, 25.0, 41.0, 56.0, 111.0, 201.0, 403.0, 974.0, 2866.0, 14976.0, 218912.0, 750399.0, 50452.0, 6220.0, 1549.0, 640.0, 305.0, 154.0, 100.0, 57.0, 18.0, 23.0, 10.0, 5.0, 6.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35595703125, -0.34336090087890625, -0.3307647705078125, -0.31816864013671875, -0.305572509765625, -0.29297637939453125, -0.2803802490234375, -0.26778411865234375, -0.25518798828125, -0.24259185791015625, -0.2299957275390625, -0.21739959716796875, -0.204803466796875, -0.19220733642578125, -0.1796112060546875, -0.16701507568359375, -0.1544189453125, -0.14182281494140625, -0.1292266845703125, -0.11663055419921875, -0.104034423828125, -0.09143829345703125, -0.0788421630859375, -0.06624603271484375, -0.05364990234375, -0.04105377197265625, -0.0284576416015625, -0.01586151123046875, -0.003265380859375, 0.00933074951171875, 0.0219268798828125, 0.03452301025390625, 0.047119140625, 0.05971527099609375, 0.0723114013671875, 0.08490753173828125, 0.097503662109375, 0.11009979248046875, 0.1226959228515625, 0.13529205322265625, 0.14788818359375, 0.16048431396484375, 0.1730804443359375, 0.18567657470703125, 0.198272705078125, 0.21086883544921875, 0.2234649658203125, 0.23606109619140625, 0.2486572265625, 0.26125335693359375, 0.2738494873046875, 0.28644561767578125, 0.299041748046875, 0.31163787841796875, 0.3242340087890625, 0.33683013916015625, 0.34942626953125, 0.36202239990234375, 0.3746185302734375, 0.38721466064453125, 0.399810791015625, 0.41240692138671875, 0.4250030517578125, 0.43759918212890625, 0.4501953125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 12.0, 20.0, 21.0, 37.0, 41.0, 60.0, 69.0, 106.0, 95.0, 107.0, 105.0, 72.0, 74.0, 58.0, 28.0, 34.0, 13.0, 20.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12646484375, -0.11955642700195312, -0.11264801025390625, -0.10573959350585938, -0.0988311767578125, -0.09192276000976562, -0.08501434326171875, -0.07810592651367188, -0.071197509765625, -0.06428909301757812, -0.05738067626953125, -0.050472259521484375, -0.0435638427734375, -0.036655426025390625, -0.02974700927734375, -0.022838592529296875, -0.01593017578125, -0.009021759033203125, -0.00211334228515625, 0.004795074462890625, 0.0117034912109375, 0.018611907958984375, 0.02552032470703125, 0.032428741455078125, 0.039337158203125, 0.046245574951171875, 0.05315399169921875, 0.060062408447265625, 0.0669708251953125, 0.07387924194335938, 0.08078765869140625, 0.08769607543945312, 0.0946044921875, 0.10151290893554688, 0.10842132568359375, 0.11532974243164062, 0.1222381591796875, 0.12914657592773438, 0.13605499267578125, 0.14296340942382812, 0.149871826171875, 0.15678024291992188, 0.16368865966796875, 0.17059707641601562, 0.1775054931640625, 0.18441390991210938, 0.19132232666015625, 0.19823074340820312, 0.20513916015625, 0.21204757690429688, 0.21895599365234375, 0.22586441040039062, 0.2327728271484375, 0.23968124389648438, 0.24658966064453125, 0.2534980773925781, 0.260406494140625, 0.2673149108886719, 0.27422332763671875, 0.2811317443847656, 0.2880401611328125, 0.2949485778808594, 0.30185699462890625, 0.3087654113769531, 0.315673828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 17.0, 19.0, 56.0, 111.0, 155.0, 233.0, 165.0, 111.0, 63.0, 32.0, 14.0, 11.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.191426753997803, -4.038639545440674, -3.885852575302124, -3.733065366744995, -3.5802783966064453, -3.4274911880493164, -3.2747039794921875, -3.1219170093536377, -2.969130039215088, -2.816342830657959, -2.663555860519409, -2.5107686519622803, -2.3579816818237305, -2.2051944732666016, -2.0524072647094727, -1.8996202945709229, -1.746833086013794, -1.5940459966659546, -1.4412589073181152, -1.2884716987609863, -1.1356847286224365, -0.9828975796699524, -0.8301104307174683, -0.6773233413696289, -0.5245362520217896, -0.3717491626739502, -0.21896204352378845, -0.06617492437362671, 0.08661216497421265, 0.239399254322052, 0.39218640327453613, 0.5449734926223755, 0.6977605819702148, 0.8505476713180542, 1.0033347606658936, 1.1561219692230225, 1.3089089393615723, 1.4616961479187012, 1.6144832372665405, 1.7672703266143799, 1.9200574159622192, 2.0728445053100586, 2.2256317138671875, 2.3784186840057373, 2.531205892562866, 2.683992862701416, 2.836780071258545, 2.989567279815674, 3.1423542499542236, 3.2951414585113525, 3.4479284286499023, 3.6007156372070312, 3.753502607345581, 3.90628981590271, 4.05907678604126, 4.211863994598389, 4.364651203155518, 4.5174384117126465, 4.670225620269775, 4.823012351989746, 4.975799560546875, 5.128586769104004, 5.281373977661133, 5.434161186218262, 5.586947917938232]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 8.0, 8.0, 8.0, 14.0, 13.0, 16.0, 21.0, 23.0, 28.0, 38.0, 34.0, 42.0, 47.0, 46.0, 45.0, 28.0, 49.0, 46.0, 49.0, 48.0, 48.0, 47.0, 43.0, 36.0, 22.0, 23.0, 24.0, 24.0, 26.0, 13.0, 15.0, 12.0, 11.0, 11.0, 10.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1554758548736572, -2.0817110538482666, -2.007946014404297, -1.9341812133789062, -1.8604164123535156, -1.7866514921188354, -1.7128865718841553, -1.6391217708587646, -1.5653568506240845, -1.4915919303894043, -1.4178271293640137, -1.3440622091293335, -1.2702972888946533, -1.1965324878692627, -1.1227675676345825, -1.0490026473999023, -0.9752378463745117, -0.9014729857444763, -0.8277081251144409, -0.7539432048797607, -0.6801783442497253, -0.6064134836196899, -0.5326485633850098, -0.45888370275497437, -0.38511884212493896, -0.31135398149490356, -0.23758909106254578, -0.16382421553134918, -0.09005934000015259, -0.016294479370117188, 0.0574704110622406, 0.1312353014945984, 0.2049999237060547, 0.2787647843360901, 0.3525296747684479, 0.42629456520080566, 0.5000594258308411, 0.5738242864608765, 0.6475892066955566, 0.721354067325592, 0.7951189279556274, 0.8688837885856628, 0.9426486492156982, 1.0164135694503784, 1.0901784896850586, 1.1639432907104492, 1.2377082109451294, 1.3114731311798096, 1.3852379322052002, 1.4590028524398804, 1.532767653465271, 1.6065325736999512, 1.6802973747253418, 1.754062294960022, 1.8278272151947021, 1.9015920162200928, 1.975356936454773, 2.049121856689453, 2.1228866577148438, 2.1966514587402344, 2.270416498184204, 2.3441812992095947, 2.4179461002349854, 2.491711139678955, 2.5654759407043457]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 9.0, 9.0, 15.0, 34.0, 42.0, 62.0, 84.0, 142.0, 212.0, 337.0, 496.0, 1025.0, 2290.0, 6557.0, 28797.0, 477184.0, 3613937.0, 47457.0, 9776.0, 3171.0, 1263.0, 585.0, 296.0, 172.0, 122.0, 77.0, 44.0, 32.0, 20.0, 7.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.0642852783203125, -1.028961181640625, -0.9936370849609375, -0.95831298828125, -0.9229888916015625, -0.887664794921875, -0.8523406982421875, -0.8170166015625, -0.7816925048828125, -0.746368408203125, -0.7110443115234375, -0.67572021484375, -0.6403961181640625, -0.605072021484375, -0.5697479248046875, -0.534423828125, -0.4990997314453125, -0.463775634765625, -0.4284515380859375, -0.39312744140625, -0.3578033447265625, -0.322479248046875, -0.2871551513671875, -0.2518310546875, -0.2165069580078125, -0.181182861328125, -0.1458587646484375, -0.11053466796875, -0.0752105712890625, -0.039886474609375, -0.0045623779296875, 0.03076171875, 0.0660858154296875, 0.101409912109375, 0.1367340087890625, 0.17205810546875, 0.2073822021484375, 0.242706298828125, 0.2780303955078125, 0.3133544921875, 0.3486785888671875, 0.384002685546875, 0.4193267822265625, 0.45465087890625, 0.4899749755859375, 0.525299072265625, 0.5606231689453125, 0.595947265625, 0.6312713623046875, 0.666595458984375, 0.7019195556640625, 0.73724365234375, 0.7725677490234375, 0.807891845703125, 0.8432159423828125, 0.8785400390625, 0.9138641357421875, 0.949188232421875, 0.9845123291015625, 1.01983642578125, 1.0551605224609375, 1.090484619140625, 1.1258087158203125, 1.1611328125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 9.0, 22.0, 18.0, 33.0, 44.0, 69.0, 82.0, 92.0, 100.0, 101.0, 84.0, 95.0, 74.0, 62.0, 33.0, 25.0, 17.0, 13.0, 7.0, 1.0, 2.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2469482421875, -0.24013900756835938, -0.23332977294921875, -0.22652053833007812, -0.2197113037109375, -0.21290206909179688, -0.20609283447265625, -0.19928359985351562, -0.192474365234375, -0.18566513061523438, -0.17885589599609375, -0.17204666137695312, -0.1652374267578125, -0.15842819213867188, -0.15161895751953125, -0.14480972290039062, -0.13800048828125, -0.13119125366210938, -0.12438201904296875, -0.11757278442382812, -0.1107635498046875, -0.10395431518554688, -0.09714508056640625, -0.09033584594726562, -0.083526611328125, -0.07671737670898438, -0.06990814208984375, -0.06309890747070312, -0.0562896728515625, -0.049480438232421875, -0.04267120361328125, -0.035861968994140625, -0.029052734375, -0.022243499755859375, -0.01543426513671875, -0.008625030517578125, -0.0018157958984375, 0.004993438720703125, 0.01180267333984375, 0.018611907958984375, 0.025421142578125, 0.032230377197265625, 0.03903961181640625, 0.045848846435546875, 0.0526580810546875, 0.059467315673828125, 0.06627655029296875, 0.07308578491210938, 0.07989501953125, 0.08670425415039062, 0.09351348876953125, 0.10032272338867188, 0.1071319580078125, 0.11394119262695312, 0.12075042724609375, 0.12755966186523438, 0.134368896484375, 0.14117813110351562, 0.14798736572265625, 0.15479660034179688, 0.1616058349609375, 0.16841506958007812, 0.17522430419921875, 0.18203353881835938, 0.1888427734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 2.0, 10.0, 7.0, 12.0, 10.0, 23.0, 25.0, 38.0, 40.0, 74.0, 117.0, 175.0, 336.0, 643.0, 1345.0, 3054.0, 8001.0, 24568.0, 109648.0, 3042572.0, 898884.0, 74372.0, 18743.0, 6517.0, 2560.0, 1134.0, 605.0, 299.0, 163.0, 94.0, 60.0, 38.0, 25.0, 21.0, 14.0, 14.0, 5.0, 10.0, 5.0, 4.0, 3.0, 0.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.52349853515625, -0.5059814453125, -0.48846435546875, -0.470947265625, -0.45343017578125, -0.4359130859375, -0.41839599609375, -0.40087890625, -0.38336181640625, -0.3658447265625, -0.34832763671875, -0.330810546875, -0.31329345703125, -0.2957763671875, -0.27825927734375, -0.2607421875, -0.24322509765625, -0.2257080078125, -0.20819091796875, -0.190673828125, -0.17315673828125, -0.1556396484375, -0.13812255859375, -0.12060546875, -0.10308837890625, -0.0855712890625, -0.06805419921875, -0.050537109375, -0.03302001953125, -0.0155029296875, 0.00201416015625, 0.01953125, 0.03704833984375, 0.0545654296875, 0.07208251953125, 0.089599609375, 0.10711669921875, 0.1246337890625, 0.14215087890625, 0.15966796875, 0.17718505859375, 0.1947021484375, 0.21221923828125, 0.229736328125, 0.24725341796875, 0.2647705078125, 0.28228759765625, 0.2998046875, 0.31732177734375, 0.3348388671875, 0.35235595703125, 0.369873046875, 0.38739013671875, 0.4049072265625, 0.42242431640625, 0.43994140625, 0.45745849609375, 0.4749755859375, 0.49249267578125, 0.510009765625, 0.52752685546875, 0.5450439453125, 0.56256103515625, 0.580078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 7.0, 4.0, 7.0, 9.0, 10.0, 20.0, 30.0, 38.0, 65.0, 89.0, 167.0, 357.0, 1143.0, 1384.0, 303.0, 156.0, 85.0, 45.0, 38.0, 24.0, 30.0, 21.0, 10.0, 14.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2939453125, -0.28578758239746094, -0.2776298522949219, -0.2694721221923828, -0.26131439208984375, -0.2531566619873047, -0.24499893188476562, -0.23684120178222656, -0.2286834716796875, -0.22052574157714844, -0.21236801147460938, -0.2042102813720703, -0.19605255126953125, -0.1878948211669922, -0.17973709106445312, -0.17157936096191406, -0.163421630859375, -0.15526390075683594, -0.14710617065429688, -0.1389484405517578, -0.13079071044921875, -0.12263298034667969, -0.11447525024414062, -0.10631752014160156, -0.0981597900390625, -0.09000205993652344, -0.08184432983398438, -0.07368659973144531, -0.06552886962890625, -0.05737113952636719, -0.049213409423828125, -0.04105567932128906, -0.03289794921875, -0.024740219116210938, -0.016582489013671875, -0.008424758911132812, -0.00026702880859375, 0.007890701293945312, 0.016048431396484375, 0.024206161499023438, 0.0323638916015625, 0.04052162170410156, 0.048679351806640625, 0.05683708190917969, 0.06499481201171875, 0.07315254211425781, 0.08131027221679688, 0.08946800231933594, 0.097625732421875, 0.10578346252441406, 0.11394119262695312, 0.12209892272949219, 0.13025665283203125, 0.1384143829345703, 0.14657211303710938, 0.15472984313964844, 0.1628875732421875, 0.17104530334472656, 0.17920303344726562, 0.1873607635498047, 0.19551849365234375, 0.2036762237548828, 0.21183395385742188, 0.21999168395996094, 0.2281494140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 10.0, 5.0, 30.0, 93.0, 167.0, 276.0, 221.0, 115.0, 38.0, 23.0, 11.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.66354501247406, -1.5745261907577515, -1.4855072498321533, -1.3964884281158447, -1.3074696063995361, -1.2184507846832275, -1.1294318437576294, -1.0404130220413208, -0.9513941407203674, -0.8623752593994141, -0.7733564376831055, -0.6843375563621521, -0.5953186750411987, -0.5062998533248901, -0.41728097200393677, -0.3282621502876282, -0.2392432689666748, -0.15022441744804382, -0.06120555102825165, 0.027813315391540527, 0.11683216691017151, 0.2058510184288025, 0.29486989974975586, 0.38388872146606445, 0.4729076027870178, 0.5619264841079712, 0.6509453058242798, 0.7399641871452332, 0.8289830684661865, 0.9180018901824951, 1.0070207118988037, 1.0960395336151123, 1.185058355331421, 1.2740771770477295, 1.3630961179733276, 1.4521149396896362, 1.5411337614059448, 1.630152702331543, 1.7191715240478516, 1.8081903457641602, 1.8972091674804688, 1.9862279891967773, 2.075246810913086, 2.1642656326293945, 2.2532846927642822, 2.342303514480591, 2.4313223361968994, 2.520341157913208, 2.6093602180480957, 2.6983790397644043, 2.787397861480713, 2.8764166831970215, 2.965435743331909, 3.0544545650482178, 3.1434733867645264, 3.232492208480835, 3.3215110301971436, 3.410529851913452, 3.4995486736297607, 3.5885677337646484, 3.677586555480957, 3.7666053771972656, 3.855624198913574, 3.944643020629883, 4.033661842346191]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 1.0, 5.0, 11.0, 10.0, 6.0, 13.0, 12.0, 24.0, 27.0, 27.0, 50.0, 45.0, 48.0, 41.0, 59.0, 59.0, 55.0, 52.0, 57.0, 59.0, 42.0, 48.0, 44.0, 31.0, 37.0, 25.0, 25.0, 18.0, 12.0, 16.0, 14.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8086709380149841, -0.7789427042007446, -0.7492144703865051, -0.7194862365722656, -0.6897580027580261, -0.6600297689437866, -0.6303015947341919, -0.6005733013153076, -0.5708451271057129, -0.5411168932914734, -0.5113886594772339, -0.4816604256629944, -0.4519321918487549, -0.4222039580345154, -0.39247575402259827, -0.36274752020835876, -0.3330192565917969, -0.3032910227775574, -0.27356278896331787, -0.24383457005023956, -0.21410633623600006, -0.18437810242176056, -0.15464988350868225, -0.12492164969444275, -0.09519341588020325, -0.06546518206596375, -0.03573695570230484, -0.006008729338645935, 0.023719504475593567, 0.05344773828983307, 0.08317595720291138, 0.11290419101715088, 0.1426323652267456, 0.1723605990409851, 0.2020888328552246, 0.23181705176830292, 0.2615453004837036, 0.2912735342979431, 0.32100173830986023, 0.35072997212409973, 0.38045820593833923, 0.41018643975257874, 0.43991467356681824, 0.46964287757873535, 0.49937111139297485, 0.5290993452072144, 0.5588275790214539, 0.5885558128356934, 0.6182840466499329, 0.6480122804641724, 0.6777405142784119, 0.7074687480926514, 0.7371969819068909, 0.7669252157211304, 0.7966533899307251, 0.8263816833496094, 0.8561098575592041, 0.8858380913734436, 0.9155663251876831, 0.9452945590019226, 0.9750227928161621, 1.0047509670257568, 1.0344792604446411, 1.0642074346542358, 1.0939357280731201]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 8.0, 14.0, 9.0, 13.0, 26.0, 33.0, 50.0, 68.0, 114.0, 165.0, 229.0, 417.0, 748.0, 1463.0, 3252.0, 8688.0, 32391.0, 188988.0, 638882.0, 134575.0, 25350.0, 7324.0, 2773.0, 1306.0, 629.0, 386.0, 221.0, 162.0, 91.0, 54.0, 36.0, 24.0, 19.0, 15.0, 14.0, 11.0, 5.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.82470703125, -0.7984542846679688, -0.7722015380859375, -0.7459487915039062, -0.719696044921875, -0.6934432983398438, -0.6671905517578125, -0.6409378051757812, -0.61468505859375, -0.5884323120117188, -0.5621795654296875, -0.5359268188476562, -0.509674072265625, -0.48342132568359375, -0.4571685791015625, -0.43091583251953125, -0.4046630859375, -0.37841033935546875, -0.3521575927734375, -0.32590484619140625, -0.299652099609375, -0.27339935302734375, -0.2471466064453125, -0.22089385986328125, -0.19464111328125, -0.16838836669921875, -0.1421356201171875, -0.11588287353515625, -0.089630126953125, -0.06337738037109375, -0.0371246337890625, -0.01087188720703125, 0.015380859375, 0.04163360595703125, 0.0678863525390625, 0.09413909912109375, 0.120391845703125, 0.14664459228515625, 0.1728973388671875, 0.19915008544921875, 0.22540283203125, 0.25165557861328125, 0.2779083251953125, 0.30416107177734375, 0.330413818359375, 0.35666656494140625, 0.3829193115234375, 0.40917205810546875, 0.4354248046875, 0.46167755126953125, 0.4879302978515625, 0.5141830444335938, 0.540435791015625, 0.5666885375976562, 0.5929412841796875, 0.6191940307617188, 0.64544677734375, 0.6716995239257812, 0.6979522705078125, 0.7242050170898438, 0.750457763671875, 0.7767105102539062, 0.8029632568359375, 0.8292160034179688, 0.85546875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 14.0, 19.0, 31.0, 32.0, 59.0, 94.0, 90.0, 127.0, 121.0, 97.0, 95.0, 68.0, 47.0, 38.0, 27.0, 10.0, 5.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271240234375, -0.2635459899902344, -0.25585174560546875, -0.24815750122070312, -0.2404632568359375, -0.23276901245117188, -0.22507476806640625, -0.21738052368164062, -0.209686279296875, -0.20199203491210938, -0.19429779052734375, -0.18660354614257812, -0.1789093017578125, -0.17121505737304688, -0.16352081298828125, -0.15582656860351562, -0.14813232421875, -0.14043807983398438, -0.13274383544921875, -0.12504959106445312, -0.1173553466796875, -0.10966110229492188, -0.10196685791015625, -0.09427261352539062, -0.086578369140625, -0.07888412475585938, -0.07118988037109375, -0.06349563598632812, -0.0558013916015625, -0.048107147216796875, -0.04041290283203125, -0.032718658447265625, -0.0250244140625, -0.017330169677734375, -0.00963592529296875, -0.001941680908203125, 0.0057525634765625, 0.013446807861328125, 0.02114105224609375, 0.028835296630859375, 0.036529541015625, 0.044223785400390625, 0.05191802978515625, 0.059612274169921875, 0.0673065185546875, 0.07500076293945312, 0.08269500732421875, 0.09038925170898438, 0.09808349609375, 0.10577774047851562, 0.11347198486328125, 0.12116622924804688, 0.1288604736328125, 0.13655471801757812, 0.14424896240234375, 0.15194320678710938, 0.159637451171875, 0.16733169555664062, 0.17502593994140625, 0.18272018432617188, 0.1904144287109375, 0.19810867309570312, 0.20580291748046875, 0.21349716186523438, 0.22119140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 10.0, 19.0, 11.0, 20.0, 29.0, 24.0, 44.0, 51.0, 88.0, 156.0, 211.0, 372.0, 695.0, 1586.0, 4449.0, 15950.0, 82879.0, 484444.0, 377301.0, 60997.0, 12683.0, 3562.0, 1379.0, 616.0, 321.0, 203.0, 118.0, 100.0, 55.0, 40.0, 42.0, 22.0, 13.0, 9.0, 15.0, 7.0, 6.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.61572265625, -0.5964279174804688, -0.5771331787109375, -0.5578384399414062, -0.538543701171875, -0.5192489624023438, -0.4999542236328125, -0.48065948486328125, -0.46136474609375, -0.44207000732421875, -0.4227752685546875, -0.40348052978515625, -0.384185791015625, -0.36489105224609375, -0.3455963134765625, -0.32630157470703125, -0.3070068359375, -0.28771209716796875, -0.2684173583984375, -0.24912261962890625, -0.229827880859375, -0.21053314208984375, -0.1912384033203125, -0.17194366455078125, -0.15264892578125, -0.13335418701171875, -0.1140594482421875, -0.09476470947265625, -0.075469970703125, -0.05617523193359375, -0.0368804931640625, -0.01758575439453125, 0.001708984375, 0.02100372314453125, 0.0402984619140625, 0.05959320068359375, 0.078887939453125, 0.09818267822265625, 0.1174774169921875, 0.13677215576171875, 0.15606689453125, 0.17536163330078125, 0.1946563720703125, 0.21395111083984375, 0.233245849609375, 0.25254058837890625, 0.2718353271484375, 0.29113006591796875, 0.3104248046875, 0.32971954345703125, 0.3490142822265625, 0.36830902099609375, 0.387603759765625, 0.40689849853515625, 0.4261932373046875, 0.44548797607421875, 0.46478271484375, 0.48407745361328125, 0.5033721923828125, 0.5226669311523438, 0.541961669921875, 0.5612564086914062, 0.5805511474609375, 0.5998458862304688, 0.619140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 9.0, 8.0, 17.0, 9.0, 19.0, 17.0, 16.0, 29.0, 19.0, 15.0, 27.0, 37.0, 34.0, 43.0, 41.0, 35.0, 50.0, 38.0, 54.0, 45.0, 46.0, 54.0, 40.0, 32.0, 37.0, 33.0, 33.0, 29.0, 24.0, 22.0, 18.0, 20.0, 10.0, 12.0, 5.0, 10.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37890625, -0.3653297424316406, -0.35175323486328125, -0.3381767272949219, -0.3246002197265625, -0.3110237121582031, -0.29744720458984375, -0.2838706970214844, -0.270294189453125, -0.2567176818847656, -0.24314117431640625, -0.22956466674804688, -0.2159881591796875, -0.20241165161132812, -0.18883514404296875, -0.17525863647460938, -0.16168212890625, -0.14810562133789062, -0.13452911376953125, -0.12095260620117188, -0.1073760986328125, -0.09379959106445312, -0.08022308349609375, -0.06664657592773438, -0.053070068359375, -0.039493560791015625, -0.02591705322265625, -0.012340545654296875, 0.0012359619140625, 0.014812469482421875, 0.02838897705078125, 0.041965484619140625, 0.0555419921875, 0.06911849975585938, 0.08269500732421875, 0.09627151489257812, 0.1098480224609375, 0.12342453002929688, 0.13700103759765625, 0.15057754516601562, 0.164154052734375, 0.17773056030273438, 0.19130706787109375, 0.20488357543945312, 0.2184600830078125, 0.23203659057617188, 0.24561309814453125, 0.2591896057128906, 0.27276611328125, 0.2863426208496094, 0.29991912841796875, 0.3134956359863281, 0.3270721435546875, 0.3406486511230469, 0.35422515869140625, 0.3678016662597656, 0.381378173828125, 0.3949546813964844, 0.40853118896484375, 0.4221076965332031, 0.4356842041015625, 0.4492607116699219, 0.46283721923828125, 0.4764137268066406, 0.489990234375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 4.0, 6.0, 11.0, 20.0, 32.0, 97.0, 159.0, 651.0, 5306.0, 1008243.0, 32193.0, 1308.0, 323.0, 97.0, 47.0, 26.0, 11.0, 7.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.078125, -1.0345001220703125, -0.990875244140625, -0.9472503662109375, -0.90362548828125, -0.8600006103515625, -0.816375732421875, -0.7727508544921875, -0.7291259765625, -0.6855010986328125, -0.641876220703125, -0.5982513427734375, -0.55462646484375, -0.5110015869140625, -0.467376708984375, -0.4237518310546875, -0.380126953125, -0.3365020751953125, -0.292877197265625, -0.2492523193359375, -0.20562744140625, -0.1620025634765625, -0.118377685546875, -0.0747528076171875, -0.0311279296875, 0.0124969482421875, 0.056121826171875, 0.0997467041015625, 0.14337158203125, 0.1869964599609375, 0.230621337890625, 0.2742462158203125, 0.31787109375, 0.3614959716796875, 0.405120849609375, 0.4487457275390625, 0.49237060546875, 0.5359954833984375, 0.579620361328125, 0.6232452392578125, 0.6668701171875, 0.7104949951171875, 0.754119873046875, 0.7977447509765625, 0.84136962890625, 0.8849945068359375, 0.928619384765625, 0.9722442626953125, 1.015869140625, 1.0594940185546875, 1.103118896484375, 1.1467437744140625, 1.19036865234375, 1.2339935302734375, 1.277618408203125, 1.3212432861328125, 1.3648681640625, 1.4084930419921875, 1.452117919921875, 1.4957427978515625, 1.53936767578125, 1.5829925537109375, 1.626617431640625, 1.6702423095703125, 1.7138671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 9.0, 17.0, 30.0, 62.0, 88.0, 213.0, 265.0, 163.0, 74.0, 27.0, 14.0, 18.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019884109497070312, -0.0001941230148077011, -0.0001894049346446991, -0.00018468685448169708, -0.00017996877431869507, -0.00017525069415569305, -0.00017053261399269104, -0.00016581453382968903, -0.000161096453666687, -0.000156378373503685, -0.00015166029334068298, -0.00014694221317768097, -0.00014222413301467896, -0.00013750605285167694, -0.00013278797268867493, -0.0001280698925256729, -0.0001233518123626709, -0.00011863373219966888, -0.00011391565203666687, -0.00010919757187366486, -0.00010447949171066284, -9.976141154766083e-05, -9.504333138465881e-05, -9.03252512216568e-05, -8.560717105865479e-05, -8.088909089565277e-05, -7.617101073265076e-05, -7.145293056964874e-05, -6.673485040664673e-05, -6.201677024364471e-05, -5.72986900806427e-05, -5.2580609917640686e-05, -4.786252975463867e-05, -4.314444959163666e-05, -3.8426369428634644e-05, -3.370828926563263e-05, -2.8990209102630615e-05, -2.42721289396286e-05, -1.9554048776626587e-05, -1.4835968613624573e-05, -1.0117888450622559e-05, -5.3998082876205444e-06, -6.817281246185303e-07, 4.036352038383484e-06, 8.754432201385498e-06, 1.3472512364387512e-05, 1.8190592527389526e-05, 2.290867269039154e-05, 2.7626752853393555e-05, 3.234483301639557e-05, 3.706291317939758e-05, 4.17809933423996e-05, 4.649907350540161e-05, 5.1217153668403625e-05, 5.593523383140564e-05, 6.0653313994407654e-05, 6.537139415740967e-05, 7.008947432041168e-05, 7.48075544834137e-05, 7.952563464641571e-05, 8.424371480941772e-05, 8.896179497241974e-05, 9.367987513542175e-05, 9.839795529842377e-05, 0.00010311603546142578]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 13.0, 24.0, 27.0, 80.0, 173.0, 411.0, 2444.0, 841682.0, 201377.0, 1663.0, 329.0, 162.0, 79.0, 36.0, 15.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7578125, -1.7102203369140625, -1.662628173828125, -1.6150360107421875, -1.56744384765625, -1.5198516845703125, -1.472259521484375, -1.4246673583984375, -1.3770751953125, -1.3294830322265625, -1.281890869140625, -1.2342987060546875, -1.18670654296875, -1.1391143798828125, -1.091522216796875, -1.0439300537109375, -0.996337890625, -0.9487457275390625, -0.901153564453125, -0.8535614013671875, -0.80596923828125, -0.7583770751953125, -0.710784912109375, -0.6631927490234375, -0.6156005859375, -0.5680084228515625, -0.520416259765625, -0.4728240966796875, -0.42523193359375, -0.3776397705078125, -0.330047607421875, -0.2824554443359375, -0.23486328125, -0.1872711181640625, -0.139678955078125, -0.0920867919921875, -0.04449462890625, 0.0030975341796875, 0.050689697265625, 0.0982818603515625, 0.1458740234375, 0.1934661865234375, 0.241058349609375, 0.2886505126953125, 0.33624267578125, 0.3838348388671875, 0.431427001953125, 0.4790191650390625, 0.526611328125, 0.5742034912109375, 0.621795654296875, 0.6693878173828125, 0.71697998046875, 0.7645721435546875, 0.812164306640625, 0.8597564697265625, 0.9073486328125, 0.9549407958984375, 1.002532958984375, 1.0501251220703125, 1.09771728515625, 1.1453094482421875, 1.192901611328125, 1.2404937744140625, 1.2880859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 13.0, 17.0, 63.0, 171.0, 440.0, 202.0, 66.0, 18.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8994140625, -0.874786376953125, -0.85015869140625, -0.825531005859375, -0.8009033203125, -0.776275634765625, -0.75164794921875, -0.727020263671875, -0.702392578125, -0.677764892578125, -0.65313720703125, -0.628509521484375, -0.6038818359375, -0.579254150390625, -0.55462646484375, -0.529998779296875, -0.50537109375, -0.480743408203125, -0.45611572265625, -0.431488037109375, -0.4068603515625, -0.382232666015625, -0.35760498046875, -0.332977294921875, -0.308349609375, -0.283721923828125, -0.25909423828125, -0.234466552734375, -0.2098388671875, -0.185211181640625, -0.16058349609375, -0.135955810546875, -0.111328125, -0.086700439453125, -0.06207275390625, -0.037445068359375, -0.0128173828125, 0.011810302734375, 0.03643798828125, 0.061065673828125, 0.085693359375, 0.110321044921875, 0.13494873046875, 0.159576416015625, 0.1842041015625, 0.208831787109375, 0.23345947265625, 0.258087158203125, 0.28271484375, 0.307342529296875, 0.33197021484375, 0.356597900390625, 0.3812255859375, 0.405853271484375, 0.43048095703125, 0.455108642578125, 0.479736328125, 0.504364013671875, 0.52899169921875, 0.553619384765625, 0.5782470703125, 0.602874755859375, 0.62750244140625, 0.652130126953125, 0.6767578125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 11.0, 22.0, 102.0, 303.0, 319.0, 182.0, 46.0, 13.0, 4.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.225072860717773, -9.93333625793457, -9.641600608825684, -9.34986400604248, -9.058128356933594, -8.76639175415039, -8.474655151367188, -8.1829195022583, -7.891182899475098, -7.599446773529053, -7.307710647583008, -7.015974044799805, -6.72423791885376, -6.432501792907715, -6.14076566696167, -5.849029541015625, -5.55729341506958, -5.265557289123535, -4.97382116317749, -4.682085037231445, -4.390348434448242, -4.098612308502197, -3.8068761825561523, -3.5151398181915283, -3.2234036922454834, -2.9316675662994385, -2.6399312019348145, -2.3481950759887695, -2.0564589500427246, -1.7647225856781006, -1.4729864597320557, -1.1812500953674316, -0.8895139694213867, -0.5977777242660522, -0.30604153871536255, -0.014305353164672852, 0.2774308919906616, 0.5691671371459961, 0.860903263092041, 1.152639627456665, 1.44437575340271, 1.7361119985580444, 2.027848243713379, 2.319584369659424, 2.6113204956054688, 2.9030568599700928, 3.1947929859161377, 3.4865293502807617, 3.7782654762268066, 4.070001602172852, 4.3617377281188965, 4.653473854064941, 4.9452104568481445, 5.2369465827941895, 5.528682708740234, 5.8204193115234375, 6.112154960632324, 6.403891086578369, 6.695627212524414, 6.987363815307617, 7.279099941253662, 7.570836067199707, 7.862572193145752, 8.154308319091797, 8.446044921875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 3.0, 6.0, 8.0, 16.0, 16.0, 12.0, 12.0, 25.0, 19.0, 16.0, 18.0, 27.0, 32.0, 37.0, 45.0, 35.0, 49.0, 34.0, 40.0, 49.0, 42.0, 41.0, 33.0, 46.0, 44.0, 37.0, 29.0, 30.0, 35.0, 28.0, 22.0, 22.0, 14.0, 16.0, 11.0, 11.0, 6.0, 10.0, 7.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.5423927307128906, -2.471569538116455, -2.4007463455200195, -2.329922914505005, -2.2590997219085693, -2.188276529312134, -2.1174533367156982, -2.0466301441192627, -1.9758068323135376, -1.904983639717102, -1.834160327911377, -1.7633371353149414, -1.6925139427185059, -1.6216906309127808, -1.5508674383163452, -1.4800441265106201, -1.4092209339141846, -1.338397741317749, -1.267574429512024, -1.1967512369155884, -1.1259279251098633, -1.0551047325134277, -0.9842815399169922, -0.9134582877159119, -0.8426350355148315, -0.7718117833137512, -0.7009885311126709, -0.6301653385162354, -0.559342086315155, -0.4885188341140747, -0.4176956117153168, -0.34687238931655884, -0.2760488986968994, -0.20522566139698029, -0.13440242409706116, -0.06357918679714203, 0.0072440505027771, 0.07806730270385742, 0.14889052510261536, 0.2197137475013733, 0.2905369997024536, 0.36136025190353394, 0.43218347430229187, 0.5030066967010498, 0.5738299489021301, 0.6446532011032104, 0.715476393699646, 0.7862996459007263, 0.8571228981018066, 0.927946150302887, 0.9987694025039673, 1.0695925951004028, 1.140415906906128, 1.2112390995025635, 1.282062292098999, 1.3528854846954346, 1.4237087965011597, 1.4945319890975952, 1.5653553009033203, 1.6361784934997559, 1.7070016860961914, 1.7778249979019165, 1.848648190498352, 1.9194715023040771, 1.9902946949005127]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 8.0, 9.0, 16.0, 18.0, 28.0, 47.0, 60.0, 70.0, 99.0, 167.0, 238.0, 374.0, 594.0, 1148.0, 2502.0, 7198.0, 28234.0, 510631.0, 3585873.0, 40956.0, 9626.0, 3231.0, 1310.0, 742.0, 375.0, 269.0, 130.0, 117.0, 60.0, 39.0, 23.0, 26.0, 18.0, 14.0, 3.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8349609375, -0.8041534423828125, -0.773345947265625, -0.7425384521484375, -0.71173095703125, -0.6809234619140625, -0.650115966796875, -0.6193084716796875, -0.5885009765625, -0.5576934814453125, -0.526885986328125, -0.4960784912109375, -0.46527099609375, -0.4344635009765625, -0.403656005859375, -0.3728485107421875, -0.342041015625, -0.3112335205078125, -0.280426025390625, -0.2496185302734375, -0.21881103515625, -0.1880035400390625, -0.157196044921875, -0.1263885498046875, -0.0955810546875, -0.0647735595703125, -0.033966064453125, -0.0031585693359375, 0.02764892578125, 0.0584564208984375, 0.089263916015625, 0.1200714111328125, 0.15087890625, 0.1816864013671875, 0.212493896484375, 0.2433013916015625, 0.27410888671875, 0.3049163818359375, 0.335723876953125, 0.3665313720703125, 0.3973388671875, 0.4281463623046875, 0.458953857421875, 0.4897613525390625, 0.52056884765625, 0.5513763427734375, 0.582183837890625, 0.6129913330078125, 0.643798828125, 0.6746063232421875, 0.705413818359375, 0.7362213134765625, 0.76702880859375, 0.7978363037109375, 0.828643798828125, 0.8594512939453125, 0.8902587890625, 0.9210662841796875, 0.951873779296875, 0.9826812744140625, 1.01348876953125, 1.0442962646484375, 1.075103759765625, 1.1059112548828125, 1.13671875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 9.0, 19.0, 34.0, 46.0, 70.0, 78.0, 96.0, 121.0, 116.0, 92.0, 94.0, 66.0, 50.0, 48.0, 15.0, 11.0, 9.0, 6.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.2777442932128906, -0.26935577392578125, -0.2609672546386719, -0.2525787353515625, -0.24419021606445312, -0.23580169677734375, -0.22741317749023438, -0.219024658203125, -0.21063613891601562, -0.20224761962890625, -0.19385910034179688, -0.1854705810546875, -0.17708206176757812, -0.16869354248046875, -0.16030502319335938, -0.15191650390625, -0.14352798461914062, -0.13513946533203125, -0.12675094604492188, -0.1183624267578125, -0.10997390747070312, -0.10158538818359375, -0.09319686889648438, -0.084808349609375, -0.07641983032226562, -0.06803131103515625, -0.059642791748046875, -0.0512542724609375, -0.042865753173828125, -0.03447723388671875, -0.026088714599609375, -0.0177001953125, -0.009311676025390625, -0.00092315673828125, 0.007465362548828125, 0.0158538818359375, 0.024242401123046875, 0.03263092041015625, 0.041019439697265625, 0.049407958984375, 0.057796478271484375, 0.06618499755859375, 0.07457351684570312, 0.0829620361328125, 0.09135055541992188, 0.09973907470703125, 0.10812759399414062, 0.11651611328125, 0.12490463256835938, 0.13329315185546875, 0.14168167114257812, 0.1500701904296875, 0.15845870971679688, 0.16684722900390625, 0.17523574829101562, 0.183624267578125, 0.19201278686523438, 0.20040130615234375, 0.20878982543945312, 0.2171783447265625, 0.22556686401367188, 0.23395538330078125, 0.24234390258789062, 0.250732421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 5.0, 9.0, 19.0, 11.0, 12.0, 39.0, 33.0, 38.0, 64.0, 96.0, 108.0, 151.0, 221.0, 527.0, 2729.0, 57911.0, 4111878.0, 17726.0, 1455.0, 381.0, 225.0, 158.0, 113.0, 79.0, 78.0, 39.0, 32.0, 35.0, 28.0, 26.0, 20.0, 5.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7666015625, -1.6909637451171875, -1.615325927734375, -1.5396881103515625, -1.46405029296875, -1.3884124755859375, -1.312774658203125, -1.2371368408203125, -1.1614990234375, -1.0858612060546875, -1.010223388671875, -0.9345855712890625, -0.85894775390625, -0.7833099365234375, -0.707672119140625, -0.6320343017578125, -0.556396484375, -0.4807586669921875, -0.405120849609375, -0.3294830322265625, -0.25384521484375, -0.1782073974609375, -0.102569580078125, -0.0269317626953125, 0.0487060546875, 0.1243438720703125, 0.199981689453125, 0.2756195068359375, 0.35125732421875, 0.4268951416015625, 0.502532958984375, 0.5781707763671875, 0.65380859375, 0.7294464111328125, 0.805084228515625, 0.8807220458984375, 0.95635986328125, 1.0319976806640625, 1.107635498046875, 1.1832733154296875, 1.2589111328125, 1.3345489501953125, 1.410186767578125, 1.4858245849609375, 1.56146240234375, 1.6371002197265625, 1.712738037109375, 1.7883758544921875, 1.864013671875, 1.9396514892578125, 2.015289306640625, 2.0909271240234375, 2.16656494140625, 2.2422027587890625, 2.317840576171875, 2.3934783935546875, 2.4691162109375, 2.5447540283203125, 2.620391845703125, 2.6960296630859375, 2.77166748046875, 2.8473052978515625, 2.922943115234375, 2.9985809326171875, 3.07421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 20.0, 37.0, 96.0, 416.0, 3233.0, 182.0, 48.0, 19.0, 10.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26611328125, -0.24033355712890625, -0.2145538330078125, -0.18877410888671875, -0.162994384765625, -0.13721466064453125, -0.1114349365234375, -0.08565521240234375, -0.05987548828125, -0.03409576416015625, -0.0083160400390625, 0.01746368408203125, 0.043243408203125, 0.06902313232421875, 0.0948028564453125, 0.12058258056640625, 0.1463623046875, 0.17214202880859375, 0.1979217529296875, 0.22370147705078125, 0.249481201171875, 0.27526092529296875, 0.3010406494140625, 0.32682037353515625, 0.35260009765625, 0.37837982177734375, 0.4041595458984375, 0.42993927001953125, 0.455718994140625, 0.48149871826171875, 0.5072784423828125, 0.5330581665039062, 0.558837890625, 0.5846176147460938, 0.6103973388671875, 0.6361770629882812, 0.661956787109375, 0.6877365112304688, 0.7135162353515625, 0.7392959594726562, 0.76507568359375, 0.7908554077148438, 0.8166351318359375, 0.8424148559570312, 0.868194580078125, 0.8939743041992188, 0.9197540283203125, 0.9455337524414062, 0.9713134765625, 0.9970932006835938, 1.0228729248046875, 1.0486526489257812, 1.074432373046875, 1.1002120971679688, 1.1259918212890625, 1.1517715454101562, 1.17755126953125, 1.2033309936523438, 1.2291107177734375, 1.2548904418945312, 1.280670166015625, 1.3064498901367188, 1.3322296142578125, 1.3580093383789062, 1.3837890625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 35.0, 93.0, 480.0, 314.0, 50.0, 9.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.217049598693848, -9.024659156799316, -8.832267761230469, -8.639877319335938, -8.447486877441406, -8.255096435546875, -8.062705039978027, -7.870314598083496, -7.677923679351807, -7.485532760620117, -7.293142318725586, -7.1007513999938965, -6.908360958099365, -6.715970039367676, -6.5235795974731445, -6.331188678741455, -6.138797760009766, -5.946406841278076, -5.754016399383545, -5.5616254806518555, -5.369235038757324, -5.176844120025635, -4.984453201293945, -4.792062759399414, -4.599672317504883, -4.407281398773193, -4.214890956878662, -4.022500038146973, -3.8301093578338623, -3.637718677520752, -3.4453279972076416, -3.2529373168945312, -3.060546398162842, -2.8681557178497314, -2.675765037536621, -2.4833741188049316, -2.2909834384918213, -2.098592758178711, -1.9062020778656006, -1.7138112783432007, -1.5214205980300903, -1.32902991771698, -1.13663911819458, -0.9442484378814697, -0.7518576979637146, -0.5594669580459595, -0.3670762777328491, -0.17468547821044922, 0.017705202102661133, 0.21009592711925507, 0.402486652135849, 0.5948773622512817, 0.7872681021690369, 0.979658842086792, 1.1720495223999023, 1.3644403219223022, 1.5568310022354126, 1.749221682548523, 1.9416124820709229, 2.134003162384033, 2.3263938426971436, 2.518784523010254, 2.7111754417419434, 2.9035661220550537, 3.095956802368164]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 5.0, 6.0, 12.0, 25.0, 30.0, 45.0, 63.0, 71.0, 102.0, 95.0, 111.0, 103.0, 82.0, 83.0, 52.0, 43.0, 23.0, 12.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.7313365936279297, -2.6597084999084473, -2.588080406188965, -2.5164523124694824, -2.44482421875, -2.3731958866119385, -2.301567792892456, -2.2299396991729736, -2.158311605453491, -2.086683511734009, -2.0150554180145264, -1.9434272050857544, -1.871799111366272, -1.8001710176467896, -1.7285428047180176, -1.6569147109985352, -1.5852866172790527, -1.5136585235595703, -1.442030429840088, -1.370402216911316, -1.2987741231918335, -1.227146029472351, -1.155517816543579, -1.0838897228240967, -1.0122616291046143, -0.9406335353851318, -0.8690053820610046, -0.7973772287368774, -0.725749135017395, -0.6541210412979126, -0.5824928879737854, -0.5108647346496582, -0.43923652172088623, -0.3676083981990814, -0.2959802746772766, -0.2243521511554718, -0.152724027633667, -0.08109590411186218, -0.009467780590057373, 0.062160372734069824, 0.13378846645355225, 0.20541658997535706, 0.27704471349716187, 0.3486728370189667, 0.4203009605407715, 0.4919290840625763, 0.5635572075843811, 0.6351853609085083, 0.7068134546279907, 0.7784415483474731, 0.8500697016716003, 0.9216978549957275, 0.99332594871521, 1.0649540424346924, 1.1365821361541748, 1.2082103490829468, 1.2798384428024292, 1.3514665365219116, 1.4230947494506836, 1.494722843170166, 1.5663509368896484, 1.6379790306091309, 1.7096071243286133, 1.7812353372573853, 1.8528634309768677]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 8.0, 7.0, 10.0, 30.0, 42.0, 80.0, 179.0, 377.0, 926.0, 2734.0, 11834.0, 127020.0, 801689.0, 90394.0, 9367.0, 2351.0, 856.0, 340.0, 152.0, 81.0, 41.0, 18.0, 11.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4521484375, -1.408721923828125, -1.36529541015625, -1.321868896484375, -1.2784423828125, -1.235015869140625, -1.19158935546875, -1.148162841796875, -1.104736328125, -1.061309814453125, -1.01788330078125, -0.974456787109375, -0.9310302734375, -0.887603759765625, -0.84417724609375, -0.800750732421875, -0.75732421875, -0.713897705078125, -0.67047119140625, -0.627044677734375, -0.5836181640625, -0.540191650390625, -0.49676513671875, -0.453338623046875, -0.409912109375, -0.366485595703125, -0.32305908203125, -0.279632568359375, -0.2362060546875, -0.192779541015625, -0.14935302734375, -0.105926513671875, -0.0625, -0.019073486328125, 0.02435302734375, 0.067779541015625, 0.1112060546875, 0.154632568359375, 0.19805908203125, 0.241485595703125, 0.284912109375, 0.328338623046875, 0.37176513671875, 0.415191650390625, 0.4586181640625, 0.502044677734375, 0.54547119140625, 0.588897705078125, 0.63232421875, 0.675750732421875, 0.71917724609375, 0.762603759765625, 0.8060302734375, 0.849456787109375, 0.89288330078125, 0.936309814453125, 0.979736328125, 1.023162841796875, 1.06658935546875, 1.110015869140625, 1.1534423828125, 1.196868896484375, 1.24029541015625, 1.283721923828125, 1.3271484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 1.0, 6.0, 10.0, 33.0, 24.0, 64.0, 81.0, 76.0, 118.0, 122.0, 105.0, 100.0, 84.0, 55.0, 47.0, 22.0, 20.0, 12.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.321044921875, -0.3115119934082031, -0.30197906494140625, -0.2924461364746094, -0.2829132080078125, -0.2733802795410156, -0.26384735107421875, -0.2543144226074219, -0.244781494140625, -0.23524856567382812, -0.22571563720703125, -0.21618270874023438, -0.2066497802734375, -0.19711685180664062, -0.18758392333984375, -0.17805099487304688, -0.16851806640625, -0.15898513793945312, -0.14945220947265625, -0.13991928100585938, -0.1303863525390625, -0.12085342407226562, -0.11132049560546875, -0.10178756713867188, -0.092254638671875, -0.08272171020507812, -0.07318878173828125, -0.06365585327148438, -0.0541229248046875, -0.044589996337890625, -0.03505706787109375, -0.025524139404296875, -0.0159912109375, -0.006458282470703125, 0.00307464599609375, 0.012607574462890625, 0.0221405029296875, 0.031673431396484375, 0.04120635986328125, 0.050739288330078125, 0.060272216796875, 0.06980514526367188, 0.07933807373046875, 0.08887100219726562, 0.0984039306640625, 0.10793685913085938, 0.11746978759765625, 0.12700271606445312, 0.13653564453125, 0.14606857299804688, 0.15560150146484375, 0.16513442993164062, 0.1746673583984375, 0.18420028686523438, 0.19373321533203125, 0.20326614379882812, 0.212799072265625, 0.22233200073242188, 0.23186492919921875, 0.24139785766601562, 0.2509307861328125, 0.2604637145996094, 0.26999664306640625, 0.2795295715332031, 0.2890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 10.0, 7.0, 12.0, 22.0, 36.0, 44.0, 58.0, 96.0, 173.0, 273.0, 532.0, 1318.0, 3694.0, 12156.0, 49471.0, 246758.0, 550338.0, 141330.0, 29811.0, 7858.0, 2537.0, 960.0, 431.0, 224.0, 118.0, 81.0, 68.0, 44.0, 25.0, 22.0, 17.0, 5.0, 7.0, 4.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62939453125, -0.6115798950195312, -0.5937652587890625, -0.5759506225585938, -0.558135986328125, -0.5403213500976562, -0.5225067138671875, -0.5046920776367188, -0.48687744140625, -0.46906280517578125, -0.4512481689453125, -0.43343353271484375, -0.415618896484375, -0.39780426025390625, -0.3799896240234375, -0.36217498779296875, -0.3443603515625, -0.32654571533203125, -0.3087310791015625, -0.29091644287109375, -0.273101806640625, -0.25528717041015625, -0.2374725341796875, -0.21965789794921875, -0.20184326171875, -0.18402862548828125, -0.1662139892578125, -0.14839935302734375, -0.130584716796875, -0.11277008056640625, -0.0949554443359375, -0.07714080810546875, -0.059326171875, -0.04151153564453125, -0.0236968994140625, -0.00588226318359375, 0.011932373046875, 0.02974700927734375, 0.0475616455078125, 0.06537628173828125, 0.08319091796875, 0.10100555419921875, 0.1188201904296875, 0.13663482666015625, 0.154449462890625, 0.17226409912109375, 0.1900787353515625, 0.20789337158203125, 0.2257080078125, 0.24352264404296875, 0.2613372802734375, 0.27915191650390625, 0.296966552734375, 0.31478118896484375, 0.3325958251953125, 0.35041046142578125, 0.36822509765625, 0.38603973388671875, 0.4038543701171875, 0.42166900634765625, 0.439483642578125, 0.45729827880859375, 0.4751129150390625, 0.49292755126953125, 0.5107421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 14.0, 13.0, 9.0, 14.0, 24.0, 31.0, 21.0, 36.0, 41.0, 26.0, 43.0, 43.0, 40.0, 39.0, 51.0, 42.0, 52.0, 43.0, 44.0, 53.0, 36.0, 27.0, 30.0, 34.0, 29.0, 29.0, 25.0, 20.0, 16.0, 15.0, 14.0, 8.0, 7.0, 9.0, 6.0, 3.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499267578125, -0.484222412109375, -0.46917724609375, -0.454132080078125, -0.4390869140625, -0.424041748046875, -0.40899658203125, -0.393951416015625, -0.37890625, -0.363861083984375, -0.34881591796875, -0.333770751953125, -0.3187255859375, -0.303680419921875, -0.28863525390625, -0.273590087890625, -0.258544921875, -0.243499755859375, -0.22845458984375, -0.213409423828125, -0.1983642578125, -0.183319091796875, -0.16827392578125, -0.153228759765625, -0.13818359375, -0.123138427734375, -0.10809326171875, -0.093048095703125, -0.0780029296875, -0.062957763671875, -0.04791259765625, -0.032867431640625, -0.017822265625, -0.002777099609375, 0.01226806640625, 0.027313232421875, 0.0423583984375, 0.057403564453125, 0.07244873046875, 0.087493896484375, 0.1025390625, 0.117584228515625, 0.13262939453125, 0.147674560546875, 0.1627197265625, 0.177764892578125, 0.19281005859375, 0.207855224609375, 0.222900390625, 0.237945556640625, 0.25299072265625, 0.268035888671875, 0.2830810546875, 0.298126220703125, 0.31317138671875, 0.328216552734375, 0.34326171875, 0.358306884765625, 0.37335205078125, 0.388397216796875, 0.4034423828125, 0.418487548828125, 0.43353271484375, 0.448577880859375, 0.463623046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 17.0, 18.0, 30.0, 79.0, 129.0, 268.0, 608.0, 1773.0, 5763.0, 30109.0, 266830.0, 643936.0, 81997.0, 12207.0, 2951.0, 1008.0, 400.0, 184.0, 95.0, 55.0, 25.0, 18.0, 13.0, 8.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.17286109924316406, -0.16542434692382812, -0.1579875946044922, -0.15055084228515625, -0.1431140899658203, -0.13567733764648438, -0.12824058532714844, -0.1208038330078125, -0.11336708068847656, -0.10593032836914062, -0.09849357604980469, -0.09105682373046875, -0.08362007141113281, -0.07618331909179688, -0.06874656677246094, -0.061309814453125, -0.05387306213378906, -0.046436309814453125, -0.03899955749511719, -0.03156280517578125, -0.024126052856445312, -0.016689300537109375, -0.009252548217773438, -0.0018157958984375, 0.0056209564208984375, 0.013057708740234375, 0.020494461059570312, 0.02793121337890625, 0.03536796569824219, 0.042804718017578125, 0.05024147033691406, 0.05767822265625, 0.06511497497558594, 0.07255172729492188, 0.07998847961425781, 0.08742523193359375, 0.09486198425292969, 0.10229873657226562, 0.10973548889160156, 0.1171722412109375, 0.12460899353027344, 0.13204574584960938, 0.1394824981689453, 0.14691925048828125, 0.1543560028076172, 0.16179275512695312, 0.16922950744628906, 0.176666259765625, 0.18410301208496094, 0.19153976440429688, 0.1989765167236328, 0.20641326904296875, 0.2138500213623047, 0.22128677368164062, 0.22872352600097656, 0.2361602783203125, 0.24359703063964844, 0.2510337829589844, 0.2584705352783203, 0.26590728759765625, 0.2733440399169922, 0.2807807922363281, 0.28821754455566406, 0.295654296875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 0.0, 10.0, 13.0, 13.0, 28.0, 33.0, 52.0, 98.0, 177.0, 189.0, 151.0, 83.0, 50.0, 30.0, 17.0, 14.0, 9.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010573863983154297, -0.00010226946324110031, -9.880028665065765e-05, -9.5331110060215e-05, -9.186193346977234e-05, -8.839275687932968e-05, -8.492358028888702e-05, -8.145440369844437e-05, -7.798522710800171e-05, -7.451605051755905e-05, -7.10468739271164e-05, -6.757769733667374e-05, -6.410852074623108e-05, -6.063934415578842e-05, -5.7170167565345764e-05, -5.370099097490311e-05, -5.023181438446045e-05, -4.676263779401779e-05, -4.3293461203575134e-05, -3.982428461313248e-05, -3.635510802268982e-05, -3.288593143224716e-05, -2.9416754841804504e-05, -2.5947578251361847e-05, -2.247840166091919e-05, -1.9009225070476532e-05, -1.5540048480033875e-05, -1.2070871889591217e-05, -8.60169529914856e-06, -5.132518708705902e-06, -1.6633421182632446e-06, 1.8058344721794128e-06, 5.27501106262207e-06, 8.744187653064728e-06, 1.2213364243507385e-05, 1.5682540833950043e-05, 1.91517174243927e-05, 2.2620894014835358e-05, 2.6090070605278015e-05, 2.9559247195720673e-05, 3.302842378616333e-05, 3.649760037660599e-05, 3.9966776967048645e-05, 4.34359535574913e-05, 4.690513014793396e-05, 5.037430673837662e-05, 5.3843483328819275e-05, 5.731265991926193e-05, 6.078183650970459e-05, 6.425101310014725e-05, 6.77201896905899e-05, 7.118936628103256e-05, 7.465854287147522e-05, 7.812771946191788e-05, 8.159689605236053e-05, 8.506607264280319e-05, 8.853524923324585e-05, 9.200442582368851e-05, 9.547360241413116e-05, 9.894277900457382e-05, 0.00010241195559501648, 0.00010588113218545914, 0.0001093503087759018, 0.00011281948536634445, 0.00011628866195678711]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 10.0, 10.0, 12.0, 12.0, 27.0, 40.0, 50.0, 84.0, 148.0, 216.0, 377.0, 657.0, 1121.0, 2381.0, 6229.0, 21410.0, 114416.0, 637456.0, 214248.0, 34253.0, 8807.0, 3239.0, 1462.0, 754.0, 423.0, 257.0, 146.0, 93.0, 66.0, 46.0, 30.0, 14.0, 21.0, 11.0, 11.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2191162109375, -0.21279335021972656, -0.20647048950195312, -0.2001476287841797, -0.19382476806640625, -0.1875019073486328, -0.18117904663085938, -0.17485618591308594, -0.1685333251953125, -0.16221046447753906, -0.15588760375976562, -0.1495647430419922, -0.14324188232421875, -0.1369190216064453, -0.13059616088867188, -0.12427330017089844, -0.117950439453125, -0.11162757873535156, -0.10530471801757812, -0.09898185729980469, -0.09265899658203125, -0.08633613586425781, -0.08001327514648438, -0.07369041442871094, -0.0673675537109375, -0.06104469299316406, -0.054721832275390625, -0.04839897155761719, -0.04207611083984375, -0.03575325012207031, -0.029430389404296875, -0.023107528686523438, -0.01678466796875, -0.010461807250976562, -0.004138946533203125, 0.0021839141845703125, 0.00850677490234375, 0.014829635620117188, 0.021152496337890625, 0.027475357055664062, 0.0337982177734375, 0.04012107849121094, 0.046443939208984375, 0.05276679992675781, 0.05908966064453125, 0.06541252136230469, 0.07173538208007812, 0.07805824279785156, 0.084381103515625, 0.09070396423339844, 0.09702682495117188, 0.10334968566894531, 0.10967254638671875, 0.11599540710449219, 0.12231826782226562, 0.12864112854003906, 0.1349639892578125, 0.14128684997558594, 0.14760971069335938, 0.1539325714111328, 0.16025543212890625, 0.1665782928466797, 0.17290115356445312, 0.17922401428222656, 0.185546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 10.0, 5.0, 16.0, 25.0, 41.0, 63.0, 76.0, 129.0, 161.0, 145.0, 105.0, 77.0, 52.0, 40.0, 18.0, 8.0, 10.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2989997863769531, -0.29111480712890625, -0.2832298278808594, -0.2753448486328125, -0.2674598693847656, -0.25957489013671875, -0.2516899108886719, -0.243804931640625, -0.23591995239257812, -0.22803497314453125, -0.22014999389648438, -0.2122650146484375, -0.20438003540039062, -0.19649505615234375, -0.18861007690429688, -0.18072509765625, -0.17284011840820312, -0.16495513916015625, -0.15707015991210938, -0.1491851806640625, -0.14130020141601562, -0.13341522216796875, -0.12553024291992188, -0.117645263671875, -0.10976028442382812, -0.10187530517578125, -0.09399032592773438, -0.0861053466796875, -0.07822036743164062, -0.07033538818359375, -0.062450408935546875, -0.0545654296875, -0.046680450439453125, -0.03879547119140625, -0.030910491943359375, -0.0230255126953125, -0.015140533447265625, -0.00725555419921875, 0.000629425048828125, 0.008514404296875, 0.016399383544921875, 0.02428436279296875, 0.032169342041015625, 0.0400543212890625, 0.047939300537109375, 0.05582427978515625, 0.06370925903320312, 0.07159423828125, 0.07947921752929688, 0.08736419677734375, 0.09524917602539062, 0.1031341552734375, 0.11101913452148438, 0.11890411376953125, 0.12678909301757812, 0.134674072265625, 0.14255905151367188, 0.15044403076171875, 0.15832901000976562, 0.1662139892578125, 0.17409896850585938, 0.18198394775390625, 0.18986892700195312, 0.19775390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 19.0, 58.0, 280.0, 413.0, 171.0, 54.0, 10.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-17.599308013916016, -17.281082153320312, -16.962854385375977, -16.644628524780273, -16.326400756835938, -16.008174896240234, -15.689948081970215, -15.371721267700195, -15.053495407104492, -14.735268592834473, -14.417041778564453, -14.09881591796875, -13.78058910369873, -13.462362289428711, -13.144135475158691, -12.825908660888672, -12.507682800292969, -12.18945598602295, -11.87122917175293, -11.553003311157227, -11.234776496887207, -10.916549682617188, -10.598322868347168, -10.280096054077148, -9.961869239807129, -9.64364242553711, -9.32541561126709, -9.007189750671387, -8.688962936401367, -8.370736122131348, -8.052509307861328, -7.734282970428467, -7.416055679321289, -7.0978288650512695, -6.779602527618408, -6.461375713348389, -6.143149375915527, -5.824922561645508, -5.506695747375488, -5.188469409942627, -4.870243072509766, -4.552016258239746, -4.233789920806885, -3.9155631065368652, -3.597336769104004, -3.2791099548339844, -2.960883378982544, -2.6426568031311035, -2.324430227279663, -2.0062036514282227, -1.6879770755767822, -1.3697503805160522, -1.0515238046646118, -0.7332972288131714, -0.4150705337524414, -0.09684395790100098, 0.22138261795043945, 0.5396091938018799, 0.8578358292579651, 1.1760624647140503, 1.4942890405654907, 1.8125156164169312, 2.130742311477661, 2.4489688873291016, 2.767195463180542]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 10.0, 7.0, 9.0, 11.0, 13.0, 19.0, 28.0, 19.0, 19.0, 21.0, 30.0, 26.0, 34.0, 31.0, 45.0, 47.0, 46.0, 35.0, 46.0, 35.0, 32.0, 39.0, 43.0, 46.0, 33.0, 36.0, 36.0, 25.0, 23.0, 30.0, 17.0, 17.0, 20.0, 11.0, 11.0, 9.0, 8.0, 5.0, 7.0, 2.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.072415828704834, -2.0087406635284424, -1.9450654983520508, -1.8813903331756592, -1.8177151679992676, -1.754040002822876, -1.6903648376464844, -1.6266896724700928, -1.5630145072937012, -1.4993393421173096, -1.435664176940918, -1.3719890117645264, -1.3083138465881348, -1.2446386814117432, -1.1809635162353516, -1.11728835105896, -1.0536130666732788, -0.9899379014968872, -0.9262627363204956, -0.862587571144104, -0.7989124059677124, -0.7352372407913208, -0.6715620160102844, -0.6078868508338928, -0.5442116856575012, -0.4805365204811096, -0.416861355304718, -0.35318616032600403, -0.2895109951496124, -0.22583582997322083, -0.16216063499450684, -0.09848546981811523, -0.03481030464172363, 0.028864867985248566, 0.09254004061222076, 0.15621522068977356, 0.21989038586616516, 0.28356555104255676, 0.34724074602127075, 0.41091591119766235, 0.47459107637405396, 0.5382662415504456, 0.6019414067268372, 0.6656166315078735, 0.7292917966842651, 0.7929669618606567, 0.8566421270370483, 0.9203172922134399, 0.9839924573898315, 1.0476676225662231, 1.1113427877426147, 1.1750179529190063, 1.238693118095398, 1.3023682832717896, 1.3660435676574707, 1.4297187328338623, 1.493393898010254, 1.5570690631866455, 1.620744228363037, 1.6844193935394287, 1.7480945587158203, 1.811769723892212, 1.8754448890686035, 1.9391200542449951, 2.0027952194213867]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 5.0, 8.0, 15.0, 15.0, 19.0, 37.0, 34.0, 57.0, 105.0, 122.0, 165.0, 271.0, 441.0, 732.0, 1423.0, 3144.0, 8770.0, 38735.0, 3704456.0, 394783.0, 28051.0, 7286.0, 2646.0, 1267.0, 630.0, 388.0, 201.0, 141.0, 102.0, 63.0, 46.0, 24.0, 27.0, 15.0, 13.0, 10.0, 9.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3828125, -1.3349609375, -1.287109375, -1.2392578125, -1.19140625, -1.1435546875, -1.095703125, -1.0478515625, -1.0, -0.9521484375, -0.904296875, -0.8564453125, -0.80859375, -0.7607421875, -0.712890625, -0.6650390625, -0.6171875, -0.5693359375, -0.521484375, -0.4736328125, -0.42578125, -0.3779296875, -0.330078125, -0.2822265625, -0.234375, -0.1865234375, -0.138671875, -0.0908203125, -0.04296875, 0.0048828125, 0.052734375, 0.1005859375, 0.1484375, 0.1962890625, 0.244140625, 0.2919921875, 0.33984375, 0.3876953125, 0.435546875, 0.4833984375, 0.53125, 0.5791015625, 0.626953125, 0.6748046875, 0.72265625, 0.7705078125, 0.818359375, 0.8662109375, 0.9140625, 0.9619140625, 1.009765625, 1.0576171875, 1.10546875, 1.1533203125, 1.201171875, 1.2490234375, 1.296875, 1.3447265625, 1.392578125, 1.4404296875, 1.48828125, 1.5361328125, 1.583984375, 1.6318359375, 1.6796875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 17.0, 21.0, 36.0, 43.0, 72.0, 95.0, 95.0, 108.0, 89.0, 107.0, 88.0, 69.0, 57.0, 31.0, 22.0, 15.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.30707550048828125, -0.2975006103515625, -0.28792572021484375, -0.278350830078125, -0.26877593994140625, -0.2592010498046875, -0.24962615966796875, -0.24005126953125, -0.23047637939453125, -0.2209014892578125, -0.21132659912109375, -0.201751708984375, -0.19217681884765625, -0.1826019287109375, -0.17302703857421875, -0.1634521484375, -0.15387725830078125, -0.1443023681640625, -0.13472747802734375, -0.125152587890625, -0.11557769775390625, -0.1060028076171875, -0.09642791748046875, -0.08685302734375, -0.07727813720703125, -0.0677032470703125, -0.05812835693359375, -0.048553466796875, -0.03897857666015625, -0.0294036865234375, -0.01982879638671875, -0.01025390625, -0.00067901611328125, 0.0088958740234375, 0.01847076416015625, 0.028045654296875, 0.03762054443359375, 0.0471954345703125, 0.05677032470703125, 0.06634521484375, 0.07592010498046875, 0.0854949951171875, 0.09506988525390625, 0.104644775390625, 0.11421966552734375, 0.1237945556640625, 0.13336944580078125, 0.1429443359375, 0.15251922607421875, 0.1620941162109375, 0.17166900634765625, 0.181243896484375, 0.19081878662109375, 0.2003936767578125, 0.20996856689453125, 0.21954345703125, 0.22911834716796875, 0.2386932373046875, 0.24826812744140625, 0.257843017578125, 0.26741790771484375, 0.2769927978515625, 0.28656768798828125, 0.296142578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 4.0, 3.0, 9.0, 16.0, 13.0, 11.0, 32.0, 29.0, 42.0, 49.0, 52.0, 85.0, 108.0, 188.0, 343.0, 624.0, 1337.0, 3063.0, 8976.0, 35117.0, 314446.0, 3737059.0, 69186.0, 14884.0, 4636.0, 1907.0, 859.0, 427.0, 257.0, 144.0, 86.0, 65.0, 52.0, 45.0, 30.0, 18.0, 16.0, 12.0, 18.0, 5.0, 4.0, 6.0, 10.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.9990234375, -0.9659423828125, -0.932861328125, -0.8997802734375, -0.86669921875, -0.8336181640625, -0.800537109375, -0.7674560546875, -0.734375, -0.7012939453125, -0.668212890625, -0.6351318359375, -0.60205078125, -0.5689697265625, -0.535888671875, -0.5028076171875, -0.4697265625, -0.4366455078125, -0.403564453125, -0.3704833984375, -0.33740234375, -0.3043212890625, -0.271240234375, -0.2381591796875, -0.205078125, -0.1719970703125, -0.138916015625, -0.1058349609375, -0.07275390625, -0.0396728515625, -0.006591796875, 0.0264892578125, 0.0595703125, 0.0926513671875, 0.125732421875, 0.1588134765625, 0.19189453125, 0.2249755859375, 0.258056640625, 0.2911376953125, 0.32421875, 0.3572998046875, 0.390380859375, 0.4234619140625, 0.45654296875, 0.4896240234375, 0.522705078125, 0.5557861328125, 0.5888671875, 0.6219482421875, 0.655029296875, 0.6881103515625, 0.72119140625, 0.7542724609375, 0.787353515625, 0.8204345703125, 0.853515625, 0.8865966796875, 0.919677734375, 0.9527587890625, 0.98583984375, 1.0189208984375, 1.052001953125, 1.0850830078125, 1.1181640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 9.0, 10.0, 25.0, 49.0, 83.0, 273.0, 3137.0, 285.0, 83.0, 45.0, 28.0, 12.0, 10.0, 5.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73486328125, -0.7135543823242188, -0.6922454833984375, -0.6709365844726562, -0.649627685546875, -0.6283187866210938, -0.6070098876953125, -0.5857009887695312, -0.56439208984375, -0.5430831909179688, -0.5217742919921875, -0.5004653930664062, -0.479156494140625, -0.45784759521484375, -0.4365386962890625, -0.41522979736328125, -0.3939208984375, -0.37261199951171875, -0.3513031005859375, -0.32999420166015625, -0.308685302734375, -0.28737640380859375, -0.2660675048828125, -0.24475860595703125, -0.22344970703125, -0.20214080810546875, -0.1808319091796875, -0.15952301025390625, -0.138214111328125, -0.11690521240234375, -0.0955963134765625, -0.07428741455078125, -0.052978515625, -0.03166961669921875, -0.0103607177734375, 0.01094818115234375, 0.032257080078125, 0.05356597900390625, 0.0748748779296875, 0.09618377685546875, 0.11749267578125, 0.13880157470703125, 0.1601104736328125, 0.18141937255859375, 0.202728271484375, 0.22403717041015625, 0.2453460693359375, 0.26665496826171875, 0.2879638671875, 0.30927276611328125, 0.3305816650390625, 0.35189056396484375, 0.373199462890625, 0.39450836181640625, 0.4158172607421875, 0.43712615966796875, 0.45843505859375, 0.47974395751953125, 0.5010528564453125, 0.5223617553710938, 0.543670654296875, 0.5649795532226562, 0.5862884521484375, 0.6075973510742188, 0.62890625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 18.0, 36.0, 112.0, 282.0, 310.0, 126.0, 61.0, 22.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.302706718444824, -4.185956001281738, -4.069204807281494, -3.952453851699829, -3.835702896118164, -3.718951940536499, -3.602200984954834, -3.485450029373169, -3.368699073791504, -3.251948118209839, -3.135197162628174, -3.018446207046509, -2.9016952514648438, -2.7849442958831787, -2.6681933403015137, -2.5514423847198486, -2.4346914291381836, -2.3179404735565186, -2.2011895179748535, -2.0844385623931885, -1.9676876068115234, -1.8509366512298584, -1.7341856956481934, -1.6174347400665283, -1.5006837844848633, -1.3839328289031982, -1.2671818733215332, -1.1504309177398682, -1.0336799621582031, -0.9169290065765381, -0.800178050994873, -0.683427095413208, -0.566676139831543, -0.44992518424987793, -0.3331742286682129, -0.21642327308654785, -0.09967231750488281, 0.017078638076782227, 0.13382959365844727, 0.2505805492401123, 0.36733150482177734, 0.4840824604034424, 0.6008334159851074, 0.7175843715667725, 0.8343353271484375, 0.9510862827301025, 1.0678372383117676, 1.1845881938934326, 1.3013391494750977, 1.4180901050567627, 1.5348410606384277, 1.6515920162200928, 1.7683429718017578, 1.8850939273834229, 2.001844882965088, 2.118595838546753, 2.235346794128418, 2.352097749710083, 2.468848705291748, 2.585599660873413, 2.702350616455078, 2.819101572036743, 2.935852527618408, 3.0526034832000732, 3.1693544387817383]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 7.0, 2.0, 9.0, 6.0, 9.0, 22.0, 27.0, 39.0, 30.0, 39.0, 55.0, 77.0, 74.0, 76.0, 65.0, 76.0, 72.0, 64.0, 53.0, 48.0, 33.0, 35.0, 25.0, 20.0, 16.0, 11.0, 5.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9575942754745483, -1.9025774002075195, -1.8475606441497803, -1.7925437688827515, -1.7375268936157227, -1.6825101375579834, -1.6274932622909546, -1.5724763870239258, -1.5174596309661865, -1.4624427556991577, -1.4074259996414185, -1.3524091243743896, -1.2973922491073608, -1.242375373840332, -1.1873586177825928, -1.132341742515564, -1.0773248672485352, -1.0223079919815063, -0.9672911763191223, -0.9122743606567383, -0.8572574853897095, -0.8022406697273254, -0.7472238540649414, -0.6922069787979126, -0.6371901631355286, -0.5821733474731445, -0.5271564722061157, -0.4721396565437317, -0.41712281107902527, -0.36210596561431885, -0.3070891499519348, -0.2520723044872284, -0.19705533981323242, -0.142038494348526, -0.08702166378498077, -0.03200483322143555, 0.023012012243270874, 0.0780288577079773, 0.13304567337036133, 0.18806251883506775, 0.24307936429977417, 0.2980962097644806, 0.353113055229187, 0.40812987089157104, 0.46314671635627747, 0.5181635618209839, 0.5731803774833679, 0.628197193145752, 0.6832140684127808, 0.7382308840751648, 0.7932477593421936, 0.8482645750045776, 0.9032814502716064, 0.9582982659339905, 1.0133150815963745, 1.0683319568634033, 1.1233487129211426, 1.1783655881881714, 1.2333823442459106, 1.2883992195129395, 1.3434160947799683, 1.398432970046997, 1.4534497261047363, 1.5084666013717651, 1.563483476638794]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 13.0, 11.0, 13.0, 23.0, 24.0, 30.0, 64.0, 125.0, 255.0, 416.0, 752.0, 1689.0, 3970.0, 12467.0, 62390.0, 452704.0, 434590.0, 59696.0, 12071.0, 3858.0, 1632.0, 840.0, 360.0, 237.0, 116.0, 75.0, 39.0, 26.0, 18.0, 13.0, 10.0, 12.0, 7.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.10699462890625, -1.0723876953125, -1.03778076171875, -1.003173828125, -0.96856689453125, -0.9339599609375, -0.89935302734375, -0.86474609375, -0.83013916015625, -0.7955322265625, -0.76092529296875, -0.726318359375, -0.69171142578125, -0.6571044921875, -0.62249755859375, -0.587890625, -0.55328369140625, -0.5186767578125, -0.48406982421875, -0.449462890625, -0.41485595703125, -0.3802490234375, -0.34564208984375, -0.31103515625, -0.27642822265625, -0.2418212890625, -0.20721435546875, -0.172607421875, -0.13800048828125, -0.1033935546875, -0.06878662109375, -0.0341796875, 0.00042724609375, 0.0350341796875, 0.06964111328125, 0.104248046875, 0.13885498046875, 0.1734619140625, 0.20806884765625, 0.24267578125, 0.27728271484375, 0.3118896484375, 0.34649658203125, 0.381103515625, 0.41571044921875, 0.4503173828125, 0.48492431640625, 0.51953125, 0.55413818359375, 0.5887451171875, 0.62335205078125, 0.657958984375, 0.69256591796875, 0.7271728515625, 0.76177978515625, 0.79638671875, 0.83099365234375, 0.8656005859375, 0.90020751953125, 0.934814453125, 0.96942138671875, 1.0040283203125, 1.03863525390625, 1.0732421875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 10.0, 21.0, 33.0, 50.0, 68.0, 74.0, 90.0, 119.0, 95.0, 107.0, 77.0, 63.0, 49.0, 40.0, 29.0, 27.0, 14.0, 7.0, 9.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343994140625, -0.3333625793457031, -0.32273101806640625, -0.3120994567871094, -0.3014678955078125, -0.2908363342285156, -0.28020477294921875, -0.2695732116699219, -0.258941650390625, -0.24831008911132812, -0.23767852783203125, -0.22704696655273438, -0.2164154052734375, -0.20578384399414062, -0.19515228271484375, -0.18452072143554688, -0.17388916015625, -0.16325759887695312, -0.15262603759765625, -0.14199447631835938, -0.1313629150390625, -0.12073135375976562, -0.11009979248046875, -0.09946823120117188, -0.088836669921875, -0.07820510864257812, -0.06757354736328125, -0.056941986083984375, -0.0463104248046875, -0.035678863525390625, -0.02504730224609375, -0.014415740966796875, -0.0037841796875, 0.006847381591796875, 0.01747894287109375, 0.028110504150390625, 0.0387420654296875, 0.049373626708984375, 0.06000518798828125, 0.07063674926757812, 0.081268310546875, 0.09189987182617188, 0.10253143310546875, 0.11316299438476562, 0.1237945556640625, 0.13442611694335938, 0.14505767822265625, 0.15568923950195312, 0.16632080078125, 0.17695236206054688, 0.18758392333984375, 0.19821548461914062, 0.2088470458984375, 0.21947860717773438, 0.23011016845703125, 0.24074172973632812, 0.251373291015625, 0.2620048522949219, 0.27263641357421875, 0.2832679748535156, 0.2938995361328125, 0.3045310974121094, 0.31516265869140625, 0.3257942199707031, 0.33642578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 10.0, 10.0, 5.0, 11.0, 14.0, 18.0, 19.0, 26.0, 56.0, 58.0, 90.0, 126.0, 165.0, 287.0, 543.0, 1046.0, 2764.0, 8936.0, 39362.0, 227995.0, 580688.0, 148498.0, 26886.0, 6693.0, 2105.0, 864.0, 453.0, 250.0, 166.0, 114.0, 72.0, 57.0, 40.0, 30.0, 23.0, 16.0, 22.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.69677734375, -0.6722259521484375, -0.647674560546875, -0.6231231689453125, -0.59857177734375, -0.5740203857421875, -0.549468994140625, -0.5249176025390625, -0.5003662109375, -0.4758148193359375, -0.451263427734375, -0.4267120361328125, -0.40216064453125, -0.3776092529296875, -0.353057861328125, -0.3285064697265625, -0.303955078125, -0.2794036865234375, -0.254852294921875, -0.2303009033203125, -0.20574951171875, -0.1811981201171875, -0.156646728515625, -0.1320953369140625, -0.1075439453125, -0.0829925537109375, -0.058441162109375, -0.0338897705078125, -0.00933837890625, 0.0152130126953125, 0.039764404296875, 0.0643157958984375, 0.0888671875, 0.1134185791015625, 0.137969970703125, 0.1625213623046875, 0.18707275390625, 0.2116241455078125, 0.236175537109375, 0.2607269287109375, 0.2852783203125, 0.3098297119140625, 0.334381103515625, 0.3589324951171875, 0.38348388671875, 0.4080352783203125, 0.432586669921875, 0.4571380615234375, 0.481689453125, 0.5062408447265625, 0.530792236328125, 0.5553436279296875, 0.57989501953125, 0.6044464111328125, 0.628997802734375, 0.6535491943359375, 0.6781005859375, 0.7026519775390625, 0.727203369140625, 0.7517547607421875, 0.77630615234375, 0.8008575439453125, 0.825408935546875, 0.8499603271484375, 0.87451171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 7.0, 5.0, 8.0, 13.0, 28.0, 27.0, 36.0, 34.0, 54.0, 58.0, 49.0, 69.0, 85.0, 69.0, 65.0, 69.0, 64.0, 59.0, 49.0, 37.0, 40.0, 22.0, 16.0, 5.0, 13.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1572265625, -1.1213836669921875, -1.085540771484375, -1.0496978759765625, -1.01385498046875, -0.9780120849609375, -0.942169189453125, -0.9063262939453125, -0.8704833984375, -0.8346405029296875, -0.798797607421875, -0.7629547119140625, -0.72711181640625, -0.6912689208984375, -0.655426025390625, -0.6195831298828125, -0.583740234375, -0.5478973388671875, -0.512054443359375, -0.4762115478515625, -0.44036865234375, -0.4045257568359375, -0.368682861328125, -0.3328399658203125, -0.2969970703125, -0.2611541748046875, -0.225311279296875, -0.1894683837890625, -0.15362548828125, -0.1177825927734375, -0.081939697265625, -0.0460968017578125, -0.01025390625, 0.0255889892578125, 0.061431884765625, 0.0972747802734375, 0.13311767578125, 0.1689605712890625, 0.204803466796875, 0.2406463623046875, 0.2764892578125, 0.3123321533203125, 0.348175048828125, 0.3840179443359375, 0.41986083984375, 0.4557037353515625, 0.491546630859375, 0.5273895263671875, 0.563232421875, 0.5990753173828125, 0.634918212890625, 0.6707611083984375, 0.70660400390625, 0.7424468994140625, 0.778289794921875, 0.8141326904296875, 0.8499755859375, 0.8858184814453125, 0.921661376953125, 0.9575042724609375, 0.99334716796875, 1.0291900634765625, 1.065032958984375, 1.1008758544921875, 1.13671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 17.0, 34.0, 47.0, 71.0, 162.0, 329.0, 730.0, 2036.0, 7248.0, 38267.0, 475714.0, 474842.0, 38407.0, 7248.0, 2009.0, 739.0, 292.0, 151.0, 83.0, 46.0, 17.0, 19.0, 8.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.421142578125, -0.4066200256347656, -0.39209747314453125, -0.3775749206542969, -0.3630523681640625, -0.3485298156738281, -0.33400726318359375, -0.3194847106933594, -0.304962158203125, -0.2904396057128906, -0.27591705322265625, -0.2613945007324219, -0.2468719482421875, -0.23234939575195312, -0.21782684326171875, -0.20330429077148438, -0.18878173828125, -0.17425918579101562, -0.15973663330078125, -0.14521408081054688, -0.1306915283203125, -0.11616897583007812, -0.10164642333984375, -0.08712387084960938, -0.072601318359375, -0.058078765869140625, -0.04355621337890625, -0.029033660888671875, -0.0145111083984375, 1.1444091796875e-05, 0.01453399658203125, 0.029056549072265625, 0.0435791015625, 0.058101654052734375, 0.07262420654296875, 0.08714675903320312, 0.1016693115234375, 0.11619186401367188, 0.13071441650390625, 0.14523696899414062, 0.159759521484375, 0.17428207397460938, 0.18880462646484375, 0.20332717895507812, 0.2178497314453125, 0.23237228393554688, 0.24689483642578125, 0.2614173889160156, 0.27593994140625, 0.2904624938964844, 0.30498504638671875, 0.3195075988769531, 0.3340301513671875, 0.3485527038574219, 0.36307525634765625, 0.3775978088378906, 0.392120361328125, 0.4066429138183594, 0.42116546630859375, 0.4356880187988281, 0.4502105712890625, 0.4647331237792969, 0.47925567626953125, 0.4937782287597656, 0.50830078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 4.0, 9.0, 9.0, 9.0, 11.0, 9.0, 21.0, 24.0, 36.0, 39.0, 54.0, 67.0, 81.0, 80.0, 99.0, 84.0, 72.0, 46.0, 39.0, 34.0, 25.0, 41.0, 17.0, 17.0, 11.0, 10.0, 15.0, 6.0, 5.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-7.50422477722168e-05, -7.307622581720352e-05, -7.111020386219025e-05, -6.914418190717697e-05, -6.71781599521637e-05, -6.521213799715042e-05, -6.324611604213715e-05, -6.128009408712387e-05, -5.9314072132110596e-05, -5.734805017709732e-05, -5.5382028222084045e-05, -5.341600626707077e-05, -5.1449984312057495e-05, -4.948396235704422e-05, -4.7517940402030945e-05, -4.555191844701767e-05, -4.3585896492004395e-05, -4.161987453699112e-05, -3.9653852581977844e-05, -3.768783062696457e-05, -3.5721808671951294e-05, -3.375578671693802e-05, -3.1789764761924744e-05, -2.982374280691147e-05, -2.7857720851898193e-05, -2.5891698896884918e-05, -2.3925676941871643e-05, -2.1959654986858368e-05, -1.9993633031845093e-05, -1.8027611076831818e-05, -1.6061589121818542e-05, -1.4095567166805267e-05, -1.2129545211791992e-05, -1.0163523256778717e-05, -8.197501301765442e-06, -6.231479346752167e-06, -4.265457391738892e-06, -2.2994354367256165e-06, -3.334134817123413e-07, 1.6326084733009338e-06, 3.598630428314209e-06, 5.564652383327484e-06, 7.530674338340759e-06, 9.496696293354034e-06, 1.146271824836731e-05, 1.3428740203380585e-05, 1.539476215839386e-05, 1.7360784113407135e-05, 1.932680606842041e-05, 2.1292828023433685e-05, 2.325884997844696e-05, 2.5224871933460236e-05, 2.719089388847351e-05, 2.9156915843486786e-05, 3.112293779850006e-05, 3.3088959753513336e-05, 3.505498170852661e-05, 3.7021003663539886e-05, 3.898702561855316e-05, 4.095304757356644e-05, 4.291906952857971e-05, 4.488509148359299e-05, 4.685111343860626e-05, 4.881713539361954e-05, 5.078315734863281e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 12.0, 11.0, 20.0, 28.0, 38.0, 58.0, 101.0, 222.0, 424.0, 1064.0, 3316.0, 17384.0, 208123.0, 751823.0, 55464.0, 7359.0, 1722.0, 674.0, 298.0, 162.0, 79.0, 57.0, 45.0, 26.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51708984375, -0.50054931640625, -0.4840087890625, -0.46746826171875, -0.450927734375, -0.43438720703125, -0.4178466796875, -0.40130615234375, -0.384765625, -0.36822509765625, -0.3516845703125, -0.33514404296875, -0.318603515625, -0.30206298828125, -0.2855224609375, -0.26898193359375, -0.25244140625, -0.23590087890625, -0.2193603515625, -0.20281982421875, -0.186279296875, -0.16973876953125, -0.1531982421875, -0.13665771484375, -0.1201171875, -0.10357666015625, -0.0870361328125, -0.07049560546875, -0.053955078125, -0.03741455078125, -0.0208740234375, -0.00433349609375, 0.01220703125, 0.02874755859375, 0.0452880859375, 0.06182861328125, 0.078369140625, 0.09490966796875, 0.1114501953125, 0.12799072265625, 0.14453125, 0.16107177734375, 0.1776123046875, 0.19415283203125, 0.210693359375, 0.22723388671875, 0.2437744140625, 0.26031494140625, 0.27685546875, 0.29339599609375, 0.3099365234375, 0.32647705078125, 0.343017578125, 0.35955810546875, 0.3760986328125, 0.39263916015625, 0.4091796875, 0.42572021484375, 0.4422607421875, 0.45880126953125, 0.475341796875, 0.49188232421875, 0.5084228515625, 0.52496337890625, 0.54150390625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 9.0, 10.0, 8.0, 18.0, 18.0, 36.0, 46.0, 72.0, 111.0, 139.0, 141.0, 111.0, 84.0, 59.0, 46.0, 21.0, 11.0, 13.0, 10.0, 4.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40283203125, -0.3898963928222656, -0.37696075439453125, -0.3640251159667969, -0.3510894775390625, -0.3381538391113281, -0.32521820068359375, -0.3122825622558594, -0.299346923828125, -0.2864112854003906, -0.27347564697265625, -0.2605400085449219, -0.2476043701171875, -0.23466873168945312, -0.22173309326171875, -0.20879745483398438, -0.19586181640625, -0.18292617797851562, -0.16999053955078125, -0.15705490112304688, -0.1441192626953125, -0.13118362426757812, -0.11824798583984375, -0.10531234741210938, -0.092376708984375, -0.07944107055664062, -0.06650543212890625, -0.053569793701171875, -0.0406341552734375, -0.027698516845703125, -0.01476287841796875, -0.001827239990234375, 0.0111083984375, 0.024044036865234375, 0.03697967529296875, 0.049915313720703125, 0.0628509521484375, 0.07578659057617188, 0.08872222900390625, 0.10165786743164062, 0.114593505859375, 0.12752914428710938, 0.14046478271484375, 0.15340042114257812, 0.1663360595703125, 0.17927169799804688, 0.19220733642578125, 0.20514297485351562, 0.21807861328125, 0.23101425170898438, 0.24394989013671875, 0.2568855285644531, 0.2698211669921875, 0.2827568054199219, 0.29569244384765625, 0.3086280822753906, 0.321563720703125, 0.3344993591308594, 0.34743499755859375, 0.3603706359863281, 0.3733062744140625, 0.3862419128417969, 0.39917755126953125, 0.4121131896972656, 0.425048828125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 28.0, 83.0, 220.0, 315.0, 228.0, 77.0, 29.0, 10.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.811117172241211, -12.45047664642334, -12.089836120605469, -11.729194641113281, -11.36855411529541, -11.007913589477539, -10.647273063659668, -10.286632537841797, -9.925992012023926, -9.565351486206055, -9.204710960388184, -8.844070434570312, -8.483428955078125, -8.122788429260254, -7.762147903442383, -7.401507377624512, -7.040866374969482, -6.680225849151611, -6.319584846496582, -5.958944320678711, -5.59830379486084, -5.237663269042969, -4.8770222663879395, -4.516381740570068, -4.155740737915039, -3.795099973678589, -3.4344594478607178, -3.0738186836242676, -2.7131781578063965, -2.3525373935699463, -1.991896629333496, -1.631256103515625, -1.270615577697754, -0.9099749326705933, -0.5493342280387878, -0.18869352340698242, 0.17194712162017822, 0.5325877666473389, 0.8932285308837891, 1.2538690567016602, 1.6145098209381104, 1.975150465965271, 2.3357911109924316, 2.696431875228882, 3.057072639465332, 3.417713165283203, 3.7783539295196533, 4.138994216918945, 4.499635219573975, 4.860275745391846, 5.220916748046875, 5.581557273864746, 5.942197799682617, 6.302838325500488, 6.663479328155518, 7.024119853973389, 7.384760856628418, 7.745401382446289, 8.10604190826416, 8.466682434082031, 8.827323913574219, 9.18796443939209, 9.548604965209961, 9.909245491027832, 10.269886016845703]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 3.0, 10.0, 13.0, 9.0, 8.0, 16.0, 22.0, 20.0, 26.0, 29.0, 28.0, 36.0, 27.0, 44.0, 43.0, 44.0, 32.0, 39.0, 56.0, 47.0, 40.0, 39.0, 48.0, 45.0, 40.0, 34.0, 28.0, 30.0, 24.0, 14.0, 21.0, 20.0, 8.0, 12.0, 9.0, 10.0, 6.0, 1.0, 5.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0], "bins": [-4.976199150085449, -4.836032390594482, -4.695866107940674, -4.555699348449707, -4.415533065795898, -4.275366306304932, -4.135200023651123, -3.9950332641601562, -3.8548667430877686, -3.714700222015381, -3.574533700942993, -3.4343671798706055, -3.2942004203796387, -3.15403413772583, -3.0138673782348633, -2.8737008571624756, -2.733534336090088, -2.5933678150177, -2.4532012939453125, -2.313034772872925, -2.172868251800537, -2.0327014923095703, -1.8925349712371826, -1.752368450164795, -1.6122019290924072, -1.4720354080200195, -1.3318688869476318, -1.1917022466659546, -1.051535725593567, -0.9113692045211792, -0.7712026238441467, -0.6310360431671143, -0.49086976051330566, -0.3507032096385956, -0.2105366587638855, -0.07037010788917542, 0.06979644298553467, 0.20996296405792236, 0.35012954473495483, 0.4902961254119873, 0.630462646484375, 0.7706291675567627, 0.9107957482337952, 1.0509623289108276, 1.1911288499832153, 1.331295371055603, 1.4714620113372803, 1.611628532409668, 1.7517950534820557, 1.8919615745544434, 2.032128095626831, 2.1722946166992188, 2.3124613761901855, 2.452627658843994, 2.592794418334961, 2.7329609394073486, 2.8731274604797363, 3.013293981552124, 3.1534605026245117, 3.2936270236968994, 3.433793544769287, 3.573960304260254, 3.7141268253326416, 3.8542933464050293, 3.994459867477417]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 10.0, 5.0, 13.0, 17.0, 28.0, 47.0, 69.0, 84.0, 146.0, 214.0, 331.0, 688.0, 1304.0, 3074.0, 9290.0, 48389.0, 3886556.0, 214688.0, 19877.0, 5331.0, 2027.0, 861.0, 466.0, 259.0, 153.0, 101.0, 73.0, 52.0, 33.0, 32.0, 18.0, 13.0, 5.0, 7.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2998046875, -1.251220703125, -1.20263671875, -1.154052734375, -1.10546875, -1.056884765625, -1.00830078125, -0.959716796875, -0.9111328125, -0.862548828125, -0.81396484375, -0.765380859375, -0.716796875, -0.668212890625, -0.61962890625, -0.571044921875, -0.5224609375, -0.473876953125, -0.42529296875, -0.376708984375, -0.328125, -0.279541015625, -0.23095703125, -0.182373046875, -0.1337890625, -0.085205078125, -0.03662109375, 0.011962890625, 0.060546875, 0.109130859375, 0.15771484375, 0.206298828125, 0.2548828125, 0.303466796875, 0.35205078125, 0.400634765625, 0.44921875, 0.497802734375, 0.54638671875, 0.594970703125, 0.6435546875, 0.692138671875, 0.74072265625, 0.789306640625, 0.837890625, 0.886474609375, 0.93505859375, 0.983642578125, 1.0322265625, 1.080810546875, 1.12939453125, 1.177978515625, 1.2265625, 1.275146484375, 1.32373046875, 1.372314453125, 1.4208984375, 1.469482421875, 1.51806640625, 1.566650390625, 1.615234375, 1.663818359375, 1.71240234375, 1.760986328125, 1.8095703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 4.0, 10.0, 14.0, 23.0, 30.0, 52.0, 52.0, 54.0, 75.0, 100.0, 96.0, 72.0, 84.0, 82.0, 52.0, 43.0, 34.0, 26.0, 31.0, 16.0, 14.0, 12.0, 7.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3450355529785156, -0.33386993408203125, -0.3227043151855469, -0.3115386962890625, -0.3003730773925781, -0.28920745849609375, -0.2780418395996094, -0.266876220703125, -0.2557106018066406, -0.24454498291015625, -0.23337936401367188, -0.2222137451171875, -0.21104812622070312, -0.19988250732421875, -0.18871688842773438, -0.17755126953125, -0.16638565063476562, -0.15522003173828125, -0.14405441284179688, -0.1328887939453125, -0.12172317504882812, -0.11055755615234375, -0.09939193725585938, -0.088226318359375, -0.07706069946289062, -0.06589508056640625, -0.054729461669921875, -0.0435638427734375, -0.032398223876953125, -0.02123260498046875, -0.010066986083984375, 0.0010986328125, 0.012264251708984375, 0.02342987060546875, 0.034595489501953125, 0.0457611083984375, 0.056926727294921875, 0.06809234619140625, 0.07925796508789062, 0.090423583984375, 0.10158920288085938, 0.11275482177734375, 0.12392044067382812, 0.1350860595703125, 0.14625167846679688, 0.15741729736328125, 0.16858291625976562, 0.17974853515625, 0.19091415405273438, 0.20207977294921875, 0.21324539184570312, 0.2244110107421875, 0.23557662963867188, 0.24674224853515625, 0.2579078674316406, 0.269073486328125, 0.2802391052246094, 0.29140472412109375, 0.3025703430175781, 0.3137359619140625, 0.3249015808105469, 0.33606719970703125, 0.3472328186035156, 0.3583984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 11.0, 29.0, 61.0, 118.0, 236.0, 508.0, 1203.0, 3353.0, 13054.0, 90786.0, 3918735.0, 143077.0, 16596.0, 4032.0, 1395.0, 531.0, 278.0, 116.0, 72.0, 39.0, 14.0, 9.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.546875, -1.5008087158203125, -1.454742431640625, -1.4086761474609375, -1.36260986328125, -1.3165435791015625, -1.270477294921875, -1.2244110107421875, -1.1783447265625, -1.1322784423828125, -1.086212158203125, -1.0401458740234375, -0.99407958984375, -0.9480133056640625, -0.901947021484375, -0.8558807373046875, -0.809814453125, -0.7637481689453125, -0.717681884765625, -0.6716156005859375, -0.62554931640625, -0.5794830322265625, -0.533416748046875, -0.4873504638671875, -0.4412841796875, -0.3952178955078125, -0.349151611328125, -0.3030853271484375, -0.25701904296875, -0.2109527587890625, -0.164886474609375, -0.1188201904296875, -0.07275390625, -0.0266876220703125, 0.019378662109375, 0.0654449462890625, 0.11151123046875, 0.1575775146484375, 0.203643798828125, 0.2497100830078125, 0.2957763671875, 0.3418426513671875, 0.387908935546875, 0.4339752197265625, 0.48004150390625, 0.5261077880859375, 0.572174072265625, 0.6182403564453125, 0.664306640625, 0.7103729248046875, 0.756439208984375, 0.8025054931640625, 0.84857177734375, 0.8946380615234375, 0.940704345703125, 0.9867706298828125, 1.0328369140625, 1.0789031982421875, 1.124969482421875, 1.1710357666015625, 1.21710205078125, 1.2631683349609375, 1.309234619140625, 1.3553009033203125, 1.4013671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 8.0, 4.0, 17.0, 12.0, 20.0, 43.0, 80.0, 180.0, 613.0, 2564.0, 266.0, 93.0, 60.0, 32.0, 18.0, 23.0, 9.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7412109375, -0.7195892333984375, -0.697967529296875, -0.6763458251953125, -0.65472412109375, -0.6331024169921875, -0.611480712890625, -0.5898590087890625, -0.5682373046875, -0.5466156005859375, -0.524993896484375, -0.5033721923828125, -0.48175048828125, -0.4601287841796875, -0.438507080078125, -0.4168853759765625, -0.395263671875, -0.3736419677734375, -0.352020263671875, -0.3303985595703125, -0.30877685546875, -0.2871551513671875, -0.265533447265625, -0.2439117431640625, -0.2222900390625, -0.2006683349609375, -0.179046630859375, -0.1574249267578125, -0.13580322265625, -0.1141815185546875, -0.092559814453125, -0.0709381103515625, -0.04931640625, -0.0276947021484375, -0.006072998046875, 0.0155487060546875, 0.03717041015625, 0.0587921142578125, 0.080413818359375, 0.1020355224609375, 0.1236572265625, 0.1452789306640625, 0.166900634765625, 0.1885223388671875, 0.21014404296875, 0.2317657470703125, 0.253387451171875, 0.2750091552734375, 0.296630859375, 0.3182525634765625, 0.339874267578125, 0.3614959716796875, 0.38311767578125, 0.4047393798828125, 0.426361083984375, 0.4479827880859375, 0.4696044921875, 0.4912261962890625, 0.512847900390625, 0.5344696044921875, 0.55609130859375, 0.5777130126953125, 0.599334716796875, 0.6209564208984375, 0.642578125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 12.0, 28.0, 108.0, 377.0, 322.0, 109.0, 36.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.398108959197998, -3.1711981296539307, -2.9442873001098633, -2.717376708984375, -2.4904658794403076, -2.2635550498962402, -2.036644458770752, -1.8097336292266846, -1.5828227996826172, -1.3559119701385498, -1.129001259803772, -0.9020904898643494, -0.6751797199249268, -0.4482688903808594, -0.22135818004608154, 0.005552530288696289, 0.23246335983276367, 0.4593741297721863, 0.6862848997116089, 0.9131956696510315, 1.140106439590454, 1.3670172691345215, 1.5939279794692993, 1.8208386898040771, 2.0477495193481445, 2.274660348892212, 2.5015711784362793, 2.7284817695617676, 2.955392599105835, 3.1823034286499023, 3.4092140197753906, 3.636124849319458, 3.863035202026367, 4.0899457931518555, 4.316856861114502, 4.54376745223999, 4.770678520202637, 4.997589111328125, 5.224499702453613, 5.451410293579102, 5.678321361541748, 5.905231952667236, 6.132143020629883, 6.359053611755371, 6.585964202880859, 6.812875270843506, 7.039785861968994, 7.266696929931641, 7.493607521057129, 7.720518112182617, 7.947429180145264, 8.17434024810791, 8.401250839233398, 8.628161430358887, 8.855072021484375, 9.081982612609863, 9.308893203735352, 9.53580379486084, 9.762714385986328, 9.989625930786133, 10.216536521911621, 10.44344711303711, 10.670357704162598, 10.897268295288086, 11.12417984008789]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 8.0, 9.0, 7.0, 8.0, 8.0, 15.0, 23.0, 22.0, 15.0, 28.0, 22.0, 30.0, 45.0, 32.0, 39.0, 41.0, 43.0, 49.0, 50.0, 58.0, 55.0, 45.0, 42.0, 40.0, 45.0, 28.0, 24.0, 34.0, 25.0, 17.0, 21.0, 18.0, 11.0, 11.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6619577407836914, -1.6124058961868286, -1.5628540515899658, -1.5133020877838135, -1.4637502431869507, -1.414198398590088, -1.364646553993225, -1.3150947093963623, -1.2655428647994995, -1.2159910202026367, -1.166439175605774, -1.1168873310089111, -1.0673353672027588, -1.017783522605896, -0.9682316780090332, -0.9186798334121704, -0.8691279292106628, -0.8195760846138, -0.7700241804122925, -0.7204723358154297, -0.6709204912185669, -0.6213686466217041, -0.5718167424201965, -0.5222648978233337, -0.47271302342414856, -0.4231611490249634, -0.3736093044281006, -0.3240574300289154, -0.2745055556297302, -0.22495371103286743, -0.17540183663368225, -0.12584999203681946, -0.07629811763763428, -0.026746254414319992, 0.022805608808994293, 0.07235747575759888, 0.12190933525562286, 0.17146119475364685, 0.22101306915283203, 0.2705649137496948, 0.32011678814888, 0.3696686625480652, 0.419220507144928, 0.46877238154411316, 0.5183242559432983, 0.5678761005401611, 0.6174279451370239, 0.6669797897338867, 0.7165316939353943, 0.7660835385322571, 0.8156354427337646, 0.8651872873306274, 0.9147391319274902, 0.964290976524353, 1.0138428211212158, 1.0633947849273682, 1.112946629524231, 1.1624984741210938, 1.2120503187179565, 1.2616021633148193, 1.3111541271209717, 1.3607059717178345, 1.4102578163146973, 1.45980966091156, 1.5093615055084229]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 11.0, 12.0, 13.0, 24.0, 41.0, 48.0, 102.0, 122.0, 224.0, 399.0, 687.0, 1162.0, 2311.0, 5095.0, 12152.0, 34633.0, 109519.0, 325699.0, 361120.0, 129551.0, 40238.0, 14045.0, 5655.0, 2623.0, 1339.0, 703.0, 399.0, 225.0, 157.0, 93.0, 47.0, 33.0, 24.0, 24.0, 11.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.80029296875, -0.776092529296875, -0.75189208984375, -0.727691650390625, -0.7034912109375, -0.679290771484375, -0.65509033203125, -0.630889892578125, -0.606689453125, -0.582489013671875, -0.55828857421875, -0.534088134765625, -0.5098876953125, -0.485687255859375, -0.46148681640625, -0.437286376953125, -0.4130859375, -0.388885498046875, -0.36468505859375, -0.340484619140625, -0.3162841796875, -0.292083740234375, -0.26788330078125, -0.243682861328125, -0.219482421875, -0.195281982421875, -0.17108154296875, -0.146881103515625, -0.1226806640625, -0.098480224609375, -0.07427978515625, -0.050079345703125, -0.02587890625, -0.001678466796875, 0.02252197265625, 0.046722412109375, 0.0709228515625, 0.095123291015625, 0.11932373046875, 0.143524169921875, 0.167724609375, 0.191925048828125, 0.21612548828125, 0.240325927734375, 0.2645263671875, 0.288726806640625, 0.31292724609375, 0.337127685546875, 0.361328125, 0.385528564453125, 0.40972900390625, 0.433929443359375, 0.4581298828125, 0.482330322265625, 0.50653076171875, 0.530731201171875, 0.554931640625, 0.579132080078125, 0.60333251953125, 0.627532958984375, 0.6517333984375, 0.675933837890625, 0.70013427734375, 0.724334716796875, 0.74853515625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 6.0, 6.0, 3.0, 11.0, 13.0, 27.0, 18.0, 34.0, 40.0, 59.0, 63.0, 69.0, 78.0, 84.0, 74.0, 72.0, 79.0, 59.0, 47.0, 35.0, 36.0, 25.0, 19.0, 13.0, 11.0, 9.0, 5.0, 1.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36181640625, -0.3504638671875, -0.339111328125, -0.3277587890625, -0.31640625, -0.3050537109375, -0.293701171875, -0.2823486328125, -0.27099609375, -0.2596435546875, -0.248291015625, -0.2369384765625, -0.2255859375, -0.2142333984375, -0.202880859375, -0.1915283203125, -0.18017578125, -0.1688232421875, -0.157470703125, -0.1461181640625, -0.134765625, -0.1234130859375, -0.112060546875, -0.1007080078125, -0.08935546875, -0.0780029296875, -0.066650390625, -0.0552978515625, -0.0439453125, -0.0325927734375, -0.021240234375, -0.0098876953125, 0.00146484375, 0.0128173828125, 0.024169921875, 0.0355224609375, 0.046875, 0.0582275390625, 0.069580078125, 0.0809326171875, 0.09228515625, 0.1036376953125, 0.114990234375, 0.1263427734375, 0.1376953125, 0.1490478515625, 0.160400390625, 0.1717529296875, 0.18310546875, 0.1944580078125, 0.205810546875, 0.2171630859375, 0.228515625, 0.2398681640625, 0.251220703125, 0.2625732421875, 0.27392578125, 0.2852783203125, 0.296630859375, 0.3079833984375, 0.3193359375, 0.3306884765625, 0.342041015625, 0.3533935546875, 0.36474609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 3.0, 9.0, 16.0, 13.0, 15.0, 28.0, 51.0, 39.0, 76.0, 111.0, 163.0, 289.0, 524.0, 937.0, 2397.0, 7165.0, 28366.0, 152170.0, 574612.0, 225972.0, 40619.0, 9514.0, 2877.0, 1077.0, 543.0, 297.0, 213.0, 130.0, 83.0, 74.0, 54.0, 34.0, 25.0, 12.0, 9.0, 8.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0], "bins": [-1.2734375, -1.2386550903320312, -1.2038726806640625, -1.1690902709960938, -1.134307861328125, -1.0995254516601562, -1.0647430419921875, -1.0299606323242188, -0.99517822265625, -0.9603958129882812, -0.9256134033203125, -0.8908309936523438, -0.856048583984375, -0.8212661743164062, -0.7864837646484375, -0.7517013549804688, -0.7169189453125, -0.6821365356445312, -0.6473541259765625, -0.6125717163085938, -0.577789306640625, -0.5430068969726562, -0.5082244873046875, -0.47344207763671875, -0.43865966796875, -0.40387725830078125, -0.3690948486328125, -0.33431243896484375, -0.299530029296875, -0.26474761962890625, -0.2299652099609375, -0.19518280029296875, -0.160400390625, -0.12561798095703125, -0.0908355712890625, -0.05605316162109375, -0.021270751953125, 0.01351165771484375, 0.0482940673828125, 0.08307647705078125, 0.11785888671875, 0.15264129638671875, 0.1874237060546875, 0.22220611572265625, 0.256988525390625, 0.29177093505859375, 0.3265533447265625, 0.36133575439453125, 0.3961181640625, 0.43090057373046875, 0.4656829833984375, 0.5004653930664062, 0.535247802734375, 0.5700302124023438, 0.6048126220703125, 0.6395950317382812, 0.67437744140625, 0.7091598510742188, 0.7439422607421875, 0.7787246704101562, 0.813507080078125, 0.8482894897460938, 0.8830718994140625, 0.9178543090820312, 0.95263671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 1.0, 10.0, 8.0, 13.0, 15.0, 16.0, 17.0, 18.0, 26.0, 37.0, 32.0, 39.0, 33.0, 46.0, 40.0, 47.0, 42.0, 45.0, 41.0, 52.0, 46.0, 38.0, 29.0, 37.0, 33.0, 29.0, 32.0, 31.0, 19.0, 15.0, 21.0, 15.0, 14.0, 12.0, 10.0, 8.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.3134765625, -1.2726593017578125, -1.231842041015625, -1.1910247802734375, -1.15020751953125, -1.1093902587890625, -1.068572998046875, -1.0277557373046875, -0.9869384765625, -0.9461212158203125, -0.905303955078125, -0.8644866943359375, -0.82366943359375, -0.7828521728515625, -0.742034912109375, -0.7012176513671875, -0.660400390625, -0.6195831298828125, -0.578765869140625, -0.5379486083984375, -0.49713134765625, -0.4563140869140625, -0.415496826171875, -0.3746795654296875, -0.3338623046875, -0.2930450439453125, -0.252227783203125, -0.2114105224609375, -0.17059326171875, -0.1297760009765625, -0.088958740234375, -0.0481414794921875, -0.00732421875, 0.0334930419921875, 0.074310302734375, 0.1151275634765625, 0.15594482421875, 0.1967620849609375, 0.237579345703125, 0.2783966064453125, 0.3192138671875, 0.3600311279296875, 0.400848388671875, 0.4416656494140625, 0.48248291015625, 0.5233001708984375, 0.564117431640625, 0.6049346923828125, 0.645751953125, 0.6865692138671875, 0.727386474609375, 0.7682037353515625, 0.80902099609375, 0.8498382568359375, 0.890655517578125, 0.9314727783203125, 0.9722900390625, 1.0131072998046875, 1.053924560546875, 1.0947418212890625, 1.13555908203125, 1.1763763427734375, 1.217193603515625, 1.2580108642578125, 1.298828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 14.0, 20.0, 27.0, 48.0, 81.0, 160.0, 410.0, 1258.0, 7709.0, 188516.0, 826559.0, 20253.0, 2372.0, 631.0, 242.0, 95.0, 57.0, 34.0, 12.0, 6.0, 9.0, 8.0, 9.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.50921630859375, -1.4637451171875, -1.41827392578125, -1.372802734375, -1.32733154296875, -1.2818603515625, -1.23638916015625, -1.19091796875, -1.14544677734375, -1.0999755859375, -1.05450439453125, -1.009033203125, -0.96356201171875, -0.9180908203125, -0.87261962890625, -0.8271484375, -0.78167724609375, -0.7362060546875, -0.69073486328125, -0.645263671875, -0.59979248046875, -0.5543212890625, -0.50885009765625, -0.46337890625, -0.41790771484375, -0.3724365234375, -0.32696533203125, -0.281494140625, -0.23602294921875, -0.1905517578125, -0.14508056640625, -0.099609375, -0.05413818359375, -0.0086669921875, 0.03680419921875, 0.082275390625, 0.12774658203125, 0.1732177734375, 0.21868896484375, 0.26416015625, 0.30963134765625, 0.3551025390625, 0.40057373046875, 0.446044921875, 0.49151611328125, 0.5369873046875, 0.58245849609375, 0.6279296875, 0.67340087890625, 0.7188720703125, 0.76434326171875, 0.809814453125, 0.85528564453125, 0.9007568359375, 0.94622802734375, 0.99169921875, 1.03717041015625, 1.0826416015625, 1.12811279296875, 1.173583984375, 1.21905517578125, 1.2645263671875, 1.30999755859375, 1.35546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 11.0, 14.0, 21.0, 28.0, 79.0, 117.0, 186.0, 223.0, 156.0, 76.0, 36.0, 18.0, 16.0, 6.0, 9.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026226043701171875, -0.00025477074086666107, -0.0002472810447216034, -0.00023979134857654572, -0.00023230165243148804, -0.00022481195628643036, -0.00021732226014137268, -0.000209832563996315, -0.00020234286785125732, -0.00019485317170619965, -0.00018736347556114197, -0.0001798737794160843, -0.0001723840832710266, -0.00016489438712596893, -0.00015740469098091125, -0.00014991499483585358, -0.0001424252986907959, -0.00013493560254573822, -0.00012744590640068054, -0.00011995621025562286, -0.00011246651411056519, -0.00010497681796550751, -9.748712182044983e-05, -8.999742567539215e-05, -8.250772953033447e-05, -7.50180333852768e-05, -6.752833724021912e-05, -6.003864109516144e-05, -5.254894495010376e-05, -4.505924880504608e-05, -3.75695526599884e-05, -3.0079856514930725e-05, -2.2590160369873047e-05, -1.5100464224815369e-05, -7.6107680797576904e-06, -1.210719347000122e-07, 7.368624210357666e-06, 1.4858320355415344e-05, 2.2348016500473022e-05, 2.98377126455307e-05, 3.732740879058838e-05, 4.481710493564606e-05, 5.2306801080703735e-05, 5.9796497225761414e-05, 6.728619337081909e-05, 7.477588951587677e-05, 8.226558566093445e-05, 8.975528180599213e-05, 9.72449779510498e-05, 0.00010473467409610748, 0.00011222437024116516, 0.00011971406638622284, 0.00012720376253128052, 0.0001346934586763382, 0.00014218315482139587, 0.00014967285096645355, 0.00015716254711151123, 0.0001646522432565689, 0.0001721419394016266, 0.00017963163554668427, 0.00018712133169174194, 0.00019461102783679962, 0.0002021007239818573, 0.00020959042012691498, 0.00021708011627197266]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 6.0, 8.0, 25.0, 40.0, 65.0, 127.0, 280.0, 819.0, 4590.0, 146880.0, 880701.0, 12794.0, 1527.0, 362.0, 154.0, 77.0, 38.0, 25.0, 11.0, 6.0, 7.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9775390625, -1.921356201171875, -1.86517333984375, -1.808990478515625, -1.7528076171875, -1.696624755859375, -1.64044189453125, -1.584259033203125, -1.528076171875, -1.471893310546875, -1.41571044921875, -1.359527587890625, -1.3033447265625, -1.247161865234375, -1.19097900390625, -1.134796142578125, -1.07861328125, -1.022430419921875, -0.96624755859375, -0.910064697265625, -0.8538818359375, -0.797698974609375, -0.74151611328125, -0.685333251953125, -0.629150390625, -0.572967529296875, -0.51678466796875, -0.460601806640625, -0.4044189453125, -0.348236083984375, -0.29205322265625, -0.235870361328125, -0.1796875, -0.123504638671875, -0.06732177734375, -0.011138916015625, 0.0450439453125, 0.101226806640625, 0.15740966796875, 0.213592529296875, 0.269775390625, 0.325958251953125, 0.38214111328125, 0.438323974609375, 0.4945068359375, 0.550689697265625, 0.60687255859375, 0.663055419921875, 0.71923828125, 0.775421142578125, 0.83160400390625, 0.887786865234375, 0.9439697265625, 1.000152587890625, 1.05633544921875, 1.112518310546875, 1.168701171875, 1.224884033203125, 1.28106689453125, 1.337249755859375, 1.3934326171875, 1.449615478515625, 1.50579833984375, 1.561981201171875, 1.6181640625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 14.0, 23.0, 35.0, 61.0, 118.0, 190.0, 218.0, 138.0, 77.0, 36.0, 19.0, 18.0, 11.0, 5.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.603515625, -1.5653915405273438, -1.5272674560546875, -1.4891433715820312, -1.451019287109375, -1.4128952026367188, -1.3747711181640625, -1.3366470336914062, -1.29852294921875, -1.2603988647460938, -1.2222747802734375, -1.1841506958007812, -1.146026611328125, -1.1079025268554688, -1.0697784423828125, -1.0316543579101562, -0.9935302734375, -0.9554061889648438, -0.9172821044921875, -0.8791580200195312, -0.841033935546875, -0.8029098510742188, -0.7647857666015625, -0.7266616821289062, -0.68853759765625, -0.6504135131835938, -0.6122894287109375, -0.5741653442382812, -0.536041259765625, -0.49791717529296875, -0.4597930908203125, -0.42166900634765625, -0.383544921875, -0.34542083740234375, -0.3072967529296875, -0.26917266845703125, -0.231048583984375, -0.19292449951171875, -0.1548004150390625, -0.11667633056640625, -0.07855224609375, -0.04042816162109375, -0.0023040771484375, 0.03582000732421875, 0.073944091796875, 0.11206817626953125, 0.1501922607421875, 0.18831634521484375, 0.2264404296875, 0.26456451416015625, 0.3026885986328125, 0.34081268310546875, 0.378936767578125, 0.41706085205078125, 0.4551849365234375, 0.49330902099609375, 0.53143310546875, 0.5695571899414062, 0.6076812744140625, 0.6458053588867188, 0.683929443359375, 0.7220535278320312, 0.7601776123046875, 0.7983016967773438, 0.83642578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 51.0, 290.0, 529.0, 121.0, 13.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.90468978881836, -49.825355529785156, -48.74602127075195, -47.66668701171875, -46.58735656738281, -45.50802230834961, -44.428688049316406, -43.3493537902832, -42.27001953125, -41.1906852722168, -40.111351013183594, -39.03201675415039, -37.95268249511719, -36.87335205078125, -35.79401779174805, -34.714683532714844, -33.63534927368164, -32.55601501464844, -31.476680755615234, -30.397348403930664, -29.31801414489746, -28.238679885864258, -27.159347534179688, -26.080013275146484, -25.00067901611328, -23.921344757080078, -22.842010498046875, -21.762678146362305, -20.6833438873291, -19.6040096282959, -18.524677276611328, -17.445343017578125, -16.366012573242188, -15.286678314208984, -14.207345008850098, -13.128011703491211, -12.048677444458008, -10.969343185424805, -9.890009880065918, -8.810676574707031, -7.731342315673828, -6.652008533477783, -5.572674751281738, -4.493340969085693, -3.4140071868896484, -2.3346734046936035, -1.2553396224975586, -0.17600584030151367, 0.9033279418945312, 1.9826617240905762, 3.061995506286621, 4.141329288482666, 5.220663070678711, 6.299996852874756, 7.379330635070801, 8.458663940429688, 9.53799819946289, 10.617332458496094, 11.69666576385498, 12.775999069213867, 13.85533332824707, 14.934667587280273, 16.013999938964844, 17.093334197998047, 18.17266845703125]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 4.0, 9.0, 7.0, 7.0, 15.0, 19.0, 20.0, 23.0, 22.0, 21.0, 27.0, 31.0, 38.0, 41.0, 40.0, 47.0, 43.0, 44.0, 55.0, 48.0, 48.0, 32.0, 35.0, 44.0, 36.0, 25.0, 35.0, 29.0, 28.0, 21.0, 17.0, 15.0, 16.0, 20.0, 6.0, 4.0, 9.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.251477241516113, -7.036263942718506, -6.821050643920898, -6.605837345123291, -6.390624046325684, -6.175411224365234, -5.960197448730469, -5.7449846267700195, -5.529771327972412, -5.314558029174805, -5.099344730377197, -4.88413143157959, -4.668918132781982, -4.453704833984375, -4.238492012023926, -4.023278713226318, -3.808065176010132, -3.5928518772125244, -3.377638578414917, -3.1624255180358887, -2.9472122192382812, -2.731998920440674, -2.5167856216430664, -2.301572322845459, -2.0863590240478516, -1.8711457252502441, -1.6559325456619263, -1.4407192468643188, -1.225506067276001, -1.0102927684783936, -0.7950794696807861, -0.5798662900924683, -0.3646531105041504, -0.14943985641002655, 0.06577339768409729, 0.2809866666793823, 0.49619990587234497, 0.7114131450653076, 0.926626443862915, 1.141839623451233, 1.3570529222488403, 1.5722662210464478, 1.7874794006347656, 2.002692699432373, 2.2179059982299805, 2.433119297027588, 2.6483325958251953, 2.8635456562042236, 3.078758955001831, 3.2939722537994385, 3.509185552597046, 3.724398612976074, 3.9396119117736816, 4.154825210571289, 4.3700385093688965, 4.585251808166504, 4.800465106964111, 5.015678405761719, 5.230891704559326, 5.446105003356934, 5.661318302154541, 5.876531600952148, 6.091744422912598, 6.306957721710205, 6.5221710205078125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 9.0, 11.0, 17.0, 21.0, 23.0, 41.0, 50.0, 95.0, 106.0, 164.0, 296.0, 496.0, 951.0, 2008.0, 5371.0, 23045.0, 3914794.0, 223786.0, 15130.0, 4207.0, 1701.0, 814.0, 397.0, 263.0, 135.0, 92.0, 75.0, 52.0, 30.0, 23.0, 18.0, 16.0, 9.0, 6.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.2890625, -1.252105712890625, -1.21514892578125, -1.178192138671875, -1.1412353515625, -1.104278564453125, -1.06732177734375, -1.030364990234375, -0.993408203125, -0.956451416015625, -0.91949462890625, -0.882537841796875, -0.8455810546875, -0.808624267578125, -0.77166748046875, -0.734710693359375, -0.69775390625, -0.660797119140625, -0.62384033203125, -0.586883544921875, -0.5499267578125, -0.512969970703125, -0.47601318359375, -0.439056396484375, -0.402099609375, -0.365142822265625, -0.32818603515625, -0.291229248046875, -0.2542724609375, -0.217315673828125, -0.18035888671875, -0.143402099609375, -0.1064453125, -0.069488525390625, -0.03253173828125, 0.004425048828125, 0.0413818359375, 0.078338623046875, 0.11529541015625, 0.152252197265625, 0.189208984375, 0.226165771484375, 0.26312255859375, 0.300079345703125, 0.3370361328125, 0.373992919921875, 0.41094970703125, 0.447906494140625, 0.48486328125, 0.521820068359375, 0.55877685546875, 0.595733642578125, 0.6326904296875, 0.669647216796875, 0.70660400390625, 0.743560791015625, 0.780517578125, 0.817474365234375, 0.85443115234375, 0.891387939453125, 0.9283447265625, 0.965301513671875, 1.00225830078125, 1.039215087890625, 1.076171875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 4.0, 6.0, 5.0, 6.0, 7.0, 14.0, 18.0, 16.0, 17.0, 36.0, 45.0, 51.0, 47.0, 68.0, 61.0, 68.0, 66.0, 59.0, 70.0, 59.0, 58.0, 25.0, 41.0, 31.0, 22.0, 16.0, 14.0, 24.0, 15.0, 9.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37744140625, -0.36418914794921875, -0.3509368896484375, -0.33768463134765625, -0.324432373046875, -0.31118011474609375, -0.2979278564453125, -0.28467559814453125, -0.27142333984375, -0.25817108154296875, -0.2449188232421875, -0.23166656494140625, -0.218414306640625, -0.20516204833984375, -0.1919097900390625, -0.17865753173828125, -0.1654052734375, -0.15215301513671875, -0.1389007568359375, -0.12564849853515625, -0.112396240234375, -0.09914398193359375, -0.0858917236328125, -0.07263946533203125, -0.05938720703125, -0.04613494873046875, -0.0328826904296875, -0.01963043212890625, -0.006378173828125, 0.00687408447265625, 0.0201263427734375, 0.03337860107421875, 0.046630859375, 0.05988311767578125, 0.0731353759765625, 0.08638763427734375, 0.099639892578125, 0.11289215087890625, 0.1261444091796875, 0.13939666748046875, 0.15264892578125, 0.16590118408203125, 0.1791534423828125, 0.19240570068359375, 0.205657958984375, 0.21891021728515625, 0.2321624755859375, 0.24541473388671875, 0.2586669921875, 0.27191925048828125, 0.2851715087890625, 0.29842376708984375, 0.311676025390625, 0.32492828369140625, 0.3381805419921875, 0.35143280029296875, 0.36468505859375, 0.37793731689453125, 0.3911895751953125, 0.40444183349609375, 0.417694091796875, 0.43094635009765625, 0.4441986083984375, 0.45745086669921875, 0.470703125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 11.0, 16.0, 15.0, 16.0, 22.0, 34.0, 36.0, 56.0, 86.0, 123.0, 195.0, 366.0, 693.0, 1773.0, 6449.0, 51682.0, 4096239.0, 28807.0, 4520.0, 1425.0, 638.0, 347.0, 231.0, 147.0, 98.0, 56.0, 50.0, 26.0, 29.0, 20.0, 15.0, 16.0, 14.0, 6.0, 9.0, 3.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.529296875, -2.461669921875, -2.39404296875, -2.326416015625, -2.2587890625, -2.191162109375, -2.12353515625, -2.055908203125, -1.98828125, -1.920654296875, -1.85302734375, -1.785400390625, -1.7177734375, -1.650146484375, -1.58251953125, -1.514892578125, -1.447265625, -1.379638671875, -1.31201171875, -1.244384765625, -1.1767578125, -1.109130859375, -1.04150390625, -0.973876953125, -0.90625, -0.838623046875, -0.77099609375, -0.703369140625, -0.6357421875, -0.568115234375, -0.50048828125, -0.432861328125, -0.365234375, -0.297607421875, -0.22998046875, -0.162353515625, -0.0947265625, -0.027099609375, 0.04052734375, 0.108154296875, 0.17578125, 0.243408203125, 0.31103515625, 0.378662109375, 0.4462890625, 0.513916015625, 0.58154296875, 0.649169921875, 0.716796875, 0.784423828125, 0.85205078125, 0.919677734375, 0.9873046875, 1.054931640625, 1.12255859375, 1.190185546875, 1.2578125, 1.325439453125, 1.39306640625, 1.460693359375, 1.5283203125, 1.595947265625, 1.66357421875, 1.731201171875, 1.798828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 13.0, 11.0, 24.0, 66.0, 364.0, 3479.0, 66.0, 21.0, 16.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2083740234375, -0.1925525665283203, -0.17673110961914062, -0.16090965270996094, -0.14508819580078125, -0.12926673889160156, -0.11344528198242188, -0.09762382507324219, -0.0818023681640625, -0.06598091125488281, -0.050159454345703125, -0.03433799743652344, -0.01851654052734375, -0.0026950836181640625, 0.013126373291015625, 0.028947830200195312, 0.044769287109375, 0.06059074401855469, 0.07641220092773438, 0.09223365783691406, 0.10805511474609375, 0.12387657165527344, 0.13969802856445312, 0.1555194854736328, 0.1713409423828125, 0.1871623992919922, 0.20298385620117188, 0.21880531311035156, 0.23462677001953125, 0.25044822692871094, 0.2662696838378906, 0.2820911407470703, 0.29791259765625, 0.3137340545654297, 0.3295555114746094, 0.34537696838378906, 0.36119842529296875, 0.37701988220214844, 0.3928413391113281, 0.4086627960205078, 0.4244842529296875, 0.4403057098388672, 0.4561271667480469, 0.47194862365722656, 0.48777008056640625, 0.5035915374755859, 0.5194129943847656, 0.5352344512939453, 0.551055908203125, 0.5668773651123047, 0.5826988220214844, 0.5985202789306641, 0.6143417358398438, 0.6301631927490234, 0.6459846496582031, 0.6618061065673828, 0.6776275634765625, 0.6934490203857422, 0.7092704772949219, 0.7250919342041016, 0.7409133911132812, 0.7567348480224609, 0.7725563049316406, 0.7883777618408203, 0.80419921875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 13.0, 43.0, 159.0, 326.0, 270.0, 134.0, 34.0, 18.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7480933666229248, -1.646098017692566, -1.544102668762207, -1.4421074390411377, -1.3401119709014893, -1.23811674118042, -1.136121392250061, -1.0341260433197021, -0.9321306943893433, -0.8301353454589844, -0.7281399965286255, -0.6261447072029114, -0.5241493582725525, -0.4221540093421936, -0.3201587200164795, -0.2181633710861206, -0.11616802215576172, -0.014172688126564026, 0.08782264590263367, 0.18981796503067017, 0.29181331396102905, 0.39380866289138794, 0.49580395221710205, 0.5977993011474609, 0.6997946500778198, 0.8017899990081787, 0.9037853479385376, 1.0057806968688965, 1.1077759265899658, 1.2097713947296143, 1.3117666244506836, 1.4137619733810425, 1.5157570838928223, 1.6177524328231812, 1.71974778175354, 1.8217430114746094, 1.9237384796142578, 2.025733709335327, 2.1277289390563965, 2.229724407196045, 2.3317198753356934, 2.4337151050567627, 2.535710573196411, 2.6377058029174805, 2.739701271057129, 2.8416965007781982, 2.9436917304992676, 3.045687198638916, 3.1476824283599854, 3.2496776580810547, 3.351673126220703, 3.4536683559417725, 3.555663824081421, 3.6576590538024902, 3.7596545219421387, 3.861649751663208, 3.9636449813842773, 4.065640449523926, 4.167635440826416, 4.2696309089660645, 4.371626377105713, 4.473621845245361, 4.575616836547852, 4.6776123046875, 4.779607772827148]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 10.0, 6.0, 17.0, 18.0, 15.0, 22.0, 22.0, 21.0, 35.0, 38.0, 45.0, 46.0, 48.0, 56.0, 62.0, 44.0, 61.0, 61.0, 42.0, 42.0, 51.0, 44.0, 30.0, 25.0, 31.0, 29.0, 19.0, 19.0, 9.0, 7.0, 9.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.3548306226730347, -1.3214133977890015, -1.2879961729049683, -1.254578948020935, -1.2211617231369019, -1.1877444982528687, -1.1543272733688354, -1.1209100484848022, -1.087492823600769, -1.0540755987167358, -1.0206583738327026, -0.9872411489486694, -0.9538239240646362, -0.920406699180603, -0.8869894742965698, -0.8535722494125366, -0.8201550245285034, -0.7867377996444702, -0.753320574760437, -0.7199033498764038, -0.6864861249923706, -0.6530689001083374, -0.6196516752243042, -0.586234450340271, -0.5528172254562378, -0.5194000005722046, -0.4859827756881714, -0.4525655508041382, -0.419148325920105, -0.3857311010360718, -0.3523138761520386, -0.31889665126800537, -0.28547942638397217, -0.25206220149993896, -0.21864497661590576, -0.18522775173187256, -0.15181052684783936, -0.11839330196380615, -0.08497607707977295, -0.051558852195739746, -0.018141627311706543, 0.01527559757232666, 0.04869282245635986, 0.08211004734039307, 0.11552727222442627, 0.14894449710845947, 0.18236172199249268, 0.21577894687652588, 0.24919617176055908, 0.2826133966445923, 0.3160306215286255, 0.3494478464126587, 0.3828650712966919, 0.4162822961807251, 0.4496995210647583, 0.4831167459487915, 0.5165339708328247, 0.5499511957168579, 0.5833684206008911, 0.6167856454849243, 0.6502028703689575, 0.6836200952529907, 0.7170373201370239, 0.7504545450210571, 0.7838717699050903]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 17.0, 16.0, 23.0, 34.0, 50.0, 73.0, 132.0, 238.0, 582.0, 1372.0, 3962.0, 14039.0, 55747.0, 236986.0, 479460.0, 193560.0, 45185.0, 11593.0, 3305.0, 1154.0, 498.0, 208.0, 107.0, 74.0, 48.0, 34.0, 19.0, 17.0, 11.0, 5.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3330078125, -1.295379638671875, -1.25775146484375, -1.220123291015625, -1.1824951171875, -1.144866943359375, -1.10723876953125, -1.069610595703125, -1.031982421875, -0.994354248046875, -0.95672607421875, -0.919097900390625, -0.8814697265625, -0.843841552734375, -0.80621337890625, -0.768585205078125, -0.73095703125, -0.693328857421875, -0.65570068359375, -0.618072509765625, -0.5804443359375, -0.542816162109375, -0.50518798828125, -0.467559814453125, -0.429931640625, -0.392303466796875, -0.35467529296875, -0.317047119140625, -0.2794189453125, -0.241790771484375, -0.20416259765625, -0.166534423828125, -0.12890625, -0.091278076171875, -0.05364990234375, -0.016021728515625, 0.0216064453125, 0.059234619140625, 0.09686279296875, 0.134490966796875, 0.172119140625, 0.209747314453125, 0.24737548828125, 0.285003662109375, 0.3226318359375, 0.360260009765625, 0.39788818359375, 0.435516357421875, 0.47314453125, 0.510772705078125, 0.54840087890625, 0.586029052734375, 0.6236572265625, 0.661285400390625, 0.69891357421875, 0.736541748046875, 0.774169921875, 0.811798095703125, 0.84942626953125, 0.887054443359375, 0.9246826171875, 0.962310791015625, 0.99993896484375, 1.037567138671875, 1.0751953125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 17.0, 16.0, 16.0, 15.0, 18.0, 41.0, 31.0, 51.0, 60.0, 74.0, 59.0, 75.0, 71.0, 61.0, 49.0, 60.0, 73.0, 44.0, 37.0, 29.0, 24.0, 15.0, 24.0, 12.0, 7.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56884765625, -0.551727294921875, -0.53460693359375, -0.517486572265625, -0.5003662109375, -0.483245849609375, -0.46612548828125, -0.449005126953125, -0.431884765625, -0.414764404296875, -0.39764404296875, -0.380523681640625, -0.3634033203125, -0.346282958984375, -0.32916259765625, -0.312042236328125, -0.294921875, -0.277801513671875, -0.26068115234375, -0.243560791015625, -0.2264404296875, -0.209320068359375, -0.19219970703125, -0.175079345703125, -0.157958984375, -0.140838623046875, -0.12371826171875, -0.106597900390625, -0.0894775390625, -0.072357177734375, -0.05523681640625, -0.038116455078125, -0.02099609375, -0.003875732421875, 0.01324462890625, 0.030364990234375, 0.0474853515625, 0.064605712890625, 0.08172607421875, 0.098846435546875, 0.115966796875, 0.133087158203125, 0.15020751953125, 0.167327880859375, 0.1844482421875, 0.201568603515625, 0.21868896484375, 0.235809326171875, 0.2529296875, 0.270050048828125, 0.28717041015625, 0.304290771484375, 0.3214111328125, 0.338531494140625, 0.35565185546875, 0.372772216796875, 0.389892578125, 0.407012939453125, 0.42413330078125, 0.441253662109375, 0.4583740234375, 0.475494384765625, 0.49261474609375, 0.509735107421875, 0.52685546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 2.0, 5.0, 14.0, 9.0, 19.0, 23.0, 28.0, 41.0, 50.0, 66.0, 104.0, 150.0, 211.0, 302.0, 467.0, 852.0, 1734.0, 4388.0, 12889.0, 53707.0, 310449.0, 532149.0, 98714.0, 20817.0, 6127.0, 2352.0, 1071.0, 582.0, 349.0, 242.0, 151.0, 130.0, 90.0, 55.0, 52.0, 35.0, 33.0, 21.0, 21.0, 5.0, 11.0, 11.0, 10.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5654296875, -1.5135650634765625, -1.461700439453125, -1.4098358154296875, -1.35797119140625, -1.3061065673828125, -1.254241943359375, -1.2023773193359375, -1.1505126953125, -1.0986480712890625, -1.046783447265625, -0.9949188232421875, -0.94305419921875, -0.8911895751953125, -0.839324951171875, -0.7874603271484375, -0.735595703125, -0.6837310791015625, -0.631866455078125, -0.5800018310546875, -0.52813720703125, -0.4762725830078125, -0.424407958984375, -0.3725433349609375, -0.3206787109375, -0.2688140869140625, -0.216949462890625, -0.1650848388671875, -0.11322021484375, -0.0613555908203125, -0.009490966796875, 0.0423736572265625, 0.09423828125, 0.1461029052734375, 0.197967529296875, 0.2498321533203125, 0.30169677734375, 0.3535614013671875, 0.405426025390625, 0.4572906494140625, 0.5091552734375, 0.5610198974609375, 0.612884521484375, 0.6647491455078125, 0.71661376953125, 0.7684783935546875, 0.820343017578125, 0.8722076416015625, 0.924072265625, 0.9759368896484375, 1.027801513671875, 1.0796661376953125, 1.13153076171875, 1.1833953857421875, 1.235260009765625, 1.2871246337890625, 1.3389892578125, 1.3908538818359375, 1.442718505859375, 1.4945831298828125, 1.54644775390625, 1.5983123779296875, 1.650177001953125, 1.7020416259765625, 1.75390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 9.0, 7.0, 14.0, 13.0, 12.0, 13.0, 30.0, 27.0, 23.0, 39.0, 58.0, 42.0, 63.0, 54.0, 58.0, 58.0, 50.0, 68.0, 54.0, 35.0, 39.0, 42.0, 47.0, 30.0, 23.0, 20.0, 15.0, 9.0, 7.0, 5.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.80078125, -2.70947265625, -2.6181640625, -2.52685546875, -2.435546875, -2.34423828125, -2.2529296875, -2.16162109375, -2.0703125, -1.97900390625, -1.8876953125, -1.79638671875, -1.705078125, -1.61376953125, -1.5224609375, -1.43115234375, -1.33984375, -1.24853515625, -1.1572265625, -1.06591796875, -0.974609375, -0.88330078125, -0.7919921875, -0.70068359375, -0.609375, -0.51806640625, -0.4267578125, -0.33544921875, -0.244140625, -0.15283203125, -0.0615234375, 0.02978515625, 0.12109375, 0.21240234375, 0.3037109375, 0.39501953125, 0.486328125, 0.57763671875, 0.6689453125, 0.76025390625, 0.8515625, 0.94287109375, 1.0341796875, 1.12548828125, 1.216796875, 1.30810546875, 1.3994140625, 1.49072265625, 1.58203125, 1.67333984375, 1.7646484375, 1.85595703125, 1.947265625, 2.03857421875, 2.1298828125, 2.22119140625, 2.3125, 2.40380859375, 2.4951171875, 2.58642578125, 2.677734375, 2.76904296875, 2.8603515625, 2.95166015625, 3.04296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 6.0, 12.0, 49.0, 112.0, 341.0, 1871.0, 389321.0, 653964.0, 2332.0, 341.0, 111.0, 45.0, 16.0, 8.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.14691162109375, -3.0516357421875, -2.95635986328125, -2.861083984375, -2.76580810546875, -2.6705322265625, -2.57525634765625, -2.47998046875, -2.38470458984375, -2.2894287109375, -2.19415283203125, -2.098876953125, -2.00360107421875, -1.9083251953125, -1.81304931640625, -1.7177734375, -1.62249755859375, -1.5272216796875, -1.43194580078125, -1.336669921875, -1.24139404296875, -1.1461181640625, -1.05084228515625, -0.95556640625, -0.86029052734375, -0.7650146484375, -0.66973876953125, -0.574462890625, -0.47918701171875, -0.3839111328125, -0.28863525390625, -0.193359375, -0.09808349609375, -0.0028076171875, 0.09246826171875, 0.187744140625, 0.28302001953125, 0.3782958984375, 0.47357177734375, 0.56884765625, 0.66412353515625, 0.7593994140625, 0.85467529296875, 0.949951171875, 1.04522705078125, 1.1405029296875, 1.23577880859375, 1.3310546875, 1.42633056640625, 1.5216064453125, 1.61688232421875, 1.712158203125, 1.80743408203125, 1.9027099609375, 1.99798583984375, 2.09326171875, 2.18853759765625, 2.2838134765625, 2.37908935546875, 2.474365234375, 2.56964111328125, 2.6649169921875, 2.76019287109375, 2.85546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 6.0, 17.0, 11.0, 16.0, 22.0, 19.0, 33.0, 38.0, 52.0, 57.0, 71.0, 74.0, 90.0, 88.0, 70.0, 66.0, 66.0, 35.0, 40.0, 19.0, 25.0, 19.0, 13.0, 12.0, 10.0, 5.0, 6.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00010478496551513672, -0.00010221172124147415, -9.963847696781158e-05, -9.706523269414902e-05, -9.449198842048645e-05, -9.191874414682388e-05, -8.934549987316132e-05, -8.677225559949875e-05, -8.419901132583618e-05, -8.162576705217361e-05, -7.905252277851105e-05, -7.647927850484848e-05, -7.390603423118591e-05, -7.133278995752335e-05, -6.875954568386078e-05, -6.618630141019821e-05, -6.361305713653564e-05, -6.103981286287308e-05, -5.846656858921051e-05, -5.589332431554794e-05, -5.3320080041885376e-05, -5.074683576822281e-05, -4.817359149456024e-05, -4.5600347220897675e-05, -4.302710294723511e-05, -4.045385867357254e-05, -3.788061439990997e-05, -3.5307370126247406e-05, -3.273412585258484e-05, -3.0160881578922272e-05, -2.7587637305259705e-05, -2.5014393031597137e-05, -2.244114875793457e-05, -1.9867904484272003e-05, -1.7294660210609436e-05, -1.4721415936946869e-05, -1.2148171663284302e-05, -9.574927389621735e-06, -7.0016831159591675e-06, -4.4284388422966e-06, -1.8551945686340332e-06, 7.180497050285339e-07, 3.291293978691101e-06, 5.864538252353668e-06, 8.437782526016235e-06, 1.1011026799678802e-05, 1.358427107334137e-05, 1.6157515347003937e-05, 1.8730759620666504e-05, 2.130400389432907e-05, 2.3877248167991638e-05, 2.6450492441654205e-05, 2.9023736715316772e-05, 3.159698098897934e-05, 3.417022526264191e-05, 3.6743469536304474e-05, 3.931671380996704e-05, 4.188995808362961e-05, 4.4463202357292175e-05, 4.703644663095474e-05, 4.960969090461731e-05, 5.218293517827988e-05, 5.4756179451942444e-05, 5.732942372560501e-05, 5.990266799926758e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 12.0, 11.0, 9.0, 16.0, 44.0, 70.0, 130.0, 348.0, 748.0, 2549.0, 25461.0, 936338.0, 77229.0, 3835.0, 1005.0, 387.0, 155.0, 75.0, 45.0, 25.0, 14.0, 8.0, 10.0, 8.0, 7.0, 4.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.087677001953125, -1.04351806640625, -0.999359130859375, -0.9552001953125, -0.911041259765625, -0.86688232421875, -0.822723388671875, -0.778564453125, -0.734405517578125, -0.69024658203125, -0.646087646484375, -0.6019287109375, -0.557769775390625, -0.51361083984375, -0.469451904296875, -0.42529296875, -0.381134033203125, -0.33697509765625, -0.292816162109375, -0.2486572265625, -0.204498291015625, -0.16033935546875, -0.116180419921875, -0.072021484375, -0.027862548828125, 0.01629638671875, 0.060455322265625, 0.1046142578125, 0.148773193359375, 0.19293212890625, 0.237091064453125, 0.28125, 0.325408935546875, 0.36956787109375, 0.413726806640625, 0.4578857421875, 0.502044677734375, 0.54620361328125, 0.590362548828125, 0.634521484375, 0.678680419921875, 0.72283935546875, 0.766998291015625, 0.8111572265625, 0.855316162109375, 0.89947509765625, 0.943634033203125, 0.98779296875, 1.031951904296875, 1.07611083984375, 1.120269775390625, 1.1644287109375, 1.208587646484375, 1.25274658203125, 1.296905517578125, 1.341064453125, 1.385223388671875, 1.42938232421875, 1.473541259765625, 1.5177001953125, 1.561859130859375, 1.60601806640625, 1.650177001953125, 1.6943359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 9.0, 19.0, 24.0, 71.0, 90.0, 145.0, 176.0, 181.0, 118.0, 70.0, 25.0, 31.0, 11.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.07421875, -1.0306243896484375, -0.987030029296875, -0.9434356689453125, -0.89984130859375, -0.8562469482421875, -0.812652587890625, -0.7690582275390625, -0.7254638671875, -0.6818695068359375, -0.638275146484375, -0.5946807861328125, -0.55108642578125, -0.5074920654296875, -0.463897705078125, -0.4203033447265625, -0.376708984375, -0.3331146240234375, -0.289520263671875, -0.2459259033203125, -0.20233154296875, -0.1587371826171875, -0.115142822265625, -0.0715484619140625, -0.0279541015625, 0.0156402587890625, 0.059234619140625, 0.1028289794921875, 0.14642333984375, 0.1900177001953125, 0.233612060546875, 0.2772064208984375, 0.32080078125, 0.3643951416015625, 0.407989501953125, 0.4515838623046875, 0.49517822265625, 0.5387725830078125, 0.582366943359375, 0.6259613037109375, 0.6695556640625, 0.7131500244140625, 0.756744384765625, 0.8003387451171875, 0.84393310546875, 0.8875274658203125, 0.931121826171875, 0.9747161865234375, 1.018310546875, 1.0619049072265625, 1.105499267578125, 1.1490936279296875, 1.19268798828125, 1.2362823486328125, 1.279876708984375, 1.3234710693359375, 1.3670654296875, 1.4106597900390625, 1.454254150390625, 1.4978485107421875, 1.54144287109375, 1.5850372314453125, 1.628631591796875, 1.6722259521484375, 1.7158203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 25.0, 58.0, 196.0, 285.0, 272.0, 104.0, 40.0, 14.0, 9.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.416728973388672, -15.627541542053223, -14.83835506439209, -14.04916763305664, -13.259981155395508, -12.470793724060059, -11.68160629272461, -10.892419815063477, -10.103232383728027, -9.314044952392578, -8.524858474731445, -7.735671043395996, -6.946484088897705, -6.157297134399414, -5.368109703063965, -4.578922748565674, -3.789735794067383, -3.000548839569092, -2.2113616466522217, -1.4221744537353516, -0.6329874992370605, 0.15619945526123047, 0.9453868865966797, 1.7345738410949707, 2.5237607955932617, 3.3129477500915527, 4.102134704589844, 4.891322135925293, 5.680509090423584, 6.469696044921875, 7.258883476257324, 8.048070907592773, 8.837257385253906, 9.626444816589355, 10.415631294250488, 11.204818725585938, 11.99400520324707, 12.78319263458252, 13.572380065917969, 14.361566543579102, 15.15075397491455, 15.93994140625, 16.729127883911133, 17.518314361572266, 18.30750274658203, 19.096689224243164, 19.885875701904297, 20.675064086914062, 21.464250564575195, 22.253437042236328, 23.042625427246094, 23.831811904907227, 24.62099838256836, 25.410186767578125, 26.199373245239258, 26.98855972290039, 27.777748107910156, 28.56693458557129, 29.356122970581055, 30.145309448242188, 30.93449592590332, 31.723682403564453, 32.51287078857422, 33.302059173583984, 34.091243743896484]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 5.0, 5.0, 7.0, 6.0, 8.0, 9.0, 11.0, 14.0, 14.0, 13.0, 21.0, 23.0, 22.0, 23.0, 39.0, 42.0, 37.0, 44.0, 49.0, 49.0, 36.0, 42.0, 38.0, 42.0, 49.0, 35.0, 37.0, 38.0, 33.0, 21.0, 22.0, 26.0, 20.0, 15.0, 17.0, 9.0, 12.0, 14.0, 6.0, 6.0, 10.0, 9.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-9.822504043579102, -9.513459205627441, -9.204414367675781, -8.895368576049805, -8.586323738098145, -8.277278900146484, -7.968234062194824, -7.659189224243164, -7.350143909454346, -7.0410990715026855, -6.732053756713867, -6.423008918762207, -6.113964080810547, -5.8049187660217285, -5.495873928070068, -5.18682861328125, -4.87778377532959, -4.56873893737793, -4.259693622589111, -3.950648784637451, -3.641603708267212, -3.3325586318969727, -3.0235137939453125, -2.7144687175750732, -2.405423641204834, -2.0963785648345947, -1.787333607673645, -1.4782886505126953, -1.169243574142456, -0.8601984977722168, -0.5511535406112671, -0.24210858345031738, 0.06693649291992188, 0.37598150968551636, 0.6850265264511108, 0.9940715432167053, 1.3031165599822998, 1.612161636352539, 1.9212065935134888, 2.2302515506744385, 2.5392966270446777, 2.848341703414917, 3.1573867797851562, 3.4664316177368164, 3.7754766941070557, 4.084521770477295, 4.393566608428955, 4.702611923217773, 5.011656761169434, 5.320701599121094, 5.629746913909912, 5.938791751861572, 6.247837066650391, 6.556881904602051, 6.865926742553711, 7.174971580505371, 7.4840168952941895, 7.79306173324585, 8.102107048034668, 8.411151885986328, 8.720196723937988, 9.029241561889648, 9.338287353515625, 9.647332191467285, 9.956377029418945]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 2.0, 4.0, 15.0, 16.0, 37.0, 51.0, 82.0, 143.0, 303.0, 682.0, 1938.0, 7495.0, 56502.0, 4066841.0, 49790.0, 7100.0, 1969.0, 641.0, 318.0, 147.0, 74.0, 46.0, 25.0, 23.0, 17.0, 9.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.00390625, -0.9571685791015625, -0.910430908203125, -0.8636932373046875, -0.81695556640625, -0.7702178955078125, -0.723480224609375, -0.6767425537109375, -0.6300048828125, -0.5832672119140625, -0.536529541015625, -0.4897918701171875, -0.44305419921875, -0.3963165283203125, -0.349578857421875, -0.3028411865234375, -0.256103515625, -0.2093658447265625, -0.162628173828125, -0.1158905029296875, -0.06915283203125, -0.0224151611328125, 0.024322509765625, 0.0710601806640625, 0.1177978515625, 0.1645355224609375, 0.211273193359375, 0.2580108642578125, 0.30474853515625, 0.3514862060546875, 0.398223876953125, 0.4449615478515625, 0.49169921875, 0.5384368896484375, 0.585174560546875, 0.6319122314453125, 0.67864990234375, 0.7253875732421875, 0.772125244140625, 0.8188629150390625, 0.8656005859375, 0.9123382568359375, 0.959075927734375, 1.0058135986328125, 1.05255126953125, 1.0992889404296875, 1.146026611328125, 1.1927642822265625, 1.239501953125, 1.2862396240234375, 1.332977294921875, 1.3797149658203125, 1.42645263671875, 1.4731903076171875, 1.519927978515625, 1.5666656494140625, 1.6134033203125, 1.6601409912109375, 1.706878662109375, 1.7536163330078125, 1.80035400390625, 1.8470916748046875, 1.893829345703125, 1.9405670166015625, 1.9873046875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 3.0, 3.0, 6.0, 4.0, 16.0, 15.0, 13.0, 19.0, 26.0, 27.0, 43.0, 52.0, 55.0, 55.0, 75.0, 74.0, 75.0, 74.0, 55.0, 47.0, 49.0, 37.0, 37.0, 28.0, 24.0, 21.0, 18.0, 14.0, 5.0, 5.0, 6.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5517578125, -0.5328216552734375, -0.513885498046875, -0.4949493408203125, -0.47601318359375, -0.4570770263671875, -0.438140869140625, -0.4192047119140625, -0.4002685546875, -0.3813323974609375, -0.362396240234375, -0.3434600830078125, -0.32452392578125, -0.3055877685546875, -0.286651611328125, -0.2677154541015625, -0.248779296875, -0.2298431396484375, -0.210906982421875, -0.1919708251953125, -0.17303466796875, -0.1540985107421875, -0.135162353515625, -0.1162261962890625, -0.0972900390625, -0.0783538818359375, -0.059417724609375, -0.0404815673828125, -0.02154541015625, -0.0026092529296875, 0.016326904296875, 0.0352630615234375, 0.05419921875, 0.0731353759765625, 0.092071533203125, 0.1110076904296875, 0.12994384765625, 0.1488800048828125, 0.167816162109375, 0.1867523193359375, 0.2056884765625, 0.2246246337890625, 0.243560791015625, 0.2624969482421875, 0.28143310546875, 0.3003692626953125, 0.319305419921875, 0.3382415771484375, 0.357177734375, 0.3761138916015625, 0.395050048828125, 0.4139862060546875, 0.43292236328125, 0.4518585205078125, 0.470794677734375, 0.4897308349609375, 0.5086669921875, 0.5276031494140625, 0.546539306640625, 0.5654754638671875, 0.58441162109375, 0.6033477783203125, 0.622283935546875, 0.6412200927734375, 0.66015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 6.0, 10.0, 16.0, 12.0, 13.0, 23.0, 31.0, 37.0, 39.0, 46.0, 49.0, 92.0, 124.0, 274.0, 870.0, 3410.0, 23026.0, 4082474.0, 74914.0, 6374.0, 1405.0, 398.0, 173.0, 114.0, 71.0, 53.0, 50.0, 48.0, 37.0, 21.0, 15.0, 11.0, 4.0, 11.0, 5.0, 11.0, 1.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.087890625, -2.998870849609375, -2.90985107421875, -2.820831298828125, -2.7318115234375, -2.642791748046875, -2.55377197265625, -2.464752197265625, -2.375732421875, -2.286712646484375, -2.19769287109375, -2.108673095703125, -2.0196533203125, -1.930633544921875, -1.84161376953125, -1.752593994140625, -1.66357421875, -1.574554443359375, -1.48553466796875, -1.396514892578125, -1.3074951171875, -1.218475341796875, -1.12945556640625, -1.040435791015625, -0.951416015625, -0.862396240234375, -0.77337646484375, -0.684356689453125, -0.5953369140625, -0.506317138671875, -0.41729736328125, -0.328277587890625, -0.2392578125, -0.150238037109375, -0.06121826171875, 0.027801513671875, 0.1168212890625, 0.205841064453125, 0.29486083984375, 0.383880615234375, 0.472900390625, 0.561920166015625, 0.65093994140625, 0.739959716796875, 0.8289794921875, 0.917999267578125, 1.00701904296875, 1.096038818359375, 1.18505859375, 1.274078369140625, 1.36309814453125, 1.452117919921875, 1.5411376953125, 1.630157470703125, 1.71917724609375, 1.808197021484375, 1.897216796875, 1.986236572265625, 2.07525634765625, 2.164276123046875, 2.2532958984375, 2.342315673828125, 2.43133544921875, 2.520355224609375, 2.609375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 8.0, 11.0, 22.0, 49.0, 159.0, 3502.0, 203.0, 57.0, 28.0, 17.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.239013671875, -0.21838760375976562, -0.19776153564453125, -0.17713546752929688, -0.1565093994140625, -0.13588333129882812, -0.11525726318359375, -0.09463119506835938, -0.074005126953125, -0.053379058837890625, -0.03275299072265625, -0.012126922607421875, 0.0084991455078125, 0.029125213623046875, 0.04975128173828125, 0.07037734985351562, 0.09100341796875, 0.11162948608398438, 0.13225555419921875, 0.15288162231445312, 0.1735076904296875, 0.19413375854492188, 0.21475982666015625, 0.23538589477539062, 0.256011962890625, 0.2766380310058594, 0.29726409912109375, 0.3178901672363281, 0.3385162353515625, 0.3591423034667969, 0.37976837158203125, 0.4003944396972656, 0.4210205078125, 0.4416465759277344, 0.46227264404296875, 0.4828987121582031, 0.5035247802734375, 0.5241508483886719, 0.5447769165039062, 0.5654029846191406, 0.586029052734375, 0.6066551208496094, 0.6272811889648438, 0.6479072570800781, 0.6685333251953125, 0.6891593933105469, 0.7097854614257812, 0.7304115295410156, 0.75103759765625, 0.7716636657714844, 0.7922897338867188, 0.8129158020019531, 0.8335418701171875, 0.8541679382324219, 0.8747940063476562, 0.8954200744628906, 0.916046142578125, 0.9366722106933594, 0.9572982788085938, 0.9779243469238281, 0.9985504150390625, 1.0191764831542969, 1.0398025512695312, 1.0604286193847656, 1.0810546875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 12.0, 19.0, 26.0, 91.0, 123.0, 186.0, 172.0, 151.0, 72.0, 48.0, 46.0, 15.0, 14.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.157376766204834, -2.0742225646972656, -1.9910684823989868, -1.907914400100708, -1.8247601985931396, -1.7416061162948608, -1.658452033996582, -1.5752978324890137, -1.4921437501907349, -1.408989667892456, -1.3258354663848877, -1.2426813840866089, -1.15952730178833, -1.0763731002807617, -0.9932190179824829, -0.9100648760795593, -0.8269107341766357, -0.7437565922737122, -0.6606024503707886, -0.5774483680725098, -0.4942942261695862, -0.4111400842666626, -0.3279859721660614, -0.2448318600654602, -0.16167771816253662, -0.07852359116077423, 0.004630535840988159, 0.08778466284275055, 0.17093878984451294, 0.2540929317474365, 0.3372470438480377, 0.4204011559486389, 0.5035550594329834, 0.586709201335907, 0.6698633432388306, 0.7530174255371094, 0.836171567440033, 0.9193257093429565, 1.0024797916412354, 1.0856339931488037, 1.1687880754470825, 1.2519421577453613, 1.3350963592529297, 1.4182504415512085, 1.5014045238494873, 1.5845587253570557, 1.6677128076553345, 1.7508668899536133, 1.8340210914611816, 1.9171751737594604, 2.0003292560577393, 2.0834834575653076, 2.166637659072876, 2.2497916221618652, 2.3329458236694336, 2.416100025177002, 2.4992542266845703, 2.5824084281921387, 2.665562391281128, 2.7487165927886963, 2.8318707942962646, 2.915024757385254, 2.9981789588928223, 3.0813331604003906, 3.16448712348938]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 9.0, 4.0, 14.0, 11.0, 10.0, 21.0, 23.0, 19.0, 11.0, 12.0, 22.0, 26.0, 24.0, 32.0, 37.0, 40.0, 31.0, 38.0, 42.0, 39.0, 45.0, 44.0, 31.0, 37.0, 36.0, 41.0, 39.0, 45.0, 19.0, 26.0, 31.0, 19.0, 19.0, 22.0, 16.0, 9.0, 10.0, 8.0, 8.0, 6.0, 2.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0084989070892334, -0.9751836657524109, -0.9418684244155884, -0.9085532426834106, -0.8752380013465881, -0.8419227600097656, -0.8086075782775879, -0.7752923369407654, -0.7419770956039429, -0.7086618542671204, -0.6753466129302979, -0.6420314311981201, -0.6087161898612976, -0.5754009485244751, -0.5420857667922974, -0.5087705254554749, -0.47545528411865234, -0.44214004278182983, -0.4088248312473297, -0.3755096197128296, -0.3421943783760071, -0.30887913703918457, -0.27556392550468445, -0.24224869906902313, -0.20893347263336182, -0.1756182461977005, -0.14230301976203918, -0.10898779332637787, -0.07567256689071655, -0.04235734045505524, -0.009042114019393921, 0.024273112416267395, 0.05758833885192871, 0.09090356528759003, 0.12421879172325134, 0.15753401815891266, 0.19084924459457397, 0.2241644710302353, 0.2574796974658966, 0.29079490900039673, 0.32411015033721924, 0.35742539167404175, 0.39074060320854187, 0.424055814743042, 0.4573710560798645, 0.490686297416687, 0.5240014791488647, 0.5573167204856873, 0.5906319618225098, 0.6239472031593323, 0.6572624444961548, 0.6905776262283325, 0.723892867565155, 0.7572081089019775, 0.7905232906341553, 0.8238385319709778, 0.8571537733078003, 0.8904690146446228, 0.9237842559814453, 0.957099437713623, 0.9904146790504456, 1.023729920387268, 1.0570451021194458, 1.090360403060913, 1.1236755847930908]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 4.0, 6.0, 12.0, 16.0, 25.0, 33.0, 46.0, 64.0, 84.0, 144.0, 241.0, 439.0, 783.0, 1604.0, 3273.0, 7951.0, 20609.0, 57729.0, 171547.0, 374991.0, 263556.0, 92403.0, 31746.0, 11881.0, 4837.0, 2084.0, 1076.0, 502.0, 330.0, 166.0, 133.0, 76.0, 58.0, 21.0, 25.0, 15.0, 14.0, 8.0, 8.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97998046875, -0.9490814208984375, -0.918182373046875, -0.8872833251953125, -0.85638427734375, -0.8254852294921875, -0.794586181640625, -0.7636871337890625, -0.7327880859375, -0.7018890380859375, -0.670989990234375, -0.6400909423828125, -0.60919189453125, -0.5782928466796875, -0.547393798828125, -0.5164947509765625, -0.485595703125, -0.4546966552734375, -0.423797607421875, -0.3928985595703125, -0.36199951171875, -0.3311004638671875, -0.300201416015625, -0.2693023681640625, -0.2384033203125, -0.2075042724609375, -0.176605224609375, -0.1457061767578125, -0.11480712890625, -0.0839080810546875, -0.053009033203125, -0.0221099853515625, 0.0087890625, 0.0396881103515625, 0.070587158203125, 0.1014862060546875, 0.13238525390625, 0.1632843017578125, 0.194183349609375, 0.2250823974609375, 0.2559814453125, 0.2868804931640625, 0.317779541015625, 0.3486785888671875, 0.37957763671875, 0.4104766845703125, 0.441375732421875, 0.4722747802734375, 0.503173828125, 0.5340728759765625, 0.564971923828125, 0.5958709716796875, 0.62677001953125, 0.6576690673828125, 0.688568115234375, 0.7194671630859375, 0.7503662109375, 0.7812652587890625, 0.812164306640625, 0.8430633544921875, 0.87396240234375, 0.9048614501953125, 0.935760498046875, 0.9666595458984375, 0.99755859375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 7.0, 1.0, 2.0, 4.0, 7.0, 5.0, 11.0, 17.0, 21.0, 24.0, 29.0, 38.0, 38.0, 57.0, 55.0, 71.0, 63.0, 74.0, 74.0, 56.0, 54.0, 59.0, 47.0, 36.0, 42.0, 22.0, 29.0, 18.0, 14.0, 11.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53515625, -0.51361083984375, -0.4920654296875, -0.47052001953125, -0.448974609375, -0.42742919921875, -0.4058837890625, -0.38433837890625, -0.36279296875, -0.34124755859375, -0.3197021484375, -0.29815673828125, -0.276611328125, -0.25506591796875, -0.2335205078125, -0.21197509765625, -0.1904296875, -0.16888427734375, -0.1473388671875, -0.12579345703125, -0.104248046875, -0.08270263671875, -0.0611572265625, -0.03961181640625, -0.01806640625, 0.00347900390625, 0.0250244140625, 0.04656982421875, 0.068115234375, 0.08966064453125, 0.1112060546875, 0.13275146484375, 0.154296875, 0.17584228515625, 0.1973876953125, 0.21893310546875, 0.240478515625, 0.26202392578125, 0.2835693359375, 0.30511474609375, 0.32666015625, 0.34820556640625, 0.3697509765625, 0.39129638671875, 0.412841796875, 0.43438720703125, 0.4559326171875, 0.47747802734375, 0.4990234375, 0.52056884765625, 0.5421142578125, 0.56365966796875, 0.585205078125, 0.60675048828125, 0.6282958984375, 0.64984130859375, 0.67138671875, 0.69293212890625, 0.7144775390625, 0.73602294921875, 0.757568359375, 0.77911376953125, 0.8006591796875, 0.82220458984375, 0.84375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 14.0, 8.0, 17.0, 23.0, 57.0, 110.0, 200.0, 319.0, 635.0, 1494.0, 6865.0, 137816.0, 861666.0, 33901.0, 3357.0, 1017.0, 461.0, 252.0, 147.0, 64.0, 35.0, 30.0, 22.0, 14.0, 10.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.875, -3.73809814453125, -3.6011962890625, -3.46429443359375, -3.327392578125, -3.19049072265625, -3.0535888671875, -2.91668701171875, -2.77978515625, -2.64288330078125, -2.5059814453125, -2.36907958984375, -2.232177734375, -2.09527587890625, -1.9583740234375, -1.82147216796875, -1.6845703125, -1.54766845703125, -1.4107666015625, -1.27386474609375, -1.136962890625, -1.00006103515625, -0.8631591796875, -0.72625732421875, -0.58935546875, -0.45245361328125, -0.3155517578125, -0.17864990234375, -0.041748046875, 0.09515380859375, 0.2320556640625, 0.36895751953125, 0.505859375, 0.64276123046875, 0.7796630859375, 0.91656494140625, 1.053466796875, 1.19036865234375, 1.3272705078125, 1.46417236328125, 1.60107421875, 1.73797607421875, 1.8748779296875, 2.01177978515625, 2.148681640625, 2.28558349609375, 2.4224853515625, 2.55938720703125, 2.6962890625, 2.83319091796875, 2.9700927734375, 3.10699462890625, 3.243896484375, 3.38079833984375, 3.5177001953125, 3.65460205078125, 3.79150390625, 3.92840576171875, 4.0653076171875, 4.20220947265625, 4.339111328125, 4.47601318359375, 4.6129150390625, 4.74981689453125, 4.88671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 9.0, 13.0, 14.0, 18.0, 22.0, 21.0, 25.0, 41.0, 37.0, 51.0, 54.0, 58.0, 52.0, 44.0, 63.0, 55.0, 69.0, 45.0, 45.0, 47.0, 35.0, 41.0, 26.0, 13.0, 14.0, 12.0, 18.0, 9.0, 6.0, 11.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.64453125, -3.54345703125, -3.4423828125, -3.34130859375, -3.240234375, -3.13916015625, -3.0380859375, -2.93701171875, -2.8359375, -2.73486328125, -2.6337890625, -2.53271484375, -2.431640625, -2.33056640625, -2.2294921875, -2.12841796875, -2.02734375, -1.92626953125, -1.8251953125, -1.72412109375, -1.623046875, -1.52197265625, -1.4208984375, -1.31982421875, -1.21875, -1.11767578125, -1.0166015625, -0.91552734375, -0.814453125, -0.71337890625, -0.6123046875, -0.51123046875, -0.41015625, -0.30908203125, -0.2080078125, -0.10693359375, -0.005859375, 0.09521484375, 0.1962890625, 0.29736328125, 0.3984375, 0.49951171875, 0.6005859375, 0.70166015625, 0.802734375, 0.90380859375, 1.0048828125, 1.10595703125, 1.20703125, 1.30810546875, 1.4091796875, 1.51025390625, 1.611328125, 1.71240234375, 1.8134765625, 1.91455078125, 2.015625, 2.11669921875, 2.2177734375, 2.31884765625, 2.419921875, 2.52099609375, 2.6220703125, 2.72314453125, 2.82421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 10.0, 6.0, 12.0, 20.0, 34.0, 56.0, 116.0, 252.0, 658.0, 2723.0, 45465.0, 965389.0, 30502.0, 2265.0, 599.0, 232.0, 100.0, 47.0, 29.0, 14.0, 10.0, 9.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.7421875, -2.6804962158203125, -2.618804931640625, -2.5571136474609375, -2.49542236328125, -2.4337310791015625, -2.372039794921875, -2.3103485107421875, -2.2486572265625, -2.1869659423828125, -2.125274658203125, -2.0635833740234375, -2.00189208984375, -1.9402008056640625, -1.878509521484375, -1.8168182373046875, -1.755126953125, -1.6934356689453125, -1.631744384765625, -1.5700531005859375, -1.50836181640625, -1.4466705322265625, -1.384979248046875, -1.3232879638671875, -1.2615966796875, -1.1999053955078125, -1.138214111328125, -1.0765228271484375, -1.01483154296875, -0.9531402587890625, -0.891448974609375, -0.8297576904296875, -0.76806640625, -0.7063751220703125, -0.644683837890625, -0.5829925537109375, -0.52130126953125, -0.4596099853515625, -0.397918701171875, -0.3362274169921875, -0.2745361328125, -0.2128448486328125, -0.151153564453125, -0.0894622802734375, -0.02777099609375, 0.0339202880859375, 0.095611572265625, 0.1573028564453125, 0.218994140625, 0.2806854248046875, 0.342376708984375, 0.4040679931640625, 0.46575927734375, 0.5274505615234375, 0.589141845703125, 0.6508331298828125, 0.7125244140625, 0.7742156982421875, 0.835906982421875, 0.8975982666015625, 0.95928955078125, 1.0209808349609375, 1.082672119140625, 1.1443634033203125, 1.2060546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 7.0, 15.0, 23.0, 19.0, 22.0, 34.0, 59.0, 48.0, 71.0, 87.0, 94.0, 90.0, 81.0, 72.0, 61.0, 58.0, 40.0, 30.0, 21.0, 11.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00011938810348510742, -0.0001163482666015625, -0.00011330842971801758, -0.00011026859283447266, -0.00010722875595092773, -0.00010418891906738281, -0.00010114908218383789, -9.810924530029297e-05, -9.506940841674805e-05, -9.202957153320312e-05, -8.89897346496582e-05, -8.594989776611328e-05, -8.291006088256836e-05, -7.987022399902344e-05, -7.683038711547852e-05, -7.37905502319336e-05, -7.075071334838867e-05, -6.771087646484375e-05, -6.467103958129883e-05, -6.16312026977539e-05, -5.8591365814208984e-05, -5.555152893066406e-05, -5.251169204711914e-05, -4.947185516357422e-05, -4.64320182800293e-05, -4.3392181396484375e-05, -4.035234451293945e-05, -3.731250762939453e-05, -3.427267074584961e-05, -3.123283386230469e-05, -2.8192996978759766e-05, -2.5153160095214844e-05, -2.2113323211669922e-05, -1.9073486328125e-05, -1.6033649444580078e-05, -1.2993812561035156e-05, -9.953975677490234e-06, -6.9141387939453125e-06, -3.874301910400391e-06, -8.344650268554688e-07, 2.205371856689453e-06, 5.245208740234375e-06, 8.285045623779297e-06, 1.1324882507324219e-05, 1.436471939086914e-05, 1.7404556274414062e-05, 2.0444393157958984e-05, 2.3484230041503906e-05, 2.6524066925048828e-05, 2.956390380859375e-05, 3.260374069213867e-05, 3.5643577575683594e-05, 3.8683414459228516e-05, 4.172325134277344e-05, 4.476308822631836e-05, 4.780292510986328e-05, 5.08427619934082e-05, 5.3882598876953125e-05, 5.692243576049805e-05, 5.996227264404297e-05, 6.300210952758789e-05, 6.604194641113281e-05, 6.908178329467773e-05, 7.212162017822266e-05, 7.516145706176758e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 9.0, 11.0, 18.0, 32.0, 32.0, 81.0, 198.0, 390.0, 1028.0, 3564.0, 52889.0, 957295.0, 28620.0, 2799.0, 839.0, 347.0, 165.0, 80.0, 53.0, 24.0, 20.0, 15.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4833984375, -1.4272613525390625, -1.371124267578125, -1.3149871826171875, -1.25885009765625, -1.2027130126953125, -1.146575927734375, -1.0904388427734375, -1.0343017578125, -0.9781646728515625, -0.922027587890625, -0.8658905029296875, -0.80975341796875, -0.7536163330078125, -0.697479248046875, -0.6413421630859375, -0.585205078125, -0.5290679931640625, -0.472930908203125, -0.4167938232421875, -0.36065673828125, -0.3045196533203125, -0.248382568359375, -0.1922454833984375, -0.1361083984375, -0.0799713134765625, -0.023834228515625, 0.0323028564453125, 0.08843994140625, 0.1445770263671875, 0.200714111328125, 0.2568511962890625, 0.31298828125, 0.3691253662109375, 0.425262451171875, 0.4813995361328125, 0.53753662109375, 0.5936737060546875, 0.649810791015625, 0.7059478759765625, 0.7620849609375, 0.8182220458984375, 0.874359130859375, 0.9304962158203125, 0.98663330078125, 1.0427703857421875, 1.098907470703125, 1.1550445556640625, 1.211181640625, 1.2673187255859375, 1.323455810546875, 1.3795928955078125, 1.43572998046875, 1.4918670654296875, 1.548004150390625, 1.6041412353515625, 1.6602783203125, 1.7164154052734375, 1.772552490234375, 1.8286895751953125, 1.88482666015625, 1.9409637451171875, 1.997100830078125, 2.0532379150390625, 2.109375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 10.0, 15.0, 41.0, 111.0, 225.0, 287.0, 173.0, 79.0, 37.0, 10.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1630859375, -1.0917816162109375, -1.020477294921875, -0.9491729736328125, -0.87786865234375, -0.8065643310546875, -0.735260009765625, -0.6639556884765625, -0.5926513671875, -0.5213470458984375, -0.450042724609375, -0.3787384033203125, -0.30743408203125, -0.2361297607421875, -0.164825439453125, -0.0935211181640625, -0.022216796875, 0.0490875244140625, 0.120391845703125, 0.1916961669921875, 0.26300048828125, 0.3343048095703125, 0.405609130859375, 0.4769134521484375, 0.5482177734375, 0.6195220947265625, 0.690826416015625, 0.7621307373046875, 0.83343505859375, 0.9047393798828125, 0.976043701171875, 1.0473480224609375, 1.11865234375, 1.1899566650390625, 1.261260986328125, 1.3325653076171875, 1.40386962890625, 1.4751739501953125, 1.546478271484375, 1.6177825927734375, 1.6890869140625, 1.7603912353515625, 1.831695556640625, 1.9029998779296875, 1.97430419921875, 2.0456085205078125, 2.116912841796875, 2.1882171630859375, 2.259521484375, 2.3308258056640625, 2.402130126953125, 2.4734344482421875, 2.54473876953125, 2.6160430908203125, 2.687347412109375, 2.7586517333984375, 2.8299560546875, 2.9012603759765625, 2.972564697265625, 3.0438690185546875, 3.11517333984375, 3.1864776611328125, 3.257781982421875, 3.3290863037109375, 3.400390625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 15.0, 36.0, 116.0, 286.0, 285.0, 167.0, 53.0, 26.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.66199493408203, -47.604583740234375, -46.54716873168945, -45.48975372314453, -44.432342529296875, -43.37493133544922, -42.3175163269043, -41.260101318359375, -40.20269012451172, -39.14527893066406, -38.08786392211914, -37.03044891357422, -35.97303771972656, -34.915626525878906, -33.858211517333984, -32.80079650878906, -31.743385314941406, -30.685972213745117, -29.628559112548828, -28.57114601135254, -27.51373291015625, -26.45631980895996, -25.398906707763672, -24.341493606567383, -23.284080505371094, -22.226667404174805, -21.169254302978516, -20.111841201782227, -19.054428100585938, -17.99701499938965, -16.93960189819336, -15.88218879699707, -14.824775695800781, -13.767362594604492, -12.709949493408203, -11.652536392211914, -10.595123291015625, -9.537710189819336, -8.480297088623047, -7.422883987426758, -6.365470886230469, -5.30805778503418, -4.250644683837891, -3.1932315826416016, -2.1358184814453125, -1.0784053802490234, -0.020992279052734375, 1.0364208221435547, 2.0938339233398438, 3.151247024536133, 4.208660125732422, 5.266073226928711, 6.323486328125, 7.380899429321289, 8.438312530517578, 9.495725631713867, 10.553138732910156, 11.610551834106445, 12.667964935302734, 13.725378036499023, 14.782791137695312, 15.840204238891602, 16.89761734008789, 17.95503044128418, 19.01244354248047]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 8.0, 10.0, 11.0, 17.0, 28.0, 15.0, 27.0, 28.0, 34.0, 29.0, 36.0, 55.0, 48.0, 37.0, 52.0, 59.0, 50.0, 60.0, 53.0, 30.0, 47.0, 27.0, 34.0, 29.0, 26.0, 18.0, 19.0, 25.0, 7.0, 16.0, 14.0, 12.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.751487731933594, -11.368470191955566, -10.985453605651855, -10.602436065673828, -10.219419479370117, -9.83640193939209, -9.453385353088379, -9.070367813110352, -8.68735122680664, -8.304333686828613, -7.921317100524902, -7.538300037384033, -7.155282974243164, -6.772265911102295, -6.389248847961426, -6.006231307983398, -5.623214244842529, -5.24019718170166, -4.857180118560791, -4.474163055419922, -4.091145992279053, -3.7081289291381836, -3.3251116275787354, -2.942094564437866, -2.559077501296997, -2.176060438156128, -1.7930433750152588, -1.4100261926651, -1.027009129524231, -0.6439920663833618, -0.2609748840332031, 0.12204217910766602, 0.5050592422485352, 0.8880763053894043, 1.2710933685302734, 1.6541105508804321, 2.0371274948120117, 2.420144557952881, 2.803161859512329, 3.1861789226531982, 3.5691959857940674, 3.9522130489349365, 4.335230350494385, 4.718247413635254, 5.101264476776123, 5.484281539916992, 5.867298603057861, 6.2503156661987305, 6.6333327293396, 7.016349792480469, 7.399366855621338, 7.782383918762207, 8.165401458740234, 8.548418045043945, 8.931435585021973, 9.314452171325684, 9.697469711303711, 10.080487251281738, 10.46350383758545, 10.846521377563477, 11.229537963867188, 11.612555503845215, 11.995572090148926, 12.378589630126953, 12.761606216430664]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 6.0, 14.0, 15.0, 21.0, 29.0, 50.0, 79.0, 110.0, 205.0, 366.0, 757.0, 1668.0, 5640.0, 41848.0, 4115561.0, 21144.0, 3968.0, 1382.0, 583.0, 320.0, 178.0, 113.0, 63.0, 56.0, 31.0, 24.0, 15.0, 7.0, 9.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3984375, -1.341064453125, -1.28369140625, -1.226318359375, -1.1689453125, -1.111572265625, -1.05419921875, -0.996826171875, -0.939453125, -0.882080078125, -0.82470703125, -0.767333984375, -0.7099609375, -0.652587890625, -0.59521484375, -0.537841796875, -0.48046875, -0.423095703125, -0.36572265625, -0.308349609375, -0.2509765625, -0.193603515625, -0.13623046875, -0.078857421875, -0.021484375, 0.035888671875, 0.09326171875, 0.150634765625, 0.2080078125, 0.265380859375, 0.32275390625, 0.380126953125, 0.4375, 0.494873046875, 0.55224609375, 0.609619140625, 0.6669921875, 0.724365234375, 0.78173828125, 0.839111328125, 0.896484375, 0.953857421875, 1.01123046875, 1.068603515625, 1.1259765625, 1.183349609375, 1.24072265625, 1.298095703125, 1.35546875, 1.412841796875, 1.47021484375, 1.527587890625, 1.5849609375, 1.642333984375, 1.69970703125, 1.757080078125, 1.814453125, 1.871826171875, 1.92919921875, 1.986572265625, 2.0439453125, 2.101318359375, 2.15869140625, 2.216064453125, 2.2734375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 7.0, 9.0, 13.0, 7.0, 24.0, 18.0, 28.0, 32.0, 32.0, 42.0, 52.0, 46.0, 62.0, 69.0, 62.0, 59.0, 69.0, 54.0, 47.0, 33.0, 30.0, 30.0, 37.0, 26.0, 26.0, 16.0, 11.0, 5.0, 12.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0], "bins": [-0.7314453125, -0.7130622863769531, -0.6946792602539062, -0.6762962341308594, -0.6579132080078125, -0.6395301818847656, -0.6211471557617188, -0.6027641296386719, -0.584381103515625, -0.5659980773925781, -0.5476150512695312, -0.5292320251464844, -0.5108489990234375, -0.4924659729003906, -0.47408294677734375, -0.4556999206542969, -0.43731689453125, -0.4189338684082031, -0.40055084228515625, -0.3821678161621094, -0.3637847900390625, -0.3454017639160156, -0.32701873779296875, -0.3086357116699219, -0.290252685546875, -0.2718696594238281, -0.25348663330078125, -0.23510360717773438, -0.2167205810546875, -0.19833755493164062, -0.17995452880859375, -0.16157150268554688, -0.1431884765625, -0.12480545043945312, -0.10642242431640625, -0.08803939819335938, -0.0696563720703125, -0.051273345947265625, -0.03289031982421875, -0.014507293701171875, 0.003875732421875, 0.022258758544921875, 0.04064178466796875, 0.059024810791015625, 0.0774078369140625, 0.09579086303710938, 0.11417388916015625, 0.13255691528320312, 0.15093994140625, 0.16932296752929688, 0.18770599365234375, 0.20608901977539062, 0.2244720458984375, 0.24285507202148438, 0.26123809814453125, 0.2796211242675781, 0.298004150390625, 0.3163871765136719, 0.33477020263671875, 0.3531532287597656, 0.3715362548828125, 0.3899192810058594, 0.40830230712890625, 0.4266853332519531, 0.445068359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 6.0, 7.0, 8.0, 15.0, 12.0, 20.0, 29.0, 34.0, 38.0, 65.0, 84.0, 125.0, 170.0, 261.0, 448.0, 709.0, 1284.0, 2527.0, 5580.0, 15515.0, 101414.0, 4015701.0, 33288.0, 9029.0, 3614.0, 1799.0, 994.0, 491.0, 326.0, 192.0, 149.0, 103.0, 65.0, 52.0, 25.0, 30.0, 21.0, 13.0, 17.0, 9.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.158203125, -1.117218017578125, -1.07623291015625, -1.035247802734375, -0.9942626953125, -0.953277587890625, -0.91229248046875, -0.871307373046875, -0.830322265625, -0.789337158203125, -0.74835205078125, -0.707366943359375, -0.6663818359375, -0.625396728515625, -0.58441162109375, -0.543426513671875, -0.50244140625, -0.461456298828125, -0.42047119140625, -0.379486083984375, -0.3385009765625, -0.297515869140625, -0.25653076171875, -0.215545654296875, -0.174560546875, -0.133575439453125, -0.09259033203125, -0.051605224609375, -0.0106201171875, 0.030364990234375, 0.07135009765625, 0.112335205078125, 0.1533203125, 0.194305419921875, 0.23529052734375, 0.276275634765625, 0.3172607421875, 0.358245849609375, 0.39923095703125, 0.440216064453125, 0.481201171875, 0.522186279296875, 0.56317138671875, 0.604156494140625, 0.6451416015625, 0.686126708984375, 0.72711181640625, 0.768096923828125, 0.80908203125, 0.850067138671875, 0.89105224609375, 0.932037353515625, 0.9730224609375, 1.014007568359375, 1.05499267578125, 1.095977783203125, 1.136962890625, 1.177947998046875, 1.21893310546875, 1.259918212890625, 1.3009033203125, 1.341888427734375, 1.38287353515625, 1.423858642578125, 1.46484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 14.0, 8.0, 17.0, 40.0, 106.0, 3574.0, 165.0, 55.0, 28.0, 16.0, 7.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395751953125, -0.3852348327636719, -0.37471771240234375, -0.3642005920410156, -0.3536834716796875, -0.3431663513183594, -0.33264923095703125, -0.3221321105957031, -0.311614990234375, -0.3010978698730469, -0.29058074951171875, -0.2800636291503906, -0.2695465087890625, -0.2590293884277344, -0.24851226806640625, -0.23799514770507812, -0.22747802734375, -0.21696090698242188, -0.20644378662109375, -0.19592666625976562, -0.1854095458984375, -0.17489242553710938, -0.16437530517578125, -0.15385818481445312, -0.143341064453125, -0.13282394409179688, -0.12230682373046875, -0.11178970336914062, -0.1012725830078125, -0.09075546264648438, -0.08023834228515625, -0.06972122192382812, -0.0592041015625, -0.048686981201171875, -0.03816986083984375, -0.027652740478515625, -0.0171356201171875, -0.006618499755859375, 0.00389862060546875, 0.014415740966796875, 0.024932861328125, 0.035449981689453125, 0.04596710205078125, 0.056484222412109375, 0.0670013427734375, 0.07751846313476562, 0.08803558349609375, 0.09855270385742188, 0.10906982421875, 0.11958694458007812, 0.13010406494140625, 0.14062118530273438, 0.1511383056640625, 0.16165542602539062, 0.17217254638671875, 0.18268966674804688, 0.193206787109375, 0.20372390747070312, 0.21424102783203125, 0.22475814819335938, 0.2352752685546875, 0.24579238891601562, 0.25630950927734375, 0.2668266296386719, 0.27734375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 17.0, 49.0, 83.0, 133.0, 177.0, 182.0, 152.0, 108.0, 50.0, 21.0, 8.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3476784229278564, -1.296535849571228, -1.2453932762145996, -1.1942508220672607, -1.1431082487106323, -1.091965675354004, -1.040823221206665, -0.9896806478500366, -0.9385380744934082, -0.8873955011367798, -0.8362529873847961, -0.7851104736328125, -0.7339679002761841, -0.6828253269195557, -0.631682813167572, -0.5805402994155884, -0.52939772605896, -0.47825518250465393, -0.4271126389503479, -0.37597009539604187, -0.32482755184173584, -0.2736850082874298, -0.22254246473312378, -0.17139992117881775, -0.12025737762451172, -0.06911483407020569, -0.017972290515899658, 0.03317025303840637, 0.0843127965927124, 0.13545534014701843, 0.18659788370132446, 0.2377404272556305, 0.2888830900192261, 0.3400256335735321, 0.39116817712783813, 0.44231072068214417, 0.4934532642364502, 0.5445958375930786, 0.5957383513450623, 0.6468808650970459, 0.6980234384536743, 0.7491660118103027, 0.8003085255622864, 0.85145103931427, 0.9025936126708984, 0.9537361860275269, 1.0048787593841553, 1.0560212135314941, 1.1071637868881226, 1.158306360244751, 1.2094488143920898, 1.2605913877487183, 1.3117339611053467, 1.362876534461975, 1.4140191078186035, 1.4651615619659424, 1.5163041353225708, 1.5674467086791992, 1.618589162826538, 1.6697317361831665, 1.720874309539795, 1.7720168828964233, 1.8231594562530518, 1.8743019104003906, 1.925444483757019]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 12.0, 10.0, 21.0, 26.0, 27.0, 32.0, 22.0, 37.0, 22.0, 48.0, 58.0, 55.0, 52.0, 54.0, 49.0, 65.0, 39.0, 50.0, 39.0, 38.0, 41.0, 41.0, 25.0, 24.0, 24.0, 22.0, 16.0, 11.0, 5.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.8112097382545471, -0.7889202833175659, -0.7666308283805847, -0.7443413734436035, -0.7220519781112671, -0.6997625231742859, -0.6774730682373047, -0.6551836133003235, -0.6328941583633423, -0.6106047034263611, -0.5883152484893799, -0.5660258531570435, -0.5437363982200623, -0.521446943283081, -0.49915748834609985, -0.47686803340911865, -0.4545786380767822, -0.432289183139801, -0.4099997580051422, -0.387710303068161, -0.3654208779335022, -0.343131422996521, -0.3208419680595398, -0.2985525131225586, -0.2762630879878998, -0.2539736330509186, -0.23168420791625977, -0.20939475297927856, -0.18710531294345856, -0.16481587290763855, -0.14252641797065735, -0.12023697793483734, -0.09794747829437256, -0.07565803825855255, -0.05336859077215195, -0.031079143285751343, -0.008789703249931335, 0.013499736785888672, 0.03578919172286987, 0.05807863175868988, 0.08036807179450989, 0.1026575118303299, 0.1249469593167305, 0.1472364068031311, 0.1695258468389511, 0.19181528687477112, 0.21410474181175232, 0.23639418184757233, 0.25868362188339233, 0.28097307682037354, 0.30326250195503235, 0.32555195689201355, 0.34784138202667236, 0.37013083696365356, 0.39242029190063477, 0.41470974683761597, 0.4369991719722748, 0.459288626909256, 0.4815780520439148, 0.503867506980896, 0.5261569619178772, 0.5484464168548584, 0.5707358121871948, 0.593025267124176, 0.6153147220611572]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 9.0, 7.0, 15.0, 16.0, 29.0, 22.0, 40.0, 63.0, 107.0, 138.0, 209.0, 292.0, 558.0, 947.0, 1573.0, 2800.0, 5037.0, 9575.0, 19173.0, 40986.0, 90164.0, 199665.0, 304360.0, 199790.0, 90982.0, 41049.0, 19463.0, 9636.0, 5102.0, 2715.0, 1557.0, 919.0, 555.0, 352.0, 209.0, 149.0, 83.0, 59.0, 54.0, 34.0, 18.0, 11.0, 8.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.677734375, -0.6547622680664062, -0.6317901611328125, -0.6088180541992188, -0.585845947265625, -0.5628738403320312, -0.5399017333984375, -0.5169296264648438, -0.49395751953125, -0.47098541259765625, -0.4480133056640625, -0.42504119873046875, -0.402069091796875, -0.37909698486328125, -0.3561248779296875, -0.33315277099609375, -0.3101806640625, -0.28720855712890625, -0.2642364501953125, -0.24126434326171875, -0.218292236328125, -0.19532012939453125, -0.1723480224609375, -0.14937591552734375, -0.12640380859375, -0.10343170166015625, -0.0804595947265625, -0.05748748779296875, -0.034515380859375, -0.01154327392578125, 0.0114288330078125, 0.03440093994140625, 0.057373046875, 0.08034515380859375, 0.1033172607421875, 0.12628936767578125, 0.149261474609375, 0.17223358154296875, 0.1952056884765625, 0.21817779541015625, 0.24114990234375, 0.26412200927734375, 0.2870941162109375, 0.31006622314453125, 0.333038330078125, 0.35601043701171875, 0.3789825439453125, 0.40195465087890625, 0.4249267578125, 0.44789886474609375, 0.4708709716796875, 0.49384307861328125, 0.516815185546875, 0.5397872924804688, 0.5627593994140625, 0.5857315063476562, 0.60870361328125, 0.6316757202148438, 0.6546478271484375, 0.6776199340820312, 0.700592041015625, 0.7235641479492188, 0.7465362548828125, 0.7695083618164062, 0.79248046875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 5.0, 8.0, 11.0, 14.0, 19.0, 25.0, 27.0, 29.0, 38.0, 40.0, 37.0, 48.0, 62.0, 59.0, 60.0, 63.0, 72.0, 56.0, 46.0, 40.0, 32.0, 39.0, 31.0, 20.0, 31.0, 14.0, 13.0, 10.0, 8.0, 6.0, 8.0, 4.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.7197265625, -0.7012672424316406, -0.6828079223632812, -0.6643486022949219, -0.6458892822265625, -0.6274299621582031, -0.6089706420898438, -0.5905113220214844, -0.572052001953125, -0.5535926818847656, -0.5351333618164062, -0.5166740417480469, -0.4982147216796875, -0.4797554016113281, -0.46129608154296875, -0.4428367614746094, -0.42437744140625, -0.4059181213378906, -0.38745880126953125, -0.3689994812011719, -0.3505401611328125, -0.3320808410644531, -0.31362152099609375, -0.2951622009277344, -0.276702880859375, -0.2582435607910156, -0.23978424072265625, -0.22132492065429688, -0.2028656005859375, -0.18440628051757812, -0.16594696044921875, -0.14748764038085938, -0.1290283203125, -0.11056900024414062, -0.09210968017578125, -0.07365036010742188, -0.0551910400390625, -0.036731719970703125, -0.01827239990234375, 0.000186920166015625, 0.018646240234375, 0.037105560302734375, 0.05556488037109375, 0.07402420043945312, 0.0924835205078125, 0.11094284057617188, 0.12940216064453125, 0.14786148071289062, 0.16632080078125, 0.18478012084960938, 0.20323944091796875, 0.22169876098632812, 0.2401580810546875, 0.2586174011230469, 0.27707672119140625, 0.2955360412597656, 0.313995361328125, 0.3324546813964844, 0.35091400146484375, 0.3693733215332031, 0.3878326416015625, 0.4062919616699219, 0.42475128173828125, 0.4432106018066406, 0.461669921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 6.0, 10.0, 13.0, 16.0, 16.0, 27.0, 36.0, 42.0, 66.0, 107.0, 128.0, 156.0, 245.0, 298.0, 437.0, 799.0, 1614.0, 5027.0, 25102.0, 188968.0, 663299.0, 135657.0, 18798.0, 4107.0, 1379.0, 688.0, 426.0, 269.0, 219.0, 164.0, 126.0, 74.0, 50.0, 46.0, 42.0, 24.0, 28.0, 17.0, 9.0, 7.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.798309326171875, -1.73919677734375, -1.680084228515625, -1.6209716796875, -1.561859130859375, -1.50274658203125, -1.443634033203125, -1.384521484375, -1.325408935546875, -1.26629638671875, -1.207183837890625, -1.1480712890625, -1.088958740234375, -1.02984619140625, -0.970733642578125, -0.91162109375, -0.852508544921875, -0.79339599609375, -0.734283447265625, -0.6751708984375, -0.616058349609375, -0.55694580078125, -0.497833251953125, -0.438720703125, -0.379608154296875, -0.32049560546875, -0.261383056640625, -0.2022705078125, -0.143157958984375, -0.08404541015625, -0.024932861328125, 0.0341796875, 0.093292236328125, 0.15240478515625, 0.211517333984375, 0.2706298828125, 0.329742431640625, 0.38885498046875, 0.447967529296875, 0.507080078125, 0.566192626953125, 0.62530517578125, 0.684417724609375, 0.7435302734375, 0.802642822265625, 0.86175537109375, 0.920867919921875, 0.97998046875, 1.039093017578125, 1.09820556640625, 1.157318115234375, 1.2164306640625, 1.275543212890625, 1.33465576171875, 1.393768310546875, 1.452880859375, 1.511993408203125, 1.57110595703125, 1.630218505859375, 1.6893310546875, 1.748443603515625, 1.80755615234375, 1.866668701171875, 1.92578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 0.0, 1.0, 9.0, 9.0, 4.0, 8.0, 12.0, 12.0, 9.0, 16.0, 18.0, 22.0, 19.0, 26.0, 17.0, 37.0, 38.0, 32.0, 45.0, 35.0, 28.0, 31.0, 41.0, 34.0, 24.0, 42.0, 36.0, 26.0, 46.0, 32.0, 34.0, 27.0, 20.0, 22.0, 21.0, 32.0, 26.0, 17.0, 16.0, 13.0, 6.0, 20.0, 6.0, 7.0, 5.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.0390625, -1.9803009033203125, -1.921539306640625, -1.8627777099609375, -1.80401611328125, -1.7452545166015625, -1.686492919921875, -1.6277313232421875, -1.5689697265625, -1.5102081298828125, -1.451446533203125, -1.3926849365234375, -1.33392333984375, -1.2751617431640625, -1.216400146484375, -1.1576385498046875, -1.098876953125, -1.0401153564453125, -0.981353759765625, -0.9225921630859375, -0.86383056640625, -0.8050689697265625, -0.746307373046875, -0.6875457763671875, -0.6287841796875, -0.5700225830078125, -0.511260986328125, -0.4524993896484375, -0.39373779296875, -0.3349761962890625, -0.276214599609375, -0.2174530029296875, -0.15869140625, -0.0999298095703125, -0.041168212890625, 0.0175933837890625, 0.07635498046875, 0.1351165771484375, 0.193878173828125, 0.2526397705078125, 0.3114013671875, 0.3701629638671875, 0.428924560546875, 0.4876861572265625, 0.54644775390625, 0.6052093505859375, 0.663970947265625, 0.7227325439453125, 0.781494140625, 0.8402557373046875, 0.899017333984375, 0.9577789306640625, 1.01654052734375, 1.0753021240234375, 1.134063720703125, 1.1928253173828125, 1.2515869140625, 1.3103485107421875, 1.369110107421875, 1.4278717041015625, 1.48663330078125, 1.5453948974609375, 1.604156494140625, 1.6629180908203125, 1.7216796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 12.0, 19.0, 39.0, 74.0, 207.0, 672.0, 3949.0, 348695.0, 688651.0, 5040.0, 773.0, 219.0, 88.0, 45.0, 24.0, 10.0, 8.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.86328125, -2.7917938232421875, -2.720306396484375, -2.6488189697265625, -2.57733154296875, -2.5058441162109375, -2.434356689453125, -2.3628692626953125, -2.2913818359375, -2.2198944091796875, -2.148406982421875, -2.0769195556640625, -2.00543212890625, -1.9339447021484375, -1.862457275390625, -1.7909698486328125, -1.719482421875, -1.6479949951171875, -1.576507568359375, -1.5050201416015625, -1.43353271484375, -1.3620452880859375, -1.290557861328125, -1.2190704345703125, -1.1475830078125, -1.0760955810546875, -1.004608154296875, -0.9331207275390625, -0.86163330078125, -0.7901458740234375, -0.718658447265625, -0.6471710205078125, -0.57568359375, -0.5041961669921875, -0.432708740234375, -0.3612213134765625, -0.28973388671875, -0.2182464599609375, -0.146759033203125, -0.0752716064453125, -0.0037841796875, 0.0677032470703125, 0.139190673828125, 0.2106781005859375, 0.28216552734375, 0.3536529541015625, 0.425140380859375, 0.4966278076171875, 0.568115234375, 0.6396026611328125, 0.711090087890625, 0.7825775146484375, 0.85406494140625, 0.9255523681640625, 0.997039794921875, 1.0685272216796875, 1.1400146484375, 1.2115020751953125, 1.282989501953125, 1.3544769287109375, 1.42596435546875, 1.4974517822265625, 1.568939208984375, 1.6404266357421875, 1.7119140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 13.0, 19.0, 19.0, 33.0, 57.0, 81.0, 89.0, 126.0, 141.0, 101.0, 78.0, 64.0, 53.0, 39.0, 27.0, 18.0, 7.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.33272933959961e-05, -7.992424070835114e-05, -7.652118802070618e-05, -7.311813533306122e-05, -6.971508264541626e-05, -6.63120299577713e-05, -6.290897727012634e-05, -5.9505924582481384e-05, -5.6102871894836426e-05, -5.269981920719147e-05, -4.929676651954651e-05, -4.589371383190155e-05, -4.249066114425659e-05, -3.908760845661163e-05, -3.5684555768966675e-05, -3.2281503081321716e-05, -2.8878450393676758e-05, -2.54753977060318e-05, -2.207234501838684e-05, -1.8669292330741882e-05, -1.5266239643096924e-05, -1.1863186955451965e-05, -8.460134267807007e-06, -5.057081580162048e-06, -1.6540288925170898e-06, 1.7490237951278687e-06, 5.152076482772827e-06, 8.555129170417786e-06, 1.1958181858062744e-05, 1.5361234545707703e-05, 1.876428723335266e-05, 2.216733992099762e-05, 2.5570392608642578e-05, 2.8973445296287537e-05, 3.2376497983932495e-05, 3.5779550671577454e-05, 3.918260335922241e-05, 4.258565604686737e-05, 4.598870873451233e-05, 4.939176142215729e-05, 5.2794814109802246e-05, 5.6197866797447205e-05, 5.960091948509216e-05, 6.300397217273712e-05, 6.640702486038208e-05, 6.981007754802704e-05, 7.3213130235672e-05, 7.661618292331696e-05, 8.001923561096191e-05, 8.342228829860687e-05, 8.682534098625183e-05, 9.022839367389679e-05, 9.363144636154175e-05, 9.70344990491867e-05, 0.00010043755173683167, 0.00010384060442447662, 0.00010724365711212158, 0.00011064670979976654, 0.0001140497624874115, 0.00011745281517505646, 0.00012085586786270142, 0.00012425892055034637, 0.00012766197323799133, 0.0001310650259256363, 0.00013446807861328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 0.0, 3.0, 7.0, 6.0, 6.0, 10.0, 5.0, 13.0, 14.0, 15.0, 28.0, 39.0, 51.0, 71.0, 109.0, 247.0, 583.0, 1464.0, 4884.0, 38880.0, 886479.0, 104539.0, 7623.0, 2007.0, 687.0, 301.0, 173.0, 90.0, 59.0, 39.0, 32.0, 22.0, 17.0, 14.0, 5.0, 4.0, 4.0, 5.0, 4.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.197265625, -1.1581878662109375, -1.119110107421875, -1.0800323486328125, -1.04095458984375, -1.0018768310546875, -0.962799072265625, -0.9237213134765625, -0.8846435546875, -0.8455657958984375, -0.806488037109375, -0.7674102783203125, -0.72833251953125, -0.6892547607421875, -0.650177001953125, -0.6110992431640625, -0.572021484375, -0.5329437255859375, -0.493865966796875, -0.4547882080078125, -0.41571044921875, -0.3766326904296875, -0.337554931640625, -0.2984771728515625, -0.2593994140625, -0.2203216552734375, -0.181243896484375, -0.1421661376953125, -0.10308837890625, -0.0640106201171875, -0.024932861328125, 0.0141448974609375, 0.05322265625, 0.0923004150390625, 0.131378173828125, 0.1704559326171875, 0.20953369140625, 0.2486114501953125, 0.287689208984375, 0.3267669677734375, 0.3658447265625, 0.4049224853515625, 0.444000244140625, 0.4830780029296875, 0.52215576171875, 0.5612335205078125, 0.600311279296875, 0.6393890380859375, 0.678466796875, 0.7175445556640625, 0.756622314453125, 0.7957000732421875, 0.83477783203125, 0.8738555908203125, 0.912933349609375, 0.9520111083984375, 0.9910888671875, 1.0301666259765625, 1.069244384765625, 1.1083221435546875, 1.14739990234375, 1.1864776611328125, 1.225555419921875, 1.2646331787109375, 1.3037109375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 17.0, 25.0, 41.0, 86.0, 127.0, 188.0, 186.0, 130.0, 97.0, 52.0, 10.0, 9.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4072265625, -1.3589324951171875, -1.310638427734375, -1.2623443603515625, -1.21405029296875, -1.1657562255859375, -1.117462158203125, -1.0691680908203125, -1.0208740234375, -0.9725799560546875, -0.924285888671875, -0.8759918212890625, -0.82769775390625, -0.7794036865234375, -0.731109619140625, -0.6828155517578125, -0.634521484375, -0.5862274169921875, -0.537933349609375, -0.4896392822265625, -0.44134521484375, -0.3930511474609375, -0.344757080078125, -0.2964630126953125, -0.2481689453125, -0.1998748779296875, -0.151580810546875, -0.1032867431640625, -0.05499267578125, -0.0066986083984375, 0.041595458984375, 0.0898895263671875, 0.13818359375, 0.1864776611328125, 0.234771728515625, 0.2830657958984375, 0.33135986328125, 0.3796539306640625, 0.427947998046875, 0.4762420654296875, 0.5245361328125, 0.5728302001953125, 0.621124267578125, 0.6694183349609375, 0.71771240234375, 0.7660064697265625, 0.814300537109375, 0.8625946044921875, 0.910888671875, 0.9591827392578125, 1.007476806640625, 1.0557708740234375, 1.10406494140625, 1.1523590087890625, 1.200653076171875, 1.2489471435546875, 1.2972412109375, 1.3455352783203125, 1.393829345703125, 1.4421234130859375, 1.49041748046875, 1.5387115478515625, 1.587005615234375, 1.6352996826171875, 1.68359375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 11.0, 12.0, 21.0, 63.0, 93.0, 155.0, 187.0, 189.0, 134.0, 71.0, 26.0, 17.0, 11.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.43998146057129, -24.940895080566406, -24.44180679321289, -23.942720413208008, -23.443632125854492, -22.94454574584961, -22.445459365844727, -21.94637107849121, -21.447284698486328, -20.948198318481445, -20.44911003112793, -19.950023651123047, -19.45093536376953, -18.95184898376465, -18.452762603759766, -17.95367431640625, -17.454587936401367, -16.955501556396484, -16.45641326904297, -15.957326889038086, -15.458239555358887, -14.959152221679688, -14.460064888000488, -13.960977554321289, -13.46189022064209, -12.96280288696289, -12.463715553283691, -11.964629173278809, -11.46554183959961, -10.96645450592041, -10.467367172241211, -9.968280792236328, -9.469193458557129, -8.97010612487793, -8.47101879119873, -7.9719319343566895, -7.472845077514648, -6.973757743835449, -6.47467041015625, -5.975583553314209, -5.476496696472168, -4.977409362792969, -4.478322505950928, -3.9792351722717285, -3.4801483154296875, -2.9810609817504883, -2.481973886489868, -1.982886791229248, -1.4837994575500488, -0.9847123622894287, -0.4856252074241638, 0.013461947441101074, 0.5125490427017212, 1.0116362571716309, 1.510723352432251, 2.009810447692871, 2.508897542953491, 3.0079846382141113, 3.5070717334747314, 4.006158828735352, 4.505246162414551, 5.00433349609375, 5.503420352935791, 6.002507209777832, 6.501594543457031]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 10.0, 8.0, 9.0, 8.0, 15.0, 17.0, 23.0, 25.0, 24.0, 30.0, 40.0, 36.0, 30.0, 36.0, 53.0, 54.0, 54.0, 54.0, 35.0, 56.0, 46.0, 39.0, 37.0, 41.0, 28.0, 24.0, 19.0, 22.0, 23.0, 10.0, 24.0, 7.0, 12.0, 5.0, 10.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-10.5196533203125, -10.20052719116211, -9.881400108337402, -9.562273979187012, -9.243146896362305, -8.924020767211914, -8.604894638061523, -8.285768508911133, -7.966641426086426, -7.647514820098877, -7.328388214111328, -7.0092620849609375, -6.690135478973389, -6.37100887298584, -6.051882743835449, -5.7327561378479, -5.413629531860352, -5.094502925872803, -4.775376319885254, -4.456250190734863, -4.1371235847473145, -3.8179969787597656, -3.498870611190796, -3.179744243621826, -2.8606176376342773, -2.5414910316467285, -2.222364664077759, -1.9032381772994995, -1.5841116905212402, -1.264985203742981, -0.9458587169647217, -0.626732349395752, -0.3076057434082031, 0.011520743370056152, 0.33064723014831543, 0.6497737169265747, 0.968900203704834, 1.2880266904830933, 1.6071531772613525, 1.9262795448303223, 2.245406150817871, 2.56453275680542, 2.8836591243743896, 3.2027854919433594, 3.521912097930908, 3.841038703918457, 4.160164833068848, 4.4792914390563965, 4.798418045043945, 5.117544651031494, 5.436671257019043, 5.755797386169434, 6.074923992156982, 6.394050598144531, 6.713176727294922, 7.032303333282471, 7.3514299392700195, 7.670556545257568, 7.989683151245117, 8.308809280395508, 8.627935409545898, 8.947062492370605, 9.266188621520996, 9.585315704345703, 9.904441833496094]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 7.0, 8.0, 10.0, 12.0, 19.0, 15.0, 38.0, 48.0, 65.0, 96.0, 141.0, 213.0, 407.0, 712.0, 1368.0, 2977.0, 7335.0, 23751.0, 178255.0, 3903273.0, 53792.0, 12604.0, 4715.0, 1986.0, 981.0, 523.0, 315.0, 187.0, 123.0, 82.0, 46.0, 47.0, 25.0, 20.0, 20.0, 18.0, 5.0, 9.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85400390625, -0.825775146484375, -0.79754638671875, -0.769317626953125, -0.7410888671875, -0.712860107421875, -0.68463134765625, -0.656402587890625, -0.628173828125, -0.599945068359375, -0.57171630859375, -0.543487548828125, -0.5152587890625, -0.487030029296875, -0.45880126953125, -0.430572509765625, -0.40234375, -0.374114990234375, -0.34588623046875, -0.317657470703125, -0.2894287109375, -0.261199951171875, -0.23297119140625, -0.204742431640625, -0.176513671875, -0.148284912109375, -0.12005615234375, -0.091827392578125, -0.0635986328125, -0.035369873046875, -0.00714111328125, 0.021087646484375, 0.04931640625, 0.077545166015625, 0.10577392578125, 0.134002685546875, 0.1622314453125, 0.190460205078125, 0.21868896484375, 0.246917724609375, 0.275146484375, 0.303375244140625, 0.33160400390625, 0.359832763671875, 0.3880615234375, 0.416290283203125, 0.44451904296875, 0.472747802734375, 0.5009765625, 0.529205322265625, 0.55743408203125, 0.585662841796875, 0.6138916015625, 0.642120361328125, 0.67034912109375, 0.698577880859375, 0.726806640625, 0.755035400390625, 0.78326416015625, 0.811492919921875, 0.8397216796875, 0.867950439453125, 0.89617919921875, 0.924407958984375, 0.95263671875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 11.0, 12.0, 14.0, 22.0, 31.0, 48.0, 47.0, 57.0, 81.0, 96.0, 100.0, 104.0, 81.0, 64.0, 52.0, 43.0, 45.0, 34.0, 15.0, 13.0, 14.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69970703125, -0.673583984375, -0.6474609375, -0.621337890625, -0.59521484375, -0.569091796875, -0.54296875, -0.516845703125, -0.49072265625, -0.464599609375, -0.4384765625, -0.412353515625, -0.38623046875, -0.360107421875, -0.333984375, -0.307861328125, -0.28173828125, -0.255615234375, -0.2294921875, -0.203369140625, -0.17724609375, -0.151123046875, -0.125, -0.098876953125, -0.07275390625, -0.046630859375, -0.0205078125, 0.005615234375, 0.03173828125, 0.057861328125, 0.083984375, 0.110107421875, 0.13623046875, 0.162353515625, 0.1884765625, 0.214599609375, 0.24072265625, 0.266845703125, 0.29296875, 0.319091796875, 0.34521484375, 0.371337890625, 0.3974609375, 0.423583984375, 0.44970703125, 0.475830078125, 0.501953125, 0.528076171875, 0.55419921875, 0.580322265625, 0.6064453125, 0.632568359375, 0.65869140625, 0.684814453125, 0.7109375, 0.737060546875, 0.76318359375, 0.789306640625, 0.8154296875, 0.841552734375, 0.86767578125, 0.893798828125, 0.919921875, 0.946044921875, 0.97216796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 6.0, 6.0, 12.0, 17.0, 19.0, 15.0, 30.0, 27.0, 45.0, 71.0, 94.0, 123.0, 160.0, 231.0, 434.0, 876.0, 2038.0, 5577.0, 22464.0, 244949.0, 3861036.0, 42030.0, 8464.0, 2843.0, 1133.0, 563.0, 302.0, 188.0, 134.0, 84.0, 73.0, 47.0, 46.0, 31.0, 26.0, 18.0, 13.0, 10.0, 17.0, 6.0, 3.0, 1.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.1354827880859375, -1.095184326171875, -1.0548858642578125, -1.01458740234375, -0.9742889404296875, -0.933990478515625, -0.8936920166015625, -0.8533935546875, -0.8130950927734375, -0.772796630859375, -0.7324981689453125, -0.69219970703125, -0.6519012451171875, -0.611602783203125, -0.5713043212890625, -0.531005859375, -0.4907073974609375, -0.450408935546875, -0.4101104736328125, -0.36981201171875, -0.3295135498046875, -0.289215087890625, -0.2489166259765625, -0.2086181640625, -0.1683197021484375, -0.128021240234375, -0.0877227783203125, -0.04742431640625, -0.0071258544921875, 0.033172607421875, 0.0734710693359375, 0.11376953125, 0.1540679931640625, 0.194366455078125, 0.2346649169921875, 0.27496337890625, 0.3152618408203125, 0.355560302734375, 0.3958587646484375, 0.4361572265625, 0.4764556884765625, 0.516754150390625, 0.5570526123046875, 0.59735107421875, 0.6376495361328125, 0.677947998046875, 0.7182464599609375, 0.758544921875, 0.7988433837890625, 0.839141845703125, 0.8794403076171875, 0.91973876953125, 0.9600372314453125, 1.000335693359375, 1.0406341552734375, 1.0809326171875, 1.1212310791015625, 1.161529541015625, 1.2018280029296875, 1.24212646484375, 1.2824249267578125, 1.322723388671875, 1.3630218505859375, 1.4033203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 6.0, 13.0, 13.0, 27.0, 71.0, 166.0, 3389.0, 251.0, 81.0, 27.0, 16.0, 10.0, 4.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81787109375, -0.7902297973632812, -0.7625885009765625, -0.7349472045898438, -0.707305908203125, -0.6796646118164062, -0.6520233154296875, -0.6243820190429688, -0.59674072265625, -0.5690994262695312, -0.5414581298828125, -0.5138168334960938, -0.486175537109375, -0.45853424072265625, -0.4308929443359375, -0.40325164794921875, -0.3756103515625, -0.34796905517578125, -0.3203277587890625, -0.29268646240234375, -0.265045166015625, -0.23740386962890625, -0.2097625732421875, -0.18212127685546875, -0.15447998046875, -0.12683868408203125, -0.0991973876953125, -0.07155609130859375, -0.043914794921875, -0.01627349853515625, 0.0113677978515625, 0.03900909423828125, 0.066650390625, 0.09429168701171875, 0.1219329833984375, 0.14957427978515625, 0.177215576171875, 0.20485687255859375, 0.2324981689453125, 0.26013946533203125, 0.28778076171875, 0.31542205810546875, 0.3430633544921875, 0.37070465087890625, 0.398345947265625, 0.42598724365234375, 0.4536285400390625, 0.48126983642578125, 0.5089111328125, 0.5365524291992188, 0.5641937255859375, 0.5918350219726562, 0.619476318359375, 0.6471176147460938, 0.6747589111328125, 0.7024002075195312, 0.73004150390625, 0.7576828002929688, 0.7853240966796875, 0.8129653930664062, 0.840606689453125, 0.8682479858398438, 0.8958892822265625, 0.9235305786132812, 0.951171875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 4.0, 11.0, 9.0, 20.0, 32.0, 60.0, 100.0, 161.0, 160.0, 159.0, 103.0, 82.0, 44.0, 22.0, 14.0, 6.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.623303174972534, -2.545696258544922, -2.4680893421173096, -2.390482187271118, -2.312875270843506, -2.2352683544158936, -2.1576614379882812, -2.080054521560669, -2.0024476051330566, -1.9248406887054443, -1.8472336530685425, -1.7696267366409302, -1.6920197010040283, -1.614412784576416, -1.5368058681488037, -1.4591989517211914, -1.381591796875, -1.3039848804473877, -1.2263778448104858, -1.1487709283828735, -1.0711638927459717, -0.9935569763183594, -0.9159500598907471, -0.83834308385849, -0.7607361078262329, -0.6831291317939758, -0.6055221557617188, -0.5279152393341064, -0.45030826330184937, -0.3727012872695923, -0.2950943410396576, -0.2174873948097229, -0.13988041877746582, -0.062273457646369934, 0.015333503484725952, 0.09294046461582184, 0.17054742574691772, 0.2481544017791748, 0.3257613480091095, 0.4033682942390442, 0.48097527027130127, 0.5585822463035583, 0.6361892223358154, 0.7137961387634277, 0.7914031147956848, 0.8690100908279419, 0.9466170072555542, 1.024224042892456, 1.1018309593200684, 1.1794378757476807, 1.2570449113845825, 1.3346518278121948, 1.4122588634490967, 1.489865779876709, 1.5674726963043213, 1.6450796127319336, 1.7226866483688354, 1.8002935647964478, 1.8779006004333496, 1.955507516860962, 2.033114433288574, 2.1107215881347656, 2.188328504562378, 2.2659354209899902, 2.3435423374176025]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 8.0, 6.0, 11.0, 11.0, 6.0, 7.0, 16.0, 14.0, 14.0, 19.0, 9.0, 20.0, 18.0, 18.0, 28.0, 41.0, 31.0, 32.0, 34.0, 51.0, 47.0, 40.0, 32.0, 37.0, 28.0, 37.0, 33.0, 49.0, 29.0, 24.0, 24.0, 31.0, 23.0, 21.0, 21.0, 24.0, 20.0, 8.0, 13.0, 10.0, 11.0, 9.0, 6.0, 2.0, 5.0, 3.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.9943637251853943, -0.9639459848403931, -0.9335281848907471, -0.9031103849411011, -0.8726926445960999, -0.8422749042510986, -0.8118571043014526, -0.7814393043518066, -0.7510215640068054, -0.7206038236618042, -0.6901860237121582, -0.6597682237625122, -0.629350483417511, -0.5989327430725098, -0.5685149431228638, -0.5380971431732178, -0.5076794028282166, -0.47726163268089294, -0.44684386253356934, -0.4164260923862457, -0.3860083222389221, -0.3555905520915985, -0.3251727819442749, -0.2947550117969513, -0.2643372416496277, -0.23391947150230408, -0.20350170135498047, -0.17308393120765686, -0.14266616106033325, -0.11224839091300964, -0.08183062076568604, -0.05141285061836243, -0.020995140075683594, 0.009422630071640015, 0.03984040021896362, 0.07025817036628723, 0.10067594051361084, 0.13109371066093445, 0.16151148080825806, 0.19192925095558167, 0.22234702110290527, 0.2527647912502289, 0.2831825613975525, 0.3136003315448761, 0.3440181016921997, 0.3744358718395233, 0.4048536419868469, 0.43527141213417053, 0.46568918228149414, 0.49610695242881775, 0.5265247225761414, 0.5569424629211426, 0.5873602628707886, 0.6177780628204346, 0.6481958031654358, 0.678613543510437, 0.709031343460083, 0.739449143409729, 0.7698668837547302, 0.8002846240997314, 0.8307024240493774, 0.8611202239990234, 0.8915379643440247, 0.9219557046890259, 0.9523735046386719]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 9.0, 6.0, 9.0, 29.0, 17.0, 37.0, 63.0, 111.0, 147.0, 322.0, 582.0, 1233.0, 2850.0, 8828.0, 36461.0, 214402.0, 582502.0, 160400.0, 28433.0, 7297.0, 2473.0, 1080.0, 520.0, 281.0, 158.0, 104.0, 60.0, 34.0, 19.0, 13.0, 17.0, 11.0, 9.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.6416015625, -1.5924835205078125, -1.543365478515625, -1.4942474365234375, -1.44512939453125, -1.3960113525390625, -1.346893310546875, -1.2977752685546875, -1.2486572265625, -1.1995391845703125, -1.150421142578125, -1.1013031005859375, -1.05218505859375, -1.0030670166015625, -0.953948974609375, -0.9048309326171875, -0.855712890625, -0.8065948486328125, -0.757476806640625, -0.7083587646484375, -0.65924072265625, -0.6101226806640625, -0.561004638671875, -0.5118865966796875, -0.4627685546875, -0.4136505126953125, -0.364532470703125, -0.3154144287109375, -0.26629638671875, -0.2171783447265625, -0.168060302734375, -0.1189422607421875, -0.06982421875, -0.0207061767578125, 0.028411865234375, 0.0775299072265625, 0.12664794921875, 0.1757659912109375, 0.224884033203125, 0.2740020751953125, 0.3231201171875, 0.3722381591796875, 0.421356201171875, 0.4704742431640625, 0.51959228515625, 0.5687103271484375, 0.617828369140625, 0.6669464111328125, 0.716064453125, 0.7651824951171875, 0.814300537109375, 0.8634185791015625, 0.91253662109375, 0.9616546630859375, 1.010772705078125, 1.0598907470703125, 1.1090087890625, 1.1581268310546875, 1.207244873046875, 1.2563629150390625, 1.30548095703125, 1.3545989990234375, 1.403717041015625, 1.4528350830078125, 1.501953125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 9.0, 11.0, 14.0, 18.0, 25.0, 35.0, 52.0, 60.0, 63.0, 85.0, 89.0, 92.0, 77.0, 94.0, 56.0, 49.0, 49.0, 42.0, 22.0, 22.0, 9.0, 8.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6497344970703125, -0.624176025390625, -0.5986175537109375, -0.57305908203125, -0.5475006103515625, -0.521942138671875, -0.4963836669921875, -0.4708251953125, -0.4452667236328125, -0.419708251953125, -0.3941497802734375, -0.36859130859375, -0.3430328369140625, -0.317474365234375, -0.2919158935546875, -0.266357421875, -0.2407989501953125, -0.215240478515625, -0.1896820068359375, -0.16412353515625, -0.1385650634765625, -0.113006591796875, -0.0874481201171875, -0.0618896484375, -0.0363311767578125, -0.010772705078125, 0.0147857666015625, 0.04034423828125, 0.0659027099609375, 0.091461181640625, 0.1170196533203125, 0.142578125, 0.1681365966796875, 0.193695068359375, 0.2192535400390625, 0.24481201171875, 0.2703704833984375, 0.295928955078125, 0.3214874267578125, 0.3470458984375, 0.3726043701171875, 0.398162841796875, 0.4237213134765625, 0.44927978515625, 0.4748382568359375, 0.500396728515625, 0.5259552001953125, 0.551513671875, 0.5770721435546875, 0.602630615234375, 0.6281890869140625, 0.65374755859375, 0.6793060302734375, 0.704864501953125, 0.7304229736328125, 0.7559814453125, 0.7815399169921875, 0.807098388671875, 0.8326568603515625, 0.85821533203125, 0.8837738037109375, 0.909332275390625, 0.9348907470703125, 0.96044921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 4.0, 12.0, 13.0, 8.0, 22.0, 31.0, 41.0, 37.0, 48.0, 111.0, 152.0, 220.0, 395.0, 768.0, 1806.0, 5749.0, 28573.0, 292724.0, 635094.0, 67610.0, 9957.0, 2708.0, 1105.0, 517.0, 311.0, 154.0, 101.0, 69.0, 61.0, 33.0, 32.0, 23.0, 14.0, 18.0, 9.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.968170166015625, -1.90509033203125, -1.842010498046875, -1.7789306640625, -1.715850830078125, -1.65277099609375, -1.589691162109375, -1.526611328125, -1.463531494140625, -1.40045166015625, -1.337371826171875, -1.2742919921875, -1.211212158203125, -1.14813232421875, -1.085052490234375, -1.02197265625, -0.958892822265625, -0.89581298828125, -0.832733154296875, -0.7696533203125, -0.706573486328125, -0.64349365234375, -0.580413818359375, -0.517333984375, -0.454254150390625, -0.39117431640625, -0.328094482421875, -0.2650146484375, -0.201934814453125, -0.13885498046875, -0.075775146484375, -0.0126953125, 0.050384521484375, 0.11346435546875, 0.176544189453125, 0.2396240234375, 0.302703857421875, 0.36578369140625, 0.428863525390625, 0.491943359375, 0.555023193359375, 0.61810302734375, 0.681182861328125, 0.7442626953125, 0.807342529296875, 0.87042236328125, 0.933502197265625, 0.99658203125, 1.059661865234375, 1.12274169921875, 1.185821533203125, 1.2489013671875, 1.311981201171875, 1.37506103515625, 1.438140869140625, 1.501220703125, 1.564300537109375, 1.62738037109375, 1.690460205078125, 1.7535400390625, 1.816619873046875, 1.87969970703125, 1.942779541015625, 2.005859375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 11.0, 10.0, 15.0, 15.0, 13.0, 28.0, 28.0, 30.0, 36.0, 44.0, 41.0, 41.0, 59.0, 61.0, 57.0, 49.0, 56.0, 56.0, 44.0, 57.0, 50.0, 37.0, 37.0, 22.0, 22.0, 21.0, 16.0, 12.0, 1.0, 5.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.391998291015625, -2.31915283203125, -2.246307373046875, -2.1734619140625, -2.100616455078125, -2.02777099609375, -1.954925537109375, -1.882080078125, -1.809234619140625, -1.73638916015625, -1.663543701171875, -1.5906982421875, -1.517852783203125, -1.44500732421875, -1.372161865234375, -1.29931640625, -1.226470947265625, -1.15362548828125, -1.080780029296875, -1.0079345703125, -0.935089111328125, -0.86224365234375, -0.789398193359375, -0.716552734375, -0.643707275390625, -0.57086181640625, -0.498016357421875, -0.4251708984375, -0.352325439453125, -0.27947998046875, -0.206634521484375, -0.1337890625, -0.060943603515625, 0.01190185546875, 0.084747314453125, 0.1575927734375, 0.230438232421875, 0.30328369140625, 0.376129150390625, 0.448974609375, 0.521820068359375, 0.59466552734375, 0.667510986328125, 0.7403564453125, 0.813201904296875, 0.88604736328125, 0.958892822265625, 1.03173828125, 1.104583740234375, 1.17742919921875, 1.250274658203125, 1.3231201171875, 1.395965576171875, 1.46881103515625, 1.541656494140625, 1.614501953125, 1.687347412109375, 1.76019287109375, 1.833038330078125, 1.9058837890625, 1.978729248046875, 2.05157470703125, 2.124420166015625, 2.197265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 11.0, 19.0, 17.0, 35.0, 42.0, 99.0, 142.0, 284.0, 604.0, 1401.0, 4762.0, 36000.0, 708524.0, 275783.0, 15865.0, 2942.0, 1034.0, 401.0, 256.0, 114.0, 76.0, 48.0, 26.0, 19.0, 13.0, 6.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.806640625, -0.783477783203125, -0.76031494140625, -0.737152099609375, -0.7139892578125, -0.690826416015625, -0.66766357421875, -0.644500732421875, -0.621337890625, -0.598175048828125, -0.57501220703125, -0.551849365234375, -0.5286865234375, -0.505523681640625, -0.48236083984375, -0.459197998046875, -0.43603515625, -0.412872314453125, -0.38970947265625, -0.366546630859375, -0.3433837890625, -0.320220947265625, -0.29705810546875, -0.273895263671875, -0.250732421875, -0.227569580078125, -0.20440673828125, -0.181243896484375, -0.1580810546875, -0.134918212890625, -0.11175537109375, -0.088592529296875, -0.0654296875, -0.042266845703125, -0.01910400390625, 0.004058837890625, 0.0272216796875, 0.050384521484375, 0.07354736328125, 0.096710205078125, 0.119873046875, 0.143035888671875, 0.16619873046875, 0.189361572265625, 0.2125244140625, 0.235687255859375, 0.25885009765625, 0.282012939453125, 0.30517578125, 0.328338623046875, 0.35150146484375, 0.374664306640625, 0.3978271484375, 0.420989990234375, 0.44415283203125, 0.467315673828125, 0.490478515625, 0.513641357421875, 0.53680419921875, 0.559967041015625, 0.5831298828125, 0.606292724609375, 0.62945556640625, 0.652618408203125, 0.67578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 4.0, 10.0, 8.0, 10.0, 20.0, 25.0, 22.0, 20.0, 42.0, 54.0, 58.0, 65.0, 80.0, 90.0, 79.0, 80.0, 79.0, 47.0, 44.0, 32.0, 21.0, 22.0, 15.0, 22.0, 16.0, 5.0, 5.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.577108383178711e-05, -8.344557136297226e-05, -8.112005889415741e-05, -7.879454642534256e-05, -7.646903395652771e-05, -7.414352148771286e-05, -7.181800901889801e-05, -6.949249655008316e-05, -6.716698408126831e-05, -6.484147161245346e-05, -6.251595914363861e-05, -6.019044667482376e-05, -5.786493420600891e-05, -5.553942173719406e-05, -5.321390926837921e-05, -5.088839679956436e-05, -4.856288433074951e-05, -4.623737186193466e-05, -4.391185939311981e-05, -4.158634692430496e-05, -3.926083445549011e-05, -3.693532198667526e-05, -3.460980951786041e-05, -3.228429704904556e-05, -2.9958784580230713e-05, -2.7633272111415863e-05, -2.5307759642601013e-05, -2.2982247173786163e-05, -2.0656734704971313e-05, -1.8331222236156464e-05, -1.6005709767341614e-05, -1.3680197298526764e-05, -1.1354684829711914e-05, -9.029172360897064e-06, -6.703659892082214e-06, -4.3781474232673645e-06, -2.0526349544525146e-06, 2.728775143623352e-07, 2.598389983177185e-06, 4.923902451992035e-06, 7.249414920806885e-06, 9.574927389621735e-06, 1.1900439858436584e-05, 1.4225952327251434e-05, 1.6551464796066284e-05, 1.8876977264881134e-05, 2.1202489733695984e-05, 2.3528002202510834e-05, 2.5853514671325684e-05, 2.8179027140140533e-05, 3.0504539608955383e-05, 3.283005207777023e-05, 3.515556454658508e-05, 3.748107701539993e-05, 3.980658948421478e-05, 4.213210195302963e-05, 4.445761442184448e-05, 4.678312689065933e-05, 4.910863935947418e-05, 5.143415182828903e-05, 5.375966429710388e-05, 5.608517676591873e-05, 5.841068923473358e-05, 6.073620170354843e-05, 6.306171417236328e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 17.0, 17.0, 23.0, 34.0, 68.0, 152.0, 314.0, 781.0, 2696.0, 19631.0, 642307.0, 366499.0, 12659.0, 2094.0, 647.0, 277.0, 140.0, 67.0, 43.0, 29.0, 17.0, 11.0, 8.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7205886840820312, -0.6916656494140625, -0.6627426147460938, -0.633819580078125, -0.6048965454101562, -0.5759735107421875, -0.5470504760742188, -0.51812744140625, -0.48920440673828125, -0.4602813720703125, -0.43135833740234375, -0.402435302734375, -0.37351226806640625, -0.3445892333984375, -0.31566619873046875, -0.2867431640625, -0.25782012939453125, -0.2288970947265625, -0.19997406005859375, -0.171051025390625, -0.14212799072265625, -0.1132049560546875, -0.08428192138671875, -0.05535888671875, -0.02643585205078125, 0.0024871826171875, 0.03141021728515625, 0.060333251953125, 0.08925628662109375, 0.1181793212890625, 0.14710235595703125, 0.176025390625, 0.20494842529296875, 0.2338714599609375, 0.26279449462890625, 0.291717529296875, 0.32064056396484375, 0.3495635986328125, 0.37848663330078125, 0.40740966796875, 0.43633270263671875, 0.4652557373046875, 0.49417877197265625, 0.523101806640625, 0.5520248413085938, 0.5809478759765625, 0.6098709106445312, 0.6387939453125, 0.6677169799804688, 0.6966400146484375, 0.7255630493164062, 0.754486083984375, 0.7834091186523438, 0.8123321533203125, 0.8412551879882812, 0.87017822265625, 0.8991012573242188, 0.9280242919921875, 0.9569473266601562, 0.985870361328125, 1.0147933959960938, 1.0437164306640625, 1.0726394653320312, 1.1015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 0.0, 2.0, 9.0, 7.0, 11.0, 14.0, 23.0, 30.0, 39.0, 51.0, 58.0, 56.0, 81.0, 110.0, 100.0, 95.0, 80.0, 63.0, 44.0, 27.0, 22.0, 18.0, 17.0, 11.0, 7.0, 6.0, 7.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4180488586425781, -0.39884185791015625, -0.3796348571777344, -0.3604278564453125, -0.3412208557128906, -0.32201385498046875, -0.3028068542480469, -0.283599853515625, -0.2643928527832031, -0.24518585205078125, -0.22597885131835938, -0.2067718505859375, -0.18756484985351562, -0.16835784912109375, -0.14915084838867188, -0.12994384765625, -0.11073684692382812, -0.09152984619140625, -0.07232284545898438, -0.0531158447265625, -0.033908843994140625, -0.01470184326171875, 0.004505157470703125, 0.023712158203125, 0.042919158935546875, 0.06212615966796875, 0.08133316040039062, 0.1005401611328125, 0.11974716186523438, 0.13895416259765625, 0.15816116333007812, 0.1773681640625, 0.19657516479492188, 0.21578216552734375, 0.23498916625976562, 0.2541961669921875, 0.2734031677246094, 0.29261016845703125, 0.3118171691894531, 0.331024169921875, 0.3502311706542969, 0.36943817138671875, 0.3886451721191406, 0.4078521728515625, 0.4270591735839844, 0.44626617431640625, 0.4654731750488281, 0.48468017578125, 0.5038871765136719, 0.5230941772460938, 0.5423011779785156, 0.5615081787109375, 0.5807151794433594, 0.5999221801757812, 0.6191291809082031, 0.638336181640625, 0.6575431823730469, 0.6767501831054688, 0.6959571838378906, 0.7151641845703125, 0.7343711853027344, 0.7535781860351562, 0.7727851867675781, 0.7919921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 13.0, 18.0, 23.0, 42.0, 86.0, 94.0, 132.0, 147.0, 141.0, 123.0, 79.0, 42.0, 29.0, 10.0, 12.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.766450881958008, -12.386005401611328, -12.005559921264648, -11.625114440917969, -11.244668006896973, -10.864222526550293, -10.483777046203613, -10.103331565856934, -9.722885131835938, -9.342439651489258, -8.961994171142578, -8.581548690795898, -8.201102256774902, -7.820656776428223, -7.440211296081543, -7.059765815734863, -6.679320335388184, -6.298874855041504, -5.918428897857666, -5.537983417510986, -5.157537460327148, -4.777091979980469, -4.396646499633789, -4.016201019287109, -3.6357550621032715, -3.2553093433380127, -2.874863624572754, -2.494418144226074, -2.1139724254608154, -1.7335267066955566, -1.353081226348877, -0.9726355075836182, -0.5921897888183594, -0.21174412965774536, 0.16870152950286865, 0.5491471290588379, 0.9295928478240967, 1.3100385665893555, 1.6904840469360352, 2.070929765701294, 2.4513754844665527, 2.8318212032318115, 3.2122669219970703, 3.59271240234375, 3.973158121109009, 4.353603839874268, 4.734049320220947, 5.114495277404785, 5.494940757751465, 5.8753862380981445, 6.255832195281982, 6.636277675628662, 7.0167236328125, 7.39716911315918, 7.777614593505859, 8.158060073852539, 8.538505554199219, 8.918951034545898, 9.299396514892578, 9.679841995239258, 10.060288429260254, 10.440733909606934, 10.821179389953613, 11.201624870300293, 11.582071304321289]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 0.0, 3.0, 6.0, 11.0, 8.0, 19.0, 20.0, 25.0, 27.0, 44.0, 66.0, 54.0, 63.0, 70.0, 69.0, 65.0, 64.0, 67.0, 51.0, 53.0, 37.0, 37.0, 27.0, 30.0, 20.0, 12.0, 15.0, 6.0, 11.0, 5.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.205841064453125, -13.823945045471191, -13.442049026489258, -13.06015396118164, -12.678257942199707, -12.296361923217773, -11.91446590423584, -11.532569885253906, -11.150674819946289, -10.768778800964355, -10.386882781982422, -10.004987716674805, -9.623091697692871, -9.241195678710938, -8.859299659729004, -8.47740364074707, -8.095507621765137, -7.713611602783203, -7.331716060638428, -6.949820041656494, -6.567924499511719, -6.186028480529785, -5.804132461547852, -5.422236442565918, -5.040340900421143, -4.658444881439209, -4.276549339294434, -3.8946533203125, -3.5127575397491455, -3.130861759185791, -2.7489657402038574, -2.367069959640503, -1.9851751327514648, -1.6032793521881104, -1.2213834524154663, -0.8394875526428223, -0.4575917720794678, -0.07569599151611328, 0.3062000274658203, 0.6880958080291748, 1.0699915885925293, 1.4518873691558838, 1.8337832689285278, 2.215679168701172, 2.5975749492645264, 2.979470729827881, 3.3613667488098145, 3.743262529373169, 4.125158309936523, 4.507054328918457, 4.888949871063232, 5.270845890045166, 5.652741432189941, 6.034637451171875, 6.416533470153809, 6.798429489135742, 7.180325031280518, 7.562221050262451, 7.944116592407227, 8.32601261138916, 8.707908630371094, 9.089803695678711, 9.471700668334961, 9.853595733642578, 10.235491752624512]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 7.0, 11.0, 11.0, 17.0, 18.0, 21.0, 38.0, 69.0, 96.0, 183.0, 427.0, 1098.0, 3735.0, 18700.0, 400397.0, 3699672.0, 59432.0, 7446.0, 1771.0, 530.0, 239.0, 107.0, 87.0, 40.0, 29.0, 24.0, 20.0, 11.0, 10.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.904296875, -1.8531646728515625, -1.802032470703125, -1.7509002685546875, -1.69976806640625, -1.6486358642578125, -1.597503662109375, -1.5463714599609375, -1.4952392578125, -1.4441070556640625, -1.392974853515625, -1.3418426513671875, -1.29071044921875, -1.2395782470703125, -1.188446044921875, -1.1373138427734375, -1.086181640625, -1.0350494384765625, -0.983917236328125, -0.9327850341796875, -0.88165283203125, -0.8305206298828125, -0.779388427734375, -0.7282562255859375, -0.6771240234375, -0.6259918212890625, -0.574859619140625, -0.5237274169921875, -0.47259521484375, -0.4214630126953125, -0.370330810546875, -0.3191986083984375, -0.26806640625, -0.2169342041015625, -0.165802001953125, -0.1146697998046875, -0.06353759765625, -0.0124053955078125, 0.038726806640625, 0.0898590087890625, 0.1409912109375, 0.1921234130859375, 0.243255615234375, 0.2943878173828125, 0.34552001953125, 0.3966522216796875, 0.447784423828125, 0.4989166259765625, 0.550048828125, 0.6011810302734375, 0.652313232421875, 0.7034454345703125, 0.75457763671875, 0.8057098388671875, 0.856842041015625, 0.9079742431640625, 0.9591064453125, 1.0102386474609375, 1.061370849609375, 1.1125030517578125, 1.16363525390625, 1.2147674560546875, 1.265899658203125, 1.3170318603515625, 1.3681640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 7.0, 6.0, 16.0, 15.0, 19.0, 23.0, 23.0, 29.0, 36.0, 42.0, 42.0, 44.0, 55.0, 57.0, 62.0, 73.0, 49.0, 68.0, 42.0, 48.0, 59.0, 40.0, 38.0, 21.0, 15.0, 22.0, 12.0, 12.0, 8.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49267578125, -0.47628021240234375, -0.4598846435546875, -0.44348907470703125, -0.427093505859375, -0.41069793701171875, -0.3943023681640625, -0.37790679931640625, -0.36151123046875, -0.34511566162109375, -0.3287200927734375, -0.31232452392578125, -0.295928955078125, -0.27953338623046875, -0.2631378173828125, -0.24674224853515625, -0.2303466796875, -0.21395111083984375, -0.1975555419921875, -0.18115997314453125, -0.164764404296875, -0.14836883544921875, -0.1319732666015625, -0.11557769775390625, -0.09918212890625, -0.08278656005859375, -0.0663909912109375, -0.04999542236328125, -0.033599853515625, -0.01720428466796875, -0.0008087158203125, 0.01558685302734375, 0.031982421875, 0.04837799072265625, 0.0647735595703125, 0.08116912841796875, 0.097564697265625, 0.11396026611328125, 0.1303558349609375, 0.14675140380859375, 0.16314697265625, 0.17954254150390625, 0.1959381103515625, 0.21233367919921875, 0.228729248046875, 0.24512481689453125, 0.2615203857421875, 0.27791595458984375, 0.2943115234375, 0.31070709228515625, 0.3271026611328125, 0.34349822998046875, 0.359893798828125, 0.37628936767578125, 0.3926849365234375, 0.40908050537109375, 0.42547607421875, 0.44187164306640625, 0.4582672119140625, 0.47466278076171875, 0.491058349609375, 0.5074539184570312, 0.5238494873046875, 0.5402450561523438, 0.556640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 9.0, 25.0, 20.0, 32.0, 76.0, 150.0, 376.0, 1869.0, 14956.0, 1293940.0, 2861273.0, 18560.0, 2238.0, 457.0, 125.0, 61.0, 39.0, 23.0, 18.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.251953125, -2.171630859375, -2.09130859375, -2.010986328125, -1.9306640625, -1.850341796875, -1.77001953125, -1.689697265625, -1.609375, -1.529052734375, -1.44873046875, -1.368408203125, -1.2880859375, -1.207763671875, -1.12744140625, -1.047119140625, -0.966796875, -0.886474609375, -0.80615234375, -0.725830078125, -0.6455078125, -0.565185546875, -0.48486328125, -0.404541015625, -0.32421875, -0.243896484375, -0.16357421875, -0.083251953125, -0.0029296875, 0.077392578125, 0.15771484375, 0.238037109375, 0.318359375, 0.398681640625, 0.47900390625, 0.559326171875, 0.6396484375, 0.719970703125, 0.80029296875, 0.880615234375, 0.9609375, 1.041259765625, 1.12158203125, 1.201904296875, 1.2822265625, 1.362548828125, 1.44287109375, 1.523193359375, 1.603515625, 1.683837890625, 1.76416015625, 1.844482421875, 1.9248046875, 2.005126953125, 2.08544921875, 2.165771484375, 2.24609375, 2.326416015625, 2.40673828125, 2.487060546875, 2.5673828125, 2.647705078125, 2.72802734375, 2.808349609375, 2.888671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 4.0, 5.0, 13.0, 11.0, 8.0, 10.0, 18.0, 26.0, 37.0, 70.0, 141.0, 323.0, 850.0, 1229.0, 623.0, 257.0, 142.0, 80.0, 57.0, 34.0, 28.0, 24.0, 17.0, 13.0, 8.0, 8.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.2490234375, -1.2127227783203125, -1.176422119140625, -1.1401214599609375, -1.10382080078125, -1.0675201416015625, -1.031219482421875, -0.9949188232421875, -0.9586181640625, -0.9223175048828125, -0.886016845703125, -0.8497161865234375, -0.81341552734375, -0.7771148681640625, -0.740814208984375, -0.7045135498046875, -0.668212890625, -0.6319122314453125, -0.595611572265625, -0.5593109130859375, -0.52301025390625, -0.4867095947265625, -0.450408935546875, -0.4141082763671875, -0.3778076171875, -0.3415069580078125, -0.305206298828125, -0.2689056396484375, -0.23260498046875, -0.1963043212890625, -0.160003662109375, -0.1237030029296875, -0.08740234375, -0.0511016845703125, -0.014801025390625, 0.0214996337890625, 0.05780029296875, 0.0941009521484375, 0.130401611328125, 0.1667022705078125, 0.2030029296875, 0.2393035888671875, 0.275604248046875, 0.3119049072265625, 0.34820556640625, 0.3845062255859375, 0.420806884765625, 0.4571075439453125, 0.493408203125, 0.5297088623046875, 0.566009521484375, 0.6023101806640625, 0.63861083984375, 0.6749114990234375, 0.711212158203125, 0.7475128173828125, 0.7838134765625, 0.8201141357421875, 0.856414794921875, 0.8927154541015625, 0.92901611328125, 0.9653167724609375, 1.001617431640625, 1.0379180908203125, 1.07421875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 7.0, 14.0, 26.0, 37.0, 49.0, 104.0, 153.0, 166.0, 127.0, 119.0, 69.0, 41.0, 17.0, 21.0, 14.0, 8.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.436581611633301, -5.194671154022217, -4.952760219573975, -4.710849761962891, -4.468938827514648, -4.2270283699035645, -3.9851179122924805, -3.7432072162628174, -3.5012965202331543, -3.259385824203491, -3.017475128173828, -2.775564670562744, -2.533653974533081, -2.291743278503418, -2.049832820892334, -1.807922124862671, -1.5660114288330078, -1.3241007328033447, -1.0821901559829712, -0.8402795195579529, -0.5983688831329346, -0.3564581871032715, -0.11454761028289795, 0.12736296653747559, 0.36927366256713867, 0.611184298992157, 0.8530949354171753, 1.0950055122375488, 1.336916208267212, 1.578826904296875, 1.8207374811172485, 2.062648057937622, 2.304558753967285, 2.5464694499969482, 2.7883801460266113, 3.0302906036376953, 3.2722012996673584, 3.5141119956970215, 3.7560224533081055, 3.9979331493377686, 4.239843845367432, 4.481754302978516, 4.723665237426758, 4.965575695037842, 5.207486152648926, 5.449397087097168, 5.691307544708252, 5.933218002319336, 6.175128936767578, 6.417039394378662, 6.658950328826904, 6.900860786437988, 7.1427717208862305, 7.3846821784973145, 7.626592636108398, 7.868503570556641, 8.110414505004883, 8.352325439453125, 8.59423542022705, 8.836146354675293, 9.078057289123535, 9.319967269897461, 9.561878204345703, 9.803789138793945, 10.045699119567871]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 6.0, 8.0, 4.0, 6.0, 6.0, 8.0, 11.0, 16.0, 15.0, 24.0, 22.0, 17.0, 35.0, 37.0, 35.0, 36.0, 46.0, 35.0, 55.0, 50.0, 59.0, 56.0, 39.0, 51.0, 48.0, 47.0, 27.0, 46.0, 29.0, 24.0, 13.0, 18.0, 15.0, 17.0, 17.0, 10.0, 0.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.054336071014404, -4.8941826820373535, -4.734029293060303, -4.57387638092041, -4.413722991943359, -4.253569602966309, -4.093416213989258, -3.933262825012207, -3.7731096744537354, -3.6129562854766846, -3.452803134918213, -3.292649745941162, -3.1324963569641113, -2.9723432064056396, -2.812189817428589, -2.652036666870117, -2.4918832778930664, -2.3317298889160156, -2.171576738357544, -2.011423349380493, -1.851270079612732, -1.6911168098449707, -1.53096342086792, -1.3708101511001587, -1.2106568813323975, -1.0505036115646362, -0.8903502821922302, -0.7301969528198242, -0.570043683052063, -0.40989041328430176, -0.24973708391189575, -0.08958375453948975, 0.07056951522827148, 0.2307228147983551, 0.3908761143684387, 0.5510294437408447, 0.711182713508606, 0.8713359832763672, 1.031489372253418, 1.1916426420211792, 1.3517959117889404, 1.5119491815567017, 1.672102451324463, 1.8322558403015137, 1.992409110069275, 2.152562379837036, 2.312715768814087, 2.4728689193725586, 2.6330223083496094, 2.79317569732666, 2.953328847885132, 3.1134822368621826, 3.2736353874206543, 3.433788776397705, 3.593942165374756, 3.7540955543518066, 3.9142487049102783, 4.07440185546875, 4.234555244445801, 4.394708633422852, 4.554862022399902, 4.715015411376953, 4.875168323516846, 5.0353217124938965, 5.195475101470947]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 18.0, 36.0, 43.0, 60.0, 117.0, 189.0, 359.0, 644.0, 1299.0, 2778.0, 6281.0, 15842.0, 42752.0, 122893.0, 326856.0, 331217.0, 125572.0, 43379.0, 15980.0, 6479.0, 2808.0, 1384.0, 708.0, 365.0, 196.0, 108.0, 72.0, 36.0, 33.0, 12.0, 11.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.783203125, -0.7587356567382812, -0.7342681884765625, -0.7098007202148438, -0.685333251953125, -0.6608657836914062, -0.6363983154296875, -0.6119308471679688, -0.58746337890625, -0.5629959106445312, -0.5385284423828125, -0.5140609741210938, -0.489593505859375, -0.46512603759765625, -0.4406585693359375, -0.41619110107421875, -0.3917236328125, -0.36725616455078125, -0.3427886962890625, -0.31832122802734375, -0.293853759765625, -0.26938629150390625, -0.2449188232421875, -0.22045135498046875, -0.19598388671875, -0.17151641845703125, -0.1470489501953125, -0.12258148193359375, -0.098114013671875, -0.07364654541015625, -0.0491790771484375, -0.02471160888671875, -0.000244140625, 0.02422332763671875, 0.0486907958984375, 0.07315826416015625, 0.097625732421875, 0.12209320068359375, 0.1465606689453125, 0.17102813720703125, 0.19549560546875, 0.21996307373046875, 0.2444305419921875, 0.26889801025390625, 0.293365478515625, 0.31783294677734375, 0.3423004150390625, 0.36676788330078125, 0.3912353515625, 0.41570281982421875, 0.4401702880859375, 0.46463775634765625, 0.489105224609375, 0.5135726928710938, 0.5380401611328125, 0.5625076293945312, 0.58697509765625, 0.6114425659179688, 0.6359100341796875, 0.6603775024414062, 0.684844970703125, 0.7093124389648438, 0.7337799072265625, 0.7582473754882812, 0.78271484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 2.0, 12.0, 7.0, 20.0, 15.0, 29.0, 28.0, 30.0, 32.0, 36.0, 40.0, 50.0, 60.0, 56.0, 58.0, 76.0, 60.0, 58.0, 52.0, 49.0, 38.0, 33.0, 44.0, 27.0, 18.0, 12.0, 18.0, 11.0, 11.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.402099609375, -0.3860588073730469, -0.37001800537109375, -0.3539772033691406, -0.3379364013671875, -0.3218955993652344, -0.30585479736328125, -0.2898139953613281, -0.273773193359375, -0.2577323913574219, -0.24169158935546875, -0.22565078735351562, -0.2096099853515625, -0.19356918334960938, -0.17752838134765625, -0.16148757934570312, -0.14544677734375, -0.12940597534179688, -0.11336517333984375, -0.09732437133789062, -0.0812835693359375, -0.06524276733398438, -0.04920196533203125, -0.033161163330078125, -0.017120361328125, -0.001079559326171875, 0.01496124267578125, 0.031002044677734375, 0.0470428466796875, 0.06308364868164062, 0.07912445068359375, 0.09516525268554688, 0.1112060546875, 0.12724685668945312, 0.14328765869140625, 0.15932846069335938, 0.1753692626953125, 0.19141006469726562, 0.20745086669921875, 0.22349166870117188, 0.239532470703125, 0.2555732727050781, 0.27161407470703125, 0.2876548767089844, 0.3036956787109375, 0.3197364807128906, 0.33577728271484375, 0.3518180847167969, 0.36785888671875, 0.3838996887207031, 0.39994049072265625, 0.4159812927246094, 0.4320220947265625, 0.4480628967285156, 0.46410369873046875, 0.4801445007324219, 0.496185302734375, 0.5122261047363281, 0.5282669067382812, 0.5443077087402344, 0.5603485107421875, 0.5763893127441406, 0.5924301147460938, 0.6084709167480469, 0.62451171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 15.0, 14.0, 32.0, 56.0, 83.0, 192.0, 432.0, 1286.0, 5336.0, 83530.0, 906973.0, 44845.0, 3962.0, 1043.0, 385.0, 169.0, 65.0, 57.0, 26.0, 23.0, 12.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017578125, -2.927276611328125, -2.83697509765625, -2.746673583984375, -2.6563720703125, -2.566070556640625, -2.47576904296875, -2.385467529296875, -2.295166015625, -2.204864501953125, -2.11456298828125, -2.024261474609375, -1.9339599609375, -1.843658447265625, -1.75335693359375, -1.663055419921875, -1.57275390625, -1.482452392578125, -1.39215087890625, -1.301849365234375, -1.2115478515625, -1.121246337890625, -1.03094482421875, -0.940643310546875, -0.850341796875, -0.760040283203125, -0.66973876953125, -0.579437255859375, -0.4891357421875, -0.398834228515625, -0.30853271484375, -0.218231201171875, -0.1279296875, -0.037628173828125, 0.05267333984375, 0.142974853515625, 0.2332763671875, 0.323577880859375, 0.41387939453125, 0.504180908203125, 0.594482421875, 0.684783935546875, 0.77508544921875, 0.865386962890625, 0.9556884765625, 1.045989990234375, 1.13629150390625, 1.226593017578125, 1.31689453125, 1.407196044921875, 1.49749755859375, 1.587799072265625, 1.6781005859375, 1.768402099609375, 1.85870361328125, 1.949005126953125, 2.039306640625, 2.129608154296875, 2.21990966796875, 2.310211181640625, 2.4005126953125, 2.490814208984375, 2.58111572265625, 2.671417236328125, 2.76171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 7.0, 14.0, 20.0, 14.0, 16.0, 23.0, 29.0, 25.0, 27.0, 32.0, 36.0, 39.0, 45.0, 43.0, 37.0, 56.0, 60.0, 49.0, 55.0, 46.0, 38.0, 33.0, 43.0, 32.0, 28.0, 31.0, 23.0, 22.0, 12.0, 4.0, 5.0, 10.0, 7.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.65234375, -1.59686279296875, -1.5413818359375, -1.48590087890625, -1.430419921875, -1.37493896484375, -1.3194580078125, -1.26397705078125, -1.20849609375, -1.15301513671875, -1.0975341796875, -1.04205322265625, -0.986572265625, -0.93109130859375, -0.8756103515625, -0.82012939453125, -0.7646484375, -0.70916748046875, -0.6536865234375, -0.59820556640625, -0.542724609375, -0.48724365234375, -0.4317626953125, -0.37628173828125, -0.32080078125, -0.26531982421875, -0.2098388671875, -0.15435791015625, -0.098876953125, -0.04339599609375, 0.0120849609375, 0.06756591796875, 0.123046875, 0.17852783203125, 0.2340087890625, 0.28948974609375, 0.344970703125, 0.40045166015625, 0.4559326171875, 0.51141357421875, 0.56689453125, 0.62237548828125, 0.6778564453125, 0.73333740234375, 0.788818359375, 0.84429931640625, 0.8997802734375, 0.95526123046875, 1.0107421875, 1.06622314453125, 1.1217041015625, 1.17718505859375, 1.232666015625, 1.28814697265625, 1.3436279296875, 1.39910888671875, 1.45458984375, 1.51007080078125, 1.5655517578125, 1.62103271484375, 1.676513671875, 1.73199462890625, 1.7874755859375, 1.84295654296875, 1.8984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 15.0, 24.0, 33.0, 56.0, 92.0, 167.0, 482.0, 2213.0, 32988.0, 976941.0, 32326.0, 2292.0, 492.0, 181.0, 89.0, 57.0, 30.0, 19.0, 11.0, 7.0, 6.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.033966064453125, -0.99176025390625, -0.949554443359375, -0.9073486328125, -0.865142822265625, -0.82293701171875, -0.780731201171875, -0.738525390625, -0.696319580078125, -0.65411376953125, -0.611907958984375, -0.5697021484375, -0.527496337890625, -0.48529052734375, -0.443084716796875, -0.40087890625, -0.358673095703125, -0.31646728515625, -0.274261474609375, -0.2320556640625, -0.189849853515625, -0.14764404296875, -0.105438232421875, -0.063232421875, -0.021026611328125, 0.02117919921875, 0.063385009765625, 0.1055908203125, 0.147796630859375, 0.19000244140625, 0.232208251953125, 0.2744140625, 0.316619873046875, 0.35882568359375, 0.401031494140625, 0.4432373046875, 0.485443115234375, 0.52764892578125, 0.569854736328125, 0.612060546875, 0.654266357421875, 0.69647216796875, 0.738677978515625, 0.7808837890625, 0.823089599609375, 0.86529541015625, 0.907501220703125, 0.94970703125, 0.991912841796875, 1.03411865234375, 1.076324462890625, 1.1185302734375, 1.160736083984375, 1.20294189453125, 1.245147705078125, 1.287353515625, 1.329559326171875, 1.37176513671875, 1.413970947265625, 1.4561767578125, 1.498382568359375, 1.54058837890625, 1.582794189453125, 1.625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 4.0, 8.0, 6.0, 12.0, 13.0, 21.0, 25.0, 39.0, 41.0, 72.0, 70.0, 111.0, 140.0, 132.0, 78.0, 59.0, 46.0, 29.0, 18.0, 14.0, 9.0, 6.0, 15.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.255243301391602e-05, -7.983110845088959e-05, -7.710978388786316e-05, -7.438845932483673e-05, -7.16671347618103e-05, -6.894581019878387e-05, -6.622448563575745e-05, -6.350316107273102e-05, -6.078183650970459e-05, -5.806051194667816e-05, -5.5339187383651733e-05, -5.2617862820625305e-05, -4.989653825759888e-05, -4.717521369457245e-05, -4.445388913154602e-05, -4.173256456851959e-05, -3.9011240005493164e-05, -3.6289915442466736e-05, -3.356859087944031e-05, -3.084726631641388e-05, -2.812594175338745e-05, -2.5404617190361023e-05, -2.2683292627334595e-05, -1.9961968064308167e-05, -1.7240643501281738e-05, -1.451931893825531e-05, -1.1797994375228882e-05, -9.076669812202454e-06, -6.355345249176025e-06, -3.634020686149597e-06, -9.126961231231689e-07, 1.8086284399032593e-06, 4.5299530029296875e-06, 7.251277565956116e-06, 9.972602128982544e-06, 1.2693926692008972e-05, 1.54152512550354e-05, 1.813657581806183e-05, 2.0857900381088257e-05, 2.3579224944114685e-05, 2.6300549507141113e-05, 2.902187407016754e-05, 3.174319863319397e-05, 3.44645231962204e-05, 3.7185847759246826e-05, 3.9907172322273254e-05, 4.262849688529968e-05, 4.534982144832611e-05, 4.807114601135254e-05, 5.079247057437897e-05, 5.3513795137405396e-05, 5.6235119700431824e-05, 5.895644426345825e-05, 6.167776882648468e-05, 6.439909338951111e-05, 6.712041795253754e-05, 6.984174251556396e-05, 7.256306707859039e-05, 7.528439164161682e-05, 7.800571620464325e-05, 8.072704076766968e-05, 8.34483653306961e-05, 8.616968989372253e-05, 8.889101445674896e-05, 9.161233901977539e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 7.0, 3.0, 5.0, 7.0, 15.0, 35.0, 52.0, 126.0, 396.0, 1372.0, 13101.0, 966863.0, 63007.0, 2612.0, 585.0, 214.0, 65.0, 39.0, 21.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7587890625, -1.710845947265625, -1.66290283203125, -1.614959716796875, -1.5670166015625, -1.519073486328125, -1.47113037109375, -1.423187255859375, -1.375244140625, -1.327301025390625, -1.27935791015625, -1.231414794921875, -1.1834716796875, -1.135528564453125, -1.08758544921875, -1.039642333984375, -0.99169921875, -0.943756103515625, -0.89581298828125, -0.847869873046875, -0.7999267578125, -0.751983642578125, -0.70404052734375, -0.656097412109375, -0.608154296875, -0.560211181640625, -0.51226806640625, -0.464324951171875, -0.4163818359375, -0.368438720703125, -0.32049560546875, -0.272552490234375, -0.224609375, -0.176666259765625, -0.12872314453125, -0.080780029296875, -0.0328369140625, 0.015106201171875, 0.06304931640625, 0.110992431640625, 0.158935546875, 0.206878662109375, 0.25482177734375, 0.302764892578125, 0.3507080078125, 0.398651123046875, 0.44659423828125, 0.494537353515625, 0.54248046875, 0.590423583984375, 0.63836669921875, 0.686309814453125, 0.7342529296875, 0.782196044921875, 0.83013916015625, 0.878082275390625, 0.926025390625, 0.973968505859375, 1.02191162109375, 1.069854736328125, 1.1177978515625, 1.165740966796875, 1.21368408203125, 1.261627197265625, 1.3095703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 7.0, 11.0, 18.0, 29.0, 26.0, 37.0, 51.0, 74.0, 117.0, 120.0, 128.0, 94.0, 79.0, 51.0, 42.0, 26.0, 22.0, 16.0, 12.0, 14.0, 7.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57763671875, -0.5563583374023438, -0.5350799560546875, -0.5138015747070312, -0.492523193359375, -0.47124481201171875, -0.4499664306640625, -0.42868804931640625, -0.40740966796875, -0.38613128662109375, -0.3648529052734375, -0.34357452392578125, -0.322296142578125, -0.30101776123046875, -0.2797393798828125, -0.25846099853515625, -0.2371826171875, -0.21590423583984375, -0.1946258544921875, -0.17334747314453125, -0.152069091796875, -0.13079071044921875, -0.1095123291015625, -0.08823394775390625, -0.06695556640625, -0.04567718505859375, -0.0243988037109375, -0.00312042236328125, 0.018157958984375, 0.03943634033203125, 0.0607147216796875, 0.08199310302734375, 0.103271484375, 0.12454986572265625, 0.1458282470703125, 0.16710662841796875, 0.188385009765625, 0.20966339111328125, 0.2309417724609375, 0.25222015380859375, 0.27349853515625, 0.29477691650390625, 0.3160552978515625, 0.33733367919921875, 0.358612060546875, 0.37989044189453125, 0.4011688232421875, 0.42244720458984375, 0.4437255859375, 0.46500396728515625, 0.4862823486328125, 0.5075607299804688, 0.528839111328125, 0.5501174926757812, 0.5713958740234375, 0.5926742553710938, 0.61395263671875, 0.6352310180664062, 0.6565093994140625, 0.6777877807617188, 0.699066162109375, 0.7203445434570312, 0.7416229248046875, 0.7629013061523438, 0.7841796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 36.0, 174.0, 353.0, 281.0, 95.0, 38.0, 15.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5160493850708, -7.850541591644287, -7.185033798217773, -6.519525527954102, -5.854017734527588, -5.188509941101074, -4.523001670837402, -3.8574938774108887, -3.191986083984375, -2.5264782905578613, -1.8609702587127686, -1.1954623460769653, -0.5299544334411621, 0.13555335998535156, 0.8010613918304443, 1.466569423675537, 2.132077217102051, 2.7975850105285645, 3.4630930423736572, 4.12860107421875, 4.794108867645264, 5.459616661071777, 6.125124931335449, 6.790632724761963, 7.456140518188477, 8.121648788452148, 8.787156105041504, 9.452664375305176, 10.118171691894531, 10.783679962158203, 11.449188232421875, 12.114696502685547, 12.780204772949219, 13.44571304321289, 14.111220359802246, 14.776728630065918, 15.442235946655273, 16.107744216918945, 16.773252487182617, 17.43876075744629, 18.104267120361328, 18.769775390625, 19.435283660888672, 20.10079002380371, 20.766298294067383, 21.431806564331055, 22.097314834594727, 22.7628231048584, 23.42833137512207, 24.093839645385742, 24.759347915649414, 25.424854278564453, 26.090362548828125, 26.755870819091797, 27.42137908935547, 28.08688735961914, 28.752395629882812, 29.417903900146484, 30.083412170410156, 30.748918533325195, 31.414426803588867, 32.079933166503906, 32.74544143676758, 33.41094970703125, 34.07645797729492]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 9.0, 6.0, 14.0, 20.0, 16.0, 22.0, 31.0, 30.0, 40.0, 49.0, 54.0, 44.0, 61.0, 74.0, 68.0, 74.0, 71.0, 42.0, 55.0, 40.0, 32.0, 29.0, 26.0, 20.0, 15.0, 11.0, 16.0, 6.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.755620956420898, -9.486498832702637, -9.217377662658691, -8.94825553894043, -8.679133415222168, -8.410011291503906, -8.140890121459961, -7.871767997741699, -7.602646350860596, -7.333524703979492, -7.0644025802612305, -6.795280933380127, -6.526159286499023, -6.257037162780762, -5.987915515899658, -5.718793869018555, -5.449671745300293, -5.1805500984191895, -4.911427974700928, -4.642306327819824, -4.3731842041015625, -4.104062557220459, -3.8349409103393555, -3.565819025039673, -3.2966971397399902, -3.0275752544403076, -2.758453369140625, -2.4893317222595215, -2.220209836959839, -1.9510879516601562, -1.6819661855697632, -1.4128444194793701, -1.1437225341796875, -0.8746007084846497, -0.6054788827896118, -0.336357057094574, -0.06723523139953613, 0.20188665390014648, 0.47100841999053955, 0.7401301860809326, 1.0092520713806152, 1.2783739566802979, 1.547495722770691, 1.816617488861084, 2.0857393741607666, 2.354861259460449, 2.6239829063415527, 2.8931047916412354, 3.162226676940918, 3.4313485622406006, 3.700470447540283, 3.9695920944213867, 4.238714218139648, 4.507835865020752, 4.7769575119018555, 5.046079635620117, 5.315201282501221, 5.584322929382324, 5.853445053100586, 6.1225666999816895, 6.391688346862793, 6.660810470581055, 6.929932117462158, 7.199053764343262, 7.468175888061523]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 14.0, 19.0, 13.0, 30.0, 31.0, 61.0, 125.0, 253.0, 611.0, 1849.0, 10007.0, 254150.0, 3887113.0, 34383.0, 3945.0, 982.0, 305.0, 148.0, 96.0, 44.0, 25.0, 16.0, 17.0, 6.0, 13.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.2214813232421875, -1.166595458984375, -1.1117095947265625, -1.05682373046875, -1.0019378662109375, -0.947052001953125, -0.8921661376953125, -0.8372802734375, -0.7823944091796875, -0.727508544921875, -0.6726226806640625, -0.61773681640625, -0.5628509521484375, -0.507965087890625, -0.4530792236328125, -0.398193359375, -0.3433074951171875, -0.288421630859375, -0.2335357666015625, -0.17864990234375, -0.1237640380859375, -0.068878173828125, -0.0139923095703125, 0.0408935546875, 0.0957794189453125, 0.150665283203125, 0.2055511474609375, 0.26043701171875, 0.3153228759765625, 0.370208740234375, 0.4250946044921875, 0.47998046875, 0.5348663330078125, 0.589752197265625, 0.6446380615234375, 0.69952392578125, 0.7544097900390625, 0.809295654296875, 0.8641815185546875, 0.9190673828125, 0.9739532470703125, 1.028839111328125, 1.0837249755859375, 1.13861083984375, 1.1934967041015625, 1.248382568359375, 1.3032684326171875, 1.358154296875, 1.4130401611328125, 1.467926025390625, 1.5228118896484375, 1.57769775390625, 1.6325836181640625, 1.687469482421875, 1.7423553466796875, 1.7972412109375, 1.8521270751953125, 1.907012939453125, 1.9618988037109375, 2.01678466796875, 2.0716705322265625, 2.126556396484375, 2.1814422607421875, 2.236328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 7.0, 12.0, 4.0, 7.0, 13.0, 19.0, 32.0, 31.0, 31.0, 35.0, 51.0, 37.0, 49.0, 51.0, 67.0, 56.0, 61.0, 67.0, 45.0, 40.0, 43.0, 34.0, 33.0, 26.0, 31.0, 22.0, 20.0, 22.0, 13.0, 8.0, 10.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385986328125, -0.3716468811035156, -0.35730743408203125, -0.3429679870605469, -0.3286285400390625, -0.3142890930175781, -0.29994964599609375, -0.2856101989746094, -0.271270751953125, -0.2569313049316406, -0.24259185791015625, -0.22825241088867188, -0.2139129638671875, -0.19957351684570312, -0.18523406982421875, -0.17089462280273438, -0.15655517578125, -0.14221572875976562, -0.12787628173828125, -0.11353683471679688, -0.0991973876953125, -0.08485794067382812, -0.07051849365234375, -0.056179046630859375, -0.041839599609375, -0.027500152587890625, -0.01316070556640625, 0.001178741455078125, 0.0155181884765625, 0.029857635498046875, 0.04419708251953125, 0.058536529541015625, 0.0728759765625, 0.08721542358398438, 0.10155487060546875, 0.11589431762695312, 0.1302337646484375, 0.14457321166992188, 0.15891265869140625, 0.17325210571289062, 0.187591552734375, 0.20193099975585938, 0.21627044677734375, 0.23060989379882812, 0.2449493408203125, 0.2592887878417969, 0.27362823486328125, 0.2879676818847656, 0.30230712890625, 0.3166465759277344, 0.33098602294921875, 0.3453254699707031, 0.3596649169921875, 0.3740043640136719, 0.38834381103515625, 0.4026832580566406, 0.417022705078125, 0.4313621520996094, 0.44570159912109375, 0.4600410461425781, 0.4743804931640625, 0.4887199401855469, 0.5030593872070312, 0.5173988342285156, 0.53173828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 10.0, 19.0, 21.0, 37.0, 55.0, 90.0, 126.0, 237.0, 395.0, 915.0, 3320.0, 21215.0, 910249.0, 3219293.0, 32014.0, 4271.0, 1081.0, 404.0, 208.0, 113.0, 72.0, 54.0, 30.0, 16.0, 23.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5859375, -1.533233642578125, -1.48052978515625, -1.427825927734375, -1.3751220703125, -1.322418212890625, -1.26971435546875, -1.217010498046875, -1.164306640625, -1.111602783203125, -1.05889892578125, -1.006195068359375, -0.9534912109375, -0.900787353515625, -0.84808349609375, -0.795379638671875, -0.74267578125, -0.689971923828125, -0.63726806640625, -0.584564208984375, -0.5318603515625, -0.479156494140625, -0.42645263671875, -0.373748779296875, -0.321044921875, -0.268341064453125, -0.21563720703125, -0.162933349609375, -0.1102294921875, -0.057525634765625, -0.00482177734375, 0.047882080078125, 0.1005859375, 0.153289794921875, 0.20599365234375, 0.258697509765625, 0.3114013671875, 0.364105224609375, 0.41680908203125, 0.469512939453125, 0.522216796875, 0.574920654296875, 0.62762451171875, 0.680328369140625, 0.7330322265625, 0.785736083984375, 0.83843994140625, 0.891143798828125, 0.94384765625, 0.996551513671875, 1.04925537109375, 1.101959228515625, 1.1546630859375, 1.207366943359375, 1.26007080078125, 1.312774658203125, 1.365478515625, 1.418182373046875, 1.47088623046875, 1.523590087890625, 1.5762939453125, 1.628997802734375, 1.68170166015625, 1.734405517578125, 1.787109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 21.0, 16.0, 22.0, 34.0, 64.0, 168.0, 371.0, 1097.0, 1390.0, 478.0, 185.0, 99.0, 52.0, 20.0, 18.0, 5.0, 9.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.517578125, -1.4787750244140625, -1.439971923828125, -1.4011688232421875, -1.36236572265625, -1.3235626220703125, -1.284759521484375, -1.2459564208984375, -1.2071533203125, -1.1683502197265625, -1.129547119140625, -1.0907440185546875, -1.05194091796875, -1.0131378173828125, -0.974334716796875, -0.9355316162109375, -0.896728515625, -0.8579254150390625, -0.819122314453125, -0.7803192138671875, -0.74151611328125, -0.7027130126953125, -0.663909912109375, -0.6251068115234375, -0.5863037109375, -0.5475006103515625, -0.508697509765625, -0.4698944091796875, -0.43109130859375, -0.3922882080078125, -0.353485107421875, -0.3146820068359375, -0.27587890625, -0.2370758056640625, -0.198272705078125, -0.1594696044921875, -0.12066650390625, -0.0818634033203125, -0.043060302734375, -0.0042572021484375, 0.0345458984375, 0.0733489990234375, 0.112152099609375, 0.1509552001953125, 0.18975830078125, 0.2285614013671875, 0.267364501953125, 0.3061676025390625, 0.344970703125, 0.3837738037109375, 0.422576904296875, 0.4613800048828125, 0.50018310546875, 0.5389862060546875, 0.577789306640625, 0.6165924072265625, 0.6553955078125, 0.6941986083984375, 0.733001708984375, 0.7718048095703125, 0.81060791015625, 0.8494110107421875, 0.888214111328125, 0.9270172119140625, 0.9658203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 17.0, 25.0, 59.0, 114.0, 210.0, 243.0, 172.0, 84.0, 34.0, 17.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.057815551757812, -11.742238998413086, -11.426661491394043, -11.111084938049316, -10.795507431030273, -10.479930877685547, -10.164353370666504, -9.848776817321777, -9.533199310302734, -9.217622756958008, -8.902045249938965, -8.586468696594238, -8.270891189575195, -7.955314636230469, -7.639737606048584, -7.324160575866699, -7.008584022521973, -6.693006992340088, -6.377429962158203, -6.061852931976318, -5.746275901794434, -5.430699348449707, -5.115122318267822, -4.7995452880859375, -4.483968257904053, -4.168391227722168, -3.852814197540283, -3.5372374057769775, -3.2216603755950928, -2.906083345413208, -2.5905065536499023, -2.2749295234680176, -1.9593524932861328, -1.643775463104248, -1.3281985521316528, -1.0126216411590576, -0.6970446109771729, -0.3814675807952881, -0.06589066982269287, 0.24968624114990234, 0.5652632713317871, 0.8808402419090271, 1.196417212486267, 1.5119941234588623, 1.827571153640747, 2.143148183822632, 2.4587249755859375, 2.7743020057678223, 3.089879035949707, 3.405456066131592, 3.7210330963134766, 4.036610126495361, 4.352187156677246, 4.667763710021973, 4.983340740203857, 5.298917770385742, 5.614494800567627, 5.930071830749512, 6.2456488609313965, 6.561225891113281, 6.876802444458008, 7.192379951477051, 7.507956504821777, 7.823533535003662, 8.139110565185547]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 4.0, 7.0, 15.0, 11.0, 7.0, 14.0, 15.0, 11.0, 24.0, 29.0, 23.0, 20.0, 37.0, 43.0, 36.0, 40.0, 52.0, 53.0, 49.0, 50.0, 47.0, 47.0, 33.0, 29.0, 38.0, 34.0, 34.0, 24.0, 28.0, 20.0, 16.0, 16.0, 14.0, 10.0, 13.0, 9.0, 5.0, 9.0, 10.0, 8.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.42110013961792, -3.3187904357910156, -3.2164807319641113, -3.114171028137207, -3.0118613243103027, -2.9095516204833984, -2.807241678237915, -2.7049319744110107, -2.6026222705841064, -2.500312566757202, -2.398002862930298, -2.2956931591033936, -2.19338321685791, -2.091073513031006, -1.9887638092041016, -1.8864541053771973, -1.784144401550293, -1.6818346977233887, -1.5795249938964844, -1.4772151708602905, -1.3749054670333862, -1.272595763206482, -1.170285940170288, -1.0679762363433838, -0.9656665325164795, -0.8633568286895752, -0.7610470652580261, -0.658737301826477, -0.5564275979995728, -0.45411789417266846, -0.3518081307411194, -0.2494983673095703, -0.14718866348266602, -0.04487892985343933, 0.057430803775787354, 0.15974053740501404, 0.2620502710342407, 0.364359974861145, 0.4666697382926941, 0.5689795017242432, 0.6712892055511475, 0.7735989093780518, 0.8759086728096008, 0.9782184362411499, 1.0805281400680542, 1.1828378438949585, 1.2851476669311523, 1.3874573707580566, 1.489767074584961, 1.5920767784118652, 1.6943864822387695, 1.7966963052749634, 1.8990060091018677, 2.0013155937194824, 2.103625535964966, 2.20593523979187, 2.3082449436187744, 2.4105546474456787, 2.512864351272583, 2.6151740550994873, 2.7174839973449707, 2.819793701171875, 2.9221034049987793, 3.0244131088256836, 3.126722812652588]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 9.0, 10.0, 22.0, 32.0, 48.0, 74.0, 154.0, 266.0, 496.0, 1116.0, 2665.0, 6809.0, 19191.0, 58872.0, 204845.0, 468182.0, 198716.0, 56892.0, 18758.0, 6588.0, 2639.0, 1058.0, 545.0, 217.0, 117.0, 91.0, 48.0, 31.0, 16.0, 14.0, 10.0, 3.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7407455444335938, -0.7104949951171875, -0.6802444458007812, -0.649993896484375, -0.6197433471679688, -0.5894927978515625, -0.5592422485351562, -0.52899169921875, -0.49874114990234375, -0.4684906005859375, -0.43824005126953125, -0.407989501953125, -0.37773895263671875, -0.3474884033203125, -0.31723785400390625, -0.2869873046875, -0.25673675537109375, -0.2264862060546875, -0.19623565673828125, -0.165985107421875, -0.13573455810546875, -0.1054840087890625, -0.07523345947265625, -0.04498291015625, -0.01473236083984375, 0.0155181884765625, 0.04576873779296875, 0.076019287109375, 0.10626983642578125, 0.1365203857421875, 0.16677093505859375, 0.197021484375, 0.22727203369140625, 0.2575225830078125, 0.28777313232421875, 0.318023681640625, 0.34827423095703125, 0.3785247802734375, 0.40877532958984375, 0.43902587890625, 0.46927642822265625, 0.4995269775390625, 0.5297775268554688, 0.560028076171875, 0.5902786254882812, 0.6205291748046875, 0.6507797241210938, 0.6810302734375, 0.7112808227539062, 0.7415313720703125, 0.7717819213867188, 0.802032470703125, 0.8322830200195312, 0.8625335693359375, 0.8927841186523438, 0.92303466796875, 0.9532852172851562, 0.9835357666015625, 1.0137863159179688, 1.044036865234375, 1.0742874145507812, 1.1045379638671875, 1.1347885131835938, 1.1650390625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 7.0, 3.0, 9.0, 16.0, 12.0, 17.0, 28.0, 12.0, 31.0, 41.0, 33.0, 41.0, 35.0, 41.0, 45.0, 54.0, 47.0, 53.0, 56.0, 57.0, 44.0, 42.0, 51.0, 31.0, 28.0, 29.0, 25.0, 21.0, 12.0, 21.0, 17.0, 11.0, 9.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.394287109375, -0.3812408447265625, -0.368194580078125, -0.3551483154296875, -0.34210205078125, -0.3290557861328125, -0.316009521484375, -0.3029632568359375, -0.2899169921875, -0.2768707275390625, -0.263824462890625, -0.2507781982421875, -0.23773193359375, -0.2246856689453125, -0.211639404296875, -0.1985931396484375, -0.185546875, -0.1725006103515625, -0.159454345703125, -0.1464080810546875, -0.13336181640625, -0.1203155517578125, -0.107269287109375, -0.0942230224609375, -0.0811767578125, -0.0681304931640625, -0.055084228515625, -0.0420379638671875, -0.02899169921875, -0.0159454345703125, -0.002899169921875, 0.0101470947265625, 0.023193359375, 0.0362396240234375, 0.049285888671875, 0.0623321533203125, 0.07537841796875, 0.0884246826171875, 0.101470947265625, 0.1145172119140625, 0.1275634765625, 0.1406097412109375, 0.153656005859375, 0.1667022705078125, 0.17974853515625, 0.1927947998046875, 0.205841064453125, 0.2188873291015625, 0.23193359375, 0.2449798583984375, 0.258026123046875, 0.2710723876953125, 0.28411865234375, 0.2971649169921875, 0.310211181640625, 0.3232574462890625, 0.3363037109375, 0.3493499755859375, 0.362396240234375, 0.3754425048828125, 0.38848876953125, 0.4015350341796875, 0.414581298828125, 0.4276275634765625, 0.440673828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 9.0, 1.0, 3.0, 8.0, 12.0, 15.0, 21.0, 31.0, 62.0, 80.0, 210.0, 451.0, 1264.0, 5083.0, 32209.0, 418737.0, 545315.0, 37234.0, 5477.0, 1387.0, 489.0, 215.0, 90.0, 47.0, 37.0, 16.0, 14.0, 18.0, 7.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.599609375, -1.540435791015625, -1.48126220703125, -1.422088623046875, -1.3629150390625, -1.303741455078125, -1.24456787109375, -1.185394287109375, -1.126220703125, -1.067047119140625, -1.00787353515625, -0.948699951171875, -0.8895263671875, -0.830352783203125, -0.77117919921875, -0.712005615234375, -0.65283203125, -0.593658447265625, -0.53448486328125, -0.475311279296875, -0.4161376953125, -0.356964111328125, -0.29779052734375, -0.238616943359375, -0.179443359375, -0.120269775390625, -0.06109619140625, -0.001922607421875, 0.0572509765625, 0.116424560546875, 0.17559814453125, 0.234771728515625, 0.2939453125, 0.353118896484375, 0.41229248046875, 0.471466064453125, 0.5306396484375, 0.589813232421875, 0.64898681640625, 0.708160400390625, 0.767333984375, 0.826507568359375, 0.88568115234375, 0.944854736328125, 1.0040283203125, 1.063201904296875, 1.12237548828125, 1.181549072265625, 1.24072265625, 1.299896240234375, 1.35906982421875, 1.418243408203125, 1.4774169921875, 1.536590576171875, 1.59576416015625, 1.654937744140625, 1.714111328125, 1.773284912109375, 1.83245849609375, 1.891632080078125, 1.9508056640625, 2.009979248046875, 2.06915283203125, 2.128326416015625, 2.1875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 12.0, 9.0, 5.0, 9.0, 17.0, 16.0, 14.0, 24.0, 16.0, 32.0, 28.0, 42.0, 52.0, 50.0, 47.0, 53.0, 58.0, 53.0, 51.0, 47.0, 47.0, 56.0, 25.0, 48.0, 29.0, 27.0, 22.0, 29.0, 23.0, 18.0, 14.0, 6.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.3675384521484375, -1.319061279296875, -1.2705841064453125, -1.22210693359375, -1.1736297607421875, -1.125152587890625, -1.0766754150390625, -1.0281982421875, -0.9797210693359375, -0.931243896484375, -0.8827667236328125, -0.83428955078125, -0.7858123779296875, -0.737335205078125, -0.6888580322265625, -0.640380859375, -0.5919036865234375, -0.543426513671875, -0.4949493408203125, -0.44647216796875, -0.3979949951171875, -0.349517822265625, -0.3010406494140625, -0.2525634765625, -0.2040863037109375, -0.155609130859375, -0.1071319580078125, -0.05865478515625, -0.0101776123046875, 0.038299560546875, 0.0867767333984375, 0.13525390625, 0.1837310791015625, 0.232208251953125, 0.2806854248046875, 0.32916259765625, 0.3776397705078125, 0.426116943359375, 0.4745941162109375, 0.5230712890625, 0.5715484619140625, 0.620025634765625, 0.6685028076171875, 0.71697998046875, 0.7654571533203125, 0.813934326171875, 0.8624114990234375, 0.910888671875, 0.9593658447265625, 1.007843017578125, 1.0563201904296875, 1.10479736328125, 1.1532745361328125, 1.201751708984375, 1.2502288818359375, 1.2987060546875, 1.3471832275390625, 1.395660400390625, 1.4441375732421875, 1.49261474609375, 1.5410919189453125, 1.589569091796875, 1.6380462646484375, 1.6865234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 3.0, 8.0, 17.0, 19.0, 40.0, 67.0, 172.0, 445.0, 1498.0, 8096.0, 349877.0, 675328.0, 10378.0, 1803.0, 452.0, 158.0, 80.0, 46.0, 23.0, 18.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8837890625, -0.8498687744140625, -0.815948486328125, -0.7820281982421875, -0.74810791015625, -0.7141876220703125, -0.680267333984375, -0.6463470458984375, -0.6124267578125, -0.5785064697265625, -0.544586181640625, -0.5106658935546875, -0.47674560546875, -0.4428253173828125, -0.408905029296875, -0.3749847412109375, -0.341064453125, -0.3071441650390625, -0.273223876953125, -0.2393035888671875, -0.20538330078125, -0.1714630126953125, -0.137542724609375, -0.1036224365234375, -0.0697021484375, -0.0357818603515625, -0.001861572265625, 0.0320587158203125, 0.06597900390625, 0.0998992919921875, 0.133819580078125, 0.1677398681640625, 0.20166015625, 0.2355804443359375, 0.269500732421875, 0.3034210205078125, 0.33734130859375, 0.3712615966796875, 0.405181884765625, 0.4391021728515625, 0.4730224609375, 0.5069427490234375, 0.540863037109375, 0.5747833251953125, 0.60870361328125, 0.6426239013671875, 0.676544189453125, 0.7104644775390625, 0.744384765625, 0.7783050537109375, 0.812225341796875, 0.8461456298828125, 0.88006591796875, 0.9139862060546875, 0.947906494140625, 0.9818267822265625, 1.0157470703125, 1.0496673583984375, 1.083587646484375, 1.1175079345703125, 1.15142822265625, 1.1853485107421875, 1.219268798828125, 1.2531890869140625, 1.287109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 8.0, 12.0, 18.0, 32.0, 35.0, 69.0, 71.0, 120.0, 154.0, 161.0, 90.0, 70.0, 38.0, 35.0, 18.0, 14.0, 14.0, 6.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.082389831542969e-05, -7.741153240203857e-05, -7.399916648864746e-05, -7.058680057525635e-05, -6.717443466186523e-05, -6.376206874847412e-05, -6.034970283508301e-05, -5.6937336921691895e-05, -5.352497100830078e-05, -5.011260509490967e-05, -4.6700239181518555e-05, -4.328787326812744e-05, -3.987550735473633e-05, -3.6463141441345215e-05, -3.30507755279541e-05, -2.9638409614562988e-05, -2.6226043701171875e-05, -2.2813677787780762e-05, -1.940131187438965e-05, -1.5988945960998535e-05, -1.2576580047607422e-05, -9.164214134216309e-06, -5.751848220825195e-06, -2.339482307434082e-06, 1.0728836059570312e-06, 4.4852495193481445e-06, 7.897615432739258e-06, 1.1309981346130371e-05, 1.4722347259521484e-05, 1.8134713172912598e-05, 2.154707908630371e-05, 2.4959444999694824e-05, 2.8371810913085938e-05, 3.178417682647705e-05, 3.5196542739868164e-05, 3.860890865325928e-05, 4.202127456665039e-05, 4.5433640480041504e-05, 4.884600639343262e-05, 5.225837230682373e-05, 5.5670738220214844e-05, 5.908310413360596e-05, 6.249547004699707e-05, 6.590783596038818e-05, 6.93202018737793e-05, 7.273256778717041e-05, 7.614493370056152e-05, 7.955729961395264e-05, 8.296966552734375e-05, 8.638203144073486e-05, 8.979439735412598e-05, 9.320676326751709e-05, 9.66191291809082e-05, 0.00010003149509429932, 0.00010344386100769043, 0.00010685622692108154, 0.00011026859283447266, 0.00011368095874786377, 0.00011709332466125488, 0.000120505690574646, 0.0001239180564880371, 0.00012733042240142822, 0.00013074278831481934, 0.00013415515422821045, 0.00013756752014160156]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 14.0, 17.0, 36.0, 58.0, 114.0, 232.0, 601.0, 2061.0, 13336.0, 607960.0, 409540.0, 11669.0, 1936.0, 528.0, 215.0, 113.0, 53.0, 21.0, 17.0, 12.0, 4.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76708984375, -0.7350845336914062, -0.7030792236328125, -0.6710739135742188, -0.639068603515625, -0.6070632934570312, -0.5750579833984375, -0.5430526733398438, -0.51104736328125, -0.47904205322265625, -0.4470367431640625, -0.41503143310546875, -0.383026123046875, -0.35102081298828125, -0.3190155029296875, -0.28701019287109375, -0.2550048828125, -0.22299957275390625, -0.1909942626953125, -0.15898895263671875, -0.126983642578125, -0.09497833251953125, -0.0629730224609375, -0.03096771240234375, 0.00103759765625, 0.03304290771484375, 0.0650482177734375, 0.09705352783203125, 0.129058837890625, 0.16106414794921875, 0.1930694580078125, 0.22507476806640625, 0.257080078125, 0.28908538818359375, 0.3210906982421875, 0.35309600830078125, 0.385101318359375, 0.41710662841796875, 0.4491119384765625, 0.48111724853515625, 0.51312255859375, 0.5451278686523438, 0.5771331787109375, 0.6091384887695312, 0.641143798828125, 0.6731491088867188, 0.7051544189453125, 0.7371597290039062, 0.7691650390625, 0.8011703491210938, 0.8331756591796875, 0.8651809692382812, 0.897186279296875, 0.9291915893554688, 0.9611968994140625, 0.9932022094726562, 1.02520751953125, 1.0572128295898438, 1.0892181396484375, 1.1212234497070312, 1.153228759765625, 1.1852340698242188, 1.2172393798828125, 1.2492446899414062, 1.28125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 8.0, 15.0, 16.0, 33.0, 51.0, 60.0, 93.0, 96.0, 105.0, 118.0, 113.0, 89.0, 65.0, 38.0, 25.0, 19.0, 10.0, 11.0, 6.0, 8.0, 6.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7431640625, -0.725494384765625, -0.70782470703125, -0.690155029296875, -0.6724853515625, -0.654815673828125, -0.63714599609375, -0.619476318359375, -0.601806640625, -0.584136962890625, -0.56646728515625, -0.548797607421875, -0.5311279296875, -0.513458251953125, -0.49578857421875, -0.478118896484375, -0.46044921875, -0.442779541015625, -0.42510986328125, -0.407440185546875, -0.3897705078125, -0.372100830078125, -0.35443115234375, -0.336761474609375, -0.319091796875, -0.301422119140625, -0.28375244140625, -0.266082763671875, -0.2484130859375, -0.230743408203125, -0.21307373046875, -0.195404052734375, -0.177734375, -0.160064697265625, -0.14239501953125, -0.124725341796875, -0.1070556640625, -0.089385986328125, -0.07171630859375, -0.054046630859375, -0.036376953125, -0.018707275390625, -0.00103759765625, 0.016632080078125, 0.0343017578125, 0.051971435546875, 0.06964111328125, 0.087310791015625, 0.10498046875, 0.122650146484375, 0.14031982421875, 0.157989501953125, 0.1756591796875, 0.193328857421875, 0.21099853515625, 0.228668212890625, 0.246337890625, 0.264007568359375, 0.28167724609375, 0.299346923828125, 0.3170166015625, 0.334686279296875, 0.35235595703125, 0.370025634765625, 0.3876953125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 9.0, 6.0, 18.0, 43.0, 112.0, 227.0, 265.0, 159.0, 97.0, 26.0, 15.0, 6.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0981035232543945, -5.669137477874756, -5.240171432495117, -4.81120491027832, -4.382238864898682, -3.953272819519043, -3.524306535720825, -3.0953402519226074, -2.6663742065429688, -2.23740816116333, -1.8084418773651123, -1.379475712776184, -0.9505095481872559, -0.5215435028076172, -0.09257721900939941, 0.33638906478881836, 0.765355110168457, 1.1943212747573853, 1.6232874393463135, 2.0522537231445312, 2.48121976852417, 2.9101858139038086, 3.3391520977020264, 3.768118381500244, 4.197084426879883, 4.6260504722595215, 5.05501651763916, 5.483983039855957, 5.912949085235596, 6.341915130615234, 6.770881652832031, 7.19984769821167, 7.628814697265625, 8.057781219482422, 8.486746788024902, 8.9157133102417, 9.34467887878418, 9.773645401000977, 10.202611923217773, 10.63157844543457, 11.06054401397705, 11.489510536193848, 11.918476104736328, 12.347442626953125, 12.776409149169922, 13.205374717712402, 13.6343412399292, 14.06330680847168, 14.492273330688477, 14.921239852905273, 15.350205421447754, 15.77917194366455, 16.20813751220703, 16.637104034423828, 17.066070556640625, 17.495037078857422, 17.92400360107422, 18.352970123291016, 18.781936645507812, 19.210901260375977, 19.639867782592773, 20.06883430480957, 20.497800827026367, 20.926767349243164, 21.355731964111328]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 1.0, 5.0, 13.0, 19.0, 14.0, 14.0, 25.0, 26.0, 46.0, 33.0, 39.0, 43.0, 43.0, 64.0, 69.0, 86.0, 70.0, 63.0, 45.0, 43.0, 42.0, 31.0, 35.0, 34.0, 12.0, 19.0, 16.0, 15.0, 8.0, 7.0, 6.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.819536209106445, -9.577393531799316, -9.335250854492188, -9.093109130859375, -8.850966453552246, -8.608823776245117, -8.366681098937988, -8.12453842163086, -7.882396221160889, -7.64025354385376, -7.398111343383789, -7.15596866607666, -6.913825988769531, -6.6716837882995605, -6.429541110992432, -6.187398910522461, -5.945256233215332, -5.703113555908203, -5.460971355438232, -5.2188286781311035, -4.976686477661133, -4.734543800354004, -4.492401123046875, -4.250258445739746, -4.008116245269775, -3.7659738063812256, -3.523831367492676, -3.281688690185547, -3.039546251296997, -2.7974038124084473, -2.5552611351013184, -2.3131186962127686, -2.0709762573242188, -1.828833818435669, -1.5866912603378296, -1.3445487022399902, -1.1024062633514404, -0.8602638244628906, -0.6181212663650513, -0.3759787082672119, -0.1338362693786621, 0.10830622911453247, 0.35044872760772705, 0.5925912261009216, 0.8347337245941162, 1.076876163482666, 1.3190187215805054, 1.5611612796783447, 1.8033037185668945, 2.0454461574554443, 2.287588596343994, 2.529731273651123, 2.771873712539673, 3.0140161514282227, 3.2561588287353516, 3.4983012676239014, 3.740443706512451, 3.982586145401001, 4.224728584289551, 4.46687126159668, 4.709013938903809, 4.951156139373779, 5.193298816680908, 5.435441017150879, 5.677583694458008]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 11.0, 4.0, 15.0, 18.0, 26.0, 33.0, 44.0, 78.0, 130.0, 154.0, 269.0, 410.0, 705.0, 1235.0, 2233.0, 4747.0, 11479.0, 36479.0, 289872.0, 3278335.0, 491786.0, 50153.0, 14529.0, 5703.0, 2620.0, 1346.0, 707.0, 429.0, 255.0, 172.0, 99.0, 57.0, 47.0, 30.0, 17.0, 12.0, 11.0, 9.0, 4.0, 6.0, 1.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.77294921875, -0.7518234252929688, -0.7306976318359375, -0.7095718383789062, -0.688446044921875, -0.6673202514648438, -0.6461944580078125, -0.6250686645507812, -0.60394287109375, -0.5828170776367188, -0.5616912841796875, -0.5405654907226562, -0.519439697265625, -0.49831390380859375, -0.4771881103515625, -0.45606231689453125, -0.4349365234375, -0.41381072998046875, -0.3926849365234375, -0.37155914306640625, -0.350433349609375, -0.32930755615234375, -0.3081817626953125, -0.28705596923828125, -0.26593017578125, -0.24480438232421875, -0.2236785888671875, -0.20255279541015625, -0.181427001953125, -0.16030120849609375, -0.1391754150390625, -0.11804962158203125, -0.096923828125, -0.07579803466796875, -0.0546722412109375, -0.03354644775390625, -0.012420654296875, 0.00870513916015625, 0.0298309326171875, 0.05095672607421875, 0.07208251953125, 0.09320831298828125, 0.1143341064453125, 0.13545989990234375, 0.156585693359375, 0.17771148681640625, 0.1988372802734375, 0.21996307373046875, 0.2410888671875, 0.26221466064453125, 0.2833404541015625, 0.30446624755859375, 0.325592041015625, 0.34671783447265625, 0.3678436279296875, 0.38896942138671875, 0.41009521484375, 0.43122100830078125, 0.4523468017578125, 0.47347259521484375, 0.494598388671875, 0.5157241821289062, 0.5368499755859375, 0.5579757690429688, 0.5791015625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 19.0, 19.0, 36.0, 55.0, 50.0, 58.0, 72.0, 75.0, 72.0, 82.0, 84.0, 77.0, 65.0, 72.0, 37.0, 38.0, 26.0, 22.0, 9.0, 9.0, 10.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.7684860229492188, -0.7493743896484375, -0.7302627563476562, -0.711151123046875, -0.6920394897460938, -0.6729278564453125, -0.6538162231445312, -0.63470458984375, -0.6155929565429688, -0.5964813232421875, -0.5773696899414062, -0.558258056640625, -0.5391464233398438, -0.5200347900390625, -0.5009231567382812, -0.4818115234375, -0.46269989013671875, -0.4435882568359375, -0.42447662353515625, -0.405364990234375, -0.38625335693359375, -0.3671417236328125, -0.34803009033203125, -0.32891845703125, -0.30980682373046875, -0.2906951904296875, -0.27158355712890625, -0.252471923828125, -0.23336029052734375, -0.2142486572265625, -0.19513702392578125, -0.176025390625, -0.15691375732421875, -0.1378021240234375, -0.11869049072265625, -0.099578857421875, -0.08046722412109375, -0.0613555908203125, -0.04224395751953125, -0.02313232421875, -0.00402069091796875, 0.0150909423828125, 0.03420257568359375, 0.053314208984375, 0.07242584228515625, 0.0915374755859375, 0.11064910888671875, 0.1297607421875, 0.14887237548828125, 0.1679840087890625, 0.18709564208984375, 0.206207275390625, 0.22531890869140625, 0.2444305419921875, 0.26354217529296875, 0.28265380859375, 0.30176544189453125, 0.3208770751953125, 0.33998870849609375, 0.359100341796875, 0.37821197509765625, 0.3973236083984375, 0.41643524169921875, 0.435546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 7.0, 12.0, 12.0, 20.0, 19.0, 24.0, 45.0, 49.0, 71.0, 126.0, 259.0, 502.0, 1046.0, 2944.0, 10228.0, 71769.0, 3724284.0, 351227.0, 23549.0, 5153.0, 1601.0, 635.0, 281.0, 142.0, 74.0, 49.0, 31.0, 30.0, 22.0, 17.0, 12.0, 10.0, 9.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5478515625, -1.5019683837890625, -1.456085205078125, -1.4102020263671875, -1.36431884765625, -1.3184356689453125, -1.272552490234375, -1.2266693115234375, -1.1807861328125, -1.1349029541015625, -1.089019775390625, -1.0431365966796875, -0.99725341796875, -0.9513702392578125, -0.905487060546875, -0.8596038818359375, -0.813720703125, -0.7678375244140625, -0.721954345703125, -0.6760711669921875, -0.63018798828125, -0.5843048095703125, -0.538421630859375, -0.4925384521484375, -0.4466552734375, -0.4007720947265625, -0.354888916015625, -0.3090057373046875, -0.26312255859375, -0.2172393798828125, -0.171356201171875, -0.1254730224609375, -0.07958984375, -0.0337066650390625, 0.012176513671875, 0.0580596923828125, 0.10394287109375, 0.1498260498046875, 0.195709228515625, 0.2415924072265625, 0.2874755859375, 0.3333587646484375, 0.379241943359375, 0.4251251220703125, 0.47100830078125, 0.5168914794921875, 0.562774658203125, 0.6086578369140625, 0.654541015625, 0.7004241943359375, 0.746307373046875, 0.7921905517578125, 0.83807373046875, 0.8839569091796875, 0.929840087890625, 0.9757232666015625, 1.0216064453125, 1.0674896240234375, 1.113372802734375, 1.1592559814453125, 1.20513916015625, 1.2510223388671875, 1.296905517578125, 1.3427886962890625, 1.388671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 3.0, 4.0, 4.0, 7.0, 4.0, 11.0, 23.0, 17.0, 37.0, 44.0, 60.0, 143.0, 221.0, 503.0, 994.0, 937.0, 447.0, 242.0, 97.0, 78.0, 41.0, 37.0, 22.0, 17.0, 22.0, 10.0, 10.0, 5.0, 5.0, 3.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0771484375, -1.0472259521484375, -1.017303466796875, -0.9873809814453125, -0.95745849609375, -0.9275360107421875, -0.897613525390625, -0.8676910400390625, -0.8377685546875, -0.8078460693359375, -0.777923583984375, -0.7480010986328125, -0.71807861328125, -0.6881561279296875, -0.658233642578125, -0.6283111572265625, -0.598388671875, -0.5684661865234375, -0.538543701171875, -0.5086212158203125, -0.47869873046875, -0.4487762451171875, -0.418853759765625, -0.3889312744140625, -0.3590087890625, -0.3290863037109375, -0.299163818359375, -0.2692413330078125, -0.23931884765625, -0.2093963623046875, -0.179473876953125, -0.1495513916015625, -0.11962890625, -0.0897064208984375, -0.059783935546875, -0.0298614501953125, 6.103515625e-05, 0.0299835205078125, 0.059906005859375, 0.0898284912109375, 0.1197509765625, 0.1496734619140625, 0.179595947265625, 0.2095184326171875, 0.23944091796875, 0.2693634033203125, 0.299285888671875, 0.3292083740234375, 0.359130859375, 0.3890533447265625, 0.418975830078125, 0.4488983154296875, 0.47882080078125, 0.5087432861328125, 0.538665771484375, 0.5685882568359375, 0.5985107421875, 0.6284332275390625, 0.658355712890625, 0.6882781982421875, 0.71820068359375, 0.7481231689453125, 0.778045654296875, 0.8079681396484375, 0.837890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 8.0, 7.0, 3.0, 5.0, 20.0, 29.0, 48.0, 72.0, 94.0, 136.0, 171.0, 141.0, 100.0, 55.0, 40.0, 20.0, 15.0, 14.0, 12.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.387801170349121, -8.15819263458252, -7.928584575653076, -7.698976039886475, -7.469367980957031, -7.23975944519043, -7.010150909423828, -6.780542373657227, -6.550934314727783, -6.321325778961182, -6.091717720031738, -5.862109184265137, -5.632500648498535, -5.402892589569092, -5.17328405380249, -4.943675994873047, -4.714067459106445, -4.484458923339844, -4.2548508644104, -4.025242328643799, -3.7956340312957764, -3.566025733947754, -3.3364171981811523, -3.10680890083313, -2.8772006034851074, -2.647592306137085, -2.4179840087890625, -2.188375473022461, -1.9587671756744385, -1.729158878326416, -1.499550461769104, -1.269942045211792, -1.0403342247009277, -0.8107258677482605, -0.5811175107955933, -0.351509153842926, -0.12190079689025879, 0.10770750045776367, 0.3373159170150757, 0.5669243335723877, 0.7965326309204102, 1.0261409282684326, 1.2557493448257446, 1.4853577613830566, 1.714966058731079, 1.9445743560791016, 2.174182891845703, 2.4037911891937256, 2.633399486541748, 2.8630077838897705, 3.092616081237793, 3.3222246170043945, 3.551832914352417, 3.7814412117004395, 4.011049747467041, 4.240657806396484, 4.470266342163086, 4.6998748779296875, 4.929482936859131, 5.159091472625732, 5.388699531555176, 5.618308067321777, 5.847916603088379, 6.0775251388549805, 6.307133197784424]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 2.0, 5.0, 4.0, 7.0, 8.0, 12.0, 18.0, 19.0, 21.0, 29.0, 29.0, 43.0, 45.0, 46.0, 66.0, 49.0, 70.0, 50.0, 36.0, 55.0, 55.0, 47.0, 45.0, 38.0, 29.0, 40.0, 37.0, 25.0, 20.0, 6.0, 9.0, 14.0, 9.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.767602443695068, -4.622891426086426, -4.478179931640625, -4.333468437194824, -4.188757419586182, -4.044046401977539, -3.8993349075317383, -3.7546236515045166, -3.609912395477295, -3.4652011394500732, -3.3204898834228516, -3.17577862739563, -3.031067371368408, -2.8863561153411865, -2.741644859313965, -2.596933603286743, -2.4522223472595215, -2.3075110912323, -2.162799835205078, -2.0180885791778564, -1.8733773231506348, -1.728666067123413, -1.5839548110961914, -1.4392435550689697, -1.294532299041748, -1.1498210430145264, -1.0051097869873047, -0.860398530960083, -0.7156872749328613, -0.5709760189056396, -0.42626476287841797, -0.2815535068511963, -0.1368427276611328, 0.007868528366088867, 0.15257978439331055, 0.2972910404205322, 0.4420022964477539, 0.5867135524749756, 0.7314248085021973, 0.876136064529419, 1.0208473205566406, 1.1655585765838623, 1.310269832611084, 1.4549810886383057, 1.5996923446655273, 1.744403600692749, 1.8891148567199707, 2.0338261127471924, 2.178537368774414, 2.3232486248016357, 2.4679598808288574, 2.612671136856079, 2.757382392883301, 2.9020936489105225, 3.046804904937744, 3.191516160964966, 3.3362274169921875, 3.480938673019409, 3.625649929046631, 3.7703611850738525, 3.915072441101074, 4.059783935546875, 4.204494953155518, 4.34920597076416, 4.493917465209961]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 6.0, 8.0, 17.0, 24.0, 43.0, 48.0, 97.0, 130.0, 236.0, 346.0, 603.0, 1068.0, 1985.0, 3701.0, 6956.0, 13960.0, 27959.0, 57732.0, 118948.0, 223376.0, 265488.0, 164389.0, 81892.0, 39552.0, 19119.0, 9691.0, 5086.0, 2630.0, 1438.0, 810.0, 461.0, 255.0, 170.0, 98.0, 73.0, 56.0, 30.0, 25.0, 19.0, 12.0, 5.0, 5.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.486297607421875, -0.46966552734375, -0.453033447265625, -0.4364013671875, -0.419769287109375, -0.40313720703125, -0.386505126953125, -0.369873046875, -0.353240966796875, -0.33660888671875, -0.319976806640625, -0.3033447265625, -0.286712646484375, -0.27008056640625, -0.253448486328125, -0.23681640625, -0.220184326171875, -0.20355224609375, -0.186920166015625, -0.1702880859375, -0.153656005859375, -0.13702392578125, -0.120391845703125, -0.103759765625, -0.087127685546875, -0.07049560546875, -0.053863525390625, -0.0372314453125, -0.020599365234375, -0.00396728515625, 0.012664794921875, 0.029296875, 0.045928955078125, 0.06256103515625, 0.079193115234375, 0.0958251953125, 0.112457275390625, 0.12908935546875, 0.145721435546875, 0.162353515625, 0.178985595703125, 0.19561767578125, 0.212249755859375, 0.2288818359375, 0.245513916015625, 0.26214599609375, 0.278778076171875, 0.29541015625, 0.312042236328125, 0.32867431640625, 0.345306396484375, 0.3619384765625, 0.378570556640625, 0.39520263671875, 0.411834716796875, 0.428466796875, 0.445098876953125, 0.46173095703125, 0.478363037109375, 0.4949951171875, 0.511627197265625, 0.52825927734375, 0.544891357421875, 0.5615234375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 11.0, 6.0, 16.0, 25.0, 24.0, 31.0, 38.0, 31.0, 41.0, 45.0, 65.0, 43.0, 52.0, 66.0, 51.0, 72.0, 61.0, 53.0, 40.0, 46.0, 39.0, 23.0, 26.0, 22.0, 19.0, 14.0, 6.0, 8.0, 5.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4150390625, -0.4020271301269531, -0.38901519775390625, -0.3760032653808594, -0.3629913330078125, -0.3499794006347656, -0.33696746826171875, -0.3239555358886719, -0.310943603515625, -0.2979316711425781, -0.28491973876953125, -0.2719078063964844, -0.2588958740234375, -0.24588394165039062, -0.23287200927734375, -0.21986007690429688, -0.20684814453125, -0.19383621215820312, -0.18082427978515625, -0.16781234741210938, -0.1548004150390625, -0.14178848266601562, -0.12877655029296875, -0.11576461791992188, -0.102752685546875, -0.08974075317382812, -0.07672882080078125, -0.06371688842773438, -0.0507049560546875, -0.037693023681640625, -0.02468109130859375, -0.011669158935546875, 0.0013427734375, 0.014354705810546875, 0.02736663818359375, 0.040378570556640625, 0.0533905029296875, 0.06640243530273438, 0.07941436767578125, 0.09242630004882812, 0.105438232421875, 0.11845016479492188, 0.13146209716796875, 0.14447402954101562, 0.1574859619140625, 0.17049789428710938, 0.18350982666015625, 0.19652175903320312, 0.20953369140625, 0.22254562377929688, 0.23555755615234375, 0.24856948852539062, 0.2615814208984375, 0.2745933532714844, 0.28760528564453125, 0.3006172180175781, 0.313629150390625, 0.3266410827636719, 0.33965301513671875, 0.3526649475097656, 0.3656768798828125, 0.3786888122558594, 0.39170074462890625, 0.4047126770019531, 0.417724609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 12.0, 16.0, 29.0, 41.0, 41.0, 107.0, 175.0, 214.0, 384.0, 577.0, 1092.0, 2079.0, 4677.0, 13554.0, 53247.0, 287779.0, 564821.0, 87189.0, 20186.0, 6488.0, 2594.0, 1291.0, 711.0, 400.0, 284.0, 166.0, 119.0, 102.0, 58.0, 32.0, 24.0, 17.0, 11.0, 14.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.9951629638671875, -0.961029052734375, -0.9268951416015625, -0.89276123046875, -0.8586273193359375, -0.824493408203125, -0.7903594970703125, -0.7562255859375, -0.7220916748046875, -0.687957763671875, -0.6538238525390625, -0.61968994140625, -0.5855560302734375, -0.551422119140625, -0.5172882080078125, -0.483154296875, -0.4490203857421875, -0.414886474609375, -0.3807525634765625, -0.34661865234375, -0.3124847412109375, -0.278350830078125, -0.2442169189453125, -0.2100830078125, -0.1759490966796875, -0.141815185546875, -0.1076812744140625, -0.07354736328125, -0.0394134521484375, -0.005279541015625, 0.0288543701171875, 0.06298828125, 0.0971221923828125, 0.131256103515625, 0.1653900146484375, 0.19952392578125, 0.2336578369140625, 0.267791748046875, 0.3019256591796875, 0.3360595703125, 0.3701934814453125, 0.404327392578125, 0.4384613037109375, 0.47259521484375, 0.5067291259765625, 0.540863037109375, 0.5749969482421875, 0.609130859375, 0.6432647705078125, 0.677398681640625, 0.7115325927734375, 0.74566650390625, 0.7798004150390625, 0.813934326171875, 0.8480682373046875, 0.8822021484375, 0.9163360595703125, 0.950469970703125, 0.9846038818359375, 1.01873779296875, 1.0528717041015625, 1.087005615234375, 1.1211395263671875, 1.1552734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 7.0, 5.0, 8.0, 8.0, 4.0, 3.0, 6.0, 3.0, 12.0, 7.0, 11.0, 13.0, 8.0, 21.0, 21.0, 19.0, 28.0, 19.0, 36.0, 28.0, 28.0, 32.0, 37.0, 43.0, 44.0, 41.0, 41.0, 42.0, 37.0, 33.0, 33.0, 31.0, 33.0, 39.0, 32.0, 31.0, 19.0, 14.0, 20.0, 19.0, 8.0, 18.0, 7.0, 6.0, 11.0, 4.0, 8.0, 8.0, 4.0, 6.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0], "bins": [-0.9970703125, -0.9640045166015625, -0.930938720703125, -0.8978729248046875, -0.86480712890625, -0.8317413330078125, -0.798675537109375, -0.7656097412109375, -0.7325439453125, -0.6994781494140625, -0.666412353515625, -0.6333465576171875, -0.60028076171875, -0.5672149658203125, -0.534149169921875, -0.5010833740234375, -0.468017578125, -0.4349517822265625, -0.401885986328125, -0.3688201904296875, -0.33575439453125, -0.3026885986328125, -0.269622802734375, -0.2365570068359375, -0.2034912109375, -0.1704254150390625, -0.137359619140625, -0.1042938232421875, -0.07122802734375, -0.0381622314453125, -0.005096435546875, 0.0279693603515625, 0.06103515625, 0.0941009521484375, 0.127166748046875, 0.1602325439453125, 0.19329833984375, 0.2263641357421875, 0.259429931640625, 0.2924957275390625, 0.3255615234375, 0.3586273193359375, 0.391693115234375, 0.4247589111328125, 0.45782470703125, 0.4908905029296875, 0.523956298828125, 0.5570220947265625, 0.590087890625, 0.6231536865234375, 0.656219482421875, 0.6892852783203125, 0.72235107421875, 0.7554168701171875, 0.788482666015625, 0.8215484619140625, 0.8546142578125, 0.8876800537109375, 0.920745849609375, 0.9538116455078125, 0.98687744140625, 1.0199432373046875, 1.053009033203125, 1.0860748291015625, 1.119140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 6.0, 9.0, 5.0, 15.0, 12.0, 20.0, 26.0, 35.0, 44.0, 69.0, 76.0, 113.0, 171.0, 286.0, 398.0, 656.0, 1203.0, 2344.0, 5142.0, 12914.0, 43020.0, 200103.0, 611143.0, 123892.0, 28902.0, 9510.0, 3962.0, 1844.0, 964.0, 550.0, 366.0, 190.0, 142.0, 105.0, 78.0, 52.0, 47.0, 26.0, 29.0, 13.0, 13.0, 9.0, 11.0, 3.0, 8.0, 0.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.268798828125, -0.26049041748046875, -0.2521820068359375, -0.24387359619140625, -0.235565185546875, -0.22725677490234375, -0.2189483642578125, -0.21063995361328125, -0.20233154296875, -0.19402313232421875, -0.1857147216796875, -0.17740631103515625, -0.169097900390625, -0.16078948974609375, -0.1524810791015625, -0.14417266845703125, -0.1358642578125, -0.12755584716796875, -0.1192474365234375, -0.11093902587890625, -0.102630615234375, -0.09432220458984375, -0.0860137939453125, -0.07770538330078125, -0.06939697265625, -0.06108856201171875, -0.0527801513671875, -0.04447174072265625, -0.036163330078125, -0.02785491943359375, -0.0195465087890625, -0.01123809814453125, -0.0029296875, 0.00537872314453125, 0.0136871337890625, 0.02199554443359375, 0.030303955078125, 0.03861236572265625, 0.0469207763671875, 0.05522918701171875, 0.06353759765625, 0.07184600830078125, 0.0801544189453125, 0.08846282958984375, 0.096771240234375, 0.10507965087890625, 0.1133880615234375, 0.12169647216796875, 0.1300048828125, 0.13831329345703125, 0.1466217041015625, 0.15493011474609375, 0.163238525390625, 0.17154693603515625, 0.1798553466796875, 0.18816375732421875, 0.19647216796875, 0.20478057861328125, 0.2130889892578125, 0.22139739990234375, 0.229705810546875, 0.23801422119140625, 0.2463226318359375, 0.25463104248046875, 0.262939453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 11.0, 20.0, 28.0, 36.0, 60.0, 81.0, 126.0, 128.0, 158.0, 89.0, 72.0, 53.0, 37.0, 24.0, 27.0, 13.0, 4.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010001659393310547, -9.644590318202972e-05, -9.287521243095398e-05, -8.930452167987823e-05, -8.573383092880249e-05, -8.216314017772675e-05, -7.8592449426651e-05, -7.502175867557526e-05, -7.145106792449951e-05, -6.788037717342377e-05, -6.430968642234802e-05, -6.073899567127228e-05, -5.716830492019653e-05, -5.359761416912079e-05, -5.0026923418045044e-05, -4.64562326669693e-05, -4.2885541915893555e-05, -3.931485116481781e-05, -3.5744160413742065e-05, -3.217346966266632e-05, -2.8602778911590576e-05, -2.503208816051483e-05, -2.1461397409439087e-05, -1.7890706658363342e-05, -1.4320015907287598e-05, -1.0749325156211853e-05, -7.178634405136108e-06, -3.6079436540603638e-06, -3.725290298461914e-08, 3.5334378480911255e-06, 7.10412859916687e-06, 1.0674819350242615e-05, 1.424551010131836e-05, 1.7816200852394104e-05, 2.138689160346985e-05, 2.4957582354545593e-05, 2.8528273105621338e-05, 3.209896385669708e-05, 3.566965460777283e-05, 3.924034535884857e-05, 4.2811036109924316e-05, 4.638172686100006e-05, 4.9952417612075806e-05, 5.352310836315155e-05, 5.7093799114227295e-05, 6.066448986530304e-05, 6.423518061637878e-05, 6.780587136745453e-05, 7.137656211853027e-05, 7.494725286960602e-05, 7.851794362068176e-05, 8.208863437175751e-05, 8.565932512283325e-05, 8.9230015873909e-05, 9.280070662498474e-05, 9.637139737606049e-05, 9.994208812713623e-05, 0.00010351277887821198, 0.00010708346962928772, 0.00011065416038036346, 0.00011422485113143921, 0.00011779554188251495, 0.0001213662326335907, 0.00012493692338466644, 0.0001285076141357422]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 9.0, 5.0, 6.0, 11.0, 11.0, 13.0, 23.0, 30.0, 51.0, 65.0, 108.0, 176.0, 304.0, 545.0, 1171.0, 2610.0, 7182.0, 24952.0, 144600.0, 708690.0, 124236.0, 22342.0, 6551.0, 2458.0, 1052.0, 550.0, 289.0, 180.0, 113.0, 61.0, 46.0, 26.0, 20.0, 18.0, 16.0, 12.0, 6.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.337890625, -0.326019287109375, -0.31414794921875, -0.302276611328125, -0.2904052734375, -0.278533935546875, -0.26666259765625, -0.254791259765625, -0.242919921875, -0.231048583984375, -0.21917724609375, -0.207305908203125, -0.1954345703125, -0.183563232421875, -0.17169189453125, -0.159820556640625, -0.14794921875, -0.136077880859375, -0.12420654296875, -0.112335205078125, -0.1004638671875, -0.088592529296875, -0.07672119140625, -0.064849853515625, -0.052978515625, -0.041107177734375, -0.02923583984375, -0.017364501953125, -0.0054931640625, 0.006378173828125, 0.01824951171875, 0.030120849609375, 0.0419921875, 0.053863525390625, 0.06573486328125, 0.077606201171875, 0.0894775390625, 0.101348876953125, 0.11322021484375, 0.125091552734375, 0.136962890625, 0.148834228515625, 0.16070556640625, 0.172576904296875, 0.1844482421875, 0.196319580078125, 0.20819091796875, 0.220062255859375, 0.23193359375, 0.243804931640625, 0.25567626953125, 0.267547607421875, 0.2794189453125, 0.291290283203125, 0.30316162109375, 0.315032958984375, 0.326904296875, 0.338775634765625, 0.35064697265625, 0.362518310546875, 0.3743896484375, 0.386260986328125, 0.39813232421875, 0.410003662109375, 0.421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 6.0, 17.0, 8.0, 8.0, 13.0, 24.0, 19.0, 25.0, 39.0, 46.0, 43.0, 68.0, 68.0, 64.0, 67.0, 71.0, 62.0, 52.0, 61.0, 38.0, 39.0, 36.0, 28.0, 20.0, 6.0, 8.0, 7.0, 11.0, 3.0, 8.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.295654296875, -0.2868232727050781, -0.27799224853515625, -0.2691612243652344, -0.2603302001953125, -0.2514991760253906, -0.24266815185546875, -0.23383712768554688, -0.225006103515625, -0.21617507934570312, -0.20734405517578125, -0.19851303100585938, -0.1896820068359375, -0.18085098266601562, -0.17201995849609375, -0.16318893432617188, -0.15435791015625, -0.14552688598632812, -0.13669586181640625, -0.12786483764648438, -0.1190338134765625, -0.11020278930664062, -0.10137176513671875, -0.09254074096679688, -0.083709716796875, -0.07487869262695312, -0.06604766845703125, -0.057216644287109375, -0.0483856201171875, -0.039554595947265625, -0.03072357177734375, -0.021892547607421875, -0.0130615234375, -0.004230499267578125, 0.00460052490234375, 0.013431549072265625, 0.0222625732421875, 0.031093597412109375, 0.03992462158203125, 0.048755645751953125, 0.057586669921875, 0.06641769409179688, 0.07524871826171875, 0.08407974243164062, 0.0929107666015625, 0.10174179077148438, 0.11057281494140625, 0.11940383911132812, 0.12823486328125, 0.13706588745117188, 0.14589691162109375, 0.15472793579101562, 0.1635589599609375, 0.17238998413085938, 0.18122100830078125, 0.19005203247070312, 0.198883056640625, 0.20771408081054688, 0.21654510498046875, 0.22537612915039062, 0.2342071533203125, 0.24303817749023438, 0.25186920166015625, 0.2607002258300781, 0.26953125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 11.0, 17.0, 27.0, 72.0, 157.0, 226.0, 221.0, 125.0, 55.0, 35.0, 15.0, 9.0, 12.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.688709259033203, -8.36483383178711, -8.0409574508667, -7.7170820236206055, -7.3932061195373535, -7.069330215454102, -6.745454788208008, -6.421578884124756, -6.097702980041504, -5.773827075958252, -5.449951171875, -5.126075744628906, -4.802199840545654, -4.478323936462402, -4.154448509216309, -3.8305726051330566, -3.5066967010498047, -3.1828207969665527, -2.85894513130188, -2.535069465637207, -2.211193561553955, -1.8873177766799927, -1.5634419918060303, -1.2395663261413574, -0.9156904220581055, -0.5918146371841431, -0.26793885231018066, 0.05593693256378174, 0.37981271743774414, 0.7036885023117065, 1.027564287185669, 1.3514399528503418, 1.6753149032592773, 1.9991906881332397, 2.323066473007202, 2.646942138671875, 2.970818042755127, 3.294693946838379, 3.6185696125030518, 3.9424452781677246, 4.266321182250977, 4.5901970863342285, 4.9140729904174805, 5.237948417663574, 5.561824321746826, 5.885700225830078, 6.209575653076172, 6.533451557159424, 6.857327461242676, 7.181203365325928, 7.50507926940918, 7.828954696655273, 8.152830123901367, 8.476706504821777, 8.800581932067871, 9.124458312988281, 9.448333740234375, 9.772209167480469, 10.096085548400879, 10.419960975646973, 10.743837356567383, 11.067712783813477, 11.39158821105957, 11.715463638305664, 12.039340019226074]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 7.0, 7.0, 8.0, 8.0, 13.0, 12.0, 11.0, 15.0, 18.0, 31.0, 31.0, 33.0, 23.0, 36.0, 27.0, 40.0, 50.0, 70.0, 74.0, 75.0, 51.0, 52.0, 29.0, 39.0, 32.0, 41.0, 28.0, 23.0, 18.0, 21.0, 12.0, 11.0, 9.0, 8.0, 9.0, 8.0, 3.0, 8.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.121819496154785, -4.968884468078613, -4.815949440002441, -4.663013935089111, -4.5100789070129395, -4.357143878936768, -4.204208850860596, -4.051273345947266, -3.8983383178710938, -3.745403289794922, -3.592468023300171, -3.439532995223999, -3.286597728729248, -3.133662700653076, -2.9807276725769043, -2.8277924060821533, -2.6748573780059814, -2.5219223499298096, -2.3689870834350586, -2.2160520553588867, -2.0631167888641357, -1.9101817607879639, -1.7572466135025024, -1.604311466217041, -1.4513763189315796, -1.2984411716461182, -1.1455060243606567, -0.9925709366798401, -0.8396357893943787, -0.6867006421089172, -0.5337655544281006, -0.38083040714263916, -0.22789525985717773, -0.0749601274728775, 0.07797500491142273, 0.23091012239456177, 0.3838452696800232, 0.5367804169654846, 0.6897155046463013, 0.8426506519317627, 0.9955857992172241, 1.1485209465026855, 1.301456093788147, 1.4543912410736084, 1.6073262691497803, 1.7602615356445312, 1.9131965637207031, 2.066131591796875, 2.219066858291626, 2.372001886367798, 2.524937152862549, 2.6778721809387207, 2.8308074474334717, 2.9837424755096436, 3.1366777420043945, 3.2896127700805664, 3.4425477981567383, 3.59548282623291, 3.748418092727661, 3.901353120803833, 4.054288387298584, 4.207223415374756, 4.360158443450928, 4.513093948364258, 4.66602897644043]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 1.0, 8.0, 10.0, 14.0, 30.0, 44.0, 42.0, 82.0, 117.0, 278.0, 378.0, 608.0, 1068.0, 2094.0, 3975.0, 9208.0, 27472.0, 157642.0, 2654060.0, 1218941.0, 84135.0, 19486.0, 7378.0, 3237.0, 1726.0, 940.0, 524.0, 291.0, 194.0, 117.0, 73.0, 39.0, 32.0, 14.0, 11.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5016555786132812, -0.4842681884765625, -0.46688079833984375, -0.449493408203125, -0.43210601806640625, -0.4147186279296875, -0.39733123779296875, -0.37994384765625, -0.36255645751953125, -0.3451690673828125, -0.32778167724609375, -0.310394287109375, -0.29300689697265625, -0.2756195068359375, -0.25823211669921875, -0.2408447265625, -0.22345733642578125, -0.2060699462890625, -0.18868255615234375, -0.171295166015625, -0.15390777587890625, -0.1365203857421875, -0.11913299560546875, -0.10174560546875, -0.08435821533203125, -0.0669708251953125, -0.04958343505859375, -0.032196044921875, -0.01480865478515625, 0.0025787353515625, 0.01996612548828125, 0.037353515625, 0.05474090576171875, 0.0721282958984375, 0.08951568603515625, 0.106903076171875, 0.12429046630859375, 0.1416778564453125, 0.15906524658203125, 0.17645263671875, 0.19384002685546875, 0.2112274169921875, 0.22861480712890625, 0.246002197265625, 0.26338958740234375, 0.2807769775390625, 0.29816436767578125, 0.3155517578125, 0.33293914794921875, 0.3503265380859375, 0.36771392822265625, 0.385101318359375, 0.40248870849609375, 0.4198760986328125, 0.43726348876953125, 0.45465087890625, 0.47203826904296875, 0.4894256591796875, 0.5068130493164062, 0.524200439453125, 0.5415878295898438, 0.5589752197265625, 0.5763626098632812, 0.59375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 5.0, 16.0, 19.0, 23.0, 27.0, 31.0, 36.0, 45.0, 55.0, 64.0, 60.0, 42.0, 57.0, 59.0, 80.0, 66.0, 52.0, 44.0, 46.0, 38.0, 27.0, 25.0, 22.0, 11.0, 13.0, 6.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.3923454284667969, -0.37917327880859375, -0.3660011291503906, -0.3528289794921875, -0.3396568298339844, -0.32648468017578125, -0.3133125305175781, -0.300140380859375, -0.2869682312011719, -0.27379608154296875, -0.2606239318847656, -0.2474517822265625, -0.23427963256835938, -0.22110748291015625, -0.20793533325195312, -0.19476318359375, -0.18159103393554688, -0.16841888427734375, -0.15524673461914062, -0.1420745849609375, -0.12890243530273438, -0.11573028564453125, -0.10255813598632812, -0.089385986328125, -0.07621383666992188, -0.06304168701171875, -0.049869537353515625, -0.0366973876953125, -0.023525238037109375, -0.01035308837890625, 0.002819061279296875, 0.0159912109375, 0.029163360595703125, 0.04233551025390625, 0.055507659912109375, 0.0686798095703125, 0.08185195922851562, 0.09502410888671875, 0.10819625854492188, 0.121368408203125, 0.13454055786132812, 0.14771270751953125, 0.16088485717773438, 0.1740570068359375, 0.18722915649414062, 0.20040130615234375, 0.21357345581054688, 0.22674560546875, 0.23991775512695312, 0.25308990478515625, 0.2662620544433594, 0.2794342041015625, 0.2926063537597656, 0.30577850341796875, 0.3189506530761719, 0.332122802734375, 0.3452949523925781, 0.35846710205078125, 0.3716392517089844, 0.3848114013671875, 0.3979835510253906, 0.41115570068359375, 0.4243278503417969, 0.4375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 9.0, 8.0, 15.0, 18.0, 31.0, 34.0, 53.0, 72.0, 128.0, 160.0, 303.0, 472.0, 880.0, 1570.0, 3246.0, 8236.0, 30177.0, 204948.0, 3611317.0, 279273.0, 36311.0, 10164.0, 3600.0, 1547.0, 749.0, 403.0, 219.0, 129.0, 64.0, 58.0, 21.0, 18.0, 16.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78466796875, -0.7589874267578125, -0.733306884765625, -0.7076263427734375, -0.68194580078125, -0.6562652587890625, -0.630584716796875, -0.6049041748046875, -0.5792236328125, -0.5535430908203125, -0.527862548828125, -0.5021820068359375, -0.47650146484375, -0.4508209228515625, -0.425140380859375, -0.3994598388671875, -0.373779296875, -0.3480987548828125, -0.322418212890625, -0.2967376708984375, -0.27105712890625, -0.2453765869140625, -0.219696044921875, -0.1940155029296875, -0.1683349609375, -0.1426544189453125, -0.116973876953125, -0.0912933349609375, -0.06561279296875, -0.0399322509765625, -0.014251708984375, 0.0114288330078125, 0.037109375, 0.0627899169921875, 0.088470458984375, 0.1141510009765625, 0.13983154296875, 0.1655120849609375, 0.191192626953125, 0.2168731689453125, 0.2425537109375, 0.2682342529296875, 0.293914794921875, 0.3195953369140625, 0.34527587890625, 0.3709564208984375, 0.396636962890625, 0.4223175048828125, 0.447998046875, 0.4736785888671875, 0.499359130859375, 0.5250396728515625, 0.55072021484375, 0.5764007568359375, 0.602081298828125, 0.6277618408203125, 0.6534423828125, 0.6791229248046875, 0.704803466796875, 0.7304840087890625, 0.75616455078125, 0.7818450927734375, 0.807525634765625, 0.8332061767578125, 0.85888671875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 10.0, 8.0, 11.0, 11.0, 35.0, 55.0, 79.0, 156.0, 316.0, 854.0, 1311.0, 646.0, 267.0, 100.0, 67.0, 35.0, 34.0, 26.0, 10.0, 11.0, 8.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0576171875, -1.0268478393554688, -0.9960784912109375, -0.9653091430664062, -0.934539794921875, -0.9037704467773438, -0.8730010986328125, -0.8422317504882812, -0.81146240234375, -0.7806930541992188, -0.7499237060546875, -0.7191543579101562, -0.688385009765625, -0.6576156616210938, -0.6268463134765625, -0.5960769653320312, -0.5653076171875, -0.5345382690429688, -0.5037689208984375, -0.47299957275390625, -0.442230224609375, -0.41146087646484375, -0.3806915283203125, -0.34992218017578125, -0.31915283203125, -0.28838348388671875, -0.2576141357421875, -0.22684478759765625, -0.196075439453125, -0.16530609130859375, -0.1345367431640625, -0.10376739501953125, -0.072998046875, -0.04222869873046875, -0.0114593505859375, 0.01930999755859375, 0.050079345703125, 0.08084869384765625, 0.1116180419921875, 0.14238739013671875, 0.17315673828125, 0.20392608642578125, 0.2346954345703125, 0.26546478271484375, 0.296234130859375, 0.32700347900390625, 0.3577728271484375, 0.38854217529296875, 0.4193115234375, 0.45008087158203125, 0.4808502197265625, 0.5116195678710938, 0.542388916015625, 0.5731582641601562, 0.6039276123046875, 0.6346969604492188, 0.66546630859375, 0.6962356567382812, 0.7270050048828125, 0.7577743530273438, 0.788543701171875, 0.8193130493164062, 0.8500823974609375, 0.8808517456054688, 0.91162109375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 3.0, 10.0, 17.0, 16.0, 47.0, 90.0, 132.0, 174.0, 188.0, 141.0, 78.0, 37.0, 25.0, 12.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.493501663208008, -7.279058456420898, -7.064615726470947, -6.850172519683838, -6.6357293128967285, -6.421286582946777, -6.206843376159668, -5.992400169372559, -5.777956962585449, -5.56351375579834, -5.349071025848389, -5.134627819061279, -4.92018461227417, -4.705741882324219, -4.491298675537109, -4.27685546875, -4.062412261962891, -3.8479692935943604, -3.633526086807251, -3.4190831184387207, -3.2046399116516113, -2.990196943283081, -2.775753974914551, -2.5613107681274414, -2.3468680381774902, -2.13242506980896, -1.9179818630218506, -1.7035388946533203, -1.489095687866211, -1.2746527194976807, -1.0602096319198608, -0.845766544342041, -0.6313233375549316, -0.4168802499771118, -0.20243719220161438, 0.012005865573883057, 0.22644895315170288, 0.44089198112487793, 0.6553350687026978, 0.8697781562805176, 1.0842212438583374, 1.2986643314361572, 1.513107419013977, 1.7275505065917969, 1.9419934749603271, 2.1564364433288574, 2.370879650115967, 2.585322856903076, 2.7997658252716064, 3.0142087936401367, 3.228652000427246, 3.4430949687957764, 3.6575381755828857, 3.871981143951416, 4.086424350738525, 4.300867080688477, 4.515310287475586, 4.729753494262695, 4.9441962242126465, 5.158639430999756, 5.373082637786865, 5.587525367736816, 5.801968574523926, 6.016411781311035, 6.2308549880981445]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 10.0, 12.0, 11.0, 27.0, 29.0, 37.0, 41.0, 56.0, 57.0, 69.0, 68.0, 72.0, 77.0, 71.0, 68.0, 57.0, 50.0, 52.0, 42.0, 22.0, 26.0, 13.0, 15.0, 5.0, 10.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2524070739746094, -3.106252431869507, -2.960097551345825, -2.8139429092407227, -2.667788028717041, -2.5216333866119385, -2.375478744506836, -2.2293238639831543, -2.0831689834594727, -1.9370142221450806, -1.7908594608306885, -1.644704818725586, -1.4985499382019043, -1.3523952960968018, -1.2062405347824097, -1.0600857734680176, -0.913931131362915, -0.767776370048523, -0.6216216087341309, -0.47546690702438354, -0.32931214570999146, -0.18315738439559937, -0.03700268268585205, 0.10915207862854004, 0.25530683994293213, 0.4014616012573242, 0.5476163625717163, 0.6937710642814636, 0.8399258255958557, 0.9860805869102478, 1.1322352886199951, 1.2783900499343872, 1.4245448112487793, 1.5706995725631714, 1.7168543338775635, 1.863008975982666, 2.0091638565063477, 2.15531849861145, 2.3014731407165527, 2.4476280212402344, 2.593782901763916, 2.7399375438690186, 2.8860924243927, 3.0322470664978027, 3.1784019470214844, 3.324556589126587, 3.4707112312316895, 3.616866111755371, 3.7630207538604736, 3.909175395965576, 4.055330276489258, 4.2014851570129395, 4.347639560699463, 4.4937944412231445, 4.639949321746826, 4.786104202270508, 4.932258605957031, 5.078413486480713, 5.224567890167236, 5.370722770690918, 5.5168776512146, 5.663032531738281, 5.809186935424805, 5.955341815948486, 6.101496696472168]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 7.0, 9.0, 9.0, 16.0, 16.0, 27.0, 31.0, 62.0, 76.0, 104.0, 128.0, 255.0, 382.0, 597.0, 1004.0, 1803.0, 3241.0, 6463.0, 12998.0, 29751.0, 71678.0, 185008.0, 372428.0, 214466.0, 83086.0, 34179.0, 14911.0, 7357.0, 3613.0, 1925.0, 1112.0, 662.0, 379.0, 250.0, 167.0, 103.0, 82.0, 47.0, 32.0, 21.0, 16.0, 14.0, 20.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.701171875, -0.6774673461914062, -0.6537628173828125, -0.6300582885742188, -0.606353759765625, -0.5826492309570312, -0.5589447021484375, -0.5352401733398438, -0.51153564453125, -0.48783111572265625, -0.4641265869140625, -0.44042205810546875, -0.416717529296875, -0.39301300048828125, -0.3693084716796875, -0.34560394287109375, -0.3218994140625, -0.29819488525390625, -0.2744903564453125, -0.25078582763671875, -0.227081298828125, -0.20337677001953125, -0.1796722412109375, -0.15596771240234375, -0.13226318359375, -0.10855865478515625, -0.0848541259765625, -0.06114959716796875, -0.037445068359375, -0.01374053955078125, 0.0099639892578125, 0.03366851806640625, 0.057373046875, 0.08107757568359375, 0.1047821044921875, 0.12848663330078125, 0.152191162109375, 0.17589569091796875, 0.1996002197265625, 0.22330474853515625, 0.24700927734375, 0.27071380615234375, 0.2944183349609375, 0.31812286376953125, 0.341827392578125, 0.36553192138671875, 0.3892364501953125, 0.41294097900390625, 0.4366455078125, 0.46035003662109375, 0.4840545654296875, 0.5077590942382812, 0.531463623046875, 0.5551681518554688, 0.5788726806640625, 0.6025772094726562, 0.62628173828125, 0.6499862670898438, 0.6736907958984375, 0.6973953247070312, 0.721099853515625, 0.7448043823242188, 0.7685089111328125, 0.7922134399414062, 0.81591796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 7.0, 12.0, 11.0, 21.0, 20.0, 20.0, 24.0, 34.0, 42.0, 35.0, 41.0, 55.0, 39.0, 41.0, 66.0, 72.0, 64.0, 55.0, 54.0, 45.0, 45.0, 36.0, 35.0, 24.0, 21.0, 20.0, 10.0, 15.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35986328125, -0.3478584289550781, -0.33585357666015625, -0.3238487243652344, -0.3118438720703125, -0.2998390197753906, -0.28783416748046875, -0.2758293151855469, -0.263824462890625, -0.2518196105957031, -0.23981475830078125, -0.22780990600585938, -0.2158050537109375, -0.20380020141601562, -0.19179534912109375, -0.17979049682617188, -0.16778564453125, -0.15578079223632812, -0.14377593994140625, -0.13177108764648438, -0.1197662353515625, -0.10776138305664062, -0.09575653076171875, -0.08375167846679688, -0.071746826171875, -0.059741973876953125, -0.04773712158203125, -0.035732269287109375, -0.0237274169921875, -0.011722564697265625, 0.00028228759765625, 0.012287139892578125, 0.0242919921875, 0.036296844482421875, 0.04830169677734375, 0.060306549072265625, 0.0723114013671875, 0.08431625366210938, 0.09632110595703125, 0.10832595825195312, 0.120330810546875, 0.13233566284179688, 0.14434051513671875, 0.15634536743164062, 0.1683502197265625, 0.18035507202148438, 0.19235992431640625, 0.20436477661132812, 0.21636962890625, 0.22837448120117188, 0.24037933349609375, 0.2523841857910156, 0.2643890380859375, 0.2763938903808594, 0.28839874267578125, 0.3004035949707031, 0.312408447265625, 0.3244132995605469, 0.33641815185546875, 0.3484230041503906, 0.3604278564453125, 0.3724327087402344, 0.38443756103515625, 0.3964424133300781, 0.408447265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 14.0, 14.0, 23.0, 32.0, 61.0, 78.0, 147.0, 258.0, 511.0, 1092.0, 2563.0, 6373.0, 18882.0, 66045.0, 313933.0, 523422.0, 80305.0, 22012.0, 7499.0, 2843.0, 1243.0, 549.0, 275.0, 148.0, 81.0, 55.0, 32.0, 19.0, 16.0, 9.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9208984375, -0.8855743408203125, -0.850250244140625, -0.8149261474609375, -0.77960205078125, -0.7442779541015625, -0.708953857421875, -0.6736297607421875, -0.6383056640625, -0.6029815673828125, -0.567657470703125, -0.5323333740234375, -0.49700927734375, -0.4616851806640625, -0.426361083984375, -0.3910369873046875, -0.355712890625, -0.3203887939453125, -0.285064697265625, -0.2497406005859375, -0.21441650390625, -0.1790924072265625, -0.143768310546875, -0.1084442138671875, -0.0731201171875, -0.0377960205078125, -0.002471923828125, 0.0328521728515625, 0.06817626953125, 0.1035003662109375, 0.138824462890625, 0.1741485595703125, 0.20947265625, 0.2447967529296875, 0.280120849609375, 0.3154449462890625, 0.35076904296875, 0.3860931396484375, 0.421417236328125, 0.4567413330078125, 0.4920654296875, 0.5273895263671875, 0.562713623046875, 0.5980377197265625, 0.63336181640625, 0.6686859130859375, 0.704010009765625, 0.7393341064453125, 0.774658203125, 0.8099822998046875, 0.845306396484375, 0.8806304931640625, 0.91595458984375, 0.9512786865234375, 0.986602783203125, 1.0219268798828125, 1.0572509765625, 1.0925750732421875, 1.127899169921875, 1.1632232666015625, 1.19854736328125, 1.2338714599609375, 1.269195556640625, 1.3045196533203125, 1.33984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 0.0, 7.0, 4.0, 6.0, 7.0, 10.0, 12.0, 12.0, 13.0, 15.0, 14.0, 24.0, 24.0, 25.0, 25.0, 26.0, 32.0, 33.0, 42.0, 46.0, 40.0, 43.0, 46.0, 51.0, 50.0, 44.0, 34.0, 51.0, 30.0, 32.0, 20.0, 32.0, 17.0, 17.0, 24.0, 21.0, 15.0, 8.0, 11.0, 8.0, 8.0, 3.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.046875, -1.0137481689453125, -0.980621337890625, -0.9474945068359375, -0.91436767578125, -0.8812408447265625, -0.848114013671875, -0.8149871826171875, -0.7818603515625, -0.7487335205078125, -0.715606689453125, -0.6824798583984375, -0.64935302734375, -0.6162261962890625, -0.583099365234375, -0.5499725341796875, -0.516845703125, -0.4837188720703125, -0.450592041015625, -0.4174652099609375, -0.38433837890625, -0.3512115478515625, -0.318084716796875, -0.2849578857421875, -0.2518310546875, -0.2187042236328125, -0.185577392578125, -0.1524505615234375, -0.11932373046875, -0.0861968994140625, -0.053070068359375, -0.0199432373046875, 0.01318359375, 0.0463104248046875, 0.079437255859375, 0.1125640869140625, 0.14569091796875, 0.1788177490234375, 0.211944580078125, 0.2450714111328125, 0.2781982421875, 0.3113250732421875, 0.344451904296875, 0.3775787353515625, 0.41070556640625, 0.4438323974609375, 0.476959228515625, 0.5100860595703125, 0.543212890625, 0.5763397216796875, 0.609466552734375, 0.6425933837890625, 0.67572021484375, 0.7088470458984375, 0.741973876953125, 0.7751007080078125, 0.8082275390625, 0.8413543701171875, 0.874481201171875, 0.9076080322265625, 0.94073486328125, 0.9738616943359375, 1.006988525390625, 1.0401153564453125, 1.0732421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 11.0, 12.0, 18.0, 24.0, 40.0, 63.0, 109.0, 287.0, 631.0, 2014.0, 8497.0, 74806.0, 849545.0, 98672.0, 10029.0, 2395.0, 750.0, 301.0, 111.0, 79.0, 46.0, 26.0, 16.0, 8.0, 10.0, 6.0, 7.0, 12.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5087890625, -0.49213409423828125, -0.4754791259765625, -0.45882415771484375, -0.442169189453125, -0.42551422119140625, -0.4088592529296875, -0.39220428466796875, -0.37554931640625, -0.35889434814453125, -0.3422393798828125, -0.32558441162109375, -0.308929443359375, -0.29227447509765625, -0.2756195068359375, -0.25896453857421875, -0.2423095703125, -0.22565460205078125, -0.2089996337890625, -0.19234466552734375, -0.175689697265625, -0.15903472900390625, -0.1423797607421875, -0.12572479248046875, -0.10906982421875, -0.09241485595703125, -0.0757598876953125, -0.05910491943359375, -0.042449951171875, -0.02579498291015625, -0.0091400146484375, 0.00751495361328125, 0.024169921875, 0.04082489013671875, 0.0574798583984375, 0.07413482666015625, 0.090789794921875, 0.10744476318359375, 0.1240997314453125, 0.14075469970703125, 0.15740966796875, 0.17406463623046875, 0.1907196044921875, 0.20737457275390625, 0.224029541015625, 0.24068450927734375, 0.2573394775390625, 0.27399444580078125, 0.2906494140625, 0.30730438232421875, 0.3239593505859375, 0.34061431884765625, 0.357269287109375, 0.37392425537109375, 0.3905792236328125, 0.40723419189453125, 0.42388916015625, 0.44054412841796875, 0.4571990966796875, 0.47385406494140625, 0.490509033203125, 0.5071640014648438, 0.5238189697265625, 0.5404739379882812, 0.55712890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 4.0, 8.0, 10.0, 4.0, 12.0, 14.0, 23.0, 19.0, 28.0, 42.0, 79.0, 121.0, 145.0, 146.0, 107.0, 51.0, 57.0, 27.0, 20.0, 14.0, 12.0, 11.0, 8.0, 10.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010776519775390625, -0.00010438170284032822, -0.00010099820792675018, -9.761471301317215e-05, -9.423121809959412e-05, -9.084772318601608e-05, -8.746422827243805e-05, -8.408073335886002e-05, -8.069723844528198e-05, -7.731374353170395e-05, -7.393024861812592e-05, -7.054675370454788e-05, -6.716325879096985e-05, -6.377976387739182e-05, -6.039626896381378e-05, -5.701277405023575e-05, -5.3629279136657715e-05, -5.024578422307968e-05, -4.686228930950165e-05, -4.3478794395923615e-05, -4.009529948234558e-05, -3.671180456876755e-05, -3.3328309655189514e-05, -2.994481474161148e-05, -2.6561319828033447e-05, -2.3177824914455414e-05, -1.979433000087738e-05, -1.6410835087299347e-05, -1.3027340173721313e-05, -9.64384526014328e-06, -6.260350346565247e-06, -2.876855432987213e-06, 5.066394805908203e-07, 3.890134394168854e-06, 7.273629307746887e-06, 1.065712422132492e-05, 1.4040619134902954e-05, 1.7424114048480988e-05, 2.080760896205902e-05, 2.4191103875637054e-05, 2.7574598789215088e-05, 3.095809370279312e-05, 3.4341588616371155e-05, 3.772508352994919e-05, 4.110857844352722e-05, 4.4492073357105255e-05, 4.787556827068329e-05, 5.125906318426132e-05, 5.4642558097839355e-05, 5.802605301141739e-05, 6.140954792499542e-05, 6.479304283857346e-05, 6.817653775215149e-05, 7.156003266572952e-05, 7.494352757930756e-05, 7.832702249288559e-05, 8.171051740646362e-05, 8.509401232004166e-05, 8.847750723361969e-05, 9.186100214719772e-05, 9.524449706077576e-05, 9.862799197435379e-05, 0.00010201148688793182, 0.00010539498180150986, 0.00010877847671508789]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 1.0, 7.0, 5.0, 6.0, 9.0, 17.0, 24.0, 32.0, 49.0, 74.0, 146.0, 187.0, 358.0, 589.0, 1173.0, 2392.0, 5471.0, 14793.0, 51012.0, 257192.0, 588715.0, 89330.0, 22548.0, 7709.0, 3338.0, 1525.0, 732.0, 447.0, 259.0, 139.0, 86.0, 57.0, 42.0, 22.0, 25.0, 9.0, 18.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.266357421875, -0.2575340270996094, -0.24871063232421875, -0.23988723754882812, -0.2310638427734375, -0.22224044799804688, -0.21341705322265625, -0.20459365844726562, -0.195770263671875, -0.18694686889648438, -0.17812347412109375, -0.16930007934570312, -0.1604766845703125, -0.15165328979492188, -0.14282989501953125, -0.13400650024414062, -0.12518310546875, -0.11635971069335938, -0.10753631591796875, -0.09871292114257812, -0.0898895263671875, -0.08106613159179688, -0.07224273681640625, -0.06341934204101562, -0.054595947265625, -0.045772552490234375, -0.03694915771484375, -0.028125762939453125, -0.0193023681640625, -0.010478973388671875, -0.00165557861328125, 0.007167816162109375, 0.0159912109375, 0.024814605712890625, 0.03363800048828125, 0.042461395263671875, 0.0512847900390625, 0.060108184814453125, 0.06893157958984375, 0.07775497436523438, 0.086578369140625, 0.09540176391601562, 0.10422515869140625, 0.11304855346679688, 0.1218719482421875, 0.13069534301757812, 0.13951873779296875, 0.14834213256835938, 0.15716552734375, 0.16598892211914062, 0.17481231689453125, 0.18363571166992188, 0.1924591064453125, 0.20128250122070312, 0.21010589599609375, 0.21892929077148438, 0.227752685546875, 0.23657608032226562, 0.24539947509765625, 0.2542228698730469, 0.2630462646484375, 0.2718696594238281, 0.28069305419921875, 0.2895164489746094, 0.29833984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 6.0, 7.0, 8.0, 11.0, 9.0, 16.0, 24.0, 38.0, 36.0, 51.0, 76.0, 79.0, 90.0, 95.0, 100.0, 80.0, 62.0, 53.0, 30.0, 27.0, 25.0, 23.0, 10.0, 6.0, 10.0, 6.0, 7.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255126953125, -0.24578857421875, -0.2364501953125, -0.22711181640625, -0.2177734375, -0.20843505859375, -0.1990966796875, -0.18975830078125, -0.180419921875, -0.17108154296875, -0.1617431640625, -0.15240478515625, -0.14306640625, -0.13372802734375, -0.1243896484375, -0.11505126953125, -0.105712890625, -0.09637451171875, -0.0870361328125, -0.07769775390625, -0.068359375, -0.05902099609375, -0.0496826171875, -0.04034423828125, -0.031005859375, -0.02166748046875, -0.0123291015625, -0.00299072265625, 0.00634765625, 0.01568603515625, 0.0250244140625, 0.03436279296875, 0.043701171875, 0.05303955078125, 0.0623779296875, 0.07171630859375, 0.0810546875, 0.09039306640625, 0.0997314453125, 0.10906982421875, 0.118408203125, 0.12774658203125, 0.1370849609375, 0.14642333984375, 0.15576171875, 0.16510009765625, 0.1744384765625, 0.18377685546875, 0.193115234375, 0.20245361328125, 0.2117919921875, 0.22113037109375, 0.23046875, 0.23980712890625, 0.2491455078125, 0.25848388671875, 0.267822265625, 0.27716064453125, 0.2864990234375, 0.29583740234375, 0.30517578125, 0.31451416015625, 0.3238525390625, 0.33319091796875, 0.342529296875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 7.0, 15.0, 33.0, 82.0, 138.0, 322.0, 195.0, 90.0, 58.0, 26.0, 8.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.334053039550781, -7.981848239898682, -7.629642963409424, -7.277438163757324, -6.925232887268066, -6.573028087615967, -6.220823287963867, -5.868618011474609, -5.51641321182251, -5.16420841217041, -4.812003135681152, -4.459798336029053, -4.107593536376953, -3.7553882598876953, -3.4031834602355957, -3.050978422164917, -2.6987733840942383, -2.3465683460235596, -1.9943634271621704, -1.6421585083007812, -1.2899534702301025, -0.9377484321594238, -0.5855436325073242, -0.2333385944366455, 0.1188664436340332, 0.47107142210006714, 0.8232764005661011, 1.1754813194274902, 1.527686357498169, 1.8798913955688477, 2.2320961952209473, 2.584301233291626, 2.9365062713623047, 3.2887113094329834, 3.640916347503662, 3.9931211471557617, 4.3453264236450195, 4.697531223297119, 5.049736022949219, 5.401941299438477, 5.754146099090576, 6.106350898742676, 6.458556175231934, 6.810760974884033, 7.162965774536133, 7.515171051025391, 7.86737585067749, 8.21958065032959, 8.571785926818848, 8.923991203308105, 9.276195526123047, 9.628400802612305, 9.980606079101562, 10.33281135559082, 10.685015678405762, 11.03722095489502, 11.389425277709961, 11.741630554199219, 12.09383487701416, 12.446040153503418, 12.798245429992676, 13.150449752807617, 13.502655029296875, 13.854860305786133, 14.20706558227539]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 10.0, 10.0, 4.0, 11.0, 8.0, 10.0, 9.0, 12.0, 24.0, 17.0, 23.0, 12.0, 24.0, 28.0, 25.0, 32.0, 29.0, 39.0, 57.0, 59.0, 75.0, 59.0, 56.0, 40.0, 34.0, 40.0, 34.0, 37.0, 28.0, 14.0, 19.0, 23.0, 17.0, 12.0, 12.0, 12.0, 8.0, 4.0, 8.0, 4.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-5.045686721801758, -4.908112049102783, -4.770537376403809, -4.632962226867676, -4.495387554168701, -4.357812881469727, -4.220238208770752, -4.082663536071777, -3.9450886249542236, -3.807513952255249, -3.6699390411376953, -3.5323643684387207, -3.394789695739746, -3.2572147846221924, -3.1196401119232178, -2.982065200805664, -2.8444905281066895, -2.706915855407715, -2.569340944290161, -2.4317662715911865, -2.294191360473633, -2.156616687774658, -2.0190420150756836, -1.8814672231674194, -1.7438924312591553, -1.6063176393508911, -1.468742847442627, -1.3311681747436523, -1.1935933828353882, -1.056018590927124, -0.9184438586235046, -0.7808691263198853, -0.643294095993042, -0.5057193040847778, -0.36814457178115845, -0.23056980967521667, -0.0929950475692749, 0.04457974433898926, 0.18215447664260864, 0.319729208946228, 0.4573040008544922, 0.5948787927627563, 0.7324535250663757, 0.8700282573699951, 1.0076030492782593, 1.1451778411865234, 1.282752513885498, 1.4203273057937622, 1.5579020977020264, 1.6954768896102905, 1.8330516815185547, 1.9706263542175293, 2.108201026916504, 2.2457759380340576, 2.3833506107330322, 2.520925521850586, 2.6585001945495605, 2.796074867248535, 2.933649778366089, 3.0712244510650635, 3.208799362182617, 3.346374034881592, 3.4839487075805664, 3.621523380279541, 3.7590982913970947]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 7.0, 13.0, 17.0, 28.0, 34.0, 44.0, 63.0, 91.0, 146.0, 239.0, 374.0, 619.0, 1037.0, 1941.0, 4067.0, 10070.0, 35942.0, 238264.0, 2518564.0, 1230014.0, 115488.0, 22558.0, 7382.0, 3239.0, 1631.0, 886.0, 586.0, 346.0, 219.0, 138.0, 78.0, 66.0, 33.0, 20.0, 15.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36181640625, -0.347808837890625, -0.33380126953125, -0.319793701171875, -0.3057861328125, -0.291778564453125, -0.27777099609375, -0.263763427734375, -0.249755859375, -0.235748291015625, -0.22174072265625, -0.207733154296875, -0.1937255859375, -0.179718017578125, -0.16571044921875, -0.151702880859375, -0.1376953125, -0.123687744140625, -0.10968017578125, -0.095672607421875, -0.0816650390625, -0.067657470703125, -0.05364990234375, -0.039642333984375, -0.025634765625, -0.011627197265625, 0.00238037109375, 0.016387939453125, 0.0303955078125, 0.044403076171875, 0.05841064453125, 0.072418212890625, 0.08642578125, 0.100433349609375, 0.11444091796875, 0.128448486328125, 0.1424560546875, 0.156463623046875, 0.17047119140625, 0.184478759765625, 0.198486328125, 0.212493896484375, 0.22650146484375, 0.240509033203125, 0.2545166015625, 0.268524169921875, 0.28253173828125, 0.296539306640625, 0.310546875, 0.324554443359375, 0.33856201171875, 0.352569580078125, 0.3665771484375, 0.380584716796875, 0.39459228515625, 0.408599853515625, 0.422607421875, 0.436614990234375, 0.45062255859375, 0.464630126953125, 0.4786376953125, 0.492645263671875, 0.50665283203125, 0.520660400390625, 0.53466796875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 6.0, 10.0, 16.0, 19.0, 20.0, 33.0, 33.0, 27.0, 31.0, 46.0, 47.0, 57.0, 55.0, 68.0, 67.0, 65.0, 51.0, 51.0, 41.0, 52.0, 37.0, 35.0, 22.0, 23.0, 20.0, 9.0, 15.0, 9.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.332275390625, -0.32083892822265625, -0.3094024658203125, -0.29796600341796875, -0.286529541015625, -0.27509307861328125, -0.2636566162109375, -0.25222015380859375, -0.24078369140625, -0.22934722900390625, -0.2179107666015625, -0.20647430419921875, -0.195037841796875, -0.18360137939453125, -0.1721649169921875, -0.16072845458984375, -0.1492919921875, -0.13785552978515625, -0.1264190673828125, -0.11498260498046875, -0.103546142578125, -0.09210968017578125, -0.0806732177734375, -0.06923675537109375, -0.05780029296875, -0.04636383056640625, -0.0349273681640625, -0.02349090576171875, -0.012054443359375, -0.00061798095703125, 0.0108184814453125, 0.02225494384765625, 0.03369140625, 0.04512786865234375, 0.0565643310546875, 0.06800079345703125, 0.079437255859375, 0.09087371826171875, 0.1023101806640625, 0.11374664306640625, 0.12518310546875, 0.13661956787109375, 0.1480560302734375, 0.15949249267578125, 0.170928955078125, 0.18236541748046875, 0.1938018798828125, 0.20523834228515625, 0.2166748046875, 0.22811126708984375, 0.2395477294921875, 0.25098419189453125, 0.262420654296875, 0.27385711669921875, 0.2852935791015625, 0.29673004150390625, 0.30816650390625, 0.31960296630859375, 0.3310394287109375, 0.34247589111328125, 0.353912353515625, 0.36534881591796875, 0.3767852783203125, 0.38822174072265625, 0.399658203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 10.0, 14.0, 19.0, 32.0, 51.0, 91.0, 99.0, 217.0, 377.0, 655.0, 1254.0, 2707.0, 6799.0, 20575.0, 107569.0, 2747142.0, 1211830.0, 69878.0, 15491.0, 5266.0, 2047.0, 964.0, 514.0, 267.0, 135.0, 96.0, 43.0, 40.0, 27.0, 22.0, 9.0, 12.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76416015625, -0.7422561645507812, -0.7203521728515625, -0.6984481811523438, -0.676544189453125, -0.6546401977539062, -0.6327362060546875, -0.6108322143554688, -0.58892822265625, -0.5670242309570312, -0.5451202392578125, -0.5232162475585938, -0.501312255859375, -0.47940826416015625, -0.4575042724609375, -0.43560028076171875, -0.4136962890625, -0.39179229736328125, -0.3698883056640625, -0.34798431396484375, -0.326080322265625, -0.30417633056640625, -0.2822723388671875, -0.26036834716796875, -0.23846435546875, -0.21656036376953125, -0.1946563720703125, -0.17275238037109375, -0.150848388671875, -0.12894439697265625, -0.1070404052734375, -0.08513641357421875, -0.063232421875, -0.04132843017578125, -0.0194244384765625, 0.00247955322265625, 0.024383544921875, 0.04628753662109375, 0.0681915283203125, 0.09009552001953125, 0.11199951171875, 0.13390350341796875, 0.1558074951171875, 0.17771148681640625, 0.199615478515625, 0.22151947021484375, 0.2434234619140625, 0.26532745361328125, 0.2872314453125, 0.30913543701171875, 0.3310394287109375, 0.35294342041015625, 0.374847412109375, 0.39675140380859375, 0.4186553955078125, 0.44055938720703125, 0.46246337890625, 0.48436737060546875, 0.5062713623046875, 0.5281753540039062, 0.550079345703125, 0.5719833374023438, 0.5938873291015625, 0.6157913208007812, 0.6376953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 2.0, 7.0, 9.0, 6.0, 11.0, 24.0, 38.0, 43.0, 73.0, 130.0, 274.0, 598.0, 1041.0, 862.0, 428.0, 218.0, 109.0, 65.0, 49.0, 27.0, 16.0, 14.0, 7.0, 4.0, 4.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75927734375, -0.7353897094726562, -0.7115020751953125, -0.6876144409179688, -0.663726806640625, -0.6398391723632812, -0.6159515380859375, -0.5920639038085938, -0.56817626953125, -0.5442886352539062, -0.5204010009765625, -0.49651336669921875, -0.472625732421875, -0.44873809814453125, -0.4248504638671875, -0.40096282958984375, -0.3770751953125, -0.35318756103515625, -0.3292999267578125, -0.30541229248046875, -0.281524658203125, -0.25763702392578125, -0.2337493896484375, -0.20986175537109375, -0.18597412109375, -0.16208648681640625, -0.1381988525390625, -0.11431121826171875, -0.090423583984375, -0.06653594970703125, -0.0426483154296875, -0.01876068115234375, 0.005126953125, 0.02901458740234375, 0.0529022216796875, 0.07678985595703125, 0.100677490234375, 0.12456512451171875, 0.1484527587890625, 0.17234039306640625, 0.19622802734375, 0.22011566162109375, 0.2440032958984375, 0.26789093017578125, 0.291778564453125, 0.31566619873046875, 0.3395538330078125, 0.36344146728515625, 0.3873291015625, 0.41121673583984375, 0.4351043701171875, 0.45899200439453125, 0.482879638671875, 0.5067672729492188, 0.5306549072265625, 0.5545425415039062, 0.57843017578125, 0.6023178100585938, 0.6262054443359375, 0.6500930786132812, 0.673980712890625, 0.6978683471679688, 0.7217559814453125, 0.7456436157226562, 0.76953125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 12.0, 37.0, 108.0, 235.0, 339.0, 168.0, 61.0, 15.0, 7.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.616809844970703, -16.29242515563965, -15.96804141998291, -15.643656730651855, -15.319272994995117, -14.994888305664062, -14.670503616333008, -14.346118927001953, -14.021735191345215, -13.69735050201416, -13.372966766357422, -13.048582077026367, -12.724197387695312, -12.399813652038574, -12.07542896270752, -11.751045227050781, -11.426660537719727, -11.102275848388672, -10.777892112731934, -10.453507423400879, -10.12912368774414, -9.804738998413086, -9.480354309082031, -9.155969619750977, -8.831585884094238, -8.507201194763184, -8.182817459106445, -7.858432769775391, -7.534048557281494, -7.209664344787598, -6.885279655456543, -6.5608954429626465, -6.23651123046875, -5.9121270179748535, -5.587742805480957, -5.263358116149902, -4.938973903656006, -4.614589691162109, -4.290205001831055, -3.965820789337158, -3.6414365768432617, -3.3170523643493652, -2.9926679134368896, -2.668283462524414, -2.3438992500305176, -2.019515037536621, -1.6951305866241455, -1.37074613571167, -1.0463619232177734, -0.7219775915145874, -0.39759325981140137, -0.07320892810821533, 0.2511754035949707, 0.5755597352981567, 0.8999440670013428, 1.2243285179138184, 1.5487127304077148, 1.8730970621109009, 2.197481393814087, 2.5218658447265625, 2.846250057220459, 3.1706342697143555, 3.495018720626831, 3.8194031715393066, 4.143787384033203]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 9.0, 10.0, 16.0, 16.0, 17.0, 31.0, 29.0, 34.0, 37.0, 30.0, 42.0, 42.0, 47.0, 55.0, 50.0, 66.0, 56.0, 47.0, 41.0, 43.0, 40.0, 32.0, 31.0, 26.0, 31.0, 22.0, 16.0, 18.0, 12.0, 8.0, 10.0, 8.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.011326789855957, -1.9330666065216064, -1.8548064231872559, -1.7765462398529053, -1.6982859373092651, -1.6200257539749146, -1.541765570640564, -1.4635052680969238, -1.3852450847625732, -1.3069849014282227, -1.228724718093872, -1.1504645347595215, -1.0722042322158813, -0.9939440488815308, -0.9156838655471802, -0.8374236226081848, -0.759163498878479, -0.6809033155441284, -0.6026430726051331, -0.5243828892707825, -0.4461226761341095, -0.3678624629974365, -0.28960227966308594, -0.21134203672409058, -0.13308185338974, -0.054821647703647614, 0.023438557982444763, 0.10169875621795654, 0.17995896935462952, 0.2582191824913025, 0.3364793658256531, 0.41473960876464844, 0.492999792098999, 0.5712599754333496, 0.649520218372345, 0.7277804017066956, 0.8060406446456909, 0.8843008279800415, 0.9625610113143921, 1.0408213138580322, 1.1190814971923828, 1.1973416805267334, 1.275601863861084, 1.3538620471954346, 1.4321223497390747, 1.5103825330734253, 1.5886427164077759, 1.666903018951416, 1.745163083076477, 1.8234232664108276, 1.9016834497451782, 1.9799437522888184, 2.058203935623169, 2.1364641189575195, 2.21472430229187, 2.2929844856262207, 2.3712446689605713, 2.449504852294922, 2.5277650356292725, 2.606025218963623, 2.6842854022979736, 2.762545585632324, 2.840806007385254, 2.9190661907196045, 2.997326374053955]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 2.0, 6.0, 9.0, 5.0, 22.0, 22.0, 37.0, 48.0, 73.0, 127.0, 170.0, 260.0, 446.0, 672.0, 1129.0, 1850.0, 3333.0, 6286.0, 13227.0, 33351.0, 104588.0, 407204.0, 337347.0, 85486.0, 28139.0, 11690.0, 5532.0, 3065.0, 1667.0, 1012.0, 594.0, 388.0, 259.0, 175.0, 95.0, 77.0, 51.0, 40.0, 20.0, 15.0, 11.0, 7.0, 9.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1728515625, -1.1372222900390625, -1.101593017578125, -1.0659637451171875, -1.03033447265625, -0.9947052001953125, -0.959075927734375, -0.9234466552734375, -0.8878173828125, -0.8521881103515625, -0.816558837890625, -0.7809295654296875, -0.74530029296875, -0.7096710205078125, -0.674041748046875, -0.6384124755859375, -0.602783203125, -0.5671539306640625, -0.531524658203125, -0.4958953857421875, -0.46026611328125, -0.4246368408203125, -0.389007568359375, -0.3533782958984375, -0.3177490234375, -0.2821197509765625, -0.246490478515625, -0.2108612060546875, -0.17523193359375, -0.1396026611328125, -0.103973388671875, -0.0683441162109375, -0.03271484375, 0.0029144287109375, 0.038543701171875, 0.0741729736328125, 0.10980224609375, 0.1454315185546875, 0.181060791015625, 0.2166900634765625, 0.2523193359375, 0.2879486083984375, 0.323577880859375, 0.3592071533203125, 0.39483642578125, 0.4304656982421875, 0.466094970703125, 0.5017242431640625, 0.537353515625, 0.5729827880859375, 0.608612060546875, 0.6442413330078125, 0.67987060546875, 0.7154998779296875, 0.751129150390625, 0.7867584228515625, 0.8223876953125, 0.8580169677734375, 0.893646240234375, 0.9292755126953125, 0.96490478515625, 1.0005340576171875, 1.036163330078125, 1.0717926025390625, 1.107421875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 1.0, 3.0, 4.0, 3.0, 13.0, 5.0, 13.0, 20.0, 23.0, 28.0, 24.0, 23.0, 26.0, 44.0, 47.0, 41.0, 45.0, 52.0, 72.0, 68.0, 52.0, 50.0, 43.0, 61.0, 35.0, 41.0, 36.0, 34.0, 17.0, 20.0, 16.0, 9.0, 9.0, 7.0, 8.0, 4.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.3280754089355469, -0.31679534912109375, -0.3055152893066406, -0.2942352294921875, -0.2829551696777344, -0.27167510986328125, -0.2603950500488281, -0.249114990234375, -0.23783493041992188, -0.22655487060546875, -0.21527481079101562, -0.2039947509765625, -0.19271469116210938, -0.18143463134765625, -0.17015457153320312, -0.15887451171875, -0.14759445190429688, -0.13631439208984375, -0.12503433227539062, -0.1137542724609375, -0.10247421264648438, -0.09119415283203125, -0.07991409301757812, -0.068634033203125, -0.057353973388671875, -0.04607391357421875, -0.034793853759765625, -0.0235137939453125, -0.012233734130859375, -0.00095367431640625, 0.010326385498046875, 0.0216064453125, 0.032886505126953125, 0.04416656494140625, 0.055446624755859375, 0.0667266845703125, 0.07800674438476562, 0.08928680419921875, 0.10056686401367188, 0.111846923828125, 0.12312698364257812, 0.13440704345703125, 0.14568710327148438, 0.1569671630859375, 0.16824722290039062, 0.17952728271484375, 0.19080734252929688, 0.20208740234375, 0.21336746215820312, 0.22464752197265625, 0.23592758178710938, 0.2472076416015625, 0.2584877014160156, 0.26976776123046875, 0.2810478210449219, 0.292327880859375, 0.3036079406738281, 0.31488800048828125, 0.3261680603027344, 0.3374481201171875, 0.3487281799316406, 0.36000823974609375, 0.3712882995605469, 0.382568359375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 6.0, 11.0, 12.0, 17.0, 30.0, 36.0, 66.0, 104.0, 159.0, 297.0, 534.0, 947.0, 1922.0, 3929.0, 8836.0, 22284.0, 70780.0, 306272.0, 507415.0, 81552.0, 25013.0, 9620.0, 4166.0, 2064.0, 1023.0, 584.0, 334.0, 187.0, 114.0, 76.0, 46.0, 31.0, 20.0, 14.0, 17.0, 4.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.78662109375, -0.7575454711914062, -0.7284698486328125, -0.6993942260742188, -0.670318603515625, -0.6412429809570312, -0.6121673583984375, -0.5830917358398438, -0.55401611328125, -0.5249404907226562, -0.4958648681640625, -0.46678924560546875, -0.437713623046875, -0.40863800048828125, -0.3795623779296875, -0.35048675537109375, -0.3214111328125, -0.29233551025390625, -0.2632598876953125, -0.23418426513671875, -0.205108642578125, -0.17603302001953125, -0.1469573974609375, -0.11788177490234375, -0.08880615234375, -0.05973052978515625, -0.0306549072265625, -0.00157928466796875, 0.027496337890625, 0.05657196044921875, 0.0856475830078125, 0.11472320556640625, 0.143798828125, 0.17287445068359375, 0.2019500732421875, 0.23102569580078125, 0.260101318359375, 0.28917694091796875, 0.3182525634765625, 0.34732818603515625, 0.37640380859375, 0.40547943115234375, 0.4345550537109375, 0.46363067626953125, 0.492706298828125, 0.5217819213867188, 0.5508575439453125, 0.5799331665039062, 0.6090087890625, 0.6380844116210938, 0.6671600341796875, 0.6962356567382812, 0.725311279296875, 0.7543869018554688, 0.7834625244140625, 0.8125381469726562, 0.84161376953125, 0.8706893920898438, 0.8997650146484375, 0.9288406372070312, 0.957916259765625, 0.9869918823242188, 1.0160675048828125, 1.0451431274414062, 1.07421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 5.0, 10.0, 13.0, 15.0, 15.0, 25.0, 13.0, 23.0, 29.0, 42.0, 30.0, 42.0, 53.0, 44.0, 54.0, 36.0, 43.0, 54.0, 49.0, 54.0, 46.0, 48.0, 29.0, 42.0, 23.0, 19.0, 19.0, 21.0, 20.0, 16.0, 10.0, 3.0, 8.0, 10.0, 10.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94580078125, -0.9135360717773438, -0.8812713623046875, -0.8490066528320312, -0.816741943359375, -0.7844772338867188, -0.7522125244140625, -0.7199478149414062, -0.68768310546875, -0.6554183959960938, -0.6231536865234375, -0.5908889770507812, -0.558624267578125, -0.5263595581054688, -0.4940948486328125, -0.46183013916015625, -0.4295654296875, -0.39730072021484375, -0.3650360107421875, -0.33277130126953125, -0.300506591796875, -0.26824188232421875, -0.2359771728515625, -0.20371246337890625, -0.17144775390625, -0.13918304443359375, -0.1069183349609375, -0.07465362548828125, -0.042388916015625, -0.01012420654296875, 0.0221405029296875, 0.05440521240234375, 0.086669921875, 0.11893463134765625, 0.1511993408203125, 0.18346405029296875, 0.215728759765625, 0.24799346923828125, 0.2802581787109375, 0.31252288818359375, 0.34478759765625, 0.37705230712890625, 0.4093170166015625, 0.44158172607421875, 0.473846435546875, 0.5061111450195312, 0.5383758544921875, 0.5706405639648438, 0.6029052734375, 0.6351699829101562, 0.6674346923828125, 0.6996994018554688, 0.731964111328125, 0.7642288208007812, 0.7964935302734375, 0.8287582397460938, 0.86102294921875, 0.8932876586914062, 0.9255523681640625, 0.9578170776367188, 0.990081787109375, 1.0223464965820312, 1.0546112060546875, 1.0868759155273438, 1.119140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 14.0, 21.0, 30.0, 67.0, 119.0, 324.0, 782.0, 2422.0, 12862.0, 185455.0, 803920.0, 35640.0, 4784.0, 1264.0, 432.0, 183.0, 100.0, 42.0, 31.0, 13.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.69482421875, -0.6756439208984375, -0.656463623046875, -0.6372833251953125, -0.61810302734375, -0.5989227294921875, -0.579742431640625, -0.5605621337890625, -0.5413818359375, -0.5222015380859375, -0.503021240234375, -0.4838409423828125, -0.46466064453125, -0.4454803466796875, -0.426300048828125, -0.4071197509765625, -0.387939453125, -0.3687591552734375, -0.349578857421875, -0.3303985595703125, -0.31121826171875, -0.2920379638671875, -0.272857666015625, -0.2536773681640625, -0.2344970703125, -0.2153167724609375, -0.196136474609375, -0.1769561767578125, -0.15777587890625, -0.1385955810546875, -0.119415283203125, -0.1002349853515625, -0.0810546875, -0.0618743896484375, -0.042694091796875, -0.0235137939453125, -0.00433349609375, 0.0148468017578125, 0.034027099609375, 0.0532073974609375, 0.0723876953125, 0.0915679931640625, 0.110748291015625, 0.1299285888671875, 0.14910888671875, 0.1682891845703125, 0.187469482421875, 0.2066497802734375, 0.225830078125, 0.2450103759765625, 0.264190673828125, 0.2833709716796875, 0.30255126953125, 0.3217315673828125, 0.340911865234375, 0.3600921630859375, 0.3792724609375, 0.3984527587890625, 0.417633056640625, 0.4368133544921875, 0.45599365234375, 0.4751739501953125, 0.494354248046875, 0.5135345458984375, 0.53271484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 17.0, 24.0, 41.0, 83.0, 118.0, 180.0, 179.0, 148.0, 74.0, 47.0, 30.0, 23.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012767314910888672, -0.00012314878404140472, -0.00011862441897392273, -0.00011410005390644073, -0.00010957568883895874, -0.00010505132377147675, -0.00010052695870399475, -9.600259363651276e-05, -9.147822856903076e-05, -8.695386350154877e-05, -8.242949843406677e-05, -7.790513336658478e-05, -7.338076829910278e-05, -6.885640323162079e-05, -6.43320381641388e-05, -5.98076730966568e-05, -5.5283308029174805e-05, -5.075894296169281e-05, -4.6234577894210815e-05, -4.171021282672882e-05, -3.7185847759246826e-05, -3.266148269176483e-05, -2.8137117624282837e-05, -2.3612752556800842e-05, -1.9088387489318848e-05, -1.4564022421836853e-05, -1.0039657354354858e-05, -5.515292286872864e-06, -9.909272193908691e-07, 3.5334378480911255e-06, 8.05780291557312e-06, 1.2582167983055115e-05, 1.710653305053711e-05, 2.1630898118019104e-05, 2.61552631855011e-05, 3.067962825298309e-05, 3.520399332046509e-05, 3.972835838794708e-05, 4.425272345542908e-05, 4.877708852291107e-05, 5.3301453590393066e-05, 5.782581865787506e-05, 6.235018372535706e-05, 6.687454879283905e-05, 7.139891386032104e-05, 7.592327892780304e-05, 8.044764399528503e-05, 8.497200906276703e-05, 8.949637413024902e-05, 9.402073919773102e-05, 9.854510426521301e-05, 0.00010306946933269501, 0.000107593834400177, 0.000112118199467659, 0.00011664256453514099, 0.00012116692960262299, 0.00012569129467010498, 0.00013021565973758698, 0.00013474002480506897, 0.00013926438987255096, 0.00014378875494003296, 0.00014831312000751495, 0.00015283748507499695, 0.00015736185014247894, 0.00016188621520996094]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 8.0, 12.0, 16.0, 33.0, 74.0, 105.0, 168.0, 392.0, 858.0, 2126.0, 6610.0, 28692.0, 218383.0, 700778.0, 71190.0, 13091.0, 3598.0, 1250.0, 550.0, 288.0, 140.0, 80.0, 47.0, 22.0, 13.0, 10.0, 9.0, 4.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322998046875, -0.31069183349609375, -0.2983856201171875, -0.28607940673828125, -0.273773193359375, -0.26146697998046875, -0.2491607666015625, -0.23685455322265625, -0.22454833984375, -0.21224212646484375, -0.1999359130859375, -0.18762969970703125, -0.175323486328125, -0.16301727294921875, -0.1507110595703125, -0.13840484619140625, -0.1260986328125, -0.11379241943359375, -0.1014862060546875, -0.08917999267578125, -0.076873779296875, -0.06456756591796875, -0.0522613525390625, -0.03995513916015625, -0.02764892578125, -0.01534271240234375, -0.0030364990234375, 0.00926971435546875, 0.021575927734375, 0.03388214111328125, 0.0461883544921875, 0.05849456787109375, 0.07080078125, 0.08310699462890625, 0.0954132080078125, 0.10771942138671875, 0.120025634765625, 0.13233184814453125, 0.1446380615234375, 0.15694427490234375, 0.16925048828125, 0.18155670166015625, 0.1938629150390625, 0.20616912841796875, 0.218475341796875, 0.23078155517578125, 0.2430877685546875, 0.25539398193359375, 0.2677001953125, 0.28000640869140625, 0.2923126220703125, 0.30461883544921875, 0.316925048828125, 0.32923126220703125, 0.3415374755859375, 0.35384368896484375, 0.36614990234375, 0.37845611572265625, 0.3907623291015625, 0.40306854248046875, 0.415374755859375, 0.42768096923828125, 0.4399871826171875, 0.45229339599609375, 0.464599609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 7.0, 12.0, 13.0, 12.0, 17.0, 34.0, 46.0, 71.0, 77.0, 89.0, 101.0, 115.0, 87.0, 91.0, 52.0, 45.0, 29.0, 20.0, 24.0, 14.0, 7.0, 7.0, 2.0, 5.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.288818359375, -0.2798004150390625, -0.270782470703125, -0.2617645263671875, -0.25274658203125, -0.2437286376953125, -0.234710693359375, -0.2256927490234375, -0.2166748046875, -0.2076568603515625, -0.198638916015625, -0.1896209716796875, -0.18060302734375, -0.1715850830078125, -0.162567138671875, -0.1535491943359375, -0.14453125, -0.1355133056640625, -0.126495361328125, -0.1174774169921875, -0.10845947265625, -0.0994415283203125, -0.090423583984375, -0.0814056396484375, -0.0723876953125, -0.0633697509765625, -0.054351806640625, -0.0453338623046875, -0.03631591796875, -0.0272979736328125, -0.018280029296875, -0.0092620849609375, -0.000244140625, 0.0087738037109375, 0.017791748046875, 0.0268096923828125, 0.03582763671875, 0.0448455810546875, 0.053863525390625, 0.0628814697265625, 0.0718994140625, 0.0809173583984375, 0.089935302734375, 0.0989532470703125, 0.10797119140625, 0.1169891357421875, 0.126007080078125, 0.1350250244140625, 0.14404296875, 0.1530609130859375, 0.162078857421875, 0.1710968017578125, 0.18011474609375, 0.1891326904296875, 0.198150634765625, 0.2071685791015625, 0.2161865234375, 0.2252044677734375, 0.234222412109375, 0.2432403564453125, 0.25225830078125, 0.2612762451171875, 0.270294189453125, 0.2793121337890625, 0.288330078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 20.0, 24.0, 57.0, 66.0, 184.0, 258.0, 137.0, 80.0, 69.0, 36.0, 27.0, 10.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.147005081176758, -6.918535232543945, -6.690065383911133, -6.4615960121154785, -6.233126163482666, -6.0046563148498535, -5.776186943054199, -5.547717094421387, -5.319247245788574, -5.090777397155762, -4.862307548522949, -4.633838176727295, -4.405368328094482, -4.17689847946167, -3.9484288692474365, -3.719959259033203, -3.4914894104003906, -3.263019561767578, -3.0345499515533447, -2.8060803413391113, -2.577610492706299, -2.3491406440734863, -2.120671033859253, -1.89220130443573, -1.663731575012207, -1.435261845588684, -1.2067921161651611, -0.9783223867416382, -0.7498526573181152, -0.5213829278945923, -0.29291319847106934, -0.06444346904754639, 0.16402673721313477, 0.3924964666366577, 0.6209661960601807, 0.8494359254837036, 1.0779056549072266, 1.3063753843307495, 1.5348451137542725, 1.7633148431777954, 1.9917845726013184, 2.220254421234131, 2.4487240314483643, 2.6771936416625977, 2.90566349029541, 3.1341333389282227, 3.362602949142456, 3.5910725593566895, 3.819542407989502, 4.0480122566223145, 4.276481628417969, 4.504951477050781, 4.733421325683594, 4.961891174316406, 5.190361022949219, 5.418830394744873, 5.6473002433776855, 5.875770092010498, 6.104239463806152, 6.332709312438965, 6.561179161071777, 6.78964900970459, 7.018118858337402, 7.246588230133057, 7.475058078765869]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 11.0, 3.0, 9.0, 5.0, 11.0, 13.0, 17.0, 16.0, 11.0, 17.0, 25.0, 23.0, 24.0, 21.0, 27.0, 33.0, 40.0, 41.0, 56.0, 69.0, 81.0, 65.0, 52.0, 39.0, 45.0, 34.0, 23.0, 29.0, 23.0, 26.0, 26.0, 8.0, 11.0, 13.0, 11.0, 8.0, 6.0, 7.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.6752586364746094, -3.5616910457611084, -3.4481232166290283, -3.3345556259155273, -3.2209877967834473, -3.1074202060699463, -2.9938526153564453, -2.8802847862243652, -2.7667171955108643, -2.6531496047973633, -2.539581775665283, -2.4260141849517822, -2.312446355819702, -2.198878765106201, -2.085310935974121, -1.9717433452606201, -1.8581756353378296, -1.744607925415039, -1.6310402154922485, -1.517472505569458, -1.403904914855957, -1.2903372049331665, -1.176769495010376, -1.063201904296875, -0.9496341347694397, -0.8360664248466492, -0.7224987745285034, -0.6089310646057129, -0.49536338448524475, -0.3817957043647766, -0.2682279944419861, -0.15466034412384033, -0.041092634201049805, 0.07247505336999893, 0.18604274094104767, 0.299610435962677, 0.41317811608314514, 0.5267457962036133, 0.6403135061264038, 0.7538811564445496, 0.8674488663673401, 0.9810165762901306, 1.0945842266082764, 1.208151936531067, 1.3217196464538574, 1.4352872371673584, 1.5488550662994385, 1.6624226570129395, 1.77599036693573, 1.8895580768585205, 2.0031256675720215, 2.1166934967041016, 2.2302610874176025, 2.3438286781311035, 2.4573965072631836, 2.5709640979766846, 2.6845319271087646, 2.7980995178222656, 2.9116673469543457, 3.0252349376678467, 3.1388027667999268, 3.2523703575134277, 3.365938186645508, 3.479505777359009, 3.5930733680725098]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 4.0, 3.0, 5.0, 11.0, 8.0, 9.0, 14.0, 21.0, 16.0, 14.0, 26.0, 26.0, 53.0, 55.0, 69.0, 84.0, 82.0, 145.0, 174.0, 303.0, 447.0, 832.0, 1904.0, 8558.0, 3216510.0, 954989.0, 6057.0, 1602.0, 776.0, 432.0, 266.0, 140.0, 120.0, 88.0, 93.0, 61.0, 41.0, 55.0, 38.0, 29.0, 24.0, 20.0, 15.0, 17.0, 18.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 4.0], "bins": [-2.234375, -2.1685028076171875, -2.102630615234375, -2.0367584228515625, -1.97088623046875, -1.9050140380859375, -1.839141845703125, -1.7732696533203125, -1.7073974609375, -1.6415252685546875, -1.575653076171875, -1.5097808837890625, -1.44390869140625, -1.3780364990234375, -1.312164306640625, -1.2462921142578125, -1.180419921875, -1.1145477294921875, -1.048675537109375, -0.9828033447265625, -0.91693115234375, -0.8510589599609375, -0.785186767578125, -0.7193145751953125, -0.6534423828125, -0.5875701904296875, -0.521697998046875, -0.4558258056640625, -0.38995361328125, -0.3240814208984375, -0.258209228515625, -0.1923370361328125, -0.12646484375, -0.0605926513671875, 0.005279541015625, 0.0711517333984375, 0.13702392578125, 0.2028961181640625, 0.268768310546875, 0.3346405029296875, 0.4005126953125, 0.4663848876953125, 0.532257080078125, 0.5981292724609375, 0.66400146484375, 0.7298736572265625, 0.795745849609375, 0.8616180419921875, 0.927490234375, 0.9933624267578125, 1.059234619140625, 1.1251068115234375, 1.19097900390625, 1.2568511962890625, 1.322723388671875, 1.3885955810546875, 1.4544677734375, 1.5203399658203125, 1.586212158203125, 1.6520843505859375, 1.71795654296875, 1.7838287353515625, 1.849700927734375, 1.9155731201171875, 1.9814453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 14.0, 14.0, 13.0, 22.0, 26.0, 26.0, 37.0, 50.0, 38.0, 45.0, 51.0, 51.0, 79.0, 53.0, 52.0, 60.0, 57.0, 44.0, 60.0, 35.0, 33.0, 30.0, 28.0, 16.0, 14.0, 20.0, 3.0, 6.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.346923828125, -0.3351325988769531, -0.32334136962890625, -0.3115501403808594, -0.2997589111328125, -0.2879676818847656, -0.27617645263671875, -0.2643852233886719, -0.252593994140625, -0.24080276489257812, -0.22901153564453125, -0.21722030639648438, -0.2054290771484375, -0.19363784790039062, -0.18184661865234375, -0.17005538940429688, -0.15826416015625, -0.14647293090820312, -0.13468170166015625, -0.12289047241210938, -0.1110992431640625, -0.09930801391601562, -0.08751678466796875, -0.07572555541992188, -0.063934326171875, -0.052143096923828125, -0.04035186767578125, -0.028560638427734375, -0.0167694091796875, -0.004978179931640625, 0.00681304931640625, 0.018604278564453125, 0.0303955078125, 0.042186737060546875, 0.05397796630859375, 0.06576919555664062, 0.0775604248046875, 0.08935165405273438, 0.10114288330078125, 0.11293411254882812, 0.124725341796875, 0.13651657104492188, 0.14830780029296875, 0.16009902954101562, 0.1718902587890625, 0.18368148803710938, 0.19547271728515625, 0.20726394653320312, 0.21905517578125, 0.23084640502929688, 0.24263763427734375, 0.2544288635253906, 0.2662200927734375, 0.2780113220214844, 0.28980255126953125, 0.3015937805175781, 0.313385009765625, 0.3251762390136719, 0.33696746826171875, 0.3487586975097656, 0.3605499267578125, 0.3723411560058594, 0.38413238525390625, 0.3959236145019531, 0.40771484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 5.0, 7.0, 11.0, 31.0, 58.0, 125.0, 253.0, 663.0, 1996.0, 19219.0, 4120966.0, 47242.0, 2440.0, 707.0, 311.0, 131.0, 56.0, 23.0, 14.0, 3.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.763671875, -2.673370361328125, -2.58306884765625, -2.492767333984375, -2.4024658203125, -2.312164306640625, -2.22186279296875, -2.131561279296875, -2.041259765625, -1.950958251953125, -1.86065673828125, -1.770355224609375, -1.6800537109375, -1.589752197265625, -1.49945068359375, -1.409149169921875, -1.31884765625, -1.228546142578125, -1.13824462890625, -1.047943115234375, -0.9576416015625, -0.867340087890625, -0.77703857421875, -0.686737060546875, -0.596435546875, -0.506134033203125, -0.41583251953125, -0.325531005859375, -0.2352294921875, -0.144927978515625, -0.05462646484375, 0.035675048828125, 0.1259765625, 0.216278076171875, 0.30657958984375, 0.396881103515625, 0.4871826171875, 0.577484130859375, 0.66778564453125, 0.758087158203125, 0.848388671875, 0.938690185546875, 1.02899169921875, 1.119293212890625, 1.2095947265625, 1.299896240234375, 1.39019775390625, 1.480499267578125, 1.57080078125, 1.661102294921875, 1.75140380859375, 1.841705322265625, 1.9320068359375, 2.022308349609375, 2.11260986328125, 2.202911376953125, 2.293212890625, 2.383514404296875, 2.47381591796875, 2.564117431640625, 2.6544189453125, 2.744720458984375, 2.83502197265625, 2.925323486328125, 3.015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 10.0, 20.0, 30.0, 50.0, 114.0, 345.0, 1354.0, 1480.0, 442.0, 115.0, 65.0, 22.0, 11.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8603515625, -1.8087310791015625, -1.757110595703125, -1.7054901123046875, -1.65386962890625, -1.6022491455078125, -1.550628662109375, -1.4990081787109375, -1.4473876953125, -1.3957672119140625, -1.344146728515625, -1.2925262451171875, -1.24090576171875, -1.1892852783203125, -1.137664794921875, -1.0860443115234375, -1.034423828125, -0.9828033447265625, -0.931182861328125, -0.8795623779296875, -0.82794189453125, -0.7763214111328125, -0.724700927734375, -0.6730804443359375, -0.6214599609375, -0.5698394775390625, -0.518218994140625, -0.4665985107421875, -0.41497802734375, -0.3633575439453125, -0.311737060546875, -0.2601165771484375, -0.20849609375, -0.1568756103515625, -0.105255126953125, -0.0536346435546875, -0.00201416015625, 0.0496063232421875, 0.101226806640625, 0.1528472900390625, 0.2044677734375, 0.2560882568359375, 0.307708740234375, 0.3593292236328125, 0.41094970703125, 0.4625701904296875, 0.514190673828125, 0.5658111572265625, 0.617431640625, 0.6690521240234375, 0.720672607421875, 0.7722930908203125, 0.82391357421875, 0.8755340576171875, 0.927154541015625, 0.9787750244140625, 1.0303955078125, 1.0820159912109375, 1.133636474609375, 1.1852569580078125, 1.23687744140625, 1.2884979248046875, 1.340118408203125, 1.3917388916015625, 1.443359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 15.0, 20.0, 41.0, 71.0, 131.0, 196.0, 221.0, 163.0, 73.0, 28.0, 8.0, 7.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.95085620880127, -13.605608940124512, -13.260361671447754, -12.915114402770996, -12.569867134094238, -12.22461986541748, -11.879372596740723, -11.534125328063965, -11.188878059387207, -10.84363079071045, -10.498383522033691, -10.153136253356934, -9.807888984680176, -9.462641716003418, -9.11739444732666, -8.772147178649902, -8.426899909973145, -8.081652641296387, -7.736405372619629, -7.391158103942871, -7.045910835266113, -6.7006635665893555, -6.355416297912598, -6.01016902923584, -5.664921760559082, -5.319674491882324, -4.974427223205566, -4.629179954528809, -4.283932685852051, -3.938685417175293, -3.593438148498535, -3.2481908798217773, -2.9029436111450195, -2.5576963424682617, -2.212449073791504, -1.867201805114746, -1.5219545364379883, -1.1767072677612305, -0.8314599990844727, -0.48621273040771484, -0.14096546173095703, 0.20428180694580078, 0.5495290756225586, 0.8947763442993164, 1.2400236129760742, 1.585270881652832, 1.9305181503295898, 2.2757654190063477, 2.6210126876831055, 2.9662599563598633, 3.311507225036621, 3.656754493713379, 4.002001762390137, 4.3472490310668945, 4.692496299743652, 5.03774356842041, 5.382990837097168, 5.728238105773926, 6.073485374450684, 6.418732643127441, 6.763979911804199, 7.109227180480957, 7.454474449157715, 7.799721717834473, 8.14496898651123]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 3.0, 3.0, 11.0, 7.0, 14.0, 12.0, 20.0, 27.0, 20.0, 28.0, 40.0, 30.0, 31.0, 33.0, 41.0, 41.0, 60.0, 49.0, 38.0, 39.0, 34.0, 41.0, 56.0, 38.0, 40.0, 37.0, 38.0, 28.0, 20.0, 22.0, 18.0, 14.0, 14.0, 14.0, 6.0, 9.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4690582752227783, -3.3464033603668213, -3.2237484455108643, -3.1010935306549072, -2.97843861579895, -2.855783700942993, -2.733128547668457, -2.6104736328125, -2.487818717956543, -2.365163803100586, -2.242508888244629, -2.119853973388672, -1.9971990585327148, -1.8745441436767578, -1.7518891096115112, -1.6292341947555542, -1.5065793991088867, -1.3839244842529297, -1.2612695693969727, -1.1386146545410156, -1.0159597396850586, -0.8933047652244568, -0.770649790763855, -0.647994875907898, -0.5253399610519409, -0.4026850461959839, -0.28003010153770447, -0.15737515687942505, -0.03472024202346802, 0.08793467283248901, 0.21058964729309082, 0.33324456214904785, 0.4558992385864258, 0.5785541534423828, 0.7012090682983398, 0.8238640427589417, 0.9465189576148987, 1.069173812866211, 1.1918288469314575, 1.3144837617874146, 1.4371386766433716, 1.5597935914993286, 1.6824485063552856, 1.8051035404205322, 1.9277584552764893, 2.0504133701324463, 2.1730682849884033, 2.2957231998443604, 2.4183781147003174, 2.5410330295562744, 2.6636879444122314, 2.7863428592681885, 2.9089977741241455, 3.0316526889801025, 3.1543078422546387, 3.2769627571105957, 3.3996176719665527, 3.5222725868225098, 3.644927501678467, 3.767582416534424, 3.890237331390381, 4.012892246246338, 4.135547161102295, 4.258202075958252, 4.380856990814209]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 7.0, 5.0, 14.0, 8.0, 17.0, 28.0, 39.0, 67.0, 74.0, 123.0, 200.0, 284.0, 407.0, 613.0, 957.0, 1611.0, 2766.0, 4785.0, 8634.0, 16518.0, 34073.0, 77404.0, 199343.0, 366065.0, 191739.0, 73736.0, 32943.0, 16079.0, 8366.0, 4613.0, 2671.0, 1507.0, 979.0, 632.0, 427.0, 236.0, 172.0, 128.0, 81.0, 58.0, 39.0, 35.0, 24.0, 16.0, 9.0, 6.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.6226654052734375, -0.600799560546875, -0.5789337158203125, -0.55706787109375, -0.5352020263671875, -0.513336181640625, -0.4914703369140625, -0.4696044921875, -0.4477386474609375, -0.425872802734375, -0.4040069580078125, -0.38214111328125, -0.3602752685546875, -0.338409423828125, -0.3165435791015625, -0.294677734375, -0.2728118896484375, -0.250946044921875, -0.2290802001953125, -0.20721435546875, -0.1853485107421875, -0.163482666015625, -0.1416168212890625, -0.1197509765625, -0.0978851318359375, -0.076019287109375, -0.0541534423828125, -0.03228759765625, -0.0104217529296875, 0.011444091796875, 0.0333099365234375, 0.05517578125, 0.0770416259765625, 0.098907470703125, 0.1207733154296875, 0.14263916015625, 0.1645050048828125, 0.186370849609375, 0.2082366943359375, 0.2301025390625, 0.2519683837890625, 0.273834228515625, 0.2957000732421875, 0.31756591796875, 0.3394317626953125, 0.361297607421875, 0.3831634521484375, 0.405029296875, 0.4268951416015625, 0.448760986328125, 0.4706268310546875, 0.49249267578125, 0.5143585205078125, 0.536224365234375, 0.5580902099609375, 0.5799560546875, 0.6018218994140625, 0.623687744140625, 0.6455535888671875, 0.66741943359375, 0.6892852783203125, 0.711151123046875, 0.7330169677734375, 0.7548828125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 8.0, 8.0, 2.0, 8.0, 17.0, 11.0, 14.0, 14.0, 21.0, 27.0, 28.0, 22.0, 35.0, 48.0, 43.0, 50.0, 30.0, 52.0, 36.0, 54.0, 46.0, 47.0, 46.0, 41.0, 40.0, 35.0, 35.0, 30.0, 20.0, 23.0, 38.0, 17.0, 16.0, 4.0, 7.0, 7.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2647056579589844, -0.25426483154296875, -0.24382400512695312, -0.2333831787109375, -0.22294235229492188, -0.21250152587890625, -0.20206069946289062, -0.191619873046875, -0.18117904663085938, -0.17073822021484375, -0.16029739379882812, -0.1498565673828125, -0.13941574096679688, -0.12897491455078125, -0.11853408813476562, -0.10809326171875, -0.09765243530273438, -0.08721160888671875, -0.07677078247070312, -0.0663299560546875, -0.055889129638671875, -0.04544830322265625, -0.035007476806640625, -0.024566650390625, -0.014125823974609375, -0.00368499755859375, 0.006755828857421875, 0.0171966552734375, 0.027637481689453125, 0.03807830810546875, 0.048519134521484375, 0.0589599609375, 0.06940078735351562, 0.07984161376953125, 0.09028244018554688, 0.1007232666015625, 0.11116409301757812, 0.12160491943359375, 0.13204574584960938, 0.142486572265625, 0.15292739868164062, 0.16336822509765625, 0.17380905151367188, 0.1842498779296875, 0.19469070434570312, 0.20513153076171875, 0.21557235717773438, 0.22601318359375, 0.23645401000976562, 0.24689483642578125, 0.2573356628417969, 0.2677764892578125, 0.2782173156738281, 0.28865814208984375, 0.2990989685058594, 0.309539794921875, 0.3199806213378906, 0.33042144775390625, 0.3408622741699219, 0.3513031005859375, 0.3617439270019531, 0.37218475341796875, 0.3826255798339844, 0.39306640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 8.0, 11.0, 12.0, 10.0, 22.0, 46.0, 45.0, 62.0, 106.0, 157.0, 310.0, 533.0, 1011.0, 2209.0, 5308.0, 15795.0, 64993.0, 587393.0, 298599.0, 50408.0, 13073.0, 4465.0, 1853.0, 960.0, 445.0, 279.0, 132.0, 102.0, 62.0, 42.0, 30.0, 17.0, 18.0, 11.0, 8.0, 7.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.90643310546875, -0.8714599609375, -0.83648681640625, -0.801513671875, -0.76654052734375, -0.7315673828125, -0.69659423828125, -0.66162109375, -0.62664794921875, -0.5916748046875, -0.55670166015625, -0.521728515625, -0.48675537109375, -0.4517822265625, -0.41680908203125, -0.3818359375, -0.34686279296875, -0.3118896484375, -0.27691650390625, -0.241943359375, -0.20697021484375, -0.1719970703125, -0.13702392578125, -0.10205078125, -0.06707763671875, -0.0321044921875, 0.00286865234375, 0.037841796875, 0.07281494140625, 0.1077880859375, 0.14276123046875, 0.177734375, 0.21270751953125, 0.2476806640625, 0.28265380859375, 0.317626953125, 0.35260009765625, 0.3875732421875, 0.42254638671875, 0.45751953125, 0.49249267578125, 0.5274658203125, 0.56243896484375, 0.597412109375, 0.63238525390625, 0.6673583984375, 0.70233154296875, 0.7373046875, 0.77227783203125, 0.8072509765625, 0.84222412109375, 0.877197265625, 0.91217041015625, 0.9471435546875, 0.98211669921875, 1.01708984375, 1.05206298828125, 1.0870361328125, 1.12200927734375, 1.156982421875, 1.19195556640625, 1.2269287109375, 1.26190185546875, 1.296875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 4.0, 11.0, 10.0, 7.0, 7.0, 15.0, 14.0, 18.0, 26.0, 34.0, 28.0, 37.0, 39.0, 43.0, 45.0, 60.0, 52.0, 52.0, 51.0, 55.0, 57.0, 46.0, 46.0, 44.0, 27.0, 17.0, 21.0, 24.0, 17.0, 19.0, 15.0, 8.0, 9.0, 7.0, 5.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.3046875, -1.264190673828125, -1.22369384765625, -1.183197021484375, -1.1427001953125, -1.102203369140625, -1.06170654296875, -1.021209716796875, -0.980712890625, -0.940216064453125, -0.89971923828125, -0.859222412109375, -0.8187255859375, -0.778228759765625, -0.73773193359375, -0.697235107421875, -0.65673828125, -0.616241455078125, -0.57574462890625, -0.535247802734375, -0.4947509765625, -0.454254150390625, -0.41375732421875, -0.373260498046875, -0.332763671875, -0.292266845703125, -0.25177001953125, -0.211273193359375, -0.1707763671875, -0.130279541015625, -0.08978271484375, -0.049285888671875, -0.0087890625, 0.031707763671875, 0.07220458984375, 0.112701416015625, 0.1531982421875, 0.193695068359375, 0.23419189453125, 0.274688720703125, 0.315185546875, 0.355682373046875, 0.39617919921875, 0.436676025390625, 0.4771728515625, 0.517669677734375, 0.55816650390625, 0.598663330078125, 0.63916015625, 0.679656982421875, 0.72015380859375, 0.760650634765625, 0.8011474609375, 0.841644287109375, 0.88214111328125, 0.922637939453125, 0.963134765625, 1.003631591796875, 1.04412841796875, 1.084625244140625, 1.1251220703125, 1.165618896484375, 1.20611572265625, 1.246612548828125, 1.287109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 12.0, 14.0, 16.0, 36.0, 42.0, 68.0, 107.0, 174.0, 306.0, 536.0, 1007.0, 2282.0, 6852.0, 36011.0, 740626.0, 230986.0, 20898.0, 4747.0, 1803.0, 857.0, 449.0, 265.0, 162.0, 99.0, 56.0, 40.0, 21.0, 17.0, 13.0, 3.0, 4.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.55322265625, -0.535858154296875, -0.51849365234375, -0.501129150390625, -0.4837646484375, -0.466400146484375, -0.44903564453125, -0.431671142578125, -0.414306640625, -0.396942138671875, -0.37957763671875, -0.362213134765625, -0.3448486328125, -0.327484130859375, -0.31011962890625, -0.292755126953125, -0.275390625, -0.258026123046875, -0.24066162109375, -0.223297119140625, -0.2059326171875, -0.188568115234375, -0.17120361328125, -0.153839111328125, -0.136474609375, -0.119110107421875, -0.10174560546875, -0.084381103515625, -0.0670166015625, -0.049652099609375, -0.03228759765625, -0.014923095703125, 0.00244140625, 0.019805908203125, 0.03717041015625, 0.054534912109375, 0.0718994140625, 0.089263916015625, 0.10662841796875, 0.123992919921875, 0.141357421875, 0.158721923828125, 0.17608642578125, 0.193450927734375, 0.2108154296875, 0.228179931640625, 0.24554443359375, 0.262908935546875, 0.2802734375, 0.297637939453125, 0.31500244140625, 0.332366943359375, 0.3497314453125, 0.367095947265625, 0.38446044921875, 0.401824951171875, 0.419189453125, 0.436553955078125, 0.45391845703125, 0.471282958984375, 0.4886474609375, 0.506011962890625, 0.52337646484375, 0.540740966796875, 0.55810546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 4.0, 9.0, 10.0, 15.0, 16.0, 26.0, 37.0, 38.0, 67.0, 112.0, 162.0, 162.0, 102.0, 61.0, 52.0, 28.0, 16.0, 19.0, 8.0, 10.0, 8.0, 6.0, 8.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0001169443130493164, -0.0001135868951678276, -0.0001102294772863388, -0.00010687205940485, -0.0001035146415233612, -0.0001001572236418724, -9.67998057603836e-05, -9.34423878788948e-05, -9.0084969997406e-05, -8.67275521159172e-05, -8.33701342344284e-05, -8.00127163529396e-05, -7.66552984714508e-05, -7.3297880589962e-05, -6.99404627084732e-05, -6.65830448269844e-05, -6.32256269454956e-05, -5.9868209064006805e-05, -5.6510791182518005e-05, -5.3153373301029205e-05, -4.9795955419540405e-05, -4.6438537538051605e-05, -4.3081119656562805e-05, -3.9723701775074005e-05, -3.6366283893585205e-05, -3.3008866012096405e-05, -2.9651448130607605e-05, -2.6294030249118805e-05, -2.2936612367630005e-05, -1.9579194486141205e-05, -1.6221776604652405e-05, -1.2864358723163605e-05, -9.506940841674805e-06, -6.149522960186005e-06, -2.7921050786972046e-06, 5.653128027915955e-07, 3.9227306842803955e-06, 7.2801485657691956e-06, 1.0637566447257996e-05, 1.3994984328746796e-05, 1.7352402210235596e-05, 2.0709820091724396e-05, 2.4067237973213196e-05, 2.7424655854701996e-05, 3.0782073736190796e-05, 3.4139491617679596e-05, 3.7496909499168396e-05, 4.0854327380657196e-05, 4.4211745262145996e-05, 4.7569163143634796e-05, 5.0926581025123596e-05, 5.4283998906612396e-05, 5.7641416788101196e-05, 6.0998834669589996e-05, 6.43562525510788e-05, 6.77136704325676e-05, 7.10710883140564e-05, 7.44285061955452e-05, 7.7785924077034e-05, 8.11433419585228e-05, 8.45007598400116e-05, 8.78581777215004e-05, 9.12155956029892e-05, 9.4573013484478e-05, 9.79304313659668e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 3.0, 7.0, 11.0, 20.0, 17.0, 40.0, 46.0, 100.0, 177.0, 291.0, 606.0, 1295.0, 3454.0, 14307.0, 137348.0, 826779.0, 51986.0, 7886.0, 2265.0, 898.0, 426.0, 228.0, 129.0, 86.0, 43.0, 30.0, 21.0, 8.0, 13.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.47119140625, -0.45328521728515625, -0.4353790283203125, -0.41747283935546875, -0.399566650390625, -0.38166046142578125, -0.3637542724609375, -0.34584808349609375, -0.32794189453125, -0.31003570556640625, -0.2921295166015625, -0.27422332763671875, -0.256317138671875, -0.23841094970703125, -0.2205047607421875, -0.20259857177734375, -0.1846923828125, -0.16678619384765625, -0.1488800048828125, -0.13097381591796875, -0.113067626953125, -0.09516143798828125, -0.0772552490234375, -0.05934906005859375, -0.04144287109375, -0.02353668212890625, -0.0056304931640625, 0.01227569580078125, 0.030181884765625, 0.04808807373046875, 0.0659942626953125, 0.08390045166015625, 0.101806640625, 0.11971282958984375, 0.1376190185546875, 0.15552520751953125, 0.173431396484375, 0.19133758544921875, 0.2092437744140625, 0.22714996337890625, 0.24505615234375, 0.26296234130859375, 0.2808685302734375, 0.29877471923828125, 0.316680908203125, 0.33458709716796875, 0.3524932861328125, 0.37039947509765625, 0.3883056640625, 0.40621185302734375, 0.4241180419921875, 0.44202423095703125, 0.459930419921875, 0.47783660888671875, 0.4957427978515625, 0.5136489868164062, 0.53155517578125, 0.5494613647460938, 0.5673675537109375, 0.5852737426757812, 0.603179931640625, 0.6210861206054688, 0.6389923095703125, 0.6568984985351562, 0.6748046875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 1.0, 8.0, 11.0, 16.0, 17.0, 32.0, 52.0, 78.0, 99.0, 157.0, 170.0, 121.0, 82.0, 56.0, 35.0, 22.0, 20.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.46044921875, -0.44362640380859375, -0.4268035888671875, -0.40998077392578125, -0.393157958984375, -0.37633514404296875, -0.3595123291015625, -0.34268951416015625, -0.32586669921875, -0.30904388427734375, -0.2922210693359375, -0.27539825439453125, -0.258575439453125, -0.24175262451171875, -0.2249298095703125, -0.20810699462890625, -0.1912841796875, -0.17446136474609375, -0.1576385498046875, -0.14081573486328125, -0.123992919921875, -0.10717010498046875, -0.0903472900390625, -0.07352447509765625, -0.05670166015625, -0.03987884521484375, -0.0230560302734375, -0.00623321533203125, 0.010589599609375, 0.02741241455078125, 0.0442352294921875, 0.06105804443359375, 0.077880859375, 0.09470367431640625, 0.1115264892578125, 0.12834930419921875, 0.145172119140625, 0.16199493408203125, 0.1788177490234375, 0.19564056396484375, 0.21246337890625, 0.22928619384765625, 0.2461090087890625, 0.26293182373046875, 0.279754638671875, 0.29657745361328125, 0.3134002685546875, 0.33022308349609375, 0.3470458984375, 0.36386871337890625, 0.3806915283203125, 0.39751434326171875, 0.414337158203125, 0.43115997314453125, 0.4479827880859375, 0.46480560302734375, 0.48162841796875, 0.49845123291015625, 0.5152740478515625, 0.5320968627929688, 0.548919677734375, 0.5657424926757812, 0.5825653076171875, 0.5993881225585938, 0.6162109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 16.0, 38.0, 67.0, 208.0, 508.0, 122.0, 22.0, 9.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.81678771972656, -36.1271858215332, -35.43758773803711, -34.74798583984375, -34.058387756347656, -33.3687858581543, -32.6791877746582, -31.989585876464844, -31.299985885620117, -30.61038589477539, -29.920785903930664, -29.231185913085938, -28.54158592224121, -27.851985931396484, -27.162384033203125, -26.4727840423584, -25.783184051513672, -25.093584060668945, -24.40398406982422, -23.714384078979492, -23.024784088134766, -22.335182189941406, -21.645584106445312, -20.955982208251953, -20.26638412475586, -19.576784133911133, -18.887184143066406, -18.19758415222168, -17.507984161376953, -16.818382263183594, -16.1287841796875, -15.43918228149414, -14.749581336975098, -14.059981346130371, -13.370381355285645, -12.680780410766602, -11.991180419921875, -11.301580429077148, -10.611980438232422, -9.922380447387695, -9.232780456542969, -8.543180465698242, -7.853579998016357, -7.163980007171631, -6.474379539489746, -5.7847795486450195, -5.095179557800293, -4.405579090118408, -3.7159786224365234, -3.0263783931732178, -2.336778163909912, -1.6471781730651855, -0.9575779438018799, -0.2679777145385742, 0.42162227630615234, 1.111222743988037, 1.8008227348327637, 2.4904229640960693, 3.180023193359375, 3.8696231842041016, 4.559223175048828, 5.248823642730713, 5.9384236335754395, 6.628024101257324, 7.317624092102051]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 8.0, 4.0, 7.0, 11.0, 12.0, 14.0, 14.0, 24.0, 19.0, 29.0, 25.0, 40.0, 42.0, 27.0, 48.0, 66.0, 108.0, 89.0, 81.0, 35.0, 34.0, 31.0, 38.0, 25.0, 14.0, 17.0, 20.0, 12.0, 16.0, 14.0, 14.0, 8.0, 8.0, 11.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.840521812438965, -4.6782732009887695, -4.516025066375732, -4.353776454925537, -4.191527843475342, -4.029279708862305, -3.8670310974121094, -3.704782485961914, -3.542534112930298, -3.3802857398986816, -3.2180371284484863, -3.05578875541687, -2.893540382385254, -2.7312917709350586, -2.5690433979034424, -2.406795024871826, -2.244546413421631, -2.0822980403900146, -1.9200494289398193, -1.7578010559082031, -1.5955525636672974, -1.4333040714263916, -1.2710556983947754, -1.1088072061538696, -0.9465587139129639, -0.7843102216720581, -0.6220617890357971, -0.45981332659721375, -0.29756486415863037, -0.1353163719177246, 0.026932060718536377, 0.18918049335479736, 0.3514285087585449, 0.5136770009994507, 0.6759254336357117, 0.8381738662719727, 1.0004223585128784, 1.1626708507537842, 1.3249192237854004, 1.4871677160263062, 1.649416208267212, 1.8116647005081177, 1.9739131927490234, 2.1361615657806396, 2.298409938812256, 2.460658550262451, 2.6229069232940674, 2.7851552963256836, 2.947403907775879, 3.109652280807495, 3.2719008922576904, 3.4341492652893066, 3.596397876739502, 3.758646249771118, 3.9208946228027344, 4.08314323425293, 4.245391845703125, 4.40764045715332, 4.569888591766357, 4.732137203216553, 4.894385814666748, 5.056633949279785, 5.2188825607299805, 5.381131172180176, 5.543379306793213]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 9.0, 14.0, 12.0, 22.0, 22.0, 42.0, 84.0, 97.0, 150.0, 304.0, 495.0, 969.0, 2000.0, 4362.0, 12032.0, 60338.0, 902658.0, 2878471.0, 288597.0, 29642.0, 7738.0, 3042.0, 1467.0, 723.0, 378.0, 228.0, 135.0, 72.0, 63.0, 44.0, 18.0, 16.0, 12.0, 5.0, 6.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58349609375, -0.561309814453125, -0.53912353515625, -0.516937255859375, -0.4947509765625, -0.472564697265625, -0.45037841796875, -0.428192138671875, -0.406005859375, -0.383819580078125, -0.36163330078125, -0.339447021484375, -0.3172607421875, -0.295074462890625, -0.27288818359375, -0.250701904296875, -0.228515625, -0.206329345703125, -0.18414306640625, -0.161956787109375, -0.1397705078125, -0.117584228515625, -0.09539794921875, -0.073211669921875, -0.051025390625, -0.028839111328125, -0.00665283203125, 0.015533447265625, 0.0377197265625, 0.059906005859375, 0.08209228515625, 0.104278564453125, 0.12646484375, 0.148651123046875, 0.17083740234375, 0.193023681640625, 0.2152099609375, 0.237396240234375, 0.25958251953125, 0.281768798828125, 0.303955078125, 0.326141357421875, 0.34832763671875, 0.370513916015625, 0.3927001953125, 0.414886474609375, 0.43707275390625, 0.459259033203125, 0.4814453125, 0.503631591796875, 0.52581787109375, 0.548004150390625, 0.5701904296875, 0.592376708984375, 0.61456298828125, 0.636749267578125, 0.658935546875, 0.681121826171875, 0.70330810546875, 0.725494384765625, 0.7476806640625, 0.769866943359375, 0.79205322265625, 0.814239501953125, 0.83642578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 6.0, 10.0, 6.0, 15.0, 10.0, 21.0, 18.0, 33.0, 38.0, 32.0, 35.0, 50.0, 30.0, 51.0, 36.0, 46.0, 58.0, 42.0, 53.0, 49.0, 48.0, 49.0, 42.0, 36.0, 29.0, 35.0, 28.0, 20.0, 13.0, 12.0, 9.0, 8.0, 5.0, 2.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3609886169433594, -0.34917449951171875, -0.3373603820800781, -0.3255462646484375, -0.3137321472167969, -0.30191802978515625, -0.2901039123535156, -0.278289794921875, -0.2664756774902344, -0.25466156005859375, -0.24284744262695312, -0.2310333251953125, -0.21921920776367188, -0.20740509033203125, -0.19559097290039062, -0.18377685546875, -0.17196273803710938, -0.16014862060546875, -0.14833450317382812, -0.1365203857421875, -0.12470626831054688, -0.11289215087890625, -0.10107803344726562, -0.089263916015625, -0.07744979858398438, -0.06563568115234375, -0.053821563720703125, -0.0420074462890625, -0.030193328857421875, -0.01837921142578125, -0.006565093994140625, 0.0052490234375, 0.017063140869140625, 0.02887725830078125, 0.040691375732421875, 0.0525054931640625, 0.06431961059570312, 0.07613372802734375, 0.08794784545898438, 0.099761962890625, 0.11157608032226562, 0.12339019775390625, 0.13520431518554688, 0.1470184326171875, 0.15883255004882812, 0.17064666748046875, 0.18246078491210938, 0.19427490234375, 0.20608901977539062, 0.21790313720703125, 0.22971725463867188, 0.2415313720703125, 0.2533454895019531, 0.26515960693359375, 0.2769737243652344, 0.288787841796875, 0.3006019592285156, 0.31241607666015625, 0.3242301940917969, 0.3360443115234375, 0.3478584289550781, 0.35967254638671875, 0.3714866638183594, 0.38330078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 5.0, 11.0, 22.0, 50.0, 94.0, 213.0, 624.0, 3487.0, 217516.0, 3959905.0, 10818.0, 966.0, 339.0, 125.0, 60.0, 21.0, 16.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.501953125, -2.4132080078125, -2.324462890625, -2.2357177734375, -2.14697265625, -2.0582275390625, -1.969482421875, -1.8807373046875, -1.7919921875, -1.7032470703125, -1.614501953125, -1.5257568359375, -1.43701171875, -1.3482666015625, -1.259521484375, -1.1707763671875, -1.08203125, -0.9932861328125, -0.904541015625, -0.8157958984375, -0.72705078125, -0.6383056640625, -0.549560546875, -0.4608154296875, -0.3720703125, -0.2833251953125, -0.194580078125, -0.1058349609375, -0.01708984375, 0.0716552734375, 0.160400390625, 0.2491455078125, 0.337890625, 0.4266357421875, 0.515380859375, 0.6041259765625, 0.69287109375, 0.7816162109375, 0.870361328125, 0.9591064453125, 1.0478515625, 1.1365966796875, 1.225341796875, 1.3140869140625, 1.40283203125, 1.4915771484375, 1.580322265625, 1.6690673828125, 1.7578125, 1.8465576171875, 1.935302734375, 2.0240478515625, 2.11279296875, 2.2015380859375, 2.290283203125, 2.3790283203125, 2.4677734375, 2.5565185546875, 2.645263671875, 2.7340087890625, 2.82275390625, 2.9114990234375, 3.000244140625, 3.0889892578125, 3.177734375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 4.0, 18.0, 18.0, 35.0, 61.0, 146.0, 356.0, 959.0, 1330.0, 665.0, 228.0, 112.0, 61.0, 33.0, 17.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.046875, -1.997344970703125, -1.94781494140625, -1.898284912109375, -1.8487548828125, -1.799224853515625, -1.74969482421875, -1.700164794921875, -1.650634765625, -1.601104736328125, -1.55157470703125, -1.502044677734375, -1.4525146484375, -1.402984619140625, -1.35345458984375, -1.303924560546875, -1.25439453125, -1.204864501953125, -1.15533447265625, -1.105804443359375, -1.0562744140625, -1.006744384765625, -0.95721435546875, -0.907684326171875, -0.858154296875, -0.808624267578125, -0.75909423828125, -0.709564208984375, -0.6600341796875, -0.610504150390625, -0.56097412109375, -0.511444091796875, -0.4619140625, -0.412384033203125, -0.36285400390625, -0.313323974609375, -0.2637939453125, -0.214263916015625, -0.16473388671875, -0.115203857421875, -0.065673828125, -0.016143798828125, 0.03338623046875, 0.082916259765625, 0.1324462890625, 0.181976318359375, 0.23150634765625, 0.281036376953125, 0.33056640625, 0.380096435546875, 0.42962646484375, 0.479156494140625, 0.5286865234375, 0.578216552734375, 0.62774658203125, 0.677276611328125, 0.726806640625, 0.776336669921875, 0.82586669921875, 0.875396728515625, 0.9249267578125, 0.974456787109375, 1.02398681640625, 1.073516845703125, 1.123046875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 13.0, 34.0, 135.0, 394.0, 306.0, 82.0, 24.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.721954345703125, -13.120304107666016, -12.518653869628906, -11.917003631591797, -11.315353393554688, -10.713703155517578, -10.112052917480469, -9.51040267944336, -8.90875244140625, -8.30710220336914, -7.705451965332031, -7.103801727294922, -6.5021514892578125, -5.900501251220703, -5.298851013183594, -4.697200775146484, -4.095550537109375, -3.4939002990722656, -2.8922500610351562, -2.290599822998047, -1.6889495849609375, -1.0872993469238281, -0.48564910888671875, 0.11600112915039062, 0.7176513671875, 1.3193016052246094, 1.9209518432617188, 2.522602081298828, 3.1242523193359375, 3.725902557373047, 4.327552795410156, 4.929203033447266, 5.530853271484375, 6.132503509521484, 6.734153747558594, 7.335803985595703, 7.9374542236328125, 8.539104461669922, 9.140754699707031, 9.74240493774414, 10.34405517578125, 10.94570541381836, 11.547355651855469, 12.149005889892578, 12.750656127929688, 13.352306365966797, 13.953956604003906, 14.555606842041016, 15.157257080078125, 15.758907318115234, 16.360557556152344, 16.962207794189453, 17.563858032226562, 18.165508270263672, 18.76715850830078, 19.36880874633789, 19.970458984375, 20.57210922241211, 21.17375946044922, 21.775409698486328, 22.377059936523438, 22.978710174560547, 23.580360412597656, 24.182010650634766, 24.783660888671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 9.0, 6.0, 13.0, 16.0, 20.0, 24.0, 29.0, 27.0, 29.0, 42.0, 30.0, 43.0, 40.0, 53.0, 58.0, 55.0, 47.0, 64.0, 52.0, 35.0, 35.0, 44.0, 29.0, 32.0, 20.0, 23.0, 16.0, 22.0, 22.0, 11.0, 9.0, 5.0, 6.0, 3.0, 2.0, 11.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.170454502105713, -4.041761875152588, -3.913069248199463, -3.784376382827759, -3.655683755874634, -3.526991128921509, -3.3982982635498047, -3.2696056365966797, -3.1409130096435547, -3.0122203826904297, -2.8835277557373047, -2.7548348903656006, -2.6261422634124756, -2.4974496364593506, -2.3687567710876465, -2.2400641441345215, -2.1113715171813965, -1.9826788902282715, -1.853986144065857, -1.7252933979034424, -1.5966007709503174, -1.4679081439971924, -1.3392153978347778, -1.2105226516723633, -1.0818300247192383, -0.9531373381614685, -0.8244446516036987, -0.695751965045929, -0.5670592784881592, -0.4383665919303894, -0.30967390537261963, -0.18098121881484985, -0.05228900909423828, 0.0764036774635315, 0.20509636402130127, 0.33378905057907104, 0.4624817371368408, 0.5911744236946106, 0.7198671102523804, 0.8485597968101501, 0.9772524833679199, 1.105945110321045, 1.2346378564834595, 1.363330602645874, 1.492023229598999, 1.620715856552124, 1.7494086027145386, 1.8781013488769531, 2.006793975830078, 2.135486602783203, 2.264179229736328, 2.3928720951080322, 2.5215647220611572, 2.6502573490142822, 2.7789502143859863, 2.9076428413391113, 3.0363354682922363, 3.1650280952453613, 3.2937207221984863, 3.4224135875701904, 3.5511062145233154, 3.6797988414764404, 3.8084917068481445, 3.9371843338012695, 4.0658769607543945]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 5.0, 5.0, 7.0, 6.0, 24.0, 18.0, 35.0, 40.0, 75.0, 108.0, 176.0, 239.0, 469.0, 752.0, 1282.0, 2448.0, 4962.0, 10619.0, 25634.0, 71388.0, 234828.0, 444235.0, 162498.0, 52126.0, 19453.0, 8423.0, 3901.0, 2024.0, 1146.0, 560.0, 385.0, 218.0, 147.0, 98.0, 48.0, 48.0, 39.0, 24.0, 23.0, 14.0, 4.0, 7.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8310546875, -0.8061370849609375, -0.781219482421875, -0.7563018798828125, -0.73138427734375, -0.7064666748046875, -0.681549072265625, -0.6566314697265625, -0.6317138671875, -0.6067962646484375, -0.581878662109375, -0.5569610595703125, -0.53204345703125, -0.5071258544921875, -0.482208251953125, -0.4572906494140625, -0.432373046875, -0.4074554443359375, -0.382537841796875, -0.3576202392578125, -0.33270263671875, -0.3077850341796875, -0.282867431640625, -0.2579498291015625, -0.2330322265625, -0.2081146240234375, -0.183197021484375, -0.1582794189453125, -0.13336181640625, -0.1084442138671875, -0.083526611328125, -0.0586090087890625, -0.03369140625, -0.0087738037109375, 0.016143798828125, 0.0410614013671875, 0.06597900390625, 0.0908966064453125, 0.115814208984375, 0.1407318115234375, 0.1656494140625, 0.1905670166015625, 0.215484619140625, 0.2404022216796875, 0.26531982421875, 0.2902374267578125, 0.315155029296875, 0.3400726318359375, 0.364990234375, 0.3899078369140625, 0.414825439453125, 0.4397430419921875, 0.46466064453125, 0.4895782470703125, 0.514495849609375, 0.5394134521484375, 0.5643310546875, 0.5892486572265625, 0.614166259765625, 0.6390838623046875, 0.66400146484375, 0.6889190673828125, 0.713836669921875, 0.7387542724609375, 0.763671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 9.0, 7.0, 6.0, 5.0, 13.0, 13.0, 19.0, 21.0, 17.0, 22.0, 17.0, 33.0, 34.0, 38.0, 40.0, 37.0, 52.0, 47.0, 41.0, 42.0, 44.0, 50.0, 47.0, 49.0, 42.0, 31.0, 32.0, 23.0, 29.0, 23.0, 18.0, 20.0, 14.0, 14.0, 10.0, 7.0, 9.0, 6.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.39208984375, -0.3799552917480469, -0.36782073974609375, -0.3556861877441406, -0.3435516357421875, -0.3314170837402344, -0.31928253173828125, -0.3071479797363281, -0.295013427734375, -0.2828788757324219, -0.27074432373046875, -0.2586097717285156, -0.2464752197265625, -0.23434066772460938, -0.22220611572265625, -0.21007156372070312, -0.19793701171875, -0.18580245971679688, -0.17366790771484375, -0.16153335571289062, -0.1493988037109375, -0.13726425170898438, -0.12512969970703125, -0.11299514770507812, -0.100860595703125, -0.08872604370117188, -0.07659149169921875, -0.06445693969726562, -0.0523223876953125, -0.040187835693359375, -0.02805328369140625, -0.015918731689453125, -0.0037841796875, 0.008350372314453125, 0.02048492431640625, 0.032619476318359375, 0.0447540283203125, 0.056888580322265625, 0.06902313232421875, 0.08115768432617188, 0.093292236328125, 0.10542678833007812, 0.11756134033203125, 0.12969589233398438, 0.1418304443359375, 0.15396499633789062, 0.16609954833984375, 0.17823410034179688, 0.19036865234375, 0.20250320434570312, 0.21463775634765625, 0.22677230834960938, 0.2389068603515625, 0.2510414123535156, 0.26317596435546875, 0.2753105163574219, 0.287445068359375, 0.2995796203613281, 0.31171417236328125, 0.3238487243652344, 0.3359832763671875, 0.3481178283691406, 0.36025238037109375, 0.3723869323730469, 0.384521484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 15.0, 15.0, 21.0, 37.0, 37.0, 72.0, 93.0, 144.0, 201.0, 338.0, 560.0, 1182.0, 3243.0, 14931.0, 181810.0, 799960.0, 36517.0, 5680.0, 1697.0, 760.0, 422.0, 286.0, 167.0, 110.0, 70.0, 46.0, 41.0, 14.0, 20.0, 11.0, 9.0, 14.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.642578125, -1.5899505615234375, -1.537322998046875, -1.4846954345703125, -1.43206787109375, -1.3794403076171875, -1.326812744140625, -1.2741851806640625, -1.2215576171875, -1.1689300537109375, -1.116302490234375, -1.0636749267578125, -1.01104736328125, -0.9584197998046875, -0.905792236328125, -0.8531646728515625, -0.800537109375, -0.7479095458984375, -0.695281982421875, -0.6426544189453125, -0.59002685546875, -0.5373992919921875, -0.484771728515625, -0.4321441650390625, -0.3795166015625, -0.3268890380859375, -0.274261474609375, -0.2216339111328125, -0.16900634765625, -0.1163787841796875, -0.063751220703125, -0.0111236572265625, 0.04150390625, 0.0941314697265625, 0.146759033203125, 0.1993865966796875, 0.25201416015625, 0.3046417236328125, 0.357269287109375, 0.4098968505859375, 0.4625244140625, 0.5151519775390625, 0.567779541015625, 0.6204071044921875, 0.67303466796875, 0.7256622314453125, 0.778289794921875, 0.8309173583984375, 0.883544921875, 0.9361724853515625, 0.988800048828125, 1.0414276123046875, 1.09405517578125, 1.1466827392578125, 1.199310302734375, 1.2519378662109375, 1.3045654296875, 1.3571929931640625, 1.409820556640625, 1.4624481201171875, 1.51507568359375, 1.5677032470703125, 1.620330810546875, 1.6729583740234375, 1.7255859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 9.0, 17.0, 26.0, 19.0, 44.0, 36.0, 53.0, 49.0, 71.0, 51.0, 74.0, 75.0, 71.0, 69.0, 61.0, 56.0, 43.0, 30.0, 21.0, 19.0, 25.0, 16.0, 10.0, 14.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.310546875, -2.244537353515625, -2.17852783203125, -2.112518310546875, -2.0465087890625, -1.980499267578125, -1.91448974609375, -1.848480224609375, -1.782470703125, -1.716461181640625, -1.65045166015625, -1.584442138671875, -1.5184326171875, -1.452423095703125, -1.38641357421875, -1.320404052734375, -1.25439453125, -1.188385009765625, -1.12237548828125, -1.056365966796875, -0.9903564453125, -0.924346923828125, -0.85833740234375, -0.792327880859375, -0.726318359375, -0.660308837890625, -0.59429931640625, -0.528289794921875, -0.4622802734375, -0.396270751953125, -0.33026123046875, -0.264251708984375, -0.1982421875, -0.132232666015625, -0.06622314453125, -0.000213623046875, 0.0657958984375, 0.131805419921875, 0.19781494140625, 0.263824462890625, 0.329833984375, 0.395843505859375, 0.46185302734375, 0.527862548828125, 0.5938720703125, 0.659881591796875, 0.72589111328125, 0.791900634765625, 0.85791015625, 0.923919677734375, 0.98992919921875, 1.055938720703125, 1.1219482421875, 1.187957763671875, 1.25396728515625, 1.319976806640625, 1.385986328125, 1.451995849609375, 1.51800537109375, 1.584014892578125, 1.6500244140625, 1.716033935546875, 1.78204345703125, 1.848052978515625, 1.9140625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 9.0, 14.0, 17.0, 20.0, 24.0, 36.0, 41.0, 83.0, 118.0, 186.0, 375.0, 781.0, 1650.0, 4599.0, 16054.0, 94716.0, 814050.0, 92018.0, 15731.0, 4682.0, 1688.0, 772.0, 360.0, 189.0, 107.0, 55.0, 40.0, 38.0, 19.0, 14.0, 11.0, 16.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.366943359375, -0.355987548828125, -0.34503173828125, -0.334075927734375, -0.3231201171875, -0.312164306640625, -0.30120849609375, -0.290252685546875, -0.279296875, -0.268341064453125, -0.25738525390625, -0.246429443359375, -0.2354736328125, -0.224517822265625, -0.21356201171875, -0.202606201171875, -0.191650390625, -0.180694580078125, -0.16973876953125, -0.158782958984375, -0.1478271484375, -0.136871337890625, -0.12591552734375, -0.114959716796875, -0.10400390625, -0.093048095703125, -0.08209228515625, -0.071136474609375, -0.0601806640625, -0.049224853515625, -0.03826904296875, -0.027313232421875, -0.016357421875, -0.005401611328125, 0.00555419921875, 0.016510009765625, 0.0274658203125, 0.038421630859375, 0.04937744140625, 0.060333251953125, 0.0712890625, 0.082244873046875, 0.09320068359375, 0.104156494140625, 0.1151123046875, 0.126068115234375, 0.13702392578125, 0.147979736328125, 0.158935546875, 0.169891357421875, 0.18084716796875, 0.191802978515625, 0.2027587890625, 0.213714599609375, 0.22467041015625, 0.235626220703125, 0.24658203125, 0.257537841796875, 0.26849365234375, 0.279449462890625, 0.2904052734375, 0.301361083984375, 0.31231689453125, 0.323272705078125, 0.334228515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 1.0, 6.0, 9.0, 10.0, 16.0, 12.0, 15.0, 23.0, 29.0, 42.0, 65.0, 86.0, 126.0, 119.0, 110.0, 90.0, 56.0, 42.0, 30.0, 23.0, 19.0, 13.0, 11.0, 12.0, 7.0, 6.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.671117782592773e-05, -7.435865700244904e-05, -7.200613617897034e-05, -6.965361535549164e-05, -6.730109453201294e-05, -6.494857370853424e-05, -6.259605288505554e-05, -6.024353206157684e-05, -5.7891011238098145e-05, -5.5538490414619446e-05, -5.318596959114075e-05, -5.083344876766205e-05, -4.848092794418335e-05, -4.612840712070465e-05, -4.377588629722595e-05, -4.1423365473747253e-05, -3.9070844650268555e-05, -3.6718323826789856e-05, -3.436580300331116e-05, -3.201328217983246e-05, -2.966076135635376e-05, -2.730824053287506e-05, -2.4955719709396362e-05, -2.2603198885917664e-05, -2.0250678062438965e-05, -1.7898157238960266e-05, -1.5545636415481567e-05, -1.3193115592002869e-05, -1.084059476852417e-05, -8.488073945045471e-06, -6.1355531215667725e-06, -3.7830322980880737e-06, -1.430511474609375e-06, 9.220093488693237e-07, 3.2745301723480225e-06, 5.627050995826721e-06, 7.97957181930542e-06, 1.0332092642784119e-05, 1.2684613466262817e-05, 1.5037134289741516e-05, 1.7389655113220215e-05, 1.9742175936698914e-05, 2.2094696760177612e-05, 2.444721758365631e-05, 2.679973840713501e-05, 2.915225923061371e-05, 3.150478005409241e-05, 3.3857300877571106e-05, 3.6209821701049805e-05, 3.8562342524528503e-05, 4.09148633480072e-05, 4.32673841714859e-05, 4.56199049949646e-05, 4.79724258184433e-05, 5.0324946641922e-05, 5.2677467465400696e-05, 5.5029988288879395e-05, 5.738250911235809e-05, 5.973502993583679e-05, 6.208755075931549e-05, 6.444007158279419e-05, 6.679259240627289e-05, 6.914511322975159e-05, 7.149763405323029e-05, 7.385015487670898e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 16.0, 23.0, 65.0, 93.0, 186.0, 438.0, 1053.0, 4061.0, 34537.0, 863753.0, 132624.0, 8717.0, 1804.0, 626.0, 256.0, 143.0, 60.0, 44.0, 22.0, 5.0, 5.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52734375, -0.5117034912109375, -0.496063232421875, -0.4804229736328125, -0.46478271484375, -0.4491424560546875, -0.433502197265625, -0.4178619384765625, -0.4022216796875, -0.3865814208984375, -0.370941162109375, -0.3553009033203125, -0.33966064453125, -0.3240203857421875, -0.308380126953125, -0.2927398681640625, -0.277099609375, -0.2614593505859375, -0.245819091796875, -0.2301788330078125, -0.21453857421875, -0.1988983154296875, -0.183258056640625, -0.1676177978515625, -0.1519775390625, -0.1363372802734375, -0.120697021484375, -0.1050567626953125, -0.08941650390625, -0.0737762451171875, -0.058135986328125, -0.0424957275390625, -0.02685546875, -0.0112152099609375, 0.004425048828125, 0.0200653076171875, 0.03570556640625, 0.0513458251953125, 0.066986083984375, 0.0826263427734375, 0.0982666015625, 0.1139068603515625, 0.129547119140625, 0.1451873779296875, 0.16082763671875, 0.1764678955078125, 0.192108154296875, 0.2077484130859375, 0.223388671875, 0.2390289306640625, 0.254669189453125, 0.2703094482421875, 0.28594970703125, 0.3015899658203125, 0.317230224609375, 0.3328704833984375, 0.3485107421875, 0.3641510009765625, 0.379791259765625, 0.3954315185546875, 0.41107177734375, 0.4267120361328125, 0.442352294921875, 0.4579925537109375, 0.4736328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 10.0, 7.0, 13.0, 10.0, 22.0, 21.0, 35.0, 31.0, 56.0, 42.0, 58.0, 68.0, 82.0, 94.0, 91.0, 65.0, 52.0, 47.0, 38.0, 22.0, 26.0, 24.0, 16.0, 9.0, 10.0, 8.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.279052734375, -0.2700996398925781, -0.26114654541015625, -0.2521934509277344, -0.2432403564453125, -0.23428726196289062, -0.22533416748046875, -0.21638107299804688, -0.207427978515625, -0.19847488403320312, -0.18952178955078125, -0.18056869506835938, -0.1716156005859375, -0.16266250610351562, -0.15370941162109375, -0.14475631713867188, -0.13580322265625, -0.12685012817382812, -0.11789703369140625, -0.10894393920898438, -0.0999908447265625, -0.09103775024414062, -0.08208465576171875, -0.07313156127929688, -0.064178466796875, -0.055225372314453125, -0.04627227783203125, -0.037319183349609375, -0.0283660888671875, -0.019412994384765625, -0.01045989990234375, -0.001506805419921875, 0.0074462890625, 0.016399383544921875, 0.02535247802734375, 0.034305572509765625, 0.0432586669921875, 0.052211761474609375, 0.06116485595703125, 0.07011795043945312, 0.079071044921875, 0.08802413940429688, 0.09697723388671875, 0.10593032836914062, 0.1148834228515625, 0.12383651733398438, 0.13278961181640625, 0.14174270629882812, 0.15069580078125, 0.15964889526367188, 0.16860198974609375, 0.17755508422851562, 0.1865081787109375, 0.19546127319335938, 0.20441436767578125, 0.21336746215820312, 0.222320556640625, 0.23127365112304688, 0.24022674560546875, 0.24917984008789062, 0.2581329345703125, 0.2670860290527344, 0.27603912353515625, 0.2849922180175781, 0.2939453125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 7.0, 13.0, 36.0, 74.0, 234.0, 495.0, 98.0, 32.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.056167602539062, -17.497779846191406, -16.939390182495117, -16.38100242614746, -15.822614669799805, -15.264225959777832, -14.70583724975586, -14.147449493408203, -13.589061737060547, -13.030673027038574, -12.472285270690918, -11.913896560668945, -11.355508804321289, -10.797120094299316, -10.238731384277344, -9.680343627929688, -9.121954917907715, -8.563566207885742, -8.005178451538086, -7.446789741516113, -6.888401985168457, -6.330013275146484, -5.77162504196167, -5.2132368087768555, -4.654848575592041, -4.096460342407227, -3.538072109222412, -2.9796836376190186, -2.421295404434204, -1.8629071712493896, -1.304518699645996, -0.7461304664611816, -0.1877422332763672, 0.37064605951309204, 0.9290343523025513, 1.4874227046966553, 2.0458109378814697, 2.604199171066284, 3.1625876426696777, 3.720975875854492, 4.279364109039307, 4.837752342224121, 5.3961405754089355, 5.95452880859375, 6.512917518615723, 7.071305274963379, 7.629693984985352, 8.188081741333008, 8.74647045135498, 9.304859161376953, 9.86324691772461, 10.421635627746582, 10.980023384094238, 11.538412094116211, 12.096799850463867, 12.65518856048584, 13.213577270507812, 13.771965980529785, 14.330353736877441, 14.888742446899414, 15.44713020324707, 16.005517959594727, 16.563907623291016, 17.122295379638672, 17.680683135986328]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 2.0, 8.0, 7.0, 10.0, 7.0, 10.0, 11.0, 7.0, 20.0, 27.0, 24.0, 21.0, 23.0, 27.0, 43.0, 49.0, 78.0, 119.0, 103.0, 62.0, 42.0, 29.0, 40.0, 27.0, 21.0, 23.0, 16.0, 15.0, 20.0, 8.0, 14.0, 14.0, 5.0, 6.0, 6.0, 16.0, 3.0, 8.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.256782531738281, -6.059810638427734, -5.862838268280029, -5.665866374969482, -5.468894004821777, -5.2719221115112305, -5.074950218200684, -4.8779778480529785, -4.681005954742432, -4.484034061431885, -4.28706169128418, -4.090089797973633, -3.893117666244507, -3.696145534515381, -3.499173402786255, -3.302201271057129, -3.105229139328003, -2.908257007598877, -2.711284875869751, -2.514312744140625, -2.317340850830078, -2.120368719100952, -1.9233965873718262, -1.7264245748519897, -1.5294524431228638, -1.3324803113937378, -1.1355082988739014, -0.9385361671447754, -0.7415640950202942, -0.544592022895813, -0.347619891166687, -0.15064787864685059, 0.04632425308227539, 0.24329634010791779, 0.4402684271335602, 0.6372405290603638, 0.834212601184845, 1.0311846733093262, 1.2281568050384521, 1.4251288175582886, 1.6221009492874146, 1.8190730810165405, 2.016045093536377, 2.213017225265503, 2.409989356994629, 2.606961250305176, 2.803933620452881, 3.0009055137634277, 3.1978776454925537, 3.3948497772216797, 3.5918219089508057, 3.7887940406799316, 3.9857659339904785, 4.182738304138184, 4.3797101974487305, 4.576682090759277, 4.773654460906982, 4.970626354217529, 5.167598724365234, 5.364570617675781, 5.561542987823486, 5.758514881134033, 5.955487251281738, 6.152459144592285, 6.349431037902832]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 4.0, 8.0, 13.0, 10.0, 15.0, 21.0, 41.0, 53.0, 81.0, 109.0, 197.0, 306.0, 472.0, 802.0, 1305.0, 2279.0, 4301.0, 8690.0, 21904.0, 72343.0, 313818.0, 1159578.0, 1735770.0, 649837.0, 155152.0, 39654.0, 13952.0, 6168.0, 3118.0, 1724.0, 988.0, 604.0, 342.0, 233.0, 131.0, 79.0, 64.0, 46.0, 22.0, 17.0, 15.0, 10.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.52392578125, -0.5086326599121094, -0.49333953857421875, -0.4780464172363281, -0.4627532958984375, -0.4474601745605469, -0.43216705322265625, -0.4168739318847656, -0.401580810546875, -0.3862876892089844, -0.37099456787109375, -0.3557014465332031, -0.3404083251953125, -0.3251152038574219, -0.30982208251953125, -0.2945289611816406, -0.27923583984375, -0.2639427185058594, -0.24864959716796875, -0.23335647583007812, -0.2180633544921875, -0.20277023315429688, -0.18747711181640625, -0.17218399047851562, -0.156890869140625, -0.14159774780273438, -0.12630462646484375, -0.11101150512695312, -0.0957183837890625, -0.08042526245117188, -0.06513214111328125, -0.049839019775390625, -0.0345458984375, -0.019252777099609375, -0.00395965576171875, 0.011333465576171875, 0.0266265869140625, 0.041919708251953125, 0.05721282958984375, 0.07250595092773438, 0.087799072265625, 0.10309219360351562, 0.11838531494140625, 0.13367843627929688, 0.1489715576171875, 0.16426467895507812, 0.17955780029296875, 0.19485092163085938, 0.21014404296875, 0.22543716430664062, 0.24073028564453125, 0.2560234069824219, 0.2713165283203125, 0.2866096496582031, 0.30190277099609375, 0.3171958923339844, 0.332489013671875, 0.3477821350097656, 0.36307525634765625, 0.3783683776855469, 0.3936614990234375, 0.4089546203613281, 0.42424774169921875, 0.4395408630371094, 0.454833984375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 7.0, 9.0, 14.0, 14.0, 15.0, 13.0, 24.0, 19.0, 30.0, 33.0, 34.0, 31.0, 55.0, 43.0, 58.0, 60.0, 57.0, 43.0, 53.0, 64.0, 48.0, 35.0, 39.0, 32.0, 24.0, 25.0, 29.0, 17.0, 16.0, 14.0, 8.0, 11.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4033203125, -0.3900871276855469, -0.37685394287109375, -0.3636207580566406, -0.3503875732421875, -0.3371543884277344, -0.32392120361328125, -0.3106880187988281, -0.297454833984375, -0.2842216491699219, -0.27098846435546875, -0.2577552795410156, -0.2445220947265625, -0.23128890991210938, -0.21805572509765625, -0.20482254028320312, -0.19158935546875, -0.17835617065429688, -0.16512298583984375, -0.15188980102539062, -0.1386566162109375, -0.12542343139648438, -0.11219024658203125, -0.09895706176757812, -0.085723876953125, -0.07249069213867188, -0.05925750732421875, -0.046024322509765625, -0.0327911376953125, -0.019557952880859375, -0.00632476806640625, 0.006908416748046875, 0.0201416015625, 0.033374786376953125, 0.04660797119140625, 0.059841156005859375, 0.0730743408203125, 0.08630752563476562, 0.09954071044921875, 0.11277389526367188, 0.126007080078125, 0.13924026489257812, 0.15247344970703125, 0.16570663452148438, 0.1789398193359375, 0.19217300415039062, 0.20540618896484375, 0.21863937377929688, 0.23187255859375, 0.24510574340820312, 0.25833892822265625, 0.2715721130371094, 0.2848052978515625, 0.2980384826660156, 0.31127166748046875, 0.3245048522949219, 0.337738037109375, 0.3509712219238281, 0.36420440673828125, 0.3774375915527344, 0.3906707763671875, 0.4039039611816406, 0.41713714599609375, 0.4303703308105469, 0.443603515625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 3.0, 12.0, 12.0, 16.0, 20.0, 28.0, 61.0, 100.0, 199.0, 468.0, 1171.0, 4712.0, 81662.0, 4062770.0, 37373.0, 3714.0, 1044.0, 453.0, 210.0, 82.0, 74.0, 38.0, 24.0, 10.0, 5.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48828125, -2.403656005859375, -2.31903076171875, -2.234405517578125, -2.1497802734375, -2.065155029296875, -1.98052978515625, -1.895904541015625, -1.811279296875, -1.726654052734375, -1.64202880859375, -1.557403564453125, -1.4727783203125, -1.388153076171875, -1.30352783203125, -1.218902587890625, -1.13427734375, -1.049652099609375, -0.96502685546875, -0.880401611328125, -0.7957763671875, -0.711151123046875, -0.62652587890625, -0.541900634765625, -0.457275390625, -0.372650146484375, -0.28802490234375, -0.203399658203125, -0.1187744140625, -0.034149169921875, 0.05047607421875, 0.135101318359375, 0.2197265625, 0.304351806640625, 0.38897705078125, 0.473602294921875, 0.5582275390625, 0.642852783203125, 0.72747802734375, 0.812103271484375, 0.896728515625, 0.981353759765625, 1.06597900390625, 1.150604248046875, 1.2352294921875, 1.319854736328125, 1.40447998046875, 1.489105224609375, 1.57373046875, 1.658355712890625, 1.74298095703125, 1.827606201171875, 1.9122314453125, 1.996856689453125, 2.08148193359375, 2.166107177734375, 2.250732421875, 2.335357666015625, 2.41998291015625, 2.504608154296875, 2.5892333984375, 2.673858642578125, 2.75848388671875, 2.843109130859375, 2.927734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 11.0, 16.0, 21.0, 60.0, 93.0, 161.0, 281.0, 535.0, 846.0, 848.0, 513.0, 285.0, 154.0, 99.0, 53.0, 35.0, 19.0, 12.0, 4.0, 6.0, 8.0, 7.0, 1.0, 3.0, 3.0, 2.0], "bins": [-2.6875, -2.6300811767578125, -2.572662353515625, -2.5152435302734375, -2.45782470703125, -2.4004058837890625, -2.342987060546875, -2.2855682373046875, -2.2281494140625, -2.1707305908203125, -2.113311767578125, -2.0558929443359375, -1.99847412109375, -1.9410552978515625, -1.883636474609375, -1.8262176513671875, -1.768798828125, -1.7113800048828125, -1.653961181640625, -1.5965423583984375, -1.53912353515625, -1.4817047119140625, -1.424285888671875, -1.3668670654296875, -1.3094482421875, -1.2520294189453125, -1.194610595703125, -1.1371917724609375, -1.07977294921875, -1.0223541259765625, -0.964935302734375, -0.9075164794921875, -0.85009765625, -0.7926788330078125, -0.735260009765625, -0.6778411865234375, -0.62042236328125, -0.5630035400390625, -0.505584716796875, -0.4481658935546875, -0.3907470703125, -0.3333282470703125, -0.275909423828125, -0.2184906005859375, -0.16107177734375, -0.1036529541015625, -0.046234130859375, 0.0111846923828125, 0.068603515625, 0.1260223388671875, 0.183441162109375, 0.2408599853515625, 0.29827880859375, 0.3556976318359375, 0.413116455078125, 0.4705352783203125, 0.5279541015625, 0.5853729248046875, 0.642791748046875, 0.7002105712890625, 0.75762939453125, 0.8150482177734375, 0.872467041015625, 0.9298858642578125, 0.9873046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 10.0, 9.0, 16.0, 35.0, 44.0, 72.0, 170.0, 219.0, 170.0, 108.0, 57.0, 28.0, 15.0, 9.0, 12.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.74794864654541, -11.288476943969727, -10.829004287719727, -10.369531631469727, -9.910059928894043, -9.45058822631836, -8.99111557006836, -8.53164291381836, -8.072171211242676, -7.612699031829834, -7.153226852416992, -6.69375467300415, -6.234282493591309, -5.774810314178467, -5.315338134765625, -4.855865955352783, -4.396393775939941, -3.9369215965270996, -3.477449417114258, -3.017977237701416, -2.558505058288574, -2.0990328788757324, -1.6395606994628906, -1.1800885200500488, -0.720616340637207, -0.26114416122436523, 0.19832801818847656, 0.6578001976013184, 1.1172723770141602, 1.576744556427002, 2.0362167358398438, 2.4956889152526855, 2.955160140991211, 3.4146323204040527, 3.8741044998168945, 4.333576679229736, 4.793048858642578, 5.25252103805542, 5.711993217468262, 6.1714653968811035, 6.630937576293945, 7.090409755706787, 7.549881935119629, 8.009353637695312, 8.468826293945312, 8.928298950195312, 9.387770652770996, 9.84724235534668, 10.30671501159668, 10.76618766784668, 11.225659370422363, 11.685131072998047, 12.144603729248047, 12.604076385498047, 13.06354808807373, 13.523019790649414, 13.982492446899414, 14.441965103149414, 14.901436805725098, 15.360908508300781, 15.820381164550781, 16.27985382080078, 16.73932647705078, 17.19879722595215, 17.65826988220215]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 3.0, 12.0, 9.0, 14.0, 16.0, 9.0, 20.0, 24.0, 36.0, 32.0, 40.0, 46.0, 59.0, 38.0, 57.0, 46.0, 75.0, 80.0, 60.0, 57.0, 40.0, 46.0, 39.0, 36.0, 18.0, 17.0, 16.0, 14.0, 10.0, 4.0, 5.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.849696159362793, -8.571756362915039, -8.293816566467285, -8.015877723693848, -7.737937927246094, -7.45999813079834, -7.182058334350586, -6.904118537902832, -6.626179218292236, -6.348239421844482, -6.070300102233887, -5.792360305786133, -5.514420509338379, -5.236481189727783, -4.958541393280029, -4.680602073669434, -4.40266227722168, -4.124722480773926, -3.84678316116333, -3.568843364715576, -3.2909038066864014, -3.0129642486572266, -2.7350244522094727, -2.457084894180298, -2.179145336151123, -1.9012057781219482, -1.6232661008834839, -1.3453264236450195, -1.0673868656158447, -0.7894473075866699, -0.5115076303482056, -0.2335679531097412, 0.04437065124511719, 0.32231026887893677, 0.6002498865127563, 0.8781895041465759, 1.1561291217803955, 1.4340686798095703, 1.7120083570480347, 1.989948034286499, 2.267887592315674, 2.5458271503448486, 2.8237667083740234, 3.1017065048217773, 3.379646062850952, 3.657585620880127, 3.935525417327881, 4.213464736938477, 4.4914045333862305, 4.769344329833984, 5.04728364944458, 5.325223445892334, 5.60316276550293, 5.881102561950684, 6.1590423583984375, 6.436982154846191, 6.714921474456787, 6.992861270904541, 7.270800590515137, 7.548740386962891, 7.8266801834106445, 8.104619979858398, 8.382558822631836, 8.66049861907959, 8.938438415527344]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 10.0, 10.0, 13.0, 18.0, 26.0, 65.0, 92.0, 198.0, 364.0, 897.0, 2307.0, 7551.0, 38909.0, 609468.0, 349376.0, 29433.0, 6296.0, 2030.0, 774.0, 369.0, 158.0, 80.0, 48.0, 23.0, 16.0, 5.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.40997314453125, -1.3707275390625, -1.33148193359375, -1.292236328125, -1.25299072265625, -1.2137451171875, -1.17449951171875, -1.13525390625, -1.09600830078125, -1.0567626953125, -1.01751708984375, -0.978271484375, -0.93902587890625, -0.8997802734375, -0.86053466796875, -0.8212890625, -0.78204345703125, -0.7427978515625, -0.70355224609375, -0.664306640625, -0.62506103515625, -0.5858154296875, -0.54656982421875, -0.50732421875, -0.46807861328125, -0.4288330078125, -0.38958740234375, -0.350341796875, -0.31109619140625, -0.2718505859375, -0.23260498046875, -0.193359375, -0.15411376953125, -0.1148681640625, -0.07562255859375, -0.036376953125, 0.00286865234375, 0.0421142578125, 0.08135986328125, 0.12060546875, 0.15985107421875, 0.1990966796875, 0.23834228515625, 0.277587890625, 0.31683349609375, 0.3560791015625, 0.39532470703125, 0.4345703125, 0.47381591796875, 0.5130615234375, 0.55230712890625, 0.591552734375, 0.63079833984375, 0.6700439453125, 0.70928955078125, 0.74853515625, 0.78778076171875, 0.8270263671875, 0.86627197265625, 0.905517578125, 0.94476318359375, 0.9840087890625, 1.02325439453125, 1.0625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 7.0, 12.0, 6.0, 21.0, 22.0, 28.0, 40.0, 30.0, 70.0, 51.0, 60.0, 92.0, 75.0, 71.0, 87.0, 65.0, 63.0, 55.0, 33.0, 31.0, 34.0, 18.0, 12.0, 13.0, 9.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86669921875, -0.842559814453125, -0.81842041015625, -0.794281005859375, -0.7701416015625, -0.746002197265625, -0.72186279296875, -0.697723388671875, -0.673583984375, -0.649444580078125, -0.62530517578125, -0.601165771484375, -0.5770263671875, -0.552886962890625, -0.52874755859375, -0.504608154296875, -0.48046875, -0.456329345703125, -0.43218994140625, -0.408050537109375, -0.3839111328125, -0.359771728515625, -0.33563232421875, -0.311492919921875, -0.287353515625, -0.263214111328125, -0.23907470703125, -0.214935302734375, -0.1907958984375, -0.166656494140625, -0.14251708984375, -0.118377685546875, -0.09423828125, -0.070098876953125, -0.04595947265625, -0.021820068359375, 0.0023193359375, 0.026458740234375, 0.05059814453125, 0.074737548828125, 0.098876953125, 0.123016357421875, 0.14715576171875, 0.171295166015625, 0.1954345703125, 0.219573974609375, 0.24371337890625, 0.267852783203125, 0.2919921875, 0.316131591796875, 0.34027099609375, 0.364410400390625, 0.3885498046875, 0.412689208984375, 0.43682861328125, 0.460968017578125, 0.485107421875, 0.509246826171875, 0.53338623046875, 0.557525634765625, 0.5816650390625, 0.605804443359375, 0.62994384765625, 0.654083251953125, 0.67822265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 9.0, 10.0, 7.0, 10.0, 12.0, 18.0, 18.0, 26.0, 38.0, 40.0, 68.0, 93.0, 129.0, 185.0, 288.0, 521.0, 1002.0, 2605.0, 10061.0, 69589.0, 904951.0, 46807.0, 7559.0, 2286.0, 883.0, 446.0, 263.0, 156.0, 120.0, 85.0, 73.0, 36.0, 40.0, 34.0, 18.0, 16.0, 17.0, 10.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.9829864501953125, -0.948394775390625, -0.9138031005859375, -0.87921142578125, -0.8446197509765625, -0.810028076171875, -0.7754364013671875, -0.7408447265625, -0.7062530517578125, -0.671661376953125, -0.6370697021484375, -0.60247802734375, -0.5678863525390625, -0.533294677734375, -0.4987030029296875, -0.464111328125, -0.4295196533203125, -0.394927978515625, -0.3603363037109375, -0.32574462890625, -0.2911529541015625, -0.256561279296875, -0.2219696044921875, -0.1873779296875, -0.1527862548828125, -0.118194580078125, -0.0836029052734375, -0.04901123046875, -0.0144195556640625, 0.020172119140625, 0.0547637939453125, 0.08935546875, 0.1239471435546875, 0.158538818359375, 0.1931304931640625, 0.22772216796875, 0.2623138427734375, 0.296905517578125, 0.3314971923828125, 0.3660888671875, 0.4006805419921875, 0.435272216796875, 0.4698638916015625, 0.50445556640625, 0.5390472412109375, 0.573638916015625, 0.6082305908203125, 0.642822265625, 0.6774139404296875, 0.712005615234375, 0.7465972900390625, 0.78118896484375, 0.8157806396484375, 0.850372314453125, 0.8849639892578125, 0.9195556640625, 0.9541473388671875, 0.988739013671875, 1.0233306884765625, 1.05792236328125, 1.0925140380859375, 1.127105712890625, 1.1616973876953125, 1.1962890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 3.0, 10.0, 6.0, 8.0, 10.0, 11.0, 9.0, 13.0, 16.0, 18.0, 18.0, 20.0, 15.0, 29.0, 41.0, 41.0, 56.0, 72.0, 67.0, 82.0, 64.0, 62.0, 66.0, 32.0, 35.0, 21.0, 24.0, 21.0, 18.0, 12.0, 8.0, 13.0, 9.0, 8.0, 3.0, 7.0, 7.0, 5.0, 6.0, 5.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-1.9619140625, -1.904754638671875, -1.84759521484375, -1.790435791015625, -1.7332763671875, -1.676116943359375, -1.61895751953125, -1.561798095703125, -1.504638671875, -1.447479248046875, -1.39031982421875, -1.333160400390625, -1.2760009765625, -1.218841552734375, -1.16168212890625, -1.104522705078125, -1.04736328125, -0.990203857421875, -0.93304443359375, -0.875885009765625, -0.8187255859375, -0.761566162109375, -0.70440673828125, -0.647247314453125, -0.590087890625, -0.532928466796875, -0.47576904296875, -0.418609619140625, -0.3614501953125, -0.304290771484375, -0.24713134765625, -0.189971923828125, -0.1328125, -0.075653076171875, -0.01849365234375, 0.038665771484375, 0.0958251953125, 0.152984619140625, 0.21014404296875, 0.267303466796875, 0.324462890625, 0.381622314453125, 0.43878173828125, 0.495941162109375, 0.5531005859375, 0.610260009765625, 0.66741943359375, 0.724578857421875, 0.78173828125, 0.838897705078125, 0.89605712890625, 0.953216552734375, 1.0103759765625, 1.067535400390625, 1.12469482421875, 1.181854248046875, 1.239013671875, 1.296173095703125, 1.35333251953125, 1.410491943359375, 1.4676513671875, 1.524810791015625, 1.58197021484375, 1.639129638671875, 1.6962890625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 9.0, 5.0, 9.0, 16.0, 15.0, 35.0, 45.0, 76.0, 100.0, 211.0, 462.0, 1046.0, 3372.0, 23245.0, 963104.0, 49095.0, 5235.0, 1321.0, 540.0, 250.0, 144.0, 69.0, 48.0, 16.0, 16.0, 16.0, 7.0, 10.0, 6.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.377197265625, -0.3648834228515625, -0.352569580078125, -0.3402557373046875, -0.32794189453125, -0.3156280517578125, -0.303314208984375, -0.2910003662109375, -0.2786865234375, -0.2663726806640625, -0.254058837890625, -0.2417449951171875, -0.22943115234375, -0.2171173095703125, -0.204803466796875, -0.1924896240234375, -0.18017578125, -0.1678619384765625, -0.155548095703125, -0.1432342529296875, -0.13092041015625, -0.1186065673828125, -0.106292724609375, -0.0939788818359375, -0.0816650390625, -0.0693511962890625, -0.057037353515625, -0.0447235107421875, -0.03240966796875, -0.0200958251953125, -0.007781982421875, 0.0045318603515625, 0.016845703125, 0.0291595458984375, 0.041473388671875, 0.0537872314453125, 0.06610107421875, 0.0784149169921875, 0.090728759765625, 0.1030426025390625, 0.1153564453125, 0.1276702880859375, 0.139984130859375, 0.1522979736328125, 0.16461181640625, 0.1769256591796875, 0.189239501953125, 0.2015533447265625, 0.2138671875, 0.2261810302734375, 0.238494873046875, 0.2508087158203125, 0.26312255859375, 0.2754364013671875, 0.287750244140625, 0.3000640869140625, 0.3123779296875, 0.3246917724609375, 0.337005615234375, 0.3493194580078125, 0.36163330078125, 0.3739471435546875, 0.386260986328125, 0.3985748291015625, 0.410888671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 11.0, 27.0, 52.0, 117.0, 374.0, 248.0, 76.0, 45.0, 19.0, 16.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022208690643310547, -0.00021635927259922028, -0.00021063163876533508, -0.0002049040049314499, -0.0001991763710975647, -0.0001934487372636795, -0.0001877211034297943, -0.00018199346959590912, -0.00017626583576202393, -0.00017053820192813873, -0.00016481056809425354, -0.00015908293426036835, -0.00015335530042648315, -0.00014762766659259796, -0.00014190003275871277, -0.00013617239892482758, -0.00013044476509094238, -0.0001247171312570572, -0.000118989497423172, -0.0001132618635892868, -0.00010753422975540161, -0.00010180659592151642, -9.607896208763123e-05, -9.035132825374603e-05, -8.462369441986084e-05, -7.889606058597565e-05, -7.316842675209045e-05, -6.744079291820526e-05, -6.171315908432007e-05, -5.5985525250434875e-05, -5.025789141654968e-05, -4.453025758266449e-05, -3.88026237487793e-05, -3.3074989914894104e-05, -2.734735608100891e-05, -2.1619722247123718e-05, -1.5892088413238525e-05, -1.0164454579353333e-05, -4.43682074546814e-06, 1.2908130884170532e-06, 7.018446922302246e-06, 1.2746080756187439e-05, 1.8473714590072632e-05, 2.4201348423957825e-05, 2.9928982257843018e-05, 3.565661609172821e-05, 4.13842499256134e-05, 4.7111883759498596e-05, 5.283951759338379e-05, 5.856715142726898e-05, 6.429478526115417e-05, 7.002241909503937e-05, 7.575005292892456e-05, 8.147768676280975e-05, 8.720532059669495e-05, 9.293295443058014e-05, 9.866058826446533e-05, 0.00010438822209835052, 0.00011011585593223572, 0.00011584348976612091, 0.0001215711236000061, 0.0001272987574338913, 0.0001330263912677765, 0.00013875402510166168, 0.00014448165893554688]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 7.0, 4.0, 6.0, 13.0, 18.0, 19.0, 33.0, 40.0, 77.0, 96.0, 167.0, 216.0, 430.0, 803.0, 1607.0, 4027.0, 13147.0, 75470.0, 888538.0, 47590.0, 9852.0, 3298.0, 1367.0, 684.0, 383.0, 222.0, 123.0, 97.0, 69.0, 45.0, 25.0, 21.0, 16.0, 7.0, 7.0, 11.0, 4.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18359375, -0.17712783813476562, -0.17066192626953125, -0.16419601440429688, -0.1577301025390625, -0.15126419067382812, -0.14479827880859375, -0.13833236694335938, -0.131866455078125, -0.12540054321289062, -0.11893463134765625, -0.11246871948242188, -0.1060028076171875, -0.09953689575195312, -0.09307098388671875, -0.08660507202148438, -0.08013916015625, -0.07367324829101562, -0.06720733642578125, -0.060741424560546875, -0.0542755126953125, -0.047809600830078125, -0.04134368896484375, -0.034877777099609375, -0.028411865234375, -0.021945953369140625, -0.01548004150390625, -0.009014129638671875, -0.0025482177734375, 0.003917694091796875, 0.01038360595703125, 0.016849517822265625, 0.0233154296875, 0.029781341552734375, 0.03624725341796875, 0.042713165283203125, 0.0491790771484375, 0.055644989013671875, 0.06211090087890625, 0.06857681274414062, 0.075042724609375, 0.08150863647460938, 0.08797454833984375, 0.09444046020507812, 0.1009063720703125, 0.10737228393554688, 0.11383819580078125, 0.12030410766601562, 0.12677001953125, 0.13323593139648438, 0.13970184326171875, 0.14616775512695312, 0.1526336669921875, 0.15909957885742188, 0.16556549072265625, 0.17203140258789062, 0.178497314453125, 0.18496322631835938, 0.19142913818359375, 0.19789505004882812, 0.2043609619140625, 0.21082687377929688, 0.21729278564453125, 0.22375869750976562, 0.230224609375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 7.0, 11.0, 14.0, 19.0, 17.0, 29.0, 27.0, 42.0, 60.0, 134.0, 164.0, 149.0, 71.0, 63.0, 52.0, 30.0, 24.0, 15.0, 16.0, 6.0, 7.0, 2.0, 5.0, 4.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23486328125, -0.22696685791015625, -0.2190704345703125, -0.21117401123046875, -0.203277587890625, -0.19538116455078125, -0.1874847412109375, -0.17958831787109375, -0.17169189453125, -0.16379547119140625, -0.1558990478515625, -0.14800262451171875, -0.140106201171875, -0.13220977783203125, -0.1243133544921875, -0.11641693115234375, -0.1085205078125, -0.10062408447265625, -0.0927276611328125, -0.08483123779296875, -0.076934814453125, -0.06903839111328125, -0.0611419677734375, -0.05324554443359375, -0.04534912109375, -0.03745269775390625, -0.0295562744140625, -0.02165985107421875, -0.013763427734375, -0.00586700439453125, 0.0020294189453125, 0.00992584228515625, 0.017822265625, 0.02571868896484375, 0.0336151123046875, 0.04151153564453125, 0.049407958984375, 0.05730438232421875, 0.0652008056640625, 0.07309722900390625, 0.08099365234375, 0.08889007568359375, 0.0967864990234375, 0.10468292236328125, 0.112579345703125, 0.12047576904296875, 0.1283721923828125, 0.13626861572265625, 0.1441650390625, 0.15206146240234375, 0.1599578857421875, 0.16785430908203125, 0.175750732421875, 0.18364715576171875, 0.1915435791015625, 0.19944000244140625, 0.20733642578125, 0.21523284912109375, 0.2231292724609375, 0.23102569580078125, 0.238922119140625, 0.24681854248046875, 0.2547149658203125, 0.26261138916015625, 0.2705078125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 12.0, 17.0, 29.0, 75.0, 458.0, 230.0, 75.0, 48.0, 21.0, 9.0, 12.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2812445163726807, -2.948821544647217, -2.616398334503174, -2.28397536277771, -1.9515522718429565, -1.6191291809082031, -1.2867062091827393, -0.9542829990386963, -0.6218600273132324, -0.2894369661808014, 0.04298609495162964, 0.3754091262817383, 0.7078322172164917, 1.0402553081512451, 1.372678279876709, 1.705101490020752, 2.037524461746216, 2.3699474334716797, 2.7023706436157227, 3.0347936153411865, 3.3672165870666504, 3.6996397972106934, 4.032062530517578, 4.364485740661621, 4.696908950805664, 5.029332160949707, 5.361754894256592, 5.694178104400635, 6.026601314544678, 6.3590240478515625, 6.6914472579956055, 7.023870468139648, 7.356293678283691, 7.688716888427734, 8.021140098571777, 8.35356330871582, 8.685985565185547, 9.01840877532959, 9.350831985473633, 9.683255195617676, 10.015678405761719, 10.348101615905762, 10.680524826049805, 11.012947082519531, 11.345370292663574, 11.677793502807617, 12.01021671295166, 12.342639923095703, 12.67506217956543, 13.007485389709473, 13.339908599853516, 13.672330856323242, 14.004754066467285, 14.337177276611328, 14.669600486755371, 15.002023696899414, 15.334446907043457, 15.6668701171875, 15.999293327331543, 16.331716537475586, 16.664138793945312, 16.996562957763672, 17.3289852142334, 17.661407470703125, 17.993831634521484]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 9.0, 4.0, 6.0, 4.0, 7.0, 10.0, 13.0, 10.0, 22.0, 19.0, 15.0, 16.0, 26.0, 22.0, 24.0, 51.0, 200.0, 202.0, 85.0, 38.0, 28.0, 23.0, 24.0, 18.0, 14.0, 15.0, 19.0, 12.0, 6.0, 5.0, 6.0, 4.0, 7.0, 2.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0], "bins": [-5.5023298263549805, -5.335952281951904, -5.169575214385986, -5.00319766998291, -4.836820125579834, -4.670442581176758, -4.50406551361084, -4.337687969207764, -4.1713104248046875, -4.004932880401611, -3.8385555744171143, -3.672178268432617, -3.505800724029541, -3.339423418045044, -3.173046112060547, -3.0066685676574707, -2.8402915000915527, -2.6739141941070557, -2.5075366497039795, -2.3411593437194824, -2.1747817993164062, -2.008404493331909, -1.842027187347412, -1.6756497621536255, -1.5092723369598389, -1.3428949117660522, -1.1765174865722656, -1.0101401805877686, -0.8437627553939819, -0.6773853302001953, -0.5110079646110535, -0.3446305990219116, -0.178253173828125, -0.011875778436660767, 0.15450161695480347, 0.3208790123462677, 0.48725640773773193, 0.6536338329315186, 0.8200111985206604, 0.9863885641098022, 1.1527659893035889, 1.3191434144973755, 1.485520839691162, 1.6518981456756592, 1.8182755708694458, 1.9846529960632324, 2.1510303020477295, 2.3174076080322266, 2.4837851524353027, 2.6501624584198, 2.816540002822876, 2.982917308807373, 3.149294853210449, 3.3156721591949463, 3.4820494651794434, 3.6484270095825195, 3.8148043155670166, 3.9811816215515137, 4.14755916595459, 4.313936710357666, 4.480313777923584, 4.64669132232666, 4.813068866729736, 4.979445934295654, 5.1458234786987305]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 14.0, 10.0, 9.0, 8.0, 10.0, 15.0, 21.0, 25.0, 17.0, 20.0, 27.0, 28.0, 47.0, 82.0, 226.0, 118.0, 57.0, 30.0, 35.0, 32.0, 25.0, 14.0, 16.0, 17.0, 13.0, 14.0, 6.0, 14.0, 4.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.35546875, -0.3431510925292969, -0.33083343505859375, -0.3185157775878906, -0.3061981201171875, -0.2938804626464844, -0.28156280517578125, -0.2692451477050781, -0.256927490234375, -0.24460983276367188, -0.23229217529296875, -0.21997451782226562, -0.2076568603515625, -0.19533920288085938, -0.18302154541015625, -0.17070388793945312, -0.15838623046875, -0.14606857299804688, -0.13375091552734375, -0.12143325805664062, -0.1091156005859375, -0.09679794311523438, -0.08448028564453125, -0.07216262817382812, -0.059844970703125, -0.047527313232421875, -0.03520965576171875, -0.022891998291015625, -0.0105743408203125, 0.001743316650390625, 0.01406097412109375, 0.026378631591796875, 0.0386962890625, 0.051013946533203125, 0.06333160400390625, 0.07564926147460938, 0.0879669189453125, 0.10028457641601562, 0.11260223388671875, 0.12491989135742188, 0.137237548828125, 0.14955520629882812, 0.16187286376953125, 0.17419052124023438, 0.1865081787109375, 0.19882583618164062, 0.21114349365234375, 0.22346115112304688, 0.23577880859375, 0.24809646606445312, 0.26041412353515625, 0.2727317810058594, 0.2850494384765625, 0.2973670959472656, 0.30968475341796875, 0.3220024108886719, 0.334320068359375, 0.3466377258300781, 0.35895538330078125, 0.3712730407714844, 0.3835906982421875, 0.3959083557128906, 0.40822601318359375, 0.4205436706542969, 0.432861328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 14.0, 28.0, 33.0, 50.0, 117.0, 279.0, 1053.0, 8757.0, 8367406.0, 9316.0, 983.0, 263.0, 111.0, 66.0, 22.0, 16.0, 16.0, 12.0, 3.0, 1.0, 2.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-7.506015777587891, -7.294615745544434, -7.083215236663818, -6.871815204620361, -6.660415172576904, -6.449014663696289, -6.237614631652832, -6.026214599609375, -5.814814567565918, -5.603414535522461, -5.392014026641846, -5.180613994598389, -4.969213962554932, -4.757813453674316, -4.546413421630859, -4.335013389587402, -4.123613357543945, -3.912213087081909, -3.700813055038452, -3.489412784576416, -3.278012752532959, -3.066612482070923, -2.8552122116088867, -2.6438121795654297, -2.4324116706848145, -2.2210114002227783, -2.0096113681793213, -1.7982110977172852, -1.5868110656738281, -1.375410795211792, -1.1640106439590454, -0.9526104927062988, -0.7412104606628418, -0.5298103094100952, -0.31841012835502625, -0.10700994729995728, 0.1043902039527893, 0.31579041481018066, 0.5271905660629272, 0.7385907173156738, 0.9499908685684204, 1.161391019821167, 1.3727911710739136, 1.5841913223266602, 1.7955915927886963, 2.0069918632507324, 2.2183918952941895, 2.4297919273376465, 2.6411921977996826, 2.8525924682617188, 3.063992500305176, 3.275392770767212, 3.486792802810669, 3.698193073272705, 3.909593105316162, 4.120993614196777, 4.332393646240234, 4.543793678283691, 4.755194187164307, 4.966594219207764, 5.177994251251221, 5.389394760131836, 5.600794792175293, 5.81219482421875, 6.023594856262207]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 6.0, 1.0, 3.0, 2.0, 3.0, 8.0, 3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.252260684967041, -2.1556754112243652, -2.0590901374816895, -1.9625048637390137, -1.865919589996338, -1.769334316253662, -1.6727490425109863, -1.5761637687683105, -1.4795784950256348, -1.382993221282959, -1.2864079475402832, -1.1898226737976074, -1.0932374000549316, -0.9966521263122559, -0.9000668525695801, -0.8034815788269043, -0.7068963050842285, -0.6103110313415527, -0.513725757598877, -0.41714048385620117, -0.3205552101135254, -0.2239699363708496, -0.12738466262817383, -0.030799388885498047, 0.06578588485717773, 0.16237115859985352, 0.2589564323425293, 0.3555417060852051, 0.45212697982788086, 0.5487122535705566, 0.6452975273132324, 0.7418828010559082, 0.8384678363800049, 0.9350531101226807, 1.0316383838653564, 1.1282236576080322, 1.224808931350708, 1.3213942050933838, 1.4179794788360596, 1.5145647525787354, 1.6111500263214111, 1.707735300064087, 1.8043205738067627, 1.9009058475494385, 1.9974911212921143, 2.09407639503479, 2.190661668777466, 2.2872469425201416, 2.3838322162628174, 2.480417490005493, 2.577002763748169, 2.6735880374908447, 2.7701733112335205, 2.8667585849761963, 2.963343858718872, 3.059929132461548, 3.1565144062042236, 3.2530996799468994, 3.349684953689575, 3.446270227432251, 3.5428555011749268, 3.6394407749176025, 3.7360260486602783, 3.832611322402954, 3.92919659614563]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 16.0, 11.0, 25.0, 29.0, 49.0, 68.0, 127.0, 204.0, 431.0, 987.0, 3027.0, 13494.0, 78107.0, 306516.0, 98754.0, 16142.0, 3847.0, 1291.0, 471.0, 259.0, 132.0, 104.0, 54.0, 28.0, 24.0, 22.0, 9.0, 7.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.8515625, -5.69580078125, -5.5400390625, -5.38427734375, -5.228515625, -5.07275390625, -4.9169921875, -4.76123046875, -4.60546875, -4.44970703125, -4.2939453125, -4.13818359375, -3.982421875, -3.82666015625, -3.6708984375, -3.51513671875, -3.359375, -3.20361328125, -3.0478515625, -2.89208984375, -2.736328125, -2.58056640625, -2.4248046875, -2.26904296875, -2.11328125, -1.95751953125, -1.8017578125, -1.64599609375, -1.490234375, -1.33447265625, -1.1787109375, -1.02294921875, -0.8671875, -0.71142578125, -0.5556640625, -0.39990234375, -0.244140625, -0.08837890625, 0.0673828125, 0.22314453125, 0.37890625, 0.53466796875, 0.6904296875, 0.84619140625, 1.001953125, 1.15771484375, 1.3134765625, 1.46923828125, 1.625, 1.78076171875, 1.9365234375, 2.09228515625, 2.248046875, 2.40380859375, 2.5595703125, 2.71533203125, 2.87109375, 3.02685546875, 3.1826171875, 3.33837890625, 3.494140625, 3.64990234375, 3.8056640625, 3.96142578125, 4.1171875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 7.0, 18.0, 23.0, 40.0, 47.0, 58.0, 62.0, 90.0, 114.0, 89.0, 109.0, 73.0, 70.0, 49.0, 38.0, 22.0, 28.0, 16.0, 14.0, 8.0, 7.0, 7.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90087890625, -0.8756332397460938, -0.8503875732421875, -0.8251419067382812, -0.799896240234375, -0.7746505737304688, -0.7494049072265625, -0.7241592407226562, -0.69891357421875, -0.6736679077148438, -0.6484222412109375, -0.6231765747070312, -0.597930908203125, -0.5726852416992188, -0.5474395751953125, -0.5221939086914062, -0.4969482421875, -0.47170257568359375, -0.4464569091796875, -0.42121124267578125, -0.395965576171875, -0.37071990966796875, -0.3454742431640625, -0.32022857666015625, -0.29498291015625, -0.26973724365234375, -0.2444915771484375, -0.21924591064453125, -0.194000244140625, -0.16875457763671875, -0.1435089111328125, -0.11826324462890625, -0.093017578125, -0.06777191162109375, -0.0425262451171875, -0.01728057861328125, 0.007965087890625, 0.03321075439453125, 0.0584564208984375, 0.08370208740234375, 0.10894775390625, 0.13419342041015625, 0.1594390869140625, 0.18468475341796875, 0.209930419921875, 0.23517608642578125, 0.2604217529296875, 0.28566741943359375, 0.3109130859375, 0.33615875244140625, 0.3614044189453125, 0.38665008544921875, 0.411895751953125, 0.43714141845703125, 0.4623870849609375, 0.48763275146484375, 0.51287841796875, 0.5381240844726562, 0.5633697509765625, 0.5886154174804688, 0.613861083984375, 0.6391067504882812, 0.6643524169921875, 0.6895980834960938, 0.71484375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 13.0, 17.0, 18.0, 28.0, 60.0, 56.0, 73.0, 65.0, 51.0, 25.0, 16.0, 10.0, 11.0, 7.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.363767385482788, -2.2669224739074707, -2.170077323913574, -2.073232412338257, -1.97638738155365, -1.879542350769043, -1.7826974391937256, -1.6858524084091187, -1.5890073776245117, -1.4921623468399048, -1.3953173160552979, -1.2984724044799805, -1.2016273736953735, -1.1047823429107666, -1.0079374313354492, -0.9110924005508423, -0.8142473697662354, -0.7174023389816284, -0.6205573678016663, -0.5237123966217041, -0.42686736583709717, -0.3300223648548126, -0.23317736387252808, -0.13633239269256592, -0.039487361907958984, 0.05735763907432556, 0.1542026400566101, 0.25104764103889465, 0.3478926420211792, 0.44473764300346375, 0.5415826439857483, 0.6384276151657104, 0.7352724075317383, 0.8321174383163452, 0.9289624094963074, 1.0258073806762695, 1.1226524114608765, 1.2194974422454834, 1.3163423538208008, 1.4131873846054077, 1.5100324153900146, 1.6068774461746216, 1.7037224769592285, 1.800567388534546, 1.8974124193191528, 1.9942574501037598, 2.091102361679077, 2.1879472732543945, 2.284792423248291, 2.3816373348236084, 2.478482484817505, 2.5753273963928223, 2.6721725463867188, 2.769017457962036, 2.8658623695373535, 2.96270751953125, 3.0595524311065674, 3.1563973426818848, 3.2532424926757812, 3.3500874042510986, 3.446932315826416, 3.5437774658203125, 3.64062237739563, 3.7374672889709473, 3.8343124389648438]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 11.0, 32.0, 54.0, 83.0, 84.0, 74.0, 31.0, 22.0, 13.0, 11.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3969743251800537, -3.293792247772217, -3.190609931945801, -3.087427854537964, -2.984245538711548, -2.881063461303711, -2.777881145477295, -2.674699068069458, -2.571516990661621, -2.468334913253784, -2.365152597427368, -2.2619705200195312, -2.1587882041931152, -2.0556061267852783, -1.9524239301681519, -1.8492417335510254, -1.7460594177246094, -1.642877221107483, -1.5396950244903564, -1.4365129470825195, -1.3333306312561035, -1.2301485538482666, -1.1269663572311401, -1.0237841606140137, -0.9206019639968872, -0.8174197673797607, -0.7142375707626343, -0.6110554337501526, -0.5078732371330261, -0.40469104051589966, -0.30150890350341797, -0.1983267068862915, -0.09514427185058594, 0.008037909865379333, 0.1112200915813446, 0.21440225839614868, 0.31758445501327515, 0.4207666516304016, 0.5239487886428833, 0.6271309852600098, 0.7303131818771362, 0.8334953784942627, 0.9366775751113892, 1.0398597717285156, 1.1430418491363525, 1.2462241649627686, 1.3494062423706055, 1.452588438987732, 1.5557706356048584, 1.6589528322219849, 1.7621350288391113, 1.8653171062469482, 1.9684994220733643, 2.071681499481201, 2.174863815307617, 2.278045892715454, 2.381227970123291, 2.484410047531128, 2.587592363357544, 2.690774440765381, 2.793956756591797, 2.897138833999634, 3.0003209114074707, 3.1035032272338867, 3.2066855430603027]}, "train/train_runtime": 5087.4578, "train/train_samples_per_second": 5.609, "train/train_steps_per_second": 0.088, "train/total_flos": 0.0, "train/train_loss": 4.256010225535508, "eval/loss": 4.295446395874023, "eval/wer": 2.317671558905196, "eval/runtime": 1115.1949, "eval/samples_per_second": 2.369, "eval/steps_per_second": 0.297, "_wandb": {"runtime": 6545}} \ No newline at end of file