diff --git "a/wandb/run-20220302_154455-17zs7rwf/files/wandb-summary.json" "b/wandb/run-20220302_154455-17zs7rwf/files/wandb-summary.json" --- "a/wandb/run-20220302_154455-17zs7rwf/files/wandb-summary.json" +++ "b/wandb/run-20220302_154455-17zs7rwf/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.6367, "train/learning_rate": 8.403483309143686e-05, "train/epoch": 0.84, "train/global_step": 1000, "_runtime": 5821, "_timestamp": 1646241716, "_step": 1001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 46.0, 970.0, 2.0], "bins": [-1146.3345947265625, -1127.9237060546875, -1109.5128173828125, -1091.10205078125, -1072.691162109375, -1054.2802734375, -1035.869384765625, -1017.45849609375, -999.0476684570312, -980.6367797851562, -962.2259521484375, -943.8150634765625, -925.4041748046875, -906.9933471679688, -888.5824584960938, -870.171630859375, -851.7607421875, -833.349853515625, -814.9390258789062, -796.5281372070312, -778.1172485351562, -759.7064208984375, -741.2955322265625, -722.8846435546875, -704.4737548828125, -686.0628662109375, -667.6520385742188, -649.2411499023438, -630.8302612304688, -612.41943359375, -594.008544921875, -575.59765625, -557.1868286132812, -538.7759399414062, -520.3651123046875, -501.9542236328125, -483.5433654785156, -465.13250732421875, -446.72161865234375, -428.3107604980469, -409.89990234375, -391.4890441894531, -373.0781555175781, -354.66729736328125, -336.2564392089844, -317.8455810546875, -299.4346923828125, -281.0238342285156, -262.6129455566406, -244.2020721435547, -225.7912139892578, -207.38034057617188, -188.969482421875, -170.55860900878906, -152.14773559570312, -133.73687744140625, -115.32600402832031, -96.9151382446289, -78.5042724609375, -60.09339904785156, -41.682533264160156, -23.27166748046875, -4.8607940673828125, 13.550064086914062, 31.9609375]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 11.0, 19.0, 23.0, 38.0, 41.0, 41.0, 42.0, 65.0, 82.0, 80.0, 83.0, 81.0, 80.0, 75.0, 57.0, 56.0, 36.0, 27.0, 14.0, 14.0, 14.0, 5.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-100.40751647949219, -97.4805679321289, -94.55361938476562, -91.62667083740234, -88.69972229003906, -85.77277374267578, -82.8458251953125, -79.91888427734375, -76.99192810058594, -74.06497955322266, -71.13803100585938, -68.2110824584961, -65.28413391113281, -62.35718536376953, -59.430240631103516, -56.503292083740234, -53.57634735107422, -50.64939880371094, -47.722450256347656, -44.795501708984375, -41.868553161621094, -38.94160461425781, -36.0146598815918, -33.087711334228516, -30.160762786865234, -27.233814239501953, -24.306865692138672, -21.379919052124023, -18.452970504760742, -15.526021957397461, -12.599075317382812, -9.672126770019531, -6.74517822265625, -3.818230152130127, -0.8912820816040039, 2.035665512084961, 4.962614059448242, 7.889562606811523, 10.816509246826172, 13.743457794189453, 16.670406341552734, 19.597354888916016, 22.524303436279297, 25.451250076293945, 28.378198623657227, 31.305147171020508, 34.232093811035156, 37.15904235839844, 40.08599090576172, 43.012939453125, 45.93988800048828, 48.86683654785156, 51.793785095214844, 54.720733642578125, 57.64767837524414, 60.57462692260742, 63.5015754699707, 66.42852020263672, 69.35546875, 72.28241729736328, 75.20936584472656, 78.13631439208984, 81.06326293945312, 83.9902114868164, 86.91716003417969]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 14.0, 21.0, 19.0, 22.0, 23.0, 29.0, 30.0, 34.0, 48.0, 46.0, 52.0, 48.0, 57.0, 66.0, 54.0, 50.0, 48.0, 47.0, 49.0, 47.0, 47.0, 24.0, 28.0, 22.0, 7.0, 18.0, 11.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.267578125, -1.215728759765625, -1.16387939453125, -1.112030029296875, -1.0601806640625, -1.008331298828125, -0.95648193359375, -0.904632568359375, -0.852783203125, -0.800933837890625, -0.74908447265625, -0.697235107421875, -0.6453857421875, -0.593536376953125, -0.54168701171875, -0.489837646484375, -0.43798828125, -0.386138916015625, -0.33428955078125, -0.282440185546875, -0.2305908203125, -0.178741455078125, -0.12689208984375, -0.075042724609375, -0.023193359375, 0.028656005859375, 0.08050537109375, 0.132354736328125, 0.1842041015625, 0.236053466796875, 0.28790283203125, 0.339752197265625, 0.3916015625, 0.443450927734375, 0.49530029296875, 0.547149658203125, 0.5989990234375, 0.650848388671875, 0.70269775390625, 0.754547119140625, 0.806396484375, 0.858245849609375, 0.91009521484375, 0.961944580078125, 1.0137939453125, 1.065643310546875, 1.11749267578125, 1.169342041015625, 1.22119140625, 1.273040771484375, 1.32489013671875, 1.376739501953125, 1.4285888671875, 1.480438232421875, 1.53228759765625, 1.584136962890625, 1.635986328125, 1.687835693359375, 1.73968505859375, 1.791534423828125, 1.8433837890625, 1.895233154296875, 1.94708251953125, 1.998931884765625, 2.05078125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 8.0, 14.0, 13.0, 25.0, 29.0, 57.0, 81.0, 109.0, 130.0, 180.0, 336.0, 547.0, 869.0, 1563.0, 3563.0, 11708.0, 95709.0, 3263264.0, 769519.0, 34216.0, 6761.0, 2432.0, 1249.0, 688.0, 374.0, 271.0, 172.0, 125.0, 64.0, 56.0, 36.0, 30.0, 17.0, 18.0, 16.0, 7.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.6285400390625, -8.280517578125, -7.9324951171875, -7.58447265625, -7.2364501953125, -6.888427734375, -6.5404052734375, -6.1923828125, -5.8443603515625, -5.496337890625, -5.1483154296875, -4.80029296875, -4.4522705078125, -4.104248046875, -3.7562255859375, -3.408203125, -3.0601806640625, -2.712158203125, -2.3641357421875, -2.01611328125, -1.6680908203125, -1.320068359375, -0.9720458984375, -0.6240234375, -0.2760009765625, 0.072021484375, 0.4200439453125, 0.76806640625, 1.1160888671875, 1.464111328125, 1.8121337890625, 2.16015625, 2.5081787109375, 2.856201171875, 3.2042236328125, 3.55224609375, 3.9002685546875, 4.248291015625, 4.5963134765625, 4.9443359375, 5.2923583984375, 5.640380859375, 5.9884033203125, 6.33642578125, 6.6844482421875, 7.032470703125, 7.3804931640625, 7.728515625, 8.0765380859375, 8.424560546875, 8.7725830078125, 9.12060546875, 9.4686279296875, 9.816650390625, 10.1646728515625, 10.5126953125, 10.8607177734375, 11.208740234375, 11.5567626953125, 11.90478515625, 12.2528076171875, 12.600830078125, 12.9488525390625, 13.296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 7.0, 17.0, 51.0, 69.0, 155.0, 307.0, 658.0, 1053.0, 907.0, 432.0, 225.0, 98.0, 51.0, 25.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.203125, -17.7879638671875, -17.372802734375, -16.9576416015625, -16.54248046875, -16.1273193359375, -15.712158203125, -15.2969970703125, -14.8818359375, -14.4666748046875, -14.051513671875, -13.6363525390625, -13.22119140625, -12.8060302734375, -12.390869140625, -11.9757080078125, -11.560546875, -11.1453857421875, -10.730224609375, -10.3150634765625, -9.89990234375, -9.4847412109375, -9.069580078125, -8.6544189453125, -8.2392578125, -7.8240966796875, -7.408935546875, -6.9937744140625, -6.57861328125, -6.1634521484375, -5.748291015625, -5.3331298828125, -4.91796875, -4.5028076171875, -4.087646484375, -3.6724853515625, -3.25732421875, -2.8421630859375, -2.427001953125, -2.0118408203125, -1.5966796875, -1.1815185546875, -0.766357421875, -0.3511962890625, 0.06396484375, 0.4791259765625, 0.894287109375, 1.3094482421875, 1.724609375, 2.1397705078125, 2.554931640625, 2.9700927734375, 3.38525390625, 3.8004150390625, 4.215576171875, 4.6307373046875, 5.0458984375, 5.4610595703125, 5.876220703125, 6.2913818359375, 6.70654296875, 7.1217041015625, 7.536865234375, 7.9520263671875, 8.3671875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 9.0, 23.0, 36.0, 132.0, 347.0, 1030.0, 6477.0, 4100062.0, 83531.0, 1814.0, 471.0, 215.0, 70.0, 30.0, 11.0, 5.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5625, -43.06298828125, -41.5634765625, -40.06396484375, -38.564453125, -37.06494140625, -35.5654296875, -34.06591796875, -32.56640625, -31.06689453125, -29.5673828125, -28.06787109375, -26.568359375, -25.06884765625, -23.5693359375, -22.06982421875, -20.5703125, -19.07080078125, -17.5712890625, -16.07177734375, -14.572265625, -13.07275390625, -11.5732421875, -10.07373046875, -8.57421875, -7.07470703125, -5.5751953125, -4.07568359375, -2.576171875, -1.07666015625, 0.4228515625, 1.92236328125, 3.421875, 4.92138671875, 6.4208984375, 7.92041015625, 9.419921875, 10.91943359375, 12.4189453125, 13.91845703125, 15.41796875, 16.91748046875, 18.4169921875, 19.91650390625, 21.416015625, 22.91552734375, 24.4150390625, 25.91455078125, 27.4140625, 28.91357421875, 30.4130859375, 31.91259765625, 33.412109375, 34.91162109375, 36.4111328125, 37.91064453125, 39.41015625, 40.90966796875, 42.4091796875, 43.90869140625, 45.408203125, 46.90771484375, 48.4072265625, 49.90673828125, 51.40625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [16.0, 904.0, 96.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.488520622253418, -5.62855339050293, 2.2314138412475586, 10.091382026672363, 17.95134735107422, 25.81131362915039, 33.67128372192383, 41.53125, 49.39121627807617, 57.251182556152344, 65.11115264892578, 72.97111511230469, 80.83108520507812, 88.69105529785156, 96.551025390625, 104.4109878540039, 112.27095794677734, 120.13092803955078, 127.99089050292969, 135.85086059570312, 143.71083068847656, 151.57080078125, 159.43075561523438, 167.2907257080078, 175.15069580078125, 183.0106658935547, 190.87063598632812, 198.7305908203125, 206.59056091308594, 214.45053100585938, 222.3105010986328, 230.17047119140625, 238.03042602539062, 245.89039611816406, 253.7503662109375, 261.6103210449219, 269.4703063964844, 277.33026123046875, 285.19024658203125, 293.0502014160156, 300.91015625, 308.7701110839844, 316.6300964355469, 324.49005126953125, 332.35003662109375, 340.2099914550781, 348.0699462890625, 355.929931640625, 363.7899169921875, 371.6498718261719, 379.5098571777344, 387.36981201171875, 395.22979736328125, 403.0897521972656, 410.94970703125, 418.8096923828125, 426.6696472167969, 434.52960205078125, 442.38958740234375, 450.2495422363281, 458.1095275878906, 465.969482421875, 473.8294677734375, 481.6894226074219, 489.54937744140625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 13.0, 7.0, 18.0, 27.0, 22.0, 18.0, 22.0, 33.0, 43.0, 33.0, 41.0, 40.0, 45.0, 61.0, 49.0, 64.0, 59.0, 38.0, 51.0, 55.0, 45.0, 33.0, 41.0, 33.0, 30.0, 22.0, 17.0, 16.0, 6.0, 4.0, 8.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.25786590576172, -26.28112030029297, -25.30437469482422, -24.32762908935547, -23.35088348388672, -22.37413787841797, -21.39739227294922, -20.42064666748047, -19.44390106201172, -18.46715545654297, -17.49040985107422, -16.51366424560547, -15.536918640136719, -14.560173034667969, -13.583428382873535, -12.606682777404785, -11.629938125610352, -10.653192520141602, -9.676446914672852, -8.699701309204102, -7.72295618057251, -6.74621057510376, -5.769465446472168, -4.792719841003418, -3.815974235534668, -2.839228630065918, -1.862483263015747, -0.8857378959655762, 0.09100770950317383, 1.0677533149719238, 2.0444984436035156, 3.0212440490722656, 3.9979896545410156, 4.974735260009766, 5.951480865478516, 6.928225994110107, 7.904971599578857, 8.881717681884766, 9.8584623336792, 10.83520793914795, 11.8119535446167, 12.78869915008545, 13.7654447555542, 14.742189407348633, 15.718935012817383, 16.695680618286133, 17.672426223754883, 18.649171829223633, 19.625917434692383, 20.602663040161133, 21.579408645629883, 22.556154251098633, 23.532899856567383, 24.509645462036133, 25.48638916015625, 26.463134765625, 27.43988037109375, 28.4166259765625, 29.39337158203125, 30.3701171875, 31.34686279296875, 32.3236083984375, 33.30035400390625, 34.277099609375, 35.25384521484375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 11.0, 11.0, 16.0, 11.0, 9.0, 25.0, 22.0, 22.0, 22.0, 21.0, 24.0, 37.0, 27.0, 39.0, 32.0, 26.0, 46.0, 38.0, 47.0, 40.0, 40.0, 42.0, 34.0, 40.0, 39.0, 31.0, 37.0, 31.0, 26.0, 28.0, 25.0, 20.0, 10.0, 13.0, 13.0, 5.0, 7.0, 2.0, 9.0, 7.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.244140625, -1.2050018310546875, -1.165863037109375, -1.1267242431640625, -1.08758544921875, -1.0484466552734375, -1.009307861328125, -0.9701690673828125, -0.9310302734375, -0.8918914794921875, -0.852752685546875, -0.8136138916015625, -0.77447509765625, -0.7353363037109375, -0.696197509765625, -0.6570587158203125, -0.617919921875, -0.5787811279296875, -0.539642333984375, -0.5005035400390625, -0.46136474609375, -0.4222259521484375, -0.383087158203125, -0.3439483642578125, -0.3048095703125, -0.2656707763671875, -0.226531982421875, -0.1873931884765625, -0.14825439453125, -0.1091156005859375, -0.069976806640625, -0.0308380126953125, 0.00830078125, 0.0474395751953125, 0.086578369140625, 0.1257171630859375, 0.16485595703125, 0.2039947509765625, 0.243133544921875, 0.2822723388671875, 0.3214111328125, 0.3605499267578125, 0.399688720703125, 0.4388275146484375, 0.47796630859375, 0.5171051025390625, 0.556243896484375, 0.5953826904296875, 0.634521484375, 0.6736602783203125, 0.712799072265625, 0.7519378662109375, 0.79107666015625, 0.8302154541015625, 0.869354248046875, 0.9084930419921875, 0.9476318359375, 0.9867706298828125, 1.025909423828125, 1.0650482177734375, 1.10418701171875, 1.1433258056640625, 1.182464599609375, 1.2216033935546875, 1.2607421875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 15.0, 18.0, 23.0, 34.0, 51.0, 66.0, 129.0, 150.0, 208.0, 298.0, 409.0, 636.0, 892.0, 1359.0, 2011.0, 2919.0, 4337.0, 6816.0, 10455.0, 16208.0, 26225.0, 41745.0, 68201.0, 120558.0, 286110.0, 205881.0, 97356.0, 57504.0, 35196.0, 21982.0, 13746.0, 9152.0, 5812.0, 3838.0, 2563.0, 1768.0, 1262.0, 797.0, 519.0, 406.0, 269.0, 193.0, 131.0, 89.0, 68.0, 44.0, 27.0, 28.0, 11.0, 14.0, 13.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.01120758056640625, -0.010855436325073242, -0.010503292083740234, -0.010151147842407227, -0.009799003601074219, -0.009446859359741211, -0.009094715118408203, -0.008742570877075195, -0.008390426635742188, -0.00803828239440918, -0.007686138153076172, -0.007333993911743164, -0.006981849670410156, -0.0066297054290771484, -0.006277561187744141, -0.005925416946411133, -0.005573272705078125, -0.005221128463745117, -0.004868984222412109, -0.0045168399810791016, -0.004164695739746094, -0.003812551498413086, -0.003460407257080078, -0.0031082630157470703, -0.0027561187744140625, -0.0024039745330810547, -0.002051830291748047, -0.001699686050415039, -0.0013475418090820312, -0.0009953975677490234, -0.0006432533264160156, -0.0002911090850830078, 6.103515625e-05, 0.0004131793975830078, 0.0007653236389160156, 0.0011174678802490234, 0.0014696121215820312, 0.001821756362915039, 0.002173900604248047, 0.0025260448455810547, 0.0028781890869140625, 0.0032303333282470703, 0.003582477569580078, 0.003934621810913086, 0.004286766052246094, 0.0046389102935791016, 0.004991054534912109, 0.005343198776245117, 0.005695343017578125, 0.006047487258911133, 0.006399631500244141, 0.0067517757415771484, 0.007103919982910156, 0.007456064224243164, 0.007808208465576172, 0.00816035270690918, 0.008512496948242188, 0.008864641189575195, 0.009216785430908203, 0.009568929672241211, 0.009921073913574219, 0.010273218154907227, 0.010625362396240234, 0.010977506637573242, 0.01132965087890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 3.0, 5.0, 7.0, 12.0, 7.0, 6.0, 6.0, 14.0, 20.0, 16.0, 19.0, 27.0, 26.0, 25.0, 21.0, 24.0, 29.0, 35.0, 26.0, 48.0, 33.0, 29.0, 33.0, 1058.0, 27.0, 29.0, 37.0, 41.0, 36.0, 33.0, 19.0, 28.0, 36.0, 19.0, 22.0, 22.0, 25.0, 15.0, 18.0, 15.0, 11.0, 10.0, 9.0, 10.0, 3.0, 8.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0], "bins": [-0.79541015625, -0.7724990844726562, -0.7495880126953125, -0.7266769409179688, -0.703765869140625, -0.6808547973632812, -0.6579437255859375, -0.6350326538085938, -0.61212158203125, -0.5892105102539062, -0.5662994384765625, -0.5433883666992188, -0.520477294921875, -0.49756622314453125, -0.4746551513671875, -0.45174407958984375, -0.4288330078125, -0.40592193603515625, -0.3830108642578125, -0.36009979248046875, -0.337188720703125, -0.31427764892578125, -0.2913665771484375, -0.26845550537109375, -0.24554443359375, -0.22263336181640625, -0.1997222900390625, -0.17681121826171875, -0.153900146484375, -0.13098907470703125, -0.1080780029296875, -0.08516693115234375, -0.062255859375, -0.03934478759765625, -0.0164337158203125, 0.00647735595703125, 0.029388427734375, 0.05229949951171875, 0.0752105712890625, 0.09812164306640625, 0.12103271484375, 0.14394378662109375, 0.1668548583984375, 0.18976593017578125, 0.212677001953125, 0.23558807373046875, 0.2584991455078125, 0.28141021728515625, 0.3043212890625, 0.32723236083984375, 0.3501434326171875, 0.37305450439453125, 0.395965576171875, 0.41887664794921875, 0.4417877197265625, 0.46469879150390625, 0.48760986328125, 0.5105209350585938, 0.5334320068359375, 0.5563430786132812, 0.579254150390625, 0.6021652221679688, 0.6250762939453125, 0.6479873657226562, 0.6708984375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 9.0, 6.0, 9.0, 21.0, 33.0, 49.0, 68.0, 120.0, 177.0, 214.0, 341.0, 471.0, 646.0, 865.0, 1117.0, 1624.0, 2099.0, 2785.0, 4002.0, 5443.0, 7377.0, 10388.0, 14372.0, 19940.0, 29116.0, 42986.0, 66373.0, 111583.0, 1258953.0, 203638.0, 107256.0, 64464.0, 41424.0, 28398.0, 19782.0, 13968.0, 10139.0, 7292.0, 5339.0, 3839.0, 2783.0, 2083.0, 1523.0, 1119.0, 867.0, 593.0, 461.0, 328.0, 232.0, 157.0, 96.0, 70.0, 45.0, 28.0, 20.0, 9.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00537872314453125, -0.005205035209655762, -0.0050313472747802734, -0.004857659339904785, -0.004683971405029297, -0.004510283470153809, -0.00433659553527832, -0.004162907600402832, -0.003989219665527344, -0.0038155317306518555, -0.003641843795776367, -0.003468155860900879, -0.0032944679260253906, -0.0031207799911499023, -0.002947092056274414, -0.0027734041213989258, -0.0025997161865234375, -0.0024260282516479492, -0.002252340316772461, -0.0020786523818969727, -0.0019049644470214844, -0.001731276512145996, -0.0015575885772705078, -0.0013839006423950195, -0.0012102127075195312, -0.001036524772644043, -0.0008628368377685547, -0.0006891489028930664, -0.0005154609680175781, -0.00034177303314208984, -0.00016808509826660156, 5.602836608886719e-06, 0.000179290771484375, 0.0003529787063598633, 0.0005266666412353516, 0.0007003545761108398, 0.0008740425109863281, 0.0010477304458618164, 0.0012214183807373047, 0.001395106315612793, 0.0015687942504882812, 0.0017424821853637695, 0.0019161701202392578, 0.002089858055114746, 0.0022635459899902344, 0.0024372339248657227, 0.002610921859741211, 0.0027846097946166992, 0.0029582977294921875, 0.0031319856643676758, 0.003305673599243164, 0.0034793615341186523, 0.0036530494689941406, 0.003826737403869629, 0.004000425338745117, 0.0041741132736206055, 0.004347801208496094, 0.004521489143371582, 0.00469517707824707, 0.004868865013122559, 0.005042552947998047, 0.005216240882873535, 0.0053899288177490234, 0.005563616752624512, 0.0057373046875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 976.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 26.0, 19.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 8.0, 4.0, 12.0, 15.0, 6.0, 25.0, 110.0, 5189.0, 1042880.0, 124.0, 15.0, 3.0, 17.0, 11.0, 4.0, 10.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 19.0, 24.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0], "bins": [-2.086162567138672e-06, -2.0209699869155884e-06, -1.955777406692505e-06, -1.8905848264694214e-06, -1.8253922462463379e-06, -1.7601996660232544e-06, -1.695007085800171e-06, -1.6298145055770874e-06, -1.564621925354004e-06, -1.4994293451309204e-06, -1.434236764907837e-06, -1.3690441846847534e-06, -1.30385160446167e-06, -1.2386590242385864e-06, -1.173466444015503e-06, -1.1082738637924194e-06, -1.043081283569336e-06, -9.778887033462524e-07, -9.126961231231689e-07, -8.475035429000854e-07, -7.82310962677002e-07, -7.171183824539185e-07, -6.51925802230835e-07, -5.867332220077515e-07, -5.21540641784668e-07, -4.5634806156158447e-07, -3.91155481338501e-07, -3.259629011154175e-07, -2.60770320892334e-07, -1.955777406692505e-07, -1.30385160446167e-07, -6.51925802230835e-08, 0.0, 6.51925802230835e-08, 1.30385160446167e-07, 1.955777406692505e-07, 2.60770320892334e-07, 3.259629011154175e-07, 3.91155481338501e-07, 4.5634806156158447e-07, 5.21540641784668e-07, 5.867332220077515e-07, 6.51925802230835e-07, 7.171183824539185e-07, 7.82310962677002e-07, 8.475035429000854e-07, 9.126961231231689e-07, 9.778887033462524e-07, 1.043081283569336e-06, 1.1082738637924194e-06, 1.173466444015503e-06, 1.2386590242385864e-06, 1.30385160446167e-06, 1.3690441846847534e-06, 1.434236764907837e-06, 1.4994293451309204e-06, 1.564621925354004e-06, 1.6298145055770874e-06, 1.695007085800171e-06, 1.7601996660232544e-06, 1.8253922462463379e-06, 1.8905848264694214e-06, 1.955777406692505e-06, 2.0209699869155884e-06, 2.086162567138672e-06]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 11.0, 11.0, 16.0, 11.0, 9.0, 25.0, 22.0, 22.0, 22.0, 21.0, 24.0, 37.0, 27.0, 39.0, 32.0, 26.0, 46.0, 38.0, 47.0, 40.0, 40.0, 42.0, 34.0, 40.0, 39.0, 31.0, 37.0, 31.0, 26.0, 28.0, 25.0, 20.0, 10.0, 13.0, 13.0, 5.0, 7.0, 2.0, 9.0, 7.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.244140625, -1.2050018310546875, -1.165863037109375, -1.1267242431640625, -1.08758544921875, -1.0484466552734375, -1.009307861328125, -0.9701690673828125, -0.9310302734375, -0.8918914794921875, -0.852752685546875, -0.8136138916015625, -0.77447509765625, -0.7353363037109375, -0.696197509765625, -0.6570587158203125, -0.617919921875, -0.5787811279296875, -0.539642333984375, -0.5005035400390625, -0.46136474609375, -0.4222259521484375, -0.383087158203125, -0.3439483642578125, -0.3048095703125, -0.2656707763671875, -0.226531982421875, -0.1873931884765625, -0.14825439453125, -0.1091156005859375, -0.069976806640625, -0.0308380126953125, 0.00830078125, 0.0474395751953125, 0.086578369140625, 0.1257171630859375, 0.16485595703125, 0.2039947509765625, 0.243133544921875, 0.2822723388671875, 0.3214111328125, 0.3605499267578125, 0.399688720703125, 0.4388275146484375, 0.47796630859375, 0.5171051025390625, 0.556243896484375, 0.5953826904296875, 0.634521484375, 0.6736602783203125, 0.712799072265625, 0.7519378662109375, 0.79107666015625, 0.8302154541015625, 0.869354248046875, 0.9084930419921875, 0.9476318359375, 0.9867706298828125, 1.025909423828125, 1.0650482177734375, 1.10418701171875, 1.1433258056640625, 1.182464599609375, 1.2216033935546875, 1.2607421875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 3.0, 5.0, 7.0, 8.0, 19.0, 25.0, 43.0, 64.0, 81.0, 120.0, 188.0, 274.0, 420.0, 633.0, 999.0, 1484.0, 2371.0, 3815.0, 6510.0, 12217.0, 28979.0, 125566.0, 612887.0, 182954.0, 35869.0, 14077.0, 7259.0, 4334.0, 2693.0, 1590.0, 1066.0, 674.0, 446.0, 282.0, 195.0, 136.0, 74.0, 65.0, 42.0, 30.0, 9.0, 10.0, 5.0, 7.0, 3.0, 8.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.48828125, -5.3145751953125, -5.140869140625, -4.9671630859375, -4.79345703125, -4.6197509765625, -4.446044921875, -4.2723388671875, -4.0986328125, -3.9249267578125, -3.751220703125, -3.5775146484375, -3.40380859375, -3.2301025390625, -3.056396484375, -2.8826904296875, -2.708984375, -2.5352783203125, -2.361572265625, -2.1878662109375, -2.01416015625, -1.8404541015625, -1.666748046875, -1.4930419921875, -1.3193359375, -1.1456298828125, -0.971923828125, -0.7982177734375, -0.62451171875, -0.4508056640625, -0.277099609375, -0.1033935546875, 0.0703125, 0.2440185546875, 0.417724609375, 0.5914306640625, 0.76513671875, 0.9388427734375, 1.112548828125, 1.2862548828125, 1.4599609375, 1.6336669921875, 1.807373046875, 1.9810791015625, 2.15478515625, 2.3284912109375, 2.502197265625, 2.6759033203125, 2.849609375, 3.0233154296875, 3.197021484375, 3.3707275390625, 3.54443359375, 3.7181396484375, 3.891845703125, 4.0655517578125, 4.2392578125, 4.4129638671875, 4.586669921875, 4.7603759765625, 4.93408203125, 5.1077880859375, 5.281494140625, 5.4552001953125, 5.62890625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 5.0, 4.0, 7.0, 14.0, 12.0, 5.0, 20.0, 20.0, 20.0, 16.0, 23.0, 20.0, 30.0, 46.0, 29.0, 35.0, 53.0, 61.0, 68.0, 98.0, 165.0, 1429.0, 249.0, 125.0, 66.0, 49.0, 42.0, 57.0, 46.0, 35.0, 37.0, 25.0, 20.0, 27.0, 14.0, 15.0, 11.0, 7.0, 9.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.83984375, -3.71484375, -3.58984375, -3.46484375, -3.33984375, -3.21484375, -3.08984375, -2.96484375, -2.83984375, -2.71484375, -2.58984375, -2.46484375, -2.33984375, -2.21484375, -2.08984375, -1.96484375, -1.83984375, -1.71484375, -1.58984375, -1.46484375, -1.33984375, -1.21484375, -1.08984375, -0.96484375, -0.83984375, -0.71484375, -0.58984375, -0.46484375, -0.33984375, -0.21484375, -0.08984375, 0.03515625, 0.16015625, 0.28515625, 0.41015625, 0.53515625, 0.66015625, 0.78515625, 0.91015625, 1.03515625, 1.16015625, 1.28515625, 1.41015625, 1.53515625, 1.66015625, 1.78515625, 1.91015625, 2.03515625, 2.16015625, 2.28515625, 2.41015625, 2.53515625, 2.66015625, 2.78515625, 2.91015625, 3.03515625, 3.16015625, 3.28515625, 3.41015625, 3.53515625, 3.66015625, 3.78515625, 3.91015625, 4.03515625, 4.16015625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 7.0, 7.0, 15.0, 11.0, 16.0, 17.0, 21.0, 43.0, 30.0, 54.0, 68.0, 117.0, 170.0, 465.0, 2484.0, 139774.0, 2990174.0, 10438.0, 954.0, 270.0, 172.0, 75.0, 55.0, 41.0, 31.0, 25.0, 21.0, 16.0, 16.0, 10.0, 19.0, 15.0, 6.0, 5.0, 13.0, 8.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-20.546875, -19.94677734375, -19.3466796875, -18.74658203125, -18.146484375, -17.54638671875, -16.9462890625, -16.34619140625, -15.74609375, -15.14599609375, -14.5458984375, -13.94580078125, -13.345703125, -12.74560546875, -12.1455078125, -11.54541015625, -10.9453125, -10.34521484375, -9.7451171875, -9.14501953125, -8.544921875, -7.94482421875, -7.3447265625, -6.74462890625, -6.14453125, -5.54443359375, -4.9443359375, -4.34423828125, -3.744140625, -3.14404296875, -2.5439453125, -1.94384765625, -1.34375, -0.74365234375, -0.1435546875, 0.45654296875, 1.056640625, 1.65673828125, 2.2568359375, 2.85693359375, 3.45703125, 4.05712890625, 4.6572265625, 5.25732421875, 5.857421875, 6.45751953125, 7.0576171875, 7.65771484375, 8.2578125, 8.85791015625, 9.4580078125, 10.05810546875, 10.658203125, 11.25830078125, 11.8583984375, 12.45849609375, 13.05859375, 13.65869140625, 14.2587890625, 14.85888671875, 15.458984375, 16.05908203125, 16.6591796875, 17.25927734375, 17.859375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 23.0, 378.0, 555.0, 50.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.002107620239258, -5.278103828430176, -3.5541000366210938, -1.8300962448120117, -0.10609245300292969, 1.6179113388061523, 3.3419151306152344, 5.065918922424316, 6.789922714233398, 8.51392650604248, 10.237930297851562, 11.961934089660645, 13.685937881469727, 15.409941673278809, 17.13394546508789, 18.857948303222656, 20.581953048706055, 22.305957794189453, 24.02996063232422, 25.753963470458984, 27.477968215942383, 29.20197296142578, 30.925975799560547, 32.64997863769531, 34.373985290527344, 36.09798812866211, 37.821990966796875, 39.545997619628906, 41.27000045776367, 42.99400329589844, 44.71800994873047, 46.442012786865234, 48.166015625, 49.890018463134766, 51.61402130126953, 53.33802795410156, 55.06203079223633, 56.786033630371094, 58.510040283203125, 60.23404312133789, 61.958045959472656, 63.68204879760742, 65.40605163574219, 67.13005828857422, 68.85406494140625, 70.57806396484375, 72.30207061767578, 74.02606964111328, 75.75007629394531, 77.47408294677734, 79.19808197021484, 80.92208862304688, 82.64608764648438, 84.3700942993164, 86.09410095214844, 87.81809997558594, 89.54210662841797, 91.26611328125, 92.9901123046875, 94.71411895751953, 96.43812561035156, 98.16212463378906, 99.8861312866211, 101.6101303100586, 103.33413696289062]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 2.0, 4.0, 7.0, 8.0, 7.0, 6.0, 13.0, 11.0, 20.0, 27.0, 27.0, 30.0, 27.0, 41.0, 41.0, 61.0, 46.0, 48.0, 36.0, 48.0, 63.0, 48.0, 50.0, 52.0, 49.0, 37.0, 34.0, 39.0, 29.0, 25.0, 30.0, 11.0, 11.0, 9.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.738250732421875, -24.121013641357422, -23.50377655029297, -22.886539459228516, -22.269302368164062, -21.65206527709961, -21.034828186035156, -20.417591094970703, -19.80035400390625, -19.183116912841797, -18.565879821777344, -17.94864273071289, -17.331405639648438, -16.714168548583984, -16.09693145751953, -15.479693412780762, -14.862455368041992, -14.245218276977539, -13.627981185913086, -13.010744094848633, -12.39350700378418, -11.776269912719727, -11.159031867980957, -10.541794776916504, -9.92455768585205, -9.307320594787598, -8.690083503723145, -8.072846412658691, -7.45560884475708, -6.838371753692627, -6.221134185791016, -5.6038970947265625, -4.986660003662109, -4.369422912597656, -3.752185583114624, -3.134948253631592, -2.5177111625671387, -1.9004740715026855, -1.2832367420196533, -0.6659994125366211, -0.04876232147216797, 0.5684748888015747, 1.1857120990753174, 1.80294930934906, 2.4201865196228027, 3.037423610687256, 3.654660940170288, 4.27189826965332, 4.889135360717773, 5.506372451782227, 6.12360954284668, 6.740847110748291, 7.358084201812744, 7.975321292877197, 8.592558860778809, 9.209795951843262, 9.827033042907715, 10.444270133972168, 11.061507225036621, 11.678744316101074, 12.295982360839844, 12.913219451904297, 13.53045654296875, 14.147693634033203, 14.764930725097656]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 9.0, 16.0, 13.0, 7.0, 17.0, 25.0, 21.0, 18.0, 25.0, 23.0, 28.0, 31.0, 24.0, 42.0, 30.0, 37.0, 39.0, 44.0, 40.0, 45.0, 40.0, 37.0, 36.0, 42.0, 25.0, 34.0, 29.0, 38.0, 29.0, 30.0, 22.0, 18.0, 18.0, 11.0, 10.0, 8.0, 6.0, 9.0, 2.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.2724609375, -1.2309417724609375, -1.189422607421875, -1.1479034423828125, -1.10638427734375, -1.0648651123046875, -1.023345947265625, -0.9818267822265625, -0.9403076171875, -0.8987884521484375, -0.857269287109375, -0.8157501220703125, -0.77423095703125, -0.7327117919921875, -0.691192626953125, -0.6496734619140625, -0.608154296875, -0.5666351318359375, -0.525115966796875, -0.4835968017578125, -0.44207763671875, -0.4005584716796875, -0.359039306640625, -0.3175201416015625, -0.2760009765625, -0.2344818115234375, -0.192962646484375, -0.1514434814453125, -0.10992431640625, -0.0684051513671875, -0.026885986328125, 0.0146331787109375, 0.05615234375, 0.0976715087890625, 0.139190673828125, 0.1807098388671875, 0.22222900390625, 0.2637481689453125, 0.305267333984375, 0.3467864990234375, 0.3883056640625, 0.4298248291015625, 0.471343994140625, 0.5128631591796875, 0.55438232421875, 0.5959014892578125, 0.637420654296875, 0.6789398193359375, 0.720458984375, 0.7619781494140625, 0.803497314453125, 0.8450164794921875, 0.88653564453125, 0.9280548095703125, 0.969573974609375, 1.0110931396484375, 1.0526123046875, 1.0941314697265625, 1.135650634765625, 1.1771697998046875, 1.21868896484375, 1.2602081298828125, 1.301727294921875, 1.3432464599609375, 1.384765625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 13.0, 17.0, 10.0, 26.0, 49.0, 46.0, 79.0, 98.0, 156.0, 215.0, 389.0, 664.0, 1542.0, 5553.0, 33957.0, 386100.0, 3348133.0, 375294.0, 33036.0, 5409.0, 1609.0, 714.0, 416.0, 275.0, 155.0, 92.0, 62.0, 37.0, 26.0, 25.0, 24.0, 19.0, 11.0, 5.0, 2.0, 0.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.5584716796875, -7.273193359375, -6.9879150390625, -6.70263671875, -6.4173583984375, -6.132080078125, -5.8468017578125, -5.5615234375, -5.2762451171875, -4.990966796875, -4.7056884765625, -4.42041015625, -4.1351318359375, -3.849853515625, -3.5645751953125, -3.279296875, -2.9940185546875, -2.708740234375, -2.4234619140625, -2.13818359375, -1.8529052734375, -1.567626953125, -1.2823486328125, -0.9970703125, -0.7117919921875, -0.426513671875, -0.1412353515625, 0.14404296875, 0.4293212890625, 0.714599609375, 0.9998779296875, 1.28515625, 1.5704345703125, 1.855712890625, 2.1409912109375, 2.42626953125, 2.7115478515625, 2.996826171875, 3.2821044921875, 3.5673828125, 3.8526611328125, 4.137939453125, 4.4232177734375, 4.70849609375, 4.9937744140625, 5.279052734375, 5.5643310546875, 5.849609375, 6.1348876953125, 6.420166015625, 6.7054443359375, 6.99072265625, 7.2760009765625, 7.561279296875, 7.8465576171875, 8.1318359375, 8.4171142578125, 8.702392578125, 8.9876708984375, 9.27294921875, 9.5582275390625, 9.843505859375, 10.1287841796875, 10.4140625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 11.0, 12.0, 16.0, 26.0, 34.0, 66.0, 84.0, 146.0, 220.0, 296.0, 381.0, 539.0, 604.0, 488.0, 354.0, 269.0, 190.0, 111.0, 90.0, 57.0, 23.0, 27.0, 15.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.5924072265625, -5.380126953125, -5.1678466796875, -4.95556640625, -4.7432861328125, -4.531005859375, -4.3187255859375, -4.1064453125, -3.8941650390625, -3.681884765625, -3.4696044921875, -3.25732421875, -3.0450439453125, -2.832763671875, -2.6204833984375, -2.408203125, -2.1959228515625, -1.983642578125, -1.7713623046875, -1.55908203125, -1.3468017578125, -1.134521484375, -0.9222412109375, -0.7099609375, -0.4976806640625, -0.285400390625, -0.0731201171875, 0.13916015625, 0.3514404296875, 0.563720703125, 0.7760009765625, 0.98828125, 1.2005615234375, 1.412841796875, 1.6251220703125, 1.83740234375, 2.0496826171875, 2.261962890625, 2.4742431640625, 2.6865234375, 2.8988037109375, 3.111083984375, 3.3233642578125, 3.53564453125, 3.7479248046875, 3.960205078125, 4.1724853515625, 4.384765625, 4.5970458984375, 4.809326171875, 5.0216064453125, 5.23388671875, 5.4461669921875, 5.658447265625, 5.8707275390625, 6.0830078125, 6.2952880859375, 6.507568359375, 6.7198486328125, 6.93212890625, 7.1444091796875, 7.356689453125, 7.5689697265625, 7.78125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 10.0, 16.0, 25.0, 27.0, 66.0, 88.0, 169.0, 284.0, 560.0, 1199.0, 3787.0, 28519.0, 494402.0, 3319305.0, 320048.0, 20355.0, 3137.0, 1119.0, 530.0, 266.0, 158.0, 80.0, 52.0, 24.0, 17.0, 14.0, 8.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9140625, -13.4412841796875, -12.968505859375, -12.4957275390625, -12.02294921875, -11.5501708984375, -11.077392578125, -10.6046142578125, -10.1318359375, -9.6590576171875, -9.186279296875, -8.7135009765625, -8.24072265625, -7.7679443359375, -7.295166015625, -6.8223876953125, -6.349609375, -5.8768310546875, -5.404052734375, -4.9312744140625, -4.45849609375, -3.9857177734375, -3.512939453125, -3.0401611328125, -2.5673828125, -2.0946044921875, -1.621826171875, -1.1490478515625, -0.67626953125, -0.2034912109375, 0.269287109375, 0.7420654296875, 1.21484375, 1.6876220703125, 2.160400390625, 2.6331787109375, 3.10595703125, 3.5787353515625, 4.051513671875, 4.5242919921875, 4.9970703125, 5.4698486328125, 5.942626953125, 6.4154052734375, 6.88818359375, 7.3609619140625, 7.833740234375, 8.3065185546875, 8.779296875, 9.2520751953125, 9.724853515625, 10.1976318359375, 10.67041015625, 11.1431884765625, 11.615966796875, 12.0887451171875, 12.5615234375, 13.0343017578125, 13.507080078125, 13.9798583984375, 14.45263671875, 14.9254150390625, 15.398193359375, 15.8709716796875, 16.34375]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 79.0, 509.0, 389.0, 33.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.2435359954834, -20.943872451782227, -16.644208908081055, -12.344545364379883, -8.044881820678711, -3.745218276977539, 0.5544452667236328, 4.854108810424805, 9.153772354125977, 13.453435897827148, 17.75309944152832, 22.052762985229492, 26.352426528930664, 30.652090072631836, 34.951751708984375, 39.25141906738281, 43.55107879638672, 47.85074234008789, 52.15040588378906, 56.450069427490234, 60.749732971191406, 65.04939270019531, 69.34906005859375, 73.64872741699219, 77.9483871459961, 82.248046875, 86.54771423339844, 90.84738159179688, 95.14704132080078, 99.44670104980469, 103.74636840820312, 108.04603576660156, 112.345703125, 116.64537048339844, 120.94503021240234, 125.24468994140625, 129.5443572998047, 133.84402465820312, 138.1436767578125, 142.44334411621094, 146.74301147460938, 151.0426788330078, 155.34234619140625, 159.64199829101562, 163.94166564941406, 168.2413330078125, 172.54098510742188, 176.8406524658203, 181.14031982421875, 185.4399871826172, 189.73965454101562, 194.039306640625, 198.33897399902344, 202.63864135742188, 206.93829345703125, 211.2379608154297, 215.53762817382812, 219.83729553222656, 224.136962890625, 228.43661499023438, 232.7362823486328, 237.03594970703125, 241.33560180664062, 245.63526916503906, 249.9349365234375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 4.0, 11.0, 13.0, 18.0, 17.0, 18.0, 22.0, 27.0, 23.0, 27.0, 34.0, 29.0, 27.0, 31.0, 37.0, 38.0, 39.0, 47.0, 48.0, 40.0, 34.0, 38.0, 47.0, 31.0, 18.0, 30.0, 30.0, 26.0, 24.0, 30.0, 21.0, 13.0, 16.0, 13.0, 9.0, 15.0, 8.0, 14.0, 6.0, 6.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.82495880126953, -16.28693199157715, -15.748905181884766, -15.210878372192383, -14.6728515625, -14.134824752807617, -13.596796989440918, -13.058770179748535, -12.520743370056152, -11.98271656036377, -11.444689750671387, -10.906662940979004, -10.368635177612305, -9.830608367919922, -9.292581558227539, -8.754554748535156, -8.216527938842773, -7.678501129150391, -7.140474319458008, -6.602447032928467, -6.064420223236084, -5.526393413543701, -4.98836612701416, -4.450339317321777, -3.9123125076293945, -3.3742856979370117, -2.83625864982605, -2.298231601715088, -1.760204792022705, -1.2221779823303223, -0.6841509342193604, -0.14612388610839844, 0.3919029235839844, 0.9299298524856567, 1.467956781387329, 2.005983829498291, 2.544010639190674, 3.0820374488830566, 3.6200644969940186, 4.1580915451049805, 4.696118354797363, 5.234145164489746, 5.772171974182129, 6.31019926071167, 6.848226070404053, 7.3862528800964355, 7.924280166625977, 8.46230697631836, 9.000333786010742, 9.538360595703125, 10.076387405395508, 10.61441421508789, 11.152441024780273, 11.690467834472656, 12.228495597839355, 12.766522407531738, 13.304549217224121, 13.842576026916504, 14.380602836608887, 14.91862964630127, 15.456657409667969, 15.994684219360352, 16.532711029052734, 17.070737838745117, 17.6087646484375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 9.0, 14.0, 12.0, 13.0, 25.0, 19.0, 20.0, 16.0, 25.0, 28.0, 37.0, 43.0, 28.0, 30.0, 38.0, 54.0, 43.0, 43.0, 42.0, 34.0, 39.0, 41.0, 36.0, 46.0, 29.0, 32.0, 37.0, 24.0, 22.0, 23.0, 15.0, 19.0, 14.0, 7.0, 7.0, 8.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34765625, -1.3022918701171875, -1.256927490234375, -1.2115631103515625, -1.16619873046875, -1.1208343505859375, -1.075469970703125, -1.0301055908203125, -0.9847412109375, -0.9393768310546875, -0.894012451171875, -0.8486480712890625, -0.80328369140625, -0.7579193115234375, -0.712554931640625, -0.6671905517578125, -0.621826171875, -0.5764617919921875, -0.531097412109375, -0.4857330322265625, -0.44036865234375, -0.3950042724609375, -0.349639892578125, -0.3042755126953125, -0.2589111328125, -0.2135467529296875, -0.168182373046875, -0.1228179931640625, -0.07745361328125, -0.0320892333984375, 0.013275146484375, 0.0586395263671875, 0.10400390625, 0.1493682861328125, 0.194732666015625, 0.2400970458984375, 0.28546142578125, 0.3308258056640625, 0.376190185546875, 0.4215545654296875, 0.4669189453125, 0.5122833251953125, 0.557647705078125, 0.6030120849609375, 0.64837646484375, 0.6937408447265625, 0.739105224609375, 0.7844696044921875, 0.829833984375, 0.8751983642578125, 0.920562744140625, 0.9659271240234375, 1.01129150390625, 1.0566558837890625, 1.102020263671875, 1.1473846435546875, 1.1927490234375, 1.2381134033203125, 1.283477783203125, 1.3288421630859375, 1.37420654296875, 1.4195709228515625, 1.464935302734375, 1.5102996826171875, 1.5556640625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 12.0, 18.0, 27.0, 49.0, 69.0, 97.0, 163.0, 242.0, 351.0, 560.0, 891.0, 1366.0, 2258.0, 3623.0, 5864.0, 9137.0, 14882.0, 24992.0, 42857.0, 76356.0, 150194.0, 353426.0, 165175.0, 81920.0, 45735.0, 26492.0, 15779.0, 9625.0, 5998.0, 3826.0, 2430.0, 1472.0, 928.0, 585.0, 379.0, 276.0, 166.0, 129.0, 66.0, 48.0, 31.0, 19.0, 13.0, 11.0, 7.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0142364501953125, -0.013824462890625, -0.0134124755859375, -0.01300048828125, -0.0125885009765625, -0.012176513671875, -0.0117645263671875, -0.0113525390625, -0.0109405517578125, -0.010528564453125, -0.0101165771484375, -0.00970458984375, -0.0092926025390625, -0.008880615234375, -0.0084686279296875, -0.008056640625, -0.0076446533203125, -0.007232666015625, -0.0068206787109375, -0.00640869140625, -0.0059967041015625, -0.005584716796875, -0.0051727294921875, -0.0047607421875, -0.0043487548828125, -0.003936767578125, -0.0035247802734375, -0.00311279296875, -0.0027008056640625, -0.002288818359375, -0.0018768310546875, -0.00146484375, -0.0010528564453125, -0.000640869140625, -0.0002288818359375, 0.00018310546875, 0.0005950927734375, 0.001007080078125, 0.0014190673828125, 0.0018310546875, 0.0022430419921875, 0.002655029296875, 0.0030670166015625, 0.00347900390625, 0.0038909912109375, 0.004302978515625, 0.0047149658203125, 0.005126953125, 0.0055389404296875, 0.005950927734375, 0.0063629150390625, 0.00677490234375, 0.0071868896484375, 0.007598876953125, 0.0080108642578125, 0.0084228515625, 0.0088348388671875, 0.009246826171875, 0.0096588134765625, 0.01007080078125, 0.0104827880859375, 0.010894775390625, 0.0113067626953125, 0.01171875, 0.0121307373046875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 6.0, 11.0, 11.0, 7.0, 16.0, 16.0, 13.0, 16.0, 20.0, 16.0, 32.0, 23.0, 43.0, 36.0, 30.0, 39.0, 37.0, 38.0, 35.0, 1070.0, 44.0, 40.0, 40.0, 43.0, 42.0, 29.0, 30.0, 30.0, 29.0, 28.0, 21.0, 27.0, 19.0, 19.0, 15.0, 8.0, 9.0, 9.0, 3.0, 8.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.9091796875, -0.88140869140625, -0.8536376953125, -0.82586669921875, -0.798095703125, -0.77032470703125, -0.7425537109375, -0.71478271484375, -0.68701171875, -0.65924072265625, -0.6314697265625, -0.60369873046875, -0.575927734375, -0.54815673828125, -0.5203857421875, -0.49261474609375, -0.46484375, -0.43707275390625, -0.4093017578125, -0.38153076171875, -0.353759765625, -0.32598876953125, -0.2982177734375, -0.27044677734375, -0.24267578125, -0.21490478515625, -0.1871337890625, -0.15936279296875, -0.131591796875, -0.10382080078125, -0.0760498046875, -0.04827880859375, -0.0205078125, 0.00726318359375, 0.0350341796875, 0.06280517578125, 0.090576171875, 0.11834716796875, 0.1461181640625, 0.17388916015625, 0.20166015625, 0.22943115234375, 0.2572021484375, 0.28497314453125, 0.312744140625, 0.34051513671875, 0.3682861328125, 0.39605712890625, 0.423828125, 0.45159912109375, 0.4793701171875, 0.50714111328125, 0.534912109375, 0.56268310546875, 0.5904541015625, 0.61822509765625, 0.64599609375, 0.67376708984375, 0.7015380859375, 0.72930908203125, 0.757080078125, 0.78485107421875, 0.8126220703125, 0.84039306640625, 0.8681640625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 9.0, 11.0, 8.0, 22.0, 41.0, 39.0, 67.0, 72.0, 114.0, 198.0, 248.0, 378.0, 526.0, 795.0, 1036.0, 1509.0, 2032.0, 2902.0, 3939.0, 5454.0, 7722.0, 11123.0, 15923.0, 23470.0, 35273.0, 54701.0, 92040.0, 179771.0, 1310124.0, 131963.0, 73357.0, 45736.0, 29468.0, 20122.0, 13615.0, 9699.0, 6740.0, 4788.0, 3505.0, 2457.0, 1814.0, 1235.0, 943.0, 621.0, 459.0, 341.0, 200.0, 160.0, 96.0, 96.0, 59.0, 38.0, 21.0, 19.0, 13.0, 13.0, 8.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.00623321533203125, -0.0060340166091918945, -0.005834817886352539, -0.005635619163513184, -0.005436420440673828, -0.005237221717834473, -0.005038022994995117, -0.004838824272155762, -0.004639625549316406, -0.004440426826477051, -0.004241228103637695, -0.00404202938079834, -0.0038428306579589844, -0.003643631935119629, -0.0034444332122802734, -0.003245234489440918, -0.0030460357666015625, -0.002846837043762207, -0.0026476383209228516, -0.002448439598083496, -0.0022492408752441406, -0.002050042152404785, -0.0018508434295654297, -0.0016516447067260742, -0.0014524459838867188, -0.0012532472610473633, -0.0010540485382080078, -0.0008548498153686523, -0.0006556510925292969, -0.0004564523696899414, -0.00025725364685058594, -5.805492401123047e-05, 0.000141143798828125, 0.00034034252166748047, 0.0005395412445068359, 0.0007387399673461914, 0.0009379386901855469, 0.0011371374130249023, 0.0013363361358642578, 0.0015355348587036133, 0.0017347335815429688, 0.0019339323043823242, 0.0021331310272216797, 0.002332329750061035, 0.0025315284729003906, 0.002730727195739746, 0.0029299259185791016, 0.003129124641418457, 0.0033283233642578125, 0.003527522087097168, 0.0037267208099365234, 0.003925919532775879, 0.004125118255615234, 0.00432431697845459, 0.004523515701293945, 0.004722714424133301, 0.004921913146972656, 0.005121111869812012, 0.005320310592651367, 0.005519509315490723, 0.005718708038330078, 0.005917906761169434, 0.006117105484008789, 0.0063163042068481445, 0.0065155029296875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 987.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 17.0, 18.0, 6.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 7.0, 652.0, 7397.0, 1032097.0, 8199.0, 69.0, 15.0, 8.0, 4.0, 1.0, 0.0, 0.0, 1.0, 22.0, 3.0, 11.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.682209014892578e-06, -2.603977918624878e-06, -2.5257468223571777e-06, -2.4475157260894775e-06, -2.3692846298217773e-06, -2.291053533554077e-06, -2.212822437286377e-06, -2.1345913410186768e-06, -2.0563602447509766e-06, -1.9781291484832764e-06, -1.8998980522155762e-06, -1.821666955947876e-06, -1.7434358596801758e-06, -1.6652047634124756e-06, -1.5869736671447754e-06, -1.5087425708770752e-06, -1.430511474609375e-06, -1.3522803783416748e-06, -1.2740492820739746e-06, -1.1958181858062744e-06, -1.1175870895385742e-06, -1.039355993270874e-06, -9.611248970031738e-07, -8.828938007354736e-07, -8.046627044677734e-07, -7.264316082000732e-07, -6.48200511932373e-07, -5.699694156646729e-07, -4.917383193969727e-07, -4.1350722312927246e-07, -3.3527612686157227e-07, -2.5704503059387207e-07, -1.7881393432617188e-07, -1.0058283805847168e-07, -2.2351741790771484e-08, 5.587935447692871e-08, 1.341104507446289e-07, 2.123415470123291e-07, 2.905726432800293e-07, 3.688037395477295e-07, 4.470348358154297e-07, 5.252659320831299e-07, 6.034970283508301e-07, 6.817281246185303e-07, 7.599592208862305e-07, 8.381903171539307e-07, 9.164214134216309e-07, 9.94652509689331e-07, 1.0728836059570312e-06, 1.1511147022247314e-06, 1.2293457984924316e-06, 1.3075768947601318e-06, 1.385807991027832e-06, 1.4640390872955322e-06, 1.5422701835632324e-06, 1.6205012798309326e-06, 1.6987323760986328e-06, 1.776963472366333e-06, 1.8551945686340332e-06, 1.9334256649017334e-06, 2.0116567611694336e-06, 2.089887857437134e-06, 2.168118953704834e-06, 2.246350049972534e-06, 2.3245811462402344e-06]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 9.0, 14.0, 12.0, 13.0, 25.0, 19.0, 20.0, 16.0, 25.0, 28.0, 37.0, 43.0, 28.0, 30.0, 38.0, 54.0, 43.0, 43.0, 42.0, 34.0, 39.0, 41.0, 36.0, 46.0, 29.0, 32.0, 37.0, 24.0, 22.0, 23.0, 15.0, 19.0, 14.0, 7.0, 7.0, 8.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34765625, -1.3022918701171875, -1.256927490234375, -1.2115631103515625, -1.16619873046875, -1.1208343505859375, -1.075469970703125, -1.0301055908203125, -0.9847412109375, -0.9393768310546875, -0.894012451171875, -0.8486480712890625, -0.80328369140625, -0.7579193115234375, -0.712554931640625, -0.6671905517578125, -0.621826171875, -0.5764617919921875, -0.531097412109375, -0.4857330322265625, -0.44036865234375, -0.3950042724609375, -0.349639892578125, -0.3042755126953125, -0.2589111328125, -0.2135467529296875, -0.168182373046875, -0.1228179931640625, -0.07745361328125, -0.0320892333984375, 0.013275146484375, 0.0586395263671875, 0.10400390625, 0.1493682861328125, 0.194732666015625, 0.2400970458984375, 0.28546142578125, 0.3308258056640625, 0.376190185546875, 0.4215545654296875, 0.4669189453125, 0.5122833251953125, 0.557647705078125, 0.6030120849609375, 0.64837646484375, 0.6937408447265625, 0.739105224609375, 0.7844696044921875, 0.829833984375, 0.8751983642578125, 0.920562744140625, 0.9659271240234375, 1.01129150390625, 1.0566558837890625, 1.102020263671875, 1.1473846435546875, 1.1927490234375, 1.2381134033203125, 1.283477783203125, 1.3288421630859375, 1.37420654296875, 1.4195709228515625, 1.464935302734375, 1.5102996826171875, 1.5556640625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 4.0, 8.0, 23.0, 30.0, 29.0, 45.0, 73.0, 92.0, 141.0, 208.0, 315.0, 407.0, 685.0, 1067.0, 1852.0, 3100.0, 6175.0, 13652.0, 34584.0, 105103.0, 364120.0, 353649.0, 101712.0, 33991.0, 13446.0, 6101.0, 3093.0, 1747.0, 1098.0, 680.0, 405.0, 278.0, 186.0, 133.0, 106.0, 67.0, 48.0, 36.0, 17.0, 17.0, 10.0, 4.0, 5.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.259765625, -1.214752197265625, -1.16973876953125, -1.124725341796875, -1.0797119140625, -1.034698486328125, -0.98968505859375, -0.944671630859375, -0.899658203125, -0.854644775390625, -0.80963134765625, -0.764617919921875, -0.7196044921875, -0.674591064453125, -0.62957763671875, -0.584564208984375, -0.53955078125, -0.494537353515625, -0.44952392578125, -0.404510498046875, -0.3594970703125, -0.314483642578125, -0.26947021484375, -0.224456787109375, -0.179443359375, -0.134429931640625, -0.08941650390625, -0.044403076171875, 0.0006103515625, 0.045623779296875, 0.09063720703125, 0.135650634765625, 0.1806640625, 0.225677490234375, 0.27069091796875, 0.315704345703125, 0.3607177734375, 0.405731201171875, 0.45074462890625, 0.495758056640625, 0.540771484375, 0.585784912109375, 0.63079833984375, 0.675811767578125, 0.7208251953125, 0.765838623046875, 0.81085205078125, 0.855865478515625, 0.90087890625, 0.945892333984375, 0.99090576171875, 1.035919189453125, 1.0809326171875, 1.125946044921875, 1.17095947265625, 1.215972900390625, 1.260986328125, 1.305999755859375, 1.35101318359375, 1.396026611328125, 1.4410400390625, 1.486053466796875, 1.53106689453125, 1.576080322265625, 1.62109375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 8.0, 10.0, 11.0, 19.0, 10.0, 19.0, 30.0, 36.0, 39.0, 36.0, 43.0, 45.0, 58.0, 86.0, 204.0, 1742.0, 196.0, 89.0, 62.0, 54.0, 37.0, 34.0, 25.0, 36.0, 25.0, 25.0, 16.0, 14.0, 7.0, 8.0, 12.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.90234375, -7.697021484375, -7.49169921875, -7.286376953125, -7.0810546875, -6.875732421875, -6.67041015625, -6.465087890625, -6.259765625, -6.054443359375, -5.84912109375, -5.643798828125, -5.4384765625, -5.233154296875, -5.02783203125, -4.822509765625, -4.6171875, -4.411865234375, -4.20654296875, -4.001220703125, -3.7958984375, -3.590576171875, -3.38525390625, -3.179931640625, -2.974609375, -2.769287109375, -2.56396484375, -2.358642578125, -2.1533203125, -1.947998046875, -1.74267578125, -1.537353515625, -1.33203125, -1.126708984375, -0.92138671875, -0.716064453125, -0.5107421875, -0.305419921875, -0.10009765625, 0.105224609375, 0.310546875, 0.515869140625, 0.72119140625, 0.926513671875, 1.1318359375, 1.337158203125, 1.54248046875, 1.747802734375, 1.953125, 2.158447265625, 2.36376953125, 2.569091796875, 2.7744140625, 2.979736328125, 3.18505859375, 3.390380859375, 3.595703125, 3.801025390625, 4.00634765625, 4.211669921875, 4.4169921875, 4.622314453125, 4.82763671875, 5.032958984375, 5.23828125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 9.0, 8.0, 16.0, 14.0, 23.0, 36.0, 32.0, 44.0, 53.0, 77.0, 140.0, 340.0, 1016.0, 9387.0, 3085936.0, 45907.0, 1662.0, 415.0, 176.0, 107.0, 61.0, 54.0, 38.0, 35.0, 24.0, 21.0, 14.0, 15.0, 9.0, 10.0, 2.0, 7.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.140625, -10.72265625, -10.3046875, -9.88671875, -9.46875, -9.05078125, -8.6328125, -8.21484375, -7.796875, -7.37890625, -6.9609375, -6.54296875, -6.125, -5.70703125, -5.2890625, -4.87109375, -4.453125, -4.03515625, -3.6171875, -3.19921875, -2.78125, -2.36328125, -1.9453125, -1.52734375, -1.109375, -0.69140625, -0.2734375, 0.14453125, 0.5625, 0.98046875, 1.3984375, 1.81640625, 2.234375, 2.65234375, 3.0703125, 3.48828125, 3.90625, 4.32421875, 4.7421875, 5.16015625, 5.578125, 5.99609375, 6.4140625, 6.83203125, 7.25, 7.66796875, 8.0859375, 8.50390625, 8.921875, 9.33984375, 9.7578125, 10.17578125, 10.59375, 11.01171875, 11.4296875, 11.84765625, 12.265625, 12.68359375, 13.1015625, 13.51953125, 13.9375, 14.35546875, 14.7734375, 15.19140625, 15.609375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 53.0, 454.0, 467.0, 35.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.398746490478516, -34.41485595703125, -33.430965423583984, -32.44707489013672, -31.463186264038086, -30.479297637939453, -29.495407104492188, -28.511516571044922, -27.527626037597656, -26.54373550415039, -25.559846878051758, -24.575956344604492, -23.592065811157227, -22.608177185058594, -21.624286651611328, -20.640396118164062, -19.65650749206543, -18.672616958618164, -17.68872833251953, -16.704837799072266, -15.720947265625, -14.73705768585205, -13.753168106079102, -12.769277572631836, -11.785387992858887, -10.801498413085938, -9.817607879638672, -8.833718299865723, -7.849828243255615, -6.865938186645508, -5.882048606872559, -4.898158550262451, -3.9142704010009766, -2.930380344390869, -1.9464905261993408, -0.9626007080078125, 0.021289348602294922, 1.0051794052124023, 1.9890689849853516, 2.972959041595459, 3.9568490982055664, 4.940739154815674, 5.924629211425781, 6.9085187911987305, 7.892408847808838, 8.876298904418945, 9.860188484191895, 10.844078063964844, 11.82796859741211, 12.811858177185059, 13.795748710632324, 14.779638290405273, 15.763528823852539, 16.747417449951172, 17.731307983398438, 18.715198516845703, 19.69908905029297, 20.682979583740234, 21.666868209838867, 22.650758743286133, 23.6346492767334, 24.61853790283203, 25.602428436279297, 26.586318969726562, 27.570207595825195]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 7.0, 8.0, 8.0, 6.0, 14.0, 15.0, 19.0, 38.0, 22.0, 32.0, 24.0, 28.0, 34.0, 39.0, 42.0, 45.0, 38.0, 60.0, 39.0, 54.0, 54.0, 44.0, 34.0, 46.0, 39.0, 34.0, 22.0, 18.0, 23.0, 26.0, 10.0, 15.0, 14.0, 11.0, 5.0, 9.0, 4.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.646018981933594, -17.094154357910156, -16.542287826538086, -15.990423202514648, -15.438557624816895, -14.88669204711914, -14.334827423095703, -13.78296184539795, -13.231096267700195, -12.679230690002441, -12.127365112304688, -11.57550048828125, -11.023634910583496, -10.471769332885742, -9.919904708862305, -9.36803913116455, -8.816173553466797, -8.264307975769043, -7.712442874908447, -7.160577774047852, -6.608712196350098, -6.056846618652344, -5.504981517791748, -4.953116416931152, -4.401250839233398, -3.8493854999542236, -3.297520160675049, -2.745654821395874, -2.193789482116699, -1.6419241428375244, -1.0900588035583496, -0.5381934642791748, 0.013671875, 0.5655372142791748, 1.1174025535583496, 1.6692678928375244, 2.221133232116699, 2.772998571395874, 3.324863910675049, 3.8767292499542236, 4.428594589233398, 4.980460166931152, 5.532325267791748, 6.084190368652344, 6.636055946350098, 7.187921524047852, 7.739786624908447, 8.291651725769043, 8.843517303466797, 9.39538288116455, 9.947248458862305, 10.499113082885742, 11.050978660583496, 11.60284423828125, 12.154708862304688, 12.706574440002441, 13.258440017700195, 13.81030559539795, 14.362171173095703, 14.91403579711914, 15.465901374816895, 16.01776695251465, 16.569631576538086, 17.121498107910156, 17.673362731933594]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 10.0, 11.0, 15.0, 18.0, 15.0, 18.0, 28.0, 17.0, 30.0, 29.0, 36.0, 33.0, 35.0, 27.0, 46.0, 52.0, 47.0, 43.0, 42.0, 37.0, 31.0, 37.0, 43.0, 31.0, 34.0, 36.0, 41.0, 16.0, 27.0, 22.0, 21.0, 15.0, 10.0, 7.0, 8.0, 6.0, 6.0, 5.0, 0.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3671875, -1.32098388671875, -1.2747802734375, -1.22857666015625, -1.182373046875, -1.13616943359375, -1.0899658203125, -1.04376220703125, -0.99755859375, -0.95135498046875, -0.9051513671875, -0.85894775390625, -0.812744140625, -0.76654052734375, -0.7203369140625, -0.67413330078125, -0.6279296875, -0.58172607421875, -0.5355224609375, -0.48931884765625, -0.443115234375, -0.39691162109375, -0.3507080078125, -0.30450439453125, -0.25830078125, -0.21209716796875, -0.1658935546875, -0.11968994140625, -0.073486328125, -0.02728271484375, 0.0189208984375, 0.06512451171875, 0.111328125, 0.15753173828125, 0.2037353515625, 0.24993896484375, 0.296142578125, 0.34234619140625, 0.3885498046875, 0.43475341796875, 0.48095703125, 0.52716064453125, 0.5733642578125, 0.61956787109375, 0.665771484375, 0.71197509765625, 0.7581787109375, 0.80438232421875, 0.8505859375, 0.89678955078125, 0.9429931640625, 0.98919677734375, 1.035400390625, 1.08160400390625, 1.1278076171875, 1.17401123046875, 1.22021484375, 1.26641845703125, 1.3126220703125, 1.35882568359375, 1.405029296875, 1.45123291015625, 1.4974365234375, 1.54364013671875, 1.58984375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 9.0, 7.0, 8.0, 9.0, 11.0, 14.0, 23.0, 23.0, 34.0, 45.0, 47.0, 54.0, 61.0, 88.0, 194.0, 387.0, 1290.0, 4719.0, 24345.0, 176270.0, 2255177.0, 1580759.0, 126365.0, 18275.0, 3850.0, 1117.0, 403.0, 205.0, 138.0, 92.0, 66.0, 52.0, 35.0, 29.0, 13.0, 24.0, 17.0, 8.0, 9.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.531982421875, -6.30615234375, -6.080322265625, -5.8544921875, -5.628662109375, -5.40283203125, -5.177001953125, -4.951171875, -4.725341796875, -4.49951171875, -4.273681640625, -4.0478515625, -3.822021484375, -3.59619140625, -3.370361328125, -3.14453125, -2.918701171875, -2.69287109375, -2.467041015625, -2.2412109375, -2.015380859375, -1.78955078125, -1.563720703125, -1.337890625, -1.112060546875, -0.88623046875, -0.660400390625, -0.4345703125, -0.208740234375, 0.01708984375, 0.242919921875, 0.46875, 0.694580078125, 0.92041015625, 1.146240234375, 1.3720703125, 1.597900390625, 1.82373046875, 2.049560546875, 2.275390625, 2.501220703125, 2.72705078125, 2.952880859375, 3.1787109375, 3.404541015625, 3.63037109375, 3.856201171875, 4.08203125, 4.307861328125, 4.53369140625, 4.759521484375, 4.9853515625, 5.211181640625, 5.43701171875, 5.662841796875, 5.888671875, 6.114501953125, 6.34033203125, 6.566162109375, 6.7919921875, 7.017822265625, 7.24365234375, 7.469482421875, 7.6953125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 11.0, 6.0, 15.0, 17.0, 18.0, 38.0, 46.0, 63.0, 81.0, 125.0, 168.0, 215.0, 270.0, 337.0, 392.0, 472.0, 406.0, 339.0, 288.0, 216.0, 163.0, 106.0, 83.0, 51.0, 49.0, 24.0, 13.0, 20.0, 10.0, 5.0, 7.0, 6.0, 1.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.1328125, -5.96929931640625, -5.8057861328125, -5.64227294921875, -5.478759765625, -5.31524658203125, -5.1517333984375, -4.98822021484375, -4.82470703125, -4.66119384765625, -4.4976806640625, -4.33416748046875, -4.170654296875, -4.00714111328125, -3.8436279296875, -3.68011474609375, -3.5166015625, -3.35308837890625, -3.1895751953125, -3.02606201171875, -2.862548828125, -2.69903564453125, -2.5355224609375, -2.37200927734375, -2.20849609375, -2.04498291015625, -1.8814697265625, -1.71795654296875, -1.554443359375, -1.39093017578125, -1.2274169921875, -1.06390380859375, -0.900390625, -0.73687744140625, -0.5733642578125, -0.40985107421875, -0.246337890625, -0.08282470703125, 0.0806884765625, 0.24420166015625, 0.40771484375, 0.57122802734375, 0.7347412109375, 0.89825439453125, 1.061767578125, 1.22528076171875, 1.3887939453125, 1.55230712890625, 1.7158203125, 1.87933349609375, 2.0428466796875, 2.20635986328125, 2.369873046875, 2.53338623046875, 2.6968994140625, 2.86041259765625, 3.02392578125, 3.18743896484375, 3.3509521484375, 3.51446533203125, 3.677978515625, 3.84149169921875, 4.0050048828125, 4.16851806640625, 4.33203125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 5.0, 4.0, 8.0, 8.0, 14.0, 9.0, 18.0, 25.0, 33.0, 61.0, 74.0, 108.0, 173.0, 314.0, 517.0, 1026.0, 2637.0, 9278.0, 46104.0, 323718.0, 2405414.0, 1222849.0, 148451.0, 24010.0, 5655.0, 1818.0, 786.0, 414.0, 264.0, 164.0, 111.0, 52.0, 49.0, 31.0, 23.0, 16.0, 6.0, 7.0, 6.0, 9.0, 2.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.8046875, -10.485107421875, -10.16552734375, -9.845947265625, -9.5263671875, -9.206787109375, -8.88720703125, -8.567626953125, -8.248046875, -7.928466796875, -7.60888671875, -7.289306640625, -6.9697265625, -6.650146484375, -6.33056640625, -6.010986328125, -5.69140625, -5.371826171875, -5.05224609375, -4.732666015625, -4.4130859375, -4.093505859375, -3.77392578125, -3.454345703125, -3.134765625, -2.815185546875, -2.49560546875, -2.176025390625, -1.8564453125, -1.536865234375, -1.21728515625, -0.897705078125, -0.578125, -0.258544921875, 0.06103515625, 0.380615234375, 0.7001953125, 1.019775390625, 1.33935546875, 1.658935546875, 1.978515625, 2.298095703125, 2.61767578125, 2.937255859375, 3.2568359375, 3.576416015625, 3.89599609375, 4.215576171875, 4.53515625, 4.854736328125, 5.17431640625, 5.493896484375, 5.8134765625, 6.133056640625, 6.45263671875, 6.772216796875, 7.091796875, 7.411376953125, 7.73095703125, 8.050537109375, 8.3701171875, 8.689697265625, 9.00927734375, 9.328857421875, 9.6484375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 9.0, 21.0, 26.0, 37.0, 40.0, 63.0, 94.0, 101.0, 99.0, 100.0, 108.0, 91.0, 59.0, 51.0, 34.0, 21.0, 12.0, 14.0, 7.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.99664306640625, -14.2024507522583, -13.408258438110352, -12.614067077636719, -11.819873809814453, -11.02568244934082, -10.231490135192871, -9.437297821044922, -8.643105506896973, -7.848913192749023, -7.054720878601074, -6.260529041290283, -5.466336727142334, -4.672144412994385, -3.8779525756835938, -3.0837602615356445, -2.2895679473876953, -1.4953757524490356, -0.701183557510376, 0.09300851821899414, 0.8872008323669434, 1.6813931465148926, 2.4755849838256836, 3.269777297973633, 4.063969612121582, 4.858161926269531, 5.6523542404174805, 6.4465460777282715, 7.240738391876221, 8.034931182861328, 8.829122543334961, 9.62331485748291, 10.41750717163086, 11.211699485778809, 12.005891799926758, 12.80008316040039, 13.594276428222656, 14.388467788696289, 15.182660102844238, 15.976852416992188, 16.771045684814453, 17.565237045288086, 18.35943031311035, 19.153621673583984, 19.94781494140625, 20.742006301879883, 21.536197662353516, 22.33039093017578, 23.124582290649414, 23.918773651123047, 24.712966918945312, 25.507158279418945, 26.30135154724121, 27.095542907714844, 27.88973617553711, 28.683927536010742, 29.478118896484375, 30.272310256958008, 31.066503524780273, 31.860694885253906, 32.65488815307617, 33.44908142089844, 34.24327087402344, 35.0374641418457, 35.83165740966797]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 16.0, 16.0, 12.0, 24.0, 28.0, 25.0, 23.0, 28.0, 27.0, 37.0, 34.0, 32.0, 50.0, 41.0, 49.0, 55.0, 38.0, 44.0, 48.0, 34.0, 34.0, 40.0, 31.0, 40.0, 36.0, 20.0, 21.0, 16.0, 15.0, 11.0, 14.0, 4.0, 8.0, 4.0, 4.0, 11.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.592483520507812, -15.031974792480469, -14.471466064453125, -13.910957336425781, -13.350448608398438, -12.789939880371094, -12.22943115234375, -11.668922424316406, -11.108413696289062, -10.547904968261719, -9.987396240234375, -9.426887512207031, -8.866378784179688, -8.305870056152344, -7.745361328125, -7.184852600097656, -6.6243438720703125, -6.063835144042969, -5.503326416015625, -4.942817687988281, -4.3823089599609375, -3.8218002319335938, -3.26129150390625, -2.7007827758789062, -2.1402740478515625, -1.5797653198242188, -1.019256591796875, -0.45874786376953125, 0.1017608642578125, 0.6622695922851562, 1.2227783203125, 1.7832870483398438, 2.3437957763671875, 2.9043045043945312, 3.464813232421875, 4.025321960449219, 4.5858306884765625, 5.146339416503906, 5.70684814453125, 6.267356872558594, 6.8278656005859375, 7.388374328613281, 7.948883056640625, 8.509391784667969, 9.069900512695312, 9.630409240722656, 10.19091796875, 10.751426696777344, 11.311935424804688, 11.872444152832031, 12.432952880859375, 12.993461608886719, 13.553970336914062, 14.114479064941406, 14.67498779296875, 15.235496520996094, 15.796005249023438, 16.35651397705078, 16.917022705078125, 17.47753143310547, 18.038040161132812, 18.598548889160156, 19.1590576171875, 19.719566345214844, 20.280075073242188]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 4.0, 4.0, 7.0, 15.0, 25.0, 12.0, 13.0, 16.0, 24.0, 21.0, 25.0, 26.0, 30.0, 31.0, 43.0, 39.0, 46.0, 47.0, 44.0, 40.0, 44.0, 33.0, 45.0, 39.0, 37.0, 31.0, 34.0, 23.0, 20.0, 30.0, 21.0, 20.0, 19.0, 17.0, 14.0, 11.0, 8.0, 8.0, 8.0, 2.0, 2.0, 1.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.5537109375, -1.5074310302734375, -1.461151123046875, -1.4148712158203125, -1.36859130859375, -1.3223114013671875, -1.276031494140625, -1.2297515869140625, -1.1834716796875, -1.1371917724609375, -1.090911865234375, -1.0446319580078125, -0.99835205078125, -0.9520721435546875, -0.905792236328125, -0.8595123291015625, -0.813232421875, -0.7669525146484375, -0.720672607421875, -0.6743927001953125, -0.62811279296875, -0.5818328857421875, -0.535552978515625, -0.4892730712890625, -0.4429931640625, -0.3967132568359375, -0.350433349609375, -0.3041534423828125, -0.25787353515625, -0.2115936279296875, -0.165313720703125, -0.1190338134765625, -0.07275390625, -0.0264739990234375, 0.019805908203125, 0.0660858154296875, 0.11236572265625, 0.1586456298828125, 0.204925537109375, 0.2512054443359375, 0.2974853515625, 0.3437652587890625, 0.390045166015625, 0.4363250732421875, 0.48260498046875, 0.5288848876953125, 0.575164794921875, 0.6214447021484375, 0.667724609375, 0.7140045166015625, 0.760284423828125, 0.8065643310546875, 0.85284423828125, 0.8991241455078125, 0.945404052734375, 0.9916839599609375, 1.0379638671875, 1.0842437744140625, 1.130523681640625, 1.1768035888671875, 1.22308349609375, 1.2693634033203125, 1.315643310546875, 1.3619232177734375, 1.408203125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 14.0, 10.0, 23.0, 31.0, 43.0, 49.0, 88.0, 127.0, 166.0, 265.0, 396.0, 583.0, 931.0, 1449.0, 2348.0, 3571.0, 5793.0, 9439.0, 15540.0, 26634.0, 47207.0, 92620.0, 233423.0, 343389.0, 123437.0, 59707.0, 32387.0, 18733.0, 11282.0, 7002.0, 4269.0, 2631.0, 1684.0, 1188.0, 685.0, 394.0, 369.0, 200.0, 155.0, 87.0, 59.0, 50.0, 22.0, 17.0, 24.0, 9.0, 5.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.013519287109375, -0.013085722923278809, -0.012652158737182617, -0.012218594551086426, -0.011785030364990234, -0.011351466178894043, -0.010917901992797852, -0.01048433780670166, -0.010050773620605469, -0.009617209434509277, -0.009183645248413086, -0.008750081062316895, -0.008316516876220703, -0.007882952690124512, -0.00744938850402832, -0.007015824317932129, -0.0065822601318359375, -0.006148695945739746, -0.005715131759643555, -0.005281567573547363, -0.004848003387451172, -0.0044144392013549805, -0.003980875015258789, -0.0035473108291625977, -0.0031137466430664062, -0.002680182456970215, -0.0022466182708740234, -0.001813054084777832, -0.0013794898986816406, -0.0009459257125854492, -0.0005123615264892578, -7.87973403930664e-05, 0.000354766845703125, 0.0007883310317993164, 0.0012218952178955078, 0.0016554594039916992, 0.0020890235900878906, 0.002522587776184082, 0.0029561519622802734, 0.003389716148376465, 0.0038232803344726562, 0.004256844520568848, 0.004690408706665039, 0.0051239728927612305, 0.005557537078857422, 0.005991101264953613, 0.006424665451049805, 0.006858229637145996, 0.0072917938232421875, 0.007725358009338379, 0.00815892219543457, 0.008592486381530762, 0.009026050567626953, 0.009459614753723145, 0.009893178939819336, 0.010326743125915527, 0.010760307312011719, 0.01119387149810791, 0.011627435684204102, 0.012060999870300293, 0.012494564056396484, 0.012928128242492676, 0.013361692428588867, 0.013795256614685059, 0.01422882080078125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 10.0, 9.0, 5.0, 9.0, 4.0, 20.0, 15.0, 23.0, 21.0, 25.0, 26.0, 23.0, 32.0, 40.0, 27.0, 44.0, 30.0, 30.0, 37.0, 37.0, 1064.0, 51.0, 55.0, 24.0, 43.0, 23.0, 29.0, 26.0, 29.0, 29.0, 27.0, 28.0, 20.0, 14.0, 18.0, 15.0, 13.0, 9.0, 9.0, 10.0, 11.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.95947265625, -0.929046630859375, -0.89862060546875, -0.868194580078125, -0.8377685546875, -0.807342529296875, -0.77691650390625, -0.746490478515625, -0.716064453125, -0.685638427734375, -0.65521240234375, -0.624786376953125, -0.5943603515625, -0.563934326171875, -0.53350830078125, -0.503082275390625, -0.47265625, -0.442230224609375, -0.41180419921875, -0.381378173828125, -0.3509521484375, -0.320526123046875, -0.29010009765625, -0.259674072265625, -0.229248046875, -0.198822021484375, -0.16839599609375, -0.137969970703125, -0.1075439453125, -0.077117919921875, -0.04669189453125, -0.016265869140625, 0.01416015625, 0.044586181640625, 0.07501220703125, 0.105438232421875, 0.1358642578125, 0.166290283203125, 0.19671630859375, 0.227142333984375, 0.257568359375, 0.287994384765625, 0.31842041015625, 0.348846435546875, 0.3792724609375, 0.409698486328125, 0.44012451171875, 0.470550537109375, 0.5009765625, 0.531402587890625, 0.56182861328125, 0.592254638671875, 0.6226806640625, 0.653106689453125, 0.68353271484375, 0.713958740234375, 0.744384765625, 0.774810791015625, 0.80523681640625, 0.835662841796875, 0.8660888671875, 0.896514892578125, 0.92694091796875, 0.957366943359375, 0.98779296875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 7.0, 6.0, 12.0, 14.0, 26.0, 33.0, 62.0, 72.0, 116.0, 172.0, 202.0, 394.0, 476.0, 665.0, 960.0, 1380.0, 1916.0, 2620.0, 3759.0, 5210.0, 7275.0, 10250.0, 14768.0, 21021.0, 31211.0, 46480.0, 72405.0, 128739.0, 1310062.0, 175599.0, 88017.0, 54828.0, 35916.0, 24393.0, 16869.0, 11752.0, 8421.0, 6011.0, 4273.0, 3063.0, 2110.0, 1654.0, 1171.0, 805.0, 581.0, 422.0, 309.0, 180.0, 132.0, 108.0, 71.0, 55.0, 34.0, 16.0, 13.0, 13.0, 7.0, 6.0, 2.0, 2.0], "bins": [-0.0071868896484375, -0.006967067718505859, -0.006747245788574219, -0.006527423858642578, -0.0063076019287109375, -0.006087779998779297, -0.005867958068847656, -0.005648136138916016, -0.005428314208984375, -0.005208492279052734, -0.004988670349121094, -0.004768848419189453, -0.0045490264892578125, -0.004329204559326172, -0.004109382629394531, -0.0038895606994628906, -0.00366973876953125, -0.0034499168395996094, -0.0032300949096679688, -0.003010272979736328, -0.0027904510498046875, -0.002570629119873047, -0.0023508071899414062, -0.0021309852600097656, -0.001911163330078125, -0.0016913414001464844, -0.0014715194702148438, -0.0012516975402832031, -0.0010318756103515625, -0.0008120536804199219, -0.0005922317504882812, -0.0003724098205566406, -0.000152587890625, 6.723403930664062e-05, 0.00028705596923828125, 0.0005068778991699219, 0.0007266998291015625, 0.0009465217590332031, 0.0011663436889648438, 0.0013861656188964844, 0.001605987548828125, 0.0018258094787597656, 0.0020456314086914062, 0.002265453338623047, 0.0024852752685546875, 0.002705097198486328, 0.0029249191284179688, 0.0031447410583496094, 0.00336456298828125, 0.0035843849182128906, 0.0038042068481445312, 0.004024028778076172, 0.0042438507080078125, 0.004463672637939453, 0.004683494567871094, 0.004903316497802734, 0.005123138427734375, 0.005342960357666016, 0.005562782287597656, 0.005782604217529297, 0.0060024261474609375, 0.006222248077392578, 0.006442070007324219, 0.006661891937255859, 0.0068817138671875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 972.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 28.0, 18.0, 3.0, 1.0, 0.0, 0.0, 10.0, 0.0, 3.0, 10.0, 13.0, 73.0, 0.0, 1032.0, 12288.0, 1021499.0, 12357.0, 1022.0, 81.0, 0.0, 13.0, 5.0, 0.0, 1.0, 13.0, 0.0, 0.0, 0.0, 4.0, 23.0, 25.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-1.6093254089355469e-06, -1.5581026673316956e-06, -1.5068799257278442e-06, -1.455657184123993e-06, -1.4044344425201416e-06, -1.3532117009162903e-06, -1.301988959312439e-06, -1.2507662177085876e-06, -1.1995434761047363e-06, -1.148320734500885e-06, -1.0970979928970337e-06, -1.0458752512931824e-06, -9.94652509689331e-07, -9.434297680854797e-07, -8.922070264816284e-07, -8.409842848777771e-07, -7.897615432739258e-07, -7.385388016700745e-07, -6.873160600662231e-07, -6.360933184623718e-07, -5.848705768585205e-07, -5.336478352546692e-07, -4.824250936508179e-07, -4.3120235204696655e-07, -3.7997961044311523e-07, -3.287568688392639e-07, -2.775341272354126e-07, -2.2631138563156128e-07, -1.7508864402770996e-07, -1.2386590242385864e-07, -7.264316082000732e-08, -2.1420419216156006e-08, 2.9802322387695312e-08, 8.102506399154663e-08, 1.3224780559539795e-07, 1.8347054719924927e-07, 2.3469328880310059e-07, 2.859160304069519e-07, 3.371387720108032e-07, 3.8836151361465454e-07, 4.3958425521850586e-07, 4.908069968223572e-07, 5.420297384262085e-07, 5.932524800300598e-07, 6.444752216339111e-07, 6.956979632377625e-07, 7.469207048416138e-07, 7.981434464454651e-07, 8.493661880493164e-07, 9.005889296531677e-07, 9.51811671257019e-07, 1.0030344128608704e-06, 1.0542571544647217e-06, 1.105479896068573e-06, 1.1567026376724243e-06, 1.2079253792762756e-06, 1.259148120880127e-06, 1.3103708624839783e-06, 1.3615936040878296e-06, 1.412816345691681e-06, 1.4640390872955322e-06, 1.5152618288993835e-06, 1.5664845705032349e-06, 1.6177073121070862e-06, 1.6689300537109375e-06]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 4.0, 4.0, 7.0, 15.0, 25.0, 12.0, 13.0, 16.0, 24.0, 21.0, 25.0, 26.0, 30.0, 31.0, 43.0, 39.0, 46.0, 47.0, 44.0, 40.0, 44.0, 33.0, 45.0, 39.0, 37.0, 31.0, 34.0, 23.0, 20.0, 30.0, 21.0, 20.0, 19.0, 17.0, 14.0, 11.0, 8.0, 8.0, 8.0, 2.0, 2.0, 1.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.5537109375, -1.5074310302734375, -1.461151123046875, -1.4148712158203125, -1.36859130859375, -1.3223114013671875, -1.276031494140625, -1.2297515869140625, -1.1834716796875, -1.1371917724609375, -1.090911865234375, -1.0446319580078125, -0.99835205078125, -0.9520721435546875, -0.905792236328125, -0.8595123291015625, -0.813232421875, -0.7669525146484375, -0.720672607421875, -0.6743927001953125, -0.62811279296875, -0.5818328857421875, -0.535552978515625, -0.4892730712890625, -0.4429931640625, -0.3967132568359375, -0.350433349609375, -0.3041534423828125, -0.25787353515625, -0.2115936279296875, -0.165313720703125, -0.1190338134765625, -0.07275390625, -0.0264739990234375, 0.019805908203125, 0.0660858154296875, 0.11236572265625, 0.1586456298828125, 0.204925537109375, 0.2512054443359375, 0.2974853515625, 0.3437652587890625, 0.390045166015625, 0.4363250732421875, 0.48260498046875, 0.5288848876953125, 0.575164794921875, 0.6214447021484375, 0.667724609375, 0.7140045166015625, 0.760284423828125, 0.8065643310546875, 0.85284423828125, 0.8991241455078125, 0.945404052734375, 0.9916839599609375, 1.0379638671875, 1.0842437744140625, 1.130523681640625, 1.1768035888671875, 1.22308349609375, 1.2693634033203125, 1.315643310546875, 1.3619232177734375, 1.408203125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 10.0, 20.0, 16.0, 31.0, 25.0, 37.0, 47.0, 75.0, 93.0, 160.0, 212.0, 311.0, 492.0, 837.0, 1287.0, 2163.0, 3516.0, 5992.0, 10740.0, 21800.0, 57678.0, 339673.0, 480805.0, 69583.0, 24590.0, 11783.0, 6530.0, 3728.0, 2303.0, 1408.0, 899.0, 547.0, 361.0, 232.0, 175.0, 110.0, 85.0, 54.0, 40.0, 27.0, 21.0, 17.0, 10.0, 6.0, 11.0, 3.0, 3.0, 3.0, 4.0, 4.0, 1.0], "bins": [-2.697265625, -2.620361328125, -2.54345703125, -2.466552734375, -2.3896484375, -2.312744140625, -2.23583984375, -2.158935546875, -2.08203125, -2.005126953125, -1.92822265625, -1.851318359375, -1.7744140625, -1.697509765625, -1.62060546875, -1.543701171875, -1.466796875, -1.389892578125, -1.31298828125, -1.236083984375, -1.1591796875, -1.082275390625, -1.00537109375, -0.928466796875, -0.8515625, -0.774658203125, -0.69775390625, -0.620849609375, -0.5439453125, -0.467041015625, -0.39013671875, -0.313232421875, -0.236328125, -0.159423828125, -0.08251953125, -0.005615234375, 0.0712890625, 0.148193359375, 0.22509765625, 0.302001953125, 0.37890625, 0.455810546875, 0.53271484375, 0.609619140625, 0.6865234375, 0.763427734375, 0.84033203125, 0.917236328125, 0.994140625, 1.071044921875, 1.14794921875, 1.224853515625, 1.3017578125, 1.378662109375, 1.45556640625, 1.532470703125, 1.609375, 1.686279296875, 1.76318359375, 1.840087890625, 1.9169921875, 1.993896484375, 2.07080078125, 2.147705078125, 2.224609375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 14.0, 11.0, 10.0, 16.0, 14.0, 30.0, 20.0, 31.0, 37.0, 29.0, 40.0, 44.0, 57.0, 87.0, 118.0, 1473.0, 432.0, 115.0, 71.0, 59.0, 65.0, 50.0, 25.0, 34.0, 24.0, 20.0, 19.0, 11.0, 18.0, 17.0, 12.0, 9.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.12890625, -6.93621826171875, -6.7435302734375, -6.55084228515625, -6.358154296875, -6.16546630859375, -5.9727783203125, -5.78009033203125, -5.58740234375, -5.39471435546875, -5.2020263671875, -5.00933837890625, -4.816650390625, -4.62396240234375, -4.4312744140625, -4.23858642578125, -4.0458984375, -3.85321044921875, -3.6605224609375, -3.46783447265625, -3.275146484375, -3.08245849609375, -2.8897705078125, -2.69708251953125, -2.50439453125, -2.31170654296875, -2.1190185546875, -1.92633056640625, -1.733642578125, -1.54095458984375, -1.3482666015625, -1.15557861328125, -0.962890625, -0.77020263671875, -0.5775146484375, -0.38482666015625, -0.192138671875, 0.00054931640625, 0.1932373046875, 0.38592529296875, 0.57861328125, 0.77130126953125, 0.9639892578125, 1.15667724609375, 1.349365234375, 1.54205322265625, 1.7347412109375, 1.92742919921875, 2.1201171875, 2.31280517578125, 2.5054931640625, 2.69818115234375, 2.890869140625, 3.08355712890625, 3.2762451171875, 3.46893310546875, 3.66162109375, 3.85430908203125, 4.0469970703125, 4.23968505859375, 4.432373046875, 4.62506103515625, 4.8177490234375, 5.01043701171875, 5.203125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 7.0, 18.0, 10.0, 17.0, 25.0, 44.0, 44.0, 59.0, 89.0, 144.0, 299.0, 760.0, 3273.0, 26912.0, 1874077.0, 1209999.0, 25237.0, 3183.0, 719.0, 244.0, 158.0, 105.0, 56.0, 46.0, 37.0, 23.0, 23.0, 15.0, 19.0, 13.0, 12.0, 5.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.78125, -8.455810546875, -8.13037109375, -7.804931640625, -7.4794921875, -7.154052734375, -6.82861328125, -6.503173828125, -6.177734375, -5.852294921875, -5.52685546875, -5.201416015625, -4.8759765625, -4.550537109375, -4.22509765625, -3.899658203125, -3.57421875, -3.248779296875, -2.92333984375, -2.597900390625, -2.2724609375, -1.947021484375, -1.62158203125, -1.296142578125, -0.970703125, -0.645263671875, -0.31982421875, 0.005615234375, 0.3310546875, 0.656494140625, 0.98193359375, 1.307373046875, 1.6328125, 1.958251953125, 2.28369140625, 2.609130859375, 2.9345703125, 3.260009765625, 3.58544921875, 3.910888671875, 4.236328125, 4.561767578125, 4.88720703125, 5.212646484375, 5.5380859375, 5.863525390625, 6.18896484375, 6.514404296875, 6.83984375, 7.165283203125, 7.49072265625, 7.816162109375, 8.1416015625, 8.467041015625, 8.79248046875, 9.117919921875, 9.443359375, 9.768798828125, 10.09423828125, 10.419677734375, 10.7451171875, 11.070556640625, 11.39599609375, 11.721435546875, 12.046875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 630.0, 354.0, 6.0, 0.0, 0.0, 1.0], "bins": [-153.84768676757812, -151.2323455810547, -148.61700439453125, -146.0016632080078, -143.38632202148438, -140.77099609375, -138.15565490722656, -135.54031372070312, -132.9249725341797, -130.30963134765625, -127.69429016113281, -125.0789566040039, -122.46361541748047, -119.84827423095703, -117.23294067382812, -114.61759948730469, -112.00225830078125, -109.38691711425781, -106.77157592773438, -104.15624237060547, -101.54090118408203, -98.9255599975586, -96.31022644042969, -93.69488525390625, -91.07954406738281, -88.46420288085938, -85.84886169433594, -83.23352813720703, -80.6181869506836, -78.00284576416016, -75.38751220703125, -72.77217102050781, -70.15682983398438, -67.54148864746094, -64.9261474609375, -62.310813903808594, -59.695472717285156, -57.08013153076172, -54.46479415893555, -51.849456787109375, -49.2341194152832, -46.61878204345703, -44.003440856933594, -41.388099670410156, -38.772762298583984, -36.15742492675781, -33.542083740234375, -30.92674446105957, -28.311405181884766, -25.69606590270996, -23.080726623535156, -20.46538734436035, -17.850048065185547, -15.234708786010742, -12.619369506835938, -10.004030227661133, -7.388689994812012, -4.773350715637207, -2.1580114364624023, 0.45732784271240234, 3.072667121887207, 5.688006401062012, 8.303345680236816, 10.918684959411621, 13.534024238586426]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 12.0, 11.0, 13.0, 17.0, 15.0, 18.0, 25.0, 46.0, 30.0, 31.0, 33.0, 39.0, 44.0, 42.0, 55.0, 44.0, 45.0, 46.0, 44.0, 38.0, 47.0, 45.0, 37.0, 21.0, 31.0, 28.0, 32.0, 18.0, 16.0, 10.0, 7.0, 11.0, 5.0, 10.0, 5.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.57647132873535, -17.96932029724121, -17.36216926574707, -16.75501823425293, -16.147869110107422, -15.540717124938965, -14.93356704711914, -14.326416015625, -13.71926498413086, -13.112113952636719, -12.504962921142578, -11.897812843322754, -11.290661811828613, -10.683510780334473, -10.076360702514648, -9.469209671020508, -8.862058639526367, -8.254907608032227, -7.647757053375244, -7.040606498718262, -6.433455467224121, -5.8263044357299805, -5.219153881072998, -4.612003326416016, -4.004852294921875, -3.3977015018463135, -2.790550708770752, -2.1833999156951904, -1.576249122619629, -0.9690983295440674, -0.36194753646850586, 0.24520301818847656, 0.8523521423339844, 1.459502935409546, 2.0666537284851074, 2.673804521560669, 3.2809553146362305, 3.888106107711792, 4.4952569007873535, 5.102407455444336, 5.709558486938477, 6.316709518432617, 6.9238600730896, 7.531010627746582, 8.138161659240723, 8.745312690734863, 9.352462768554688, 9.959613800048828, 10.566764831542969, 11.17391586303711, 11.78106689453125, 12.388216972351074, 12.995368003845215, 13.602519035339355, 14.20966911315918, 14.81682014465332, 15.423971176147461, 16.0311222076416, 16.638273239135742, 17.245424270629883, 17.85257339477539, 18.45972442626953, 19.066875457763672, 19.674026489257812, 20.281177520751953]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 7.0, 17.0, 12.0, 14.0, 14.0, 24.0, 14.0, 21.0, 27.0, 20.0, 26.0, 26.0, 26.0, 42.0, 36.0, 55.0, 50.0, 33.0, 50.0, 38.0, 43.0, 36.0, 32.0, 40.0, 33.0, 27.0, 26.0, 29.0, 27.0, 18.0, 16.0, 21.0, 17.0, 9.0, 14.0, 15.0, 9.0, 7.0, 1.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.533203125, -1.4860687255859375, -1.438934326171875, -1.3917999267578125, -1.34466552734375, -1.2975311279296875, -1.250396728515625, -1.2032623291015625, -1.1561279296875, -1.1089935302734375, -1.061859130859375, -1.0147247314453125, -0.96759033203125, -0.9204559326171875, -0.873321533203125, -0.8261871337890625, -0.779052734375, -0.7319183349609375, -0.684783935546875, -0.6376495361328125, -0.59051513671875, -0.5433807373046875, -0.496246337890625, -0.4491119384765625, -0.4019775390625, -0.3548431396484375, -0.307708740234375, -0.2605743408203125, -0.21343994140625, -0.1663055419921875, -0.119171142578125, -0.0720367431640625, -0.02490234375, 0.0222320556640625, 0.069366455078125, 0.1165008544921875, 0.16363525390625, 0.2107696533203125, 0.257904052734375, 0.3050384521484375, 0.3521728515625, 0.3993072509765625, 0.446441650390625, 0.4935760498046875, 0.54071044921875, 0.5878448486328125, 0.634979248046875, 0.6821136474609375, 0.729248046875, 0.7763824462890625, 0.823516845703125, 0.8706512451171875, 0.91778564453125, 0.9649200439453125, 1.012054443359375, 1.0591888427734375, 1.1063232421875, 1.1534576416015625, 1.200592041015625, 1.2477264404296875, 1.29486083984375, 1.3419952392578125, 1.389129638671875, 1.4362640380859375, 1.4833984375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 9.0, 5.0, 10.0, 9.0, 11.0, 15.0, 27.0, 25.0, 35.0, 41.0, 43.0, 47.0, 84.0, 92.0, 183.0, 345.0, 953.0, 3523.0, 17916.0, 115241.0, 1392538.0, 2436957.0, 191948.0, 26664.0, 5082.0, 1253.0, 434.0, 228.0, 121.0, 106.0, 78.0, 58.0, 54.0, 33.0, 22.0, 17.0, 12.0, 14.0, 7.0, 14.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.625, -7.394775390625, -7.16455078125, -6.934326171875, -6.7041015625, -6.473876953125, -6.24365234375, -6.013427734375, -5.783203125, -5.552978515625, -5.32275390625, -5.092529296875, -4.8623046875, -4.632080078125, -4.40185546875, -4.171630859375, -3.94140625, -3.711181640625, -3.48095703125, -3.250732421875, -3.0205078125, -2.790283203125, -2.56005859375, -2.329833984375, -2.099609375, -1.869384765625, -1.63916015625, -1.408935546875, -1.1787109375, -0.948486328125, -0.71826171875, -0.488037109375, -0.2578125, -0.027587890625, 0.20263671875, 0.432861328125, 0.6630859375, 0.893310546875, 1.12353515625, 1.353759765625, 1.583984375, 1.814208984375, 2.04443359375, 2.274658203125, 2.5048828125, 2.735107421875, 2.96533203125, 3.195556640625, 3.42578125, 3.656005859375, 3.88623046875, 4.116455078125, 4.3466796875, 4.576904296875, 4.80712890625, 5.037353515625, 5.267578125, 5.497802734375, 5.72802734375, 5.958251953125, 6.1884765625, 6.418701171875, 6.64892578125, 6.879150390625, 7.109375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 12.0, 15.0, 27.0, 31.0, 46.0, 81.0, 119.0, 169.0, 239.0, 400.0, 496.0, 557.0, 553.0, 394.0, 283.0, 216.0, 131.0, 124.0, 69.0, 32.0, 19.0, 18.0, 10.0, 12.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -8.03466796875, -7.8271484375, -7.61962890625, -7.412109375, -7.20458984375, -6.9970703125, -6.78955078125, -6.58203125, -6.37451171875, -6.1669921875, -5.95947265625, -5.751953125, -5.54443359375, -5.3369140625, -5.12939453125, -4.921875, -4.71435546875, -4.5068359375, -4.29931640625, -4.091796875, -3.88427734375, -3.6767578125, -3.46923828125, -3.26171875, -3.05419921875, -2.8466796875, -2.63916015625, -2.431640625, -2.22412109375, -2.0166015625, -1.80908203125, -1.6015625, -1.39404296875, -1.1865234375, -0.97900390625, -0.771484375, -0.56396484375, -0.3564453125, -0.14892578125, 0.05859375, 0.26611328125, 0.4736328125, 0.68115234375, 0.888671875, 1.09619140625, 1.3037109375, 1.51123046875, 1.71875, 1.92626953125, 2.1337890625, 2.34130859375, 2.548828125, 2.75634765625, 2.9638671875, 3.17138671875, 3.37890625, 3.58642578125, 3.7939453125, 4.00146484375, 4.208984375, 4.41650390625, 4.6240234375, 4.83154296875, 5.0390625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 12.0, 20.0, 22.0, 48.0, 50.0, 87.0, 137.0, 205.0, 363.0, 663.0, 1703.0, 6921.0, 58849.0, 913683.0, 2965168.0, 221882.0, 18942.0, 3283.0, 1000.0, 490.0, 275.0, 166.0, 106.0, 82.0, 38.0, 25.0, 18.0, 13.0, 9.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4375, -10.984619140625, -10.53173828125, -10.078857421875, -9.6259765625, -9.173095703125, -8.72021484375, -8.267333984375, -7.814453125, -7.361572265625, -6.90869140625, -6.455810546875, -6.0029296875, -5.550048828125, -5.09716796875, -4.644287109375, -4.19140625, -3.738525390625, -3.28564453125, -2.832763671875, -2.3798828125, -1.927001953125, -1.47412109375, -1.021240234375, -0.568359375, -0.115478515625, 0.33740234375, 0.790283203125, 1.2431640625, 1.696044921875, 2.14892578125, 2.601806640625, 3.0546875, 3.507568359375, 3.96044921875, 4.413330078125, 4.8662109375, 5.319091796875, 5.77197265625, 6.224853515625, 6.677734375, 7.130615234375, 7.58349609375, 8.036376953125, 8.4892578125, 8.942138671875, 9.39501953125, 9.847900390625, 10.30078125, 10.753662109375, 11.20654296875, 11.659423828125, 12.1123046875, 12.565185546875, 13.01806640625, 13.470947265625, 13.923828125, 14.376708984375, 14.82958984375, 15.282470703125, 15.7353515625, 16.188232421875, 16.64111328125, 17.093994140625, 17.546875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 12.0, 46.0, 104.0, 172.0, 217.0, 230.0, 126.0, 72.0, 27.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.64372253417969, -60.66957092285156, -58.69541931152344, -56.72126770019531, -54.74711990356445, -52.77296829223633, -50.7988166809082, -48.82466506958008, -46.85051727294922, -44.876365661621094, -42.90221405029297, -40.928062438964844, -38.953914642333984, -36.97976303100586, -35.005611419677734, -33.03145980834961, -31.057308197021484, -29.08315658569336, -27.109006881713867, -25.134855270385742, -23.16070556640625, -21.186553955078125, -19.21240234375, -17.238250732421875, -15.264101028442383, -13.289950370788574, -11.315799713134766, -9.34164810180664, -7.367497444152832, -5.393346786499023, -3.4191951751708984, -1.4450445175170898, 0.5291099548339844, 2.503260850906372, 4.47741174697876, 6.451562881469727, 8.425713539123535, 10.399864196777344, 12.374015808105469, 14.348166465759277, 16.322317123413086, 18.29646873474121, 20.270618438720703, 22.244770050048828, 24.218921661376953, 26.193071365356445, 28.16722297668457, 30.141372680664062, 32.11552429199219, 34.08967590332031, 36.06382751464844, 38.03797912597656, 40.01212692260742, 41.98627853393555, 43.96043014526367, 45.9345817565918, 47.908729553222656, 49.88288116455078, 51.857032775878906, 53.83118438720703, 55.80533218383789, 57.779483795166016, 59.75363540649414, 61.727787017822266, 63.70193862915039]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 6.0, 13.0, 10.0, 10.0, 14.0, 16.0, 18.0, 20.0, 21.0, 32.0, 26.0, 22.0, 44.0, 41.0, 44.0, 30.0, 39.0, 47.0, 36.0, 42.0, 31.0, 32.0, 44.0, 37.0, 39.0, 29.0, 29.0, 21.0, 34.0, 29.0, 23.0, 19.0, 17.0, 17.0, 12.0, 5.0, 8.0, 9.0, 4.0, 11.0, 4.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.227069854736328, -15.661134719848633, -15.095198631286621, -14.529263496398926, -13.963327407836914, -13.397392272949219, -12.831457138061523, -12.265521049499512, -11.6995849609375, -11.133649826049805, -10.567713737487793, -10.001778602600098, -9.435842514038086, -8.86990737915039, -8.303972244262695, -7.738036155700684, -7.172101020812988, -6.606165409088135, -6.040229797363281, -5.474294662475586, -4.908358573913574, -4.342423439025879, -3.7764878273010254, -3.210552215576172, -2.6446166038513184, -2.078680992126465, -1.5127454996109009, -0.9468100070953369, -0.3808743953704834, 0.18506121635437012, 0.7509965896606445, 1.316932201385498, 1.8828678131103516, 2.448803424835205, 3.0147390365600586, 3.580674409866333, 4.146610260009766, 4.712545394897461, 5.2784810066223145, 5.844416618347168, 6.4103522300720215, 6.976287841796875, 7.5422234535217285, 8.108159065246582, 8.674094200134277, 9.240030288696289, 9.805965423583984, 10.37190055847168, 10.937836647033691, 11.503771781921387, 12.069707870483398, 12.635643005371094, 13.201579093933105, 13.7675142288208, 14.333450317382812, 14.899385452270508, 15.465320587158203, 16.0312557220459, 16.597190856933594, 17.163127899169922, 17.729063034057617, 18.294998168945312, 18.860933303833008, 19.426868438720703, 19.99280548095703]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 4.0, 3.0, 7.0, 11.0, 18.0, 11.0, 13.0, 18.0, 14.0, 22.0, 22.0, 23.0, 29.0, 27.0, 36.0, 32.0, 43.0, 52.0, 33.0, 50.0, 49.0, 53.0, 35.0, 58.0, 36.0, 38.0, 29.0, 32.0, 35.0, 26.0, 16.0, 20.0, 20.0, 18.0, 13.0, 16.0, 9.0, 1.0, 11.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6279296875, -1.5745697021484375, -1.521209716796875, -1.4678497314453125, -1.41448974609375, -1.3611297607421875, -1.307769775390625, -1.2544097900390625, -1.2010498046875, -1.1476898193359375, -1.094329833984375, -1.0409698486328125, -0.98760986328125, -0.9342498779296875, -0.880889892578125, -0.8275299072265625, -0.774169921875, -0.7208099365234375, -0.667449951171875, -0.6140899658203125, -0.56072998046875, -0.5073699951171875, -0.454010009765625, -0.4006500244140625, -0.3472900390625, -0.2939300537109375, -0.240570068359375, -0.1872100830078125, -0.13385009765625, -0.0804901123046875, -0.027130126953125, 0.0262298583984375, 0.07958984375, 0.1329498291015625, 0.186309814453125, 0.2396697998046875, 0.29302978515625, 0.3463897705078125, 0.399749755859375, 0.4531097412109375, 0.5064697265625, 0.5598297119140625, 0.613189697265625, 0.6665496826171875, 0.71990966796875, 0.7732696533203125, 0.826629638671875, 0.8799896240234375, 0.933349609375, 0.9867095947265625, 1.040069580078125, 1.0934295654296875, 1.14678955078125, 1.2001495361328125, 1.253509521484375, 1.3068695068359375, 1.3602294921875, 1.4135894775390625, 1.466949462890625, 1.5203094482421875, 1.57366943359375, 1.6270294189453125, 1.680389404296875, 1.7337493896484375, 1.787109375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 20.0, 10.0, 23.0, 33.0, 51.0, 68.0, 97.0, 138.0, 192.0, 304.0, 420.0, 608.0, 901.0, 1290.0, 1906.0, 2890.0, 4257.0, 6542.0, 9762.0, 15376.0, 23752.0, 38351.0, 66336.0, 132174.0, 349787.0, 185317.0, 81701.0, 46373.0, 28004.0, 17757.0, 11430.0, 7456.0, 5063.0, 3177.0, 2196.0, 1563.0, 1017.0, 675.0, 472.0, 326.0, 222.0, 150.0, 111.0, 81.0, 49.0, 40.0, 20.0, 24.0, 16.0, 5.0, 10.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.01332855224609375, -0.012894034385681152, -0.012459516525268555, -0.012024998664855957, -0.01159048080444336, -0.011155962944030762, -0.010721445083618164, -0.010286927223205566, -0.009852409362792969, -0.009417891502380371, -0.008983373641967773, -0.008548855781555176, -0.008114337921142578, -0.0076798200607299805, -0.007245302200317383, -0.006810784339904785, -0.0063762664794921875, -0.00594174861907959, -0.005507230758666992, -0.0050727128982543945, -0.004638195037841797, -0.004203677177429199, -0.0037691593170166016, -0.003334641456604004, -0.0029001235961914062, -0.0024656057357788086, -0.002031087875366211, -0.0015965700149536133, -0.0011620521545410156, -0.000727534294128418, -0.0002930164337158203, 0.00014150142669677734, 0.000576019287109375, 0.0010105371475219727, 0.0014450550079345703, 0.001879572868347168, 0.0023140907287597656, 0.0027486085891723633, 0.003183126449584961, 0.0036176443099975586, 0.004052162170410156, 0.004486680030822754, 0.0049211978912353516, 0.005355715751647949, 0.005790233612060547, 0.0062247514724731445, 0.006659269332885742, 0.00709378719329834, 0.0075283050537109375, 0.007962822914123535, 0.008397340774536133, 0.00883185863494873, 0.009266376495361328, 0.009700894355773926, 0.010135412216186523, 0.010569930076599121, 0.011004447937011719, 0.011438965797424316, 0.011873483657836914, 0.012308001518249512, 0.01274251937866211, 0.013177037239074707, 0.013611555099487305, 0.014046072959899902, 0.0144805908203125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 8.0, 8.0, 8.0, 10.0, 8.0, 15.0, 18.0, 18.0, 21.0, 24.0, 25.0, 21.0, 25.0, 19.0, 32.0, 28.0, 34.0, 35.0, 37.0, 38.0, 36.0, 1067.0, 41.0, 37.0, 39.0, 44.0, 44.0, 33.0, 32.0, 23.0, 26.0, 18.0, 22.0, 23.0, 19.0, 18.0, 16.0, 18.0, 11.0, 5.0, 8.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0458984375, -1.0133209228515625, -0.980743408203125, -0.9481658935546875, -0.91558837890625, -0.8830108642578125, -0.850433349609375, -0.8178558349609375, -0.7852783203125, -0.7527008056640625, -0.720123291015625, -0.6875457763671875, -0.65496826171875, -0.6223907470703125, -0.589813232421875, -0.5572357177734375, -0.524658203125, -0.4920806884765625, -0.459503173828125, -0.4269256591796875, -0.39434814453125, -0.3617706298828125, -0.329193115234375, -0.2966156005859375, -0.2640380859375, -0.2314605712890625, -0.198883056640625, -0.1663055419921875, -0.13372802734375, -0.1011505126953125, -0.068572998046875, -0.0359954833984375, -0.00341796875, 0.0291595458984375, 0.061737060546875, 0.0943145751953125, 0.12689208984375, 0.1594696044921875, 0.192047119140625, 0.2246246337890625, 0.2572021484375, 0.2897796630859375, 0.322357177734375, 0.3549346923828125, 0.38751220703125, 0.4200897216796875, 0.452667236328125, 0.4852447509765625, 0.517822265625, 0.5503997802734375, 0.582977294921875, 0.6155548095703125, 0.64813232421875, 0.6807098388671875, 0.713287353515625, 0.7458648681640625, 0.7784423828125, 0.8110198974609375, 0.843597412109375, 0.8761749267578125, 0.90875244140625, 0.9413299560546875, 0.973907470703125, 1.0064849853515625, 1.0390625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 12.0, 21.0, 24.0, 45.0, 57.0, 94.0, 118.0, 210.0, 314.0, 438.0, 684.0, 985.0, 1396.0, 1934.0, 2811.0, 3929.0, 5439.0, 7400.0, 10588.0, 14543.0, 20925.0, 30706.0, 46661.0, 73543.0, 132244.0, 1307501.0, 173099.0, 88851.0, 54740.0, 35625.0, 24118.0, 16603.0, 11844.0, 8451.0, 6160.0, 4474.0, 3161.0, 2219.0, 1624.0, 1136.0, 776.0, 519.0, 379.0, 246.0, 153.0, 104.0, 71.0, 48.0, 35.0, 22.0, 12.0, 11.0, 9.0, 5.0, 4.0, 3.0, 0.0, 1.0], "bins": [-0.00746917724609375, -0.007233381271362305, -0.006997585296630859, -0.006761789321899414, -0.006525993347167969, -0.0062901973724365234, -0.006054401397705078, -0.005818605422973633, -0.0055828094482421875, -0.005347013473510742, -0.005111217498779297, -0.0048754215240478516, -0.004639625549316406, -0.004403829574584961, -0.004168033599853516, -0.00393223762512207, -0.003696441650390625, -0.0034606456756591797, -0.0032248497009277344, -0.002989053726196289, -0.0027532577514648438, -0.0025174617767333984, -0.002281665802001953, -0.002045869827270508, -0.0018100738525390625, -0.0015742778778076172, -0.0013384819030761719, -0.0011026859283447266, -0.0008668899536132812, -0.0006310939788818359, -0.0003952980041503906, -0.0001595020294189453, 7.62939453125e-05, 0.0003120899200439453, 0.0005478858947753906, 0.0007836818695068359, 0.0010194778442382812, 0.0012552738189697266, 0.0014910697937011719, 0.0017268657684326172, 0.0019626617431640625, 0.002198457717895508, 0.002434253692626953, 0.0026700496673583984, 0.0029058456420898438, 0.003141641616821289, 0.0033774375915527344, 0.0036132335662841797, 0.003849029541015625, 0.00408482551574707, 0.004320621490478516, 0.004556417465209961, 0.004792213439941406, 0.0050280094146728516, 0.005263805389404297, 0.005499601364135742, 0.0057353973388671875, 0.005971193313598633, 0.006206989288330078, 0.0064427852630615234, 0.006678581237792969, 0.006914377212524414, 0.007150173187255859, 0.007385969161987305, 0.00762176513671875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 946.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 8.0, 16.0, 0.0, 22.0, 18.0, 10.0, 19.0, 13.0, 10.0, 11.0, 34.0, 0.0, 89.0, 380.0, 3438.0, 21877.0, 996646.0, 21918.0, 3434.0, 359.0, 0.0, 90.0, 34.0, 10.0, 9.0, 7.0, 23.0, 10.0, 21.0, 0.0, 16.0, 15.0, 8.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6754493117332458e-06, -1.6223639249801636e-06, -1.5692785382270813e-06, -1.516193151473999e-06, -1.4631077647209167e-06, -1.4100223779678345e-06, -1.3569369912147522e-06, -1.30385160446167e-06, -1.2507662177085876e-06, -1.1976808309555054e-06, -1.144595444202423e-06, -1.0915100574493408e-06, -1.0384246706962585e-06, -9.853392839431763e-07, -9.32253897190094e-07, -8.791685104370117e-07, -8.260831236839294e-07, -7.729977369308472e-07, -7.199123501777649e-07, -6.668269634246826e-07, -6.137415766716003e-07, -5.606561899185181e-07, -5.075708031654358e-07, -4.544854164123535e-07, -4.0140002965927124e-07, -3.4831464290618896e-07, -2.952292561531067e-07, -2.421438694000244e-07, -1.8905848264694214e-07, -1.3597309589385986e-07, -8.288770914077759e-08, -2.9802322387695312e-08, 2.3283064365386963e-08, 7.636845111846924e-08, 1.2945383787155151e-07, 1.825392246246338e-07, 2.3562461137771606e-07, 2.8870999813079834e-07, 3.417953848838806e-07, 3.948807716369629e-07, 4.4796615839004517e-07, 5.010515451431274e-07, 5.541369318962097e-07, 6.07222318649292e-07, 6.603077054023743e-07, 7.133930921554565e-07, 7.664784789085388e-07, 8.195638656616211e-07, 8.726492524147034e-07, 9.257346391677856e-07, 9.78820025920868e-07, 1.0319054126739502e-06, 1.0849907994270325e-06, 1.1380761861801147e-06, 1.191161572933197e-06, 1.2442469596862793e-06, 1.2973323464393616e-06, 1.3504177331924438e-06, 1.4035031199455261e-06, 1.4565885066986084e-06, 1.5096738934516907e-06, 1.562759280204773e-06, 1.6158446669578552e-06, 1.6689300537109375e-06]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 4.0, 3.0, 7.0, 11.0, 18.0, 11.0, 13.0, 18.0, 14.0, 22.0, 22.0, 23.0, 29.0, 27.0, 36.0, 32.0, 43.0, 52.0, 33.0, 50.0, 49.0, 53.0, 35.0, 58.0, 36.0, 38.0, 29.0, 32.0, 35.0, 26.0, 16.0, 20.0, 20.0, 18.0, 13.0, 16.0, 9.0, 1.0, 11.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6279296875, -1.5745697021484375, -1.521209716796875, -1.4678497314453125, -1.41448974609375, -1.3611297607421875, -1.307769775390625, -1.2544097900390625, -1.2010498046875, -1.1476898193359375, -1.094329833984375, -1.0409698486328125, -0.98760986328125, -0.9342498779296875, -0.880889892578125, -0.8275299072265625, -0.774169921875, -0.7208099365234375, -0.667449951171875, -0.6140899658203125, -0.56072998046875, -0.5073699951171875, -0.454010009765625, -0.4006500244140625, -0.3472900390625, -0.2939300537109375, -0.240570068359375, -0.1872100830078125, -0.13385009765625, -0.0804901123046875, -0.027130126953125, 0.0262298583984375, 0.07958984375, 0.1329498291015625, 0.186309814453125, 0.2396697998046875, 0.29302978515625, 0.3463897705078125, 0.399749755859375, 0.4531097412109375, 0.5064697265625, 0.5598297119140625, 0.613189697265625, 0.6665496826171875, 0.71990966796875, 0.7732696533203125, 0.826629638671875, 0.8799896240234375, 0.933349609375, 0.9867095947265625, 1.040069580078125, 1.0934295654296875, 1.14678955078125, 1.2001495361328125, 1.253509521484375, 1.3068695068359375, 1.3602294921875, 1.4135894775390625, 1.466949462890625, 1.5203094482421875, 1.57366943359375, 1.6270294189453125, 1.680389404296875, 1.7337493896484375, 1.787109375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 8.0, 21.0, 33.0, 67.0, 137.0, 248.0, 445.0, 895.0, 1771.0, 3882.0, 8410.0, 20381.0, 57107.0, 200932.0, 518110.0, 157621.0, 47416.0, 17240.0, 7194.0, 3339.0, 1616.0, 797.0, 405.0, 223.0, 120.0, 66.0, 23.0, 21.0, 8.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.636383056640625, -1.58428955078125, -1.532196044921875, -1.4801025390625, -1.428009033203125, -1.37591552734375, -1.323822021484375, -1.271728515625, -1.219635009765625, -1.16754150390625, -1.115447998046875, -1.0633544921875, -1.011260986328125, -0.95916748046875, -0.907073974609375, -0.85498046875, -0.802886962890625, -0.75079345703125, -0.698699951171875, -0.6466064453125, -0.594512939453125, -0.54241943359375, -0.490325927734375, -0.438232421875, -0.386138916015625, -0.33404541015625, -0.281951904296875, -0.2298583984375, -0.177764892578125, -0.12567138671875, -0.073577880859375, -0.021484375, 0.030609130859375, 0.08270263671875, 0.134796142578125, 0.1868896484375, 0.238983154296875, 0.29107666015625, 0.343170166015625, 0.395263671875, 0.447357177734375, 0.49945068359375, 0.551544189453125, 0.6036376953125, 0.655731201171875, 0.70782470703125, 0.759918212890625, 0.81201171875, 0.864105224609375, 0.91619873046875, 0.968292236328125, 1.0203857421875, 1.072479248046875, 1.12457275390625, 1.176666259765625, 1.228759765625, 1.280853271484375, 1.33294677734375, 1.385040283203125, 1.4371337890625, 1.489227294921875, 1.54132080078125, 1.593414306640625, 1.6455078125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 11.0, 8.0, 11.0, 18.0, 4.0, 17.0, 17.0, 19.0, 17.0, 25.0, 32.0, 32.0, 43.0, 42.0, 49.0, 48.0, 80.0, 141.0, 1575.0, 314.0, 103.0, 53.0, 41.0, 46.0, 46.0, 30.0, 28.0, 32.0, 31.0, 21.0, 18.0, 12.0, 11.0, 10.0, 13.0, 9.0, 8.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.7811279296875, -4.609130859375, -4.4371337890625, -4.26513671875, -4.0931396484375, -3.921142578125, -3.7491455078125, -3.5771484375, -3.4051513671875, -3.233154296875, -3.0611572265625, -2.88916015625, -2.7171630859375, -2.545166015625, -2.3731689453125, -2.201171875, -2.0291748046875, -1.857177734375, -1.6851806640625, -1.51318359375, -1.3411865234375, -1.169189453125, -0.9971923828125, -0.8251953125, -0.6531982421875, -0.481201171875, -0.3092041015625, -0.13720703125, 0.0347900390625, 0.206787109375, 0.3787841796875, 0.55078125, 0.7227783203125, 0.894775390625, 1.0667724609375, 1.23876953125, 1.4107666015625, 1.582763671875, 1.7547607421875, 1.9267578125, 2.0987548828125, 2.270751953125, 2.4427490234375, 2.61474609375, 2.7867431640625, 2.958740234375, 3.1307373046875, 3.302734375, 3.4747314453125, 3.646728515625, 3.8187255859375, 3.99072265625, 4.1627197265625, 4.334716796875, 4.5067138671875, 4.6787109375, 4.8507080078125, 5.022705078125, 5.1947021484375, 5.36669921875, 5.5386962890625, 5.710693359375, 5.8826904296875, 6.0546875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 6.0, 11.0, 14.0, 11.0, 13.0, 13.0, 17.0, 22.0, 37.0, 42.0, 62.0, 94.0, 137.0, 254.0, 481.0, 955.0, 2907.0, 20540.0, 1369798.0, 1723147.0, 21727.0, 3099.0, 1029.0, 501.0, 261.0, 152.0, 87.0, 71.0, 38.0, 31.0, 31.0, 16.0, 11.0, 11.0, 12.0, 11.0, 10.0, 12.0, 6.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-8.8046875, -8.5601806640625, -8.315673828125, -8.0711669921875, -7.82666015625, -7.5821533203125, -7.337646484375, -7.0931396484375, -6.8486328125, -6.6041259765625, -6.359619140625, -6.1151123046875, -5.87060546875, -5.6260986328125, -5.381591796875, -5.1370849609375, -4.892578125, -4.6480712890625, -4.403564453125, -4.1590576171875, -3.91455078125, -3.6700439453125, -3.425537109375, -3.1810302734375, -2.9365234375, -2.6920166015625, -2.447509765625, -2.2030029296875, -1.95849609375, -1.7139892578125, -1.469482421875, -1.2249755859375, -0.98046875, -0.7359619140625, -0.491455078125, -0.2469482421875, -0.00244140625, 0.2420654296875, 0.486572265625, 0.7310791015625, 0.9755859375, 1.2200927734375, 1.464599609375, 1.7091064453125, 1.95361328125, 2.1981201171875, 2.442626953125, 2.6871337890625, 2.931640625, 3.1761474609375, 3.420654296875, 3.6651611328125, 3.90966796875, 4.1541748046875, 4.398681640625, 4.6431884765625, 4.8876953125, 5.1322021484375, 5.376708984375, 5.6212158203125, 5.86572265625, 6.1102294921875, 6.354736328125, 6.5992431640625, 6.84375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 27.0, 167.0, 436.0, 317.0, 62.0, 9.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.762038230895996, -8.757911682128906, -7.7537841796875, -6.749657154083252, -5.745530128479004, -4.741403102874756, -3.737276077270508, -2.7331490516662598, -1.7290220260620117, -0.7248950004577637, 0.2792320251464844, 1.2833590507507324, 2.2874860763549805, 3.2916131019592285, 4.295740127563477, 5.299867153167725, 6.303994178771973, 7.308121204376221, 8.312248229980469, 9.316375732421875, 10.320502281188965, 11.324628829956055, 12.328756332397461, 13.332883834838867, 14.337010383605957, 15.341136932373047, 16.345264434814453, 17.34939193725586, 18.353519439697266, 19.35764503479004, 20.361772537231445, 21.36590003967285, 22.37002944946289, 23.374156951904297, 24.378284454345703, 25.382410049438477, 26.386537551879883, 27.39066505432129, 28.394790649414062, 29.39891815185547, 30.403045654296875, 31.40717315673828, 32.41130065917969, 33.415428161621094, 34.4195556640625, 35.42367935180664, 36.42780685424805, 37.43193435668945, 38.43606185913086, 39.440189361572266, 40.44431686401367, 41.44844436645508, 42.45256805419922, 43.456695556640625, 44.46082305908203, 45.46495056152344, 46.469078063964844, 47.47320556640625, 48.477333068847656, 49.48146057128906, 50.48558807373047, 51.48971176147461, 52.493839263916016, 53.49796676635742, 54.50209426879883]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 9.0, 11.0, 12.0, 19.0, 20.0, 22.0, 23.0, 33.0, 31.0, 36.0, 42.0, 36.0, 38.0, 39.0, 40.0, 47.0, 56.0, 48.0, 39.0, 43.0, 42.0, 34.0, 41.0, 29.0, 27.0, 29.0, 24.0, 19.0, 15.0, 17.0, 9.0, 6.0, 12.0, 6.0, 8.0, 6.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.299198150634766, -14.72690200805664, -14.154605865478516, -13.58230972290039, -13.010013580322266, -12.43771743774414, -11.865422248840332, -11.293126106262207, -10.720829963684082, -10.148533821105957, -9.576237678527832, -9.003941535949707, -8.431646347045898, -7.859349727630615, -7.287054061889648, -6.714757919311523, -6.142461776733398, -5.570165634155273, -4.997869491577148, -4.425573825836182, -3.8532776832580566, -3.2809815406799316, -2.7086856365203857, -2.13638973236084, -1.5640935897827148, -0.9917975664138794, -0.41950154304504395, 0.1527944803237915, 0.725090503692627, 1.297386646270752, 1.8696825504302979, 2.4419784545898438, 3.0142765045166016, 3.5865726470947266, 4.158868789672852, 4.731164455413818, 5.303460597991943, 5.875756740570068, 6.448052406311035, 7.02034854888916, 7.592644691467285, 8.16494083404541, 8.737236976623535, 9.30953311920166, 9.881828308105469, 10.454124450683594, 11.026420593261719, 11.598716735839844, 12.171012878417969, 12.743309020996094, 13.315605163574219, 13.887901306152344, 14.460197448730469, 15.032493591308594, 15.604788780212402, 16.177085876464844, 16.74938201904297, 17.321678161621094, 17.89397430419922, 18.466270446777344, 19.03856658935547, 19.610862731933594, 20.18315887451172, 20.755455017089844, 21.327749252319336]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 14.0, 12.0, 8.0, 16.0, 16.0, 14.0, 29.0, 20.0, 29.0, 27.0, 20.0, 38.0, 44.0, 44.0, 44.0, 36.0, 59.0, 50.0, 39.0, 40.0, 61.0, 35.0, 36.0, 27.0, 35.0, 39.0, 21.0, 15.0, 25.0, 16.0, 16.0, 15.0, 13.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6748046875, -1.619598388671875, -1.56439208984375, -1.509185791015625, -1.4539794921875, -1.398773193359375, -1.34356689453125, -1.288360595703125, -1.233154296875, -1.177947998046875, -1.12274169921875, -1.067535400390625, -1.0123291015625, -0.957122802734375, -0.90191650390625, -0.846710205078125, -0.79150390625, -0.736297607421875, -0.68109130859375, -0.625885009765625, -0.5706787109375, -0.515472412109375, -0.46026611328125, -0.405059814453125, -0.349853515625, -0.294647216796875, -0.23944091796875, -0.184234619140625, -0.1290283203125, -0.073822021484375, -0.01861572265625, 0.036590576171875, 0.091796875, 0.147003173828125, 0.20220947265625, 0.257415771484375, 0.3126220703125, 0.367828369140625, 0.42303466796875, 0.478240966796875, 0.533447265625, 0.588653564453125, 0.64385986328125, 0.699066162109375, 0.7542724609375, 0.809478759765625, 0.86468505859375, 0.919891357421875, 0.97509765625, 1.030303955078125, 1.08551025390625, 1.140716552734375, 1.1959228515625, 1.251129150390625, 1.30633544921875, 1.361541748046875, 1.416748046875, 1.471954345703125, 1.52716064453125, 1.582366943359375, 1.6375732421875, 1.692779541015625, 1.74798583984375, 1.803192138671875, 1.8583984375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 14.0, 14.0, 13.0, 26.0, 41.0, 74.0, 162.0, 368.0, 843.0, 2043.0, 6060.0, 19364.0, 72140.0, 329875.0, 2063740.0, 1407815.0, 218888.0, 50741.0, 14378.0, 4558.0, 1782.0, 640.0, 306.0, 152.0, 84.0, 53.0, 32.0, 19.0, 15.0, 11.0, 4.0, 10.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.83203125, -4.675537109375, -4.51904296875, -4.362548828125, -4.2060546875, -4.049560546875, -3.89306640625, -3.736572265625, -3.580078125, -3.423583984375, -3.26708984375, -3.110595703125, -2.9541015625, -2.797607421875, -2.64111328125, -2.484619140625, -2.328125, -2.171630859375, -2.01513671875, -1.858642578125, -1.7021484375, -1.545654296875, -1.38916015625, -1.232666015625, -1.076171875, -0.919677734375, -0.76318359375, -0.606689453125, -0.4501953125, -0.293701171875, -0.13720703125, 0.019287109375, 0.17578125, 0.332275390625, 0.48876953125, 0.645263671875, 0.8017578125, 0.958251953125, 1.11474609375, 1.271240234375, 1.427734375, 1.584228515625, 1.74072265625, 1.897216796875, 2.0537109375, 2.210205078125, 2.36669921875, 2.523193359375, 2.6796875, 2.836181640625, 2.99267578125, 3.149169921875, 3.3056640625, 3.462158203125, 3.61865234375, 3.775146484375, 3.931640625, 4.088134765625, 4.24462890625, 4.401123046875, 4.5576171875, 4.714111328125, 4.87060546875, 5.027099609375, 5.18359375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 17.0, 21.0, 37.0, 65.0, 111.0, 197.0, 265.0, 431.0, 579.0, 763.0, 538.0, 384.0, 257.0, 162.0, 94.0, 60.0, 35.0, 12.0, 13.0, 3.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.703125, -8.44903564453125, -8.1949462890625, -7.94085693359375, -7.686767578125, -7.43267822265625, -7.1785888671875, -6.92449951171875, -6.67041015625, -6.41632080078125, -6.1622314453125, -5.90814208984375, -5.654052734375, -5.39996337890625, -5.1458740234375, -4.89178466796875, -4.6376953125, -4.38360595703125, -4.1295166015625, -3.87542724609375, -3.621337890625, -3.36724853515625, -3.1131591796875, -2.85906982421875, -2.60498046875, -2.35089111328125, -2.0968017578125, -1.84271240234375, -1.588623046875, -1.33453369140625, -1.0804443359375, -0.82635498046875, -0.572265625, -0.31817626953125, -0.0640869140625, 0.19000244140625, 0.444091796875, 0.69818115234375, 0.9522705078125, 1.20635986328125, 1.46044921875, 1.71453857421875, 1.9686279296875, 2.22271728515625, 2.476806640625, 2.73089599609375, 2.9849853515625, 3.23907470703125, 3.4931640625, 3.74725341796875, 4.0013427734375, 4.25543212890625, 4.509521484375, 4.76361083984375, 5.0177001953125, 5.27178955078125, 5.52587890625, 5.77996826171875, 6.0340576171875, 6.28814697265625, 6.542236328125, 6.79632568359375, 7.0504150390625, 7.30450439453125, 7.55859375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 7.0, 7.0, 10.0, 13.0, 21.0, 35.0, 52.0, 75.0, 115.0, 188.0, 304.0, 484.0, 1012.0, 2331.0, 8984.0, 66510.0, 856458.0, 2940774.0, 281935.0, 26846.0, 4742.0, 1599.0, 724.0, 408.0, 234.0, 148.0, 70.0, 60.0, 47.0, 23.0, 21.0, 14.0, 9.0, 4.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.0234375, -14.6094970703125, -14.195556640625, -13.7816162109375, -13.36767578125, -12.9537353515625, -12.539794921875, -12.1258544921875, -11.7119140625, -11.2979736328125, -10.884033203125, -10.4700927734375, -10.05615234375, -9.6422119140625, -9.228271484375, -8.8143310546875, -8.400390625, -7.9864501953125, -7.572509765625, -7.1585693359375, -6.74462890625, -6.3306884765625, -5.916748046875, -5.5028076171875, -5.0888671875, -4.6749267578125, -4.260986328125, -3.8470458984375, -3.43310546875, -3.0191650390625, -2.605224609375, -2.1912841796875, -1.77734375, -1.3634033203125, -0.949462890625, -0.5355224609375, -0.12158203125, 0.2923583984375, 0.706298828125, 1.1202392578125, 1.5341796875, 1.9481201171875, 2.362060546875, 2.7760009765625, 3.18994140625, 3.6038818359375, 4.017822265625, 4.4317626953125, 4.845703125, 5.2596435546875, 5.673583984375, 6.0875244140625, 6.50146484375, 6.9154052734375, 7.329345703125, 7.7432861328125, 8.1572265625, 8.5711669921875, 8.985107421875, 9.3990478515625, 9.81298828125, 10.2269287109375, 10.640869140625, 11.0548095703125, 11.46875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 27.0, 100.0, 252.0, 313.0, 222.0, 72.0, 19.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.40717315673828, -99.50914764404297, -96.61112976074219, -93.71310424804688, -90.81507873535156, -87.91705322265625, -85.01902770996094, -82.12100982666016, -79.22298431396484, -76.32495880126953, -73.42694091796875, -70.52891540527344, -67.63088989257812, -64.73286437988281, -61.834842681884766, -58.93682098388672, -56.038795471191406, -53.140769958496094, -50.24274826049805, -47.3447265625, -44.44670104980469, -41.548675537109375, -38.65065383911133, -35.75263214111328, -32.85460662841797, -29.95658302307129, -27.05855941772461, -24.16053581237793, -21.26251220703125, -18.36448860168457, -15.46646499633789, -12.568441390991211, -9.67041015625, -6.77238655090332, -3.8743629455566406, -0.9763393402099609, 1.9216842651367188, 4.819707870483398, 7.717731475830078, 10.615755081176758, 13.513778686523438, 16.411802291870117, 19.309825897216797, 22.207849502563477, 25.105873107910156, 28.003896713256836, 30.901920318603516, 33.79994201660156, 36.697967529296875, 39.59599304199219, 42.494014739990234, 45.39203643798828, 48.290061950683594, 51.188087463378906, 54.08610916137695, 56.984130859375, 59.88215637207031, 62.780181884765625, 65.67820739746094, 68.57622528076172, 71.47425079345703, 74.37227630615234, 77.27029418945312, 80.16831970214844, 83.06634521484375]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 7.0, 5.0, 10.0, 9.0, 14.0, 13.0, 12.0, 6.0, 19.0, 29.0, 25.0, 17.0, 36.0, 27.0, 25.0, 26.0, 26.0, 43.0, 34.0, 44.0, 40.0, 29.0, 47.0, 37.0, 35.0, 38.0, 28.0, 36.0, 36.0, 33.0, 29.0, 24.0, 13.0, 23.0, 23.0, 8.0, 13.0, 15.0, 11.0, 11.0, 9.0, 8.0, 4.0, 3.0, 6.0, 3.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.128562927246094, -17.561918258666992, -16.995275497436523, -16.428630828857422, -15.86198616027832, -15.295342445373535, -14.72869873046875, -14.162054061889648, -13.595410346984863, -13.028766632080078, -12.462121963500977, -11.895478248596191, -11.328834533691406, -10.762189865112305, -10.19554615020752, -9.628902435302734, -9.062257766723633, -8.495614051818848, -7.928969383239746, -7.362325668334961, -6.795681476593018, -6.229037284851074, -5.662393569946289, -5.095749378204346, -4.529105186462402, -3.962460994720459, -3.3958170413970947, -2.8291730880737305, -2.262528896331787, -1.6958847045898438, -1.1292407512664795, -0.5625967979431152, 0.004047393798828125, 0.5706914663314819, 1.1373355388641357, 1.7039796113967896, 2.2706236839294434, 2.8372678756713867, 3.403911828994751, 3.9705557823181152, 4.537199974060059, 5.103844165802002, 5.670488357543945, 6.2371320724487305, 6.803776264190674, 7.370420455932617, 7.937064170837402, 8.503707885742188, 9.070352554321289, 9.636996269226074, 10.203640937805176, 10.770284652709961, 11.336929321289062, 11.903573036193848, 12.470216751098633, 13.036861419677734, 13.60350513458252, 14.170148849487305, 14.736793518066406, 15.303437232971191, 15.870080947875977, 16.436725616455078, 17.00337028503418, 17.57001304626465, 18.13665771484375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 5.0, 11.0, 11.0, 12.0, 21.0, 12.0, 31.0, 18.0, 20.0, 33.0, 24.0, 40.0, 31.0, 51.0, 42.0, 45.0, 56.0, 53.0, 45.0, 48.0, 45.0, 45.0, 32.0, 35.0, 25.0, 25.0, 27.0, 21.0, 13.0, 22.0, 23.0, 16.0, 11.0, 7.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71484375, -1.654327392578125, -1.59381103515625, -1.533294677734375, -1.4727783203125, -1.412261962890625, -1.35174560546875, -1.291229248046875, -1.230712890625, -1.170196533203125, -1.10968017578125, -1.049163818359375, -0.9886474609375, -0.928131103515625, -0.86761474609375, -0.807098388671875, -0.74658203125, -0.686065673828125, -0.62554931640625, -0.565032958984375, -0.5045166015625, -0.444000244140625, -0.38348388671875, -0.322967529296875, -0.262451171875, -0.201934814453125, -0.14141845703125, -0.080902099609375, -0.0203857421875, 0.040130615234375, 0.10064697265625, 0.161163330078125, 0.2216796875, 0.282196044921875, 0.34271240234375, 0.403228759765625, 0.4637451171875, 0.524261474609375, 0.58477783203125, 0.645294189453125, 0.705810546875, 0.766326904296875, 0.82684326171875, 0.887359619140625, 0.9478759765625, 1.008392333984375, 1.06890869140625, 1.129425048828125, 1.18994140625, 1.250457763671875, 1.31097412109375, 1.371490478515625, 1.4320068359375, 1.492523193359375, 1.55303955078125, 1.613555908203125, 1.674072265625, 1.734588623046875, 1.79510498046875, 1.855621337890625, 1.9161376953125, 1.976654052734375, 2.03717041015625, 2.097686767578125, 2.158203125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 17.0, 17.0, 39.0, 30.0, 78.0, 101.0, 157.0, 211.0, 332.0, 500.0, 718.0, 1138.0, 1674.0, 2586.0, 3881.0, 5990.0, 9407.0, 14610.0, 23075.0, 37832.0, 65151.0, 126686.0, 319290.0, 209169.0, 92152.0, 50534.0, 30112.0, 18998.0, 11927.0, 7698.0, 4896.0, 3222.0, 2136.0, 1361.0, 919.0, 615.0, 446.0, 254.0, 196.0, 123.0, 88.0, 63.0, 41.0, 26.0, 13.0, 19.0, 5.0, 2.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.01514434814453125, -0.014667749404907227, -0.014191150665283203, -0.01371455192565918, -0.013237953186035156, -0.012761354446411133, -0.01228475570678711, -0.011808156967163086, -0.011331558227539062, -0.010854959487915039, -0.010378360748291016, -0.009901762008666992, -0.009425163269042969, -0.008948564529418945, -0.008471965789794922, -0.007995367050170898, -0.007518768310546875, -0.0070421695709228516, -0.006565570831298828, -0.006088972091674805, -0.005612373352050781, -0.005135774612426758, -0.004659175872802734, -0.004182577133178711, -0.0037059783935546875, -0.003229379653930664, -0.0027527809143066406, -0.002276182174682617, -0.0017995834350585938, -0.0013229846954345703, -0.0008463859558105469, -0.00036978721618652344, 0.0001068115234375, 0.0005834102630615234, 0.0010600090026855469, 0.0015366077423095703, 0.0020132064819335938, 0.002489805221557617, 0.0029664039611816406, 0.003443002700805664, 0.0039196014404296875, 0.004396200180053711, 0.004872798919677734, 0.005349397659301758, 0.005825996398925781, 0.006302595138549805, 0.006779193878173828, 0.0072557926177978516, 0.007732391357421875, 0.008208990097045898, 0.008685588836669922, 0.009162187576293945, 0.009638786315917969, 0.010115385055541992, 0.010591983795166016, 0.011068582534790039, 0.011545181274414062, 0.012021780014038086, 0.01249837875366211, 0.012974977493286133, 0.013451576232910156, 0.01392817497253418, 0.014404773712158203, 0.014881372451782227, 0.01535797119140625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 7.0, 5.0, 5.0, 12.0, 7.0, 11.0, 15.0, 16.0, 23.0, 27.0, 29.0, 31.0, 31.0, 37.0, 33.0, 39.0, 47.0, 37.0, 39.0, 1071.0, 33.0, 58.0, 53.0, 34.0, 26.0, 21.0, 34.0, 30.0, 39.0, 26.0, 20.0, 19.0, 15.0, 16.0, 17.0, 8.0, 14.0, 7.0, 9.0, 3.0, 5.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.283203125, -1.2464752197265625, -1.209747314453125, -1.1730194091796875, -1.13629150390625, -1.0995635986328125, -1.062835693359375, -1.0261077880859375, -0.9893798828125, -0.9526519775390625, -0.915924072265625, -0.8791961669921875, -0.84246826171875, -0.8057403564453125, -0.769012451171875, -0.7322845458984375, -0.695556640625, -0.6588287353515625, -0.622100830078125, -0.5853729248046875, -0.54864501953125, -0.5119171142578125, -0.475189208984375, -0.4384613037109375, -0.4017333984375, -0.3650054931640625, -0.328277587890625, -0.2915496826171875, -0.25482177734375, -0.2180938720703125, -0.181365966796875, -0.1446380615234375, -0.10791015625, -0.0711822509765625, -0.034454345703125, 0.0022735595703125, 0.03900146484375, 0.0757293701171875, 0.112457275390625, 0.1491851806640625, 0.1859130859375, 0.2226409912109375, 0.259368896484375, 0.2960968017578125, 0.33282470703125, 0.3695526123046875, 0.406280517578125, 0.4430084228515625, 0.479736328125, 0.5164642333984375, 0.553192138671875, 0.5899200439453125, 0.62664794921875, 0.6633758544921875, 0.700103759765625, 0.7368316650390625, 0.7735595703125, 0.8102874755859375, 0.847015380859375, 0.8837432861328125, 0.92047119140625, 0.9571990966796875, 0.993927001953125, 1.0306549072265625, 1.0673828125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 9.0, 22.0, 19.0, 38.0, 58.0, 72.0, 152.0, 219.0, 311.0, 428.0, 688.0, 962.0, 1285.0, 1881.0, 2708.0, 3812.0, 5587.0, 8118.0, 11956.0, 17950.0, 27445.0, 42806.0, 70711.0, 133256.0, 1335362.0, 189005.0, 90382.0, 52235.0, 32559.0, 21319.0, 14336.0, 9584.0, 6564.0, 4561.0, 3164.0, 2241.0, 1636.0, 1157.0, 803.0, 561.0, 388.0, 256.0, 189.0, 117.0, 87.0, 36.0, 39.0, 25.0, 17.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00872802734375, -0.008443832397460938, -0.008159637451171875, -0.007875442504882812, -0.00759124755859375, -0.0073070526123046875, -0.007022857666015625, -0.0067386627197265625, -0.0064544677734375, -0.0061702728271484375, -0.005886077880859375, -0.0056018829345703125, -0.00531768798828125, -0.0050334930419921875, -0.004749298095703125, -0.0044651031494140625, -0.004180908203125, -0.0038967132568359375, -0.003612518310546875, -0.0033283233642578125, -0.00304412841796875, -0.0027599334716796875, -0.002475738525390625, -0.0021915435791015625, -0.0019073486328125, -0.0016231536865234375, -0.001338958740234375, -0.0010547637939453125, -0.00077056884765625, -0.0004863739013671875, -0.000202178955078125, 8.20159912109375e-05, 0.0003662109375, 0.0006504058837890625, 0.000934600830078125, 0.0012187957763671875, 0.00150299072265625, 0.0017871856689453125, 0.002071380615234375, 0.0023555755615234375, 0.0026397705078125, 0.0029239654541015625, 0.003208160400390625, 0.0034923553466796875, 0.00377655029296875, 0.0040607452392578125, 0.004344940185546875, 0.0046291351318359375, 0.004913330078125, 0.0051975250244140625, 0.005481719970703125, 0.0057659149169921875, 0.00605010986328125, 0.0063343048095703125, 0.006618499755859375, 0.0069026947021484375, 0.0071868896484375, 0.0074710845947265625, 0.007755279541015625, 0.008039474487304688, 0.00832366943359375, 0.008607864379882812, 0.008892059326171875, 0.009176254272460938, 0.00946044921875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 939.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 18.0, 25.0, 14.0, 10.0, 26.0, 28.0, 76.0, 169.0, 4710.0, 21720.0, 1016647.0, 4077.0, 822.0, 40.0, 66.0, 26.0, 34.0, 6.0, 17.0, 5.0, 19.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3245811462402344e-06, -2.2351741790771484e-06, -2.1457672119140625e-06, -2.0563602447509766e-06, -1.9669532775878906e-06, -1.8775463104248047e-06, -1.7881393432617188e-06, -1.6987323760986328e-06, -1.6093254089355469e-06, -1.519918441772461e-06, -1.430511474609375e-06, -1.341104507446289e-06, -1.2516975402832031e-06, -1.1622905731201172e-06, -1.0728836059570312e-06, -9.834766387939453e-07, -8.940696716308594e-07, -8.046627044677734e-07, -7.152557373046875e-07, -6.258487701416016e-07, -5.364418029785156e-07, -4.470348358154297e-07, -3.5762786865234375e-07, -2.682209014892578e-07, -1.7881393432617188e-07, -8.940696716308594e-08, 0.0, 8.940696716308594e-08, 1.7881393432617188e-07, 2.682209014892578e-07, 3.5762786865234375e-07, 4.470348358154297e-07, 5.364418029785156e-07, 6.258487701416016e-07, 7.152557373046875e-07, 8.046627044677734e-07, 8.940696716308594e-07, 9.834766387939453e-07, 1.0728836059570312e-06, 1.1622905731201172e-06, 1.2516975402832031e-06, 1.341104507446289e-06, 1.430511474609375e-06, 1.519918441772461e-06, 1.6093254089355469e-06, 1.6987323760986328e-06, 1.7881393432617188e-06, 1.8775463104248047e-06, 1.9669532775878906e-06, 2.0563602447509766e-06, 2.1457672119140625e-06, 2.2351741790771484e-06, 2.3245811462402344e-06, 2.4139881134033203e-06, 2.5033950805664062e-06, 2.592802047729492e-06, 2.682209014892578e-06, 2.771615982055664e-06, 2.86102294921875e-06, 2.950429916381836e-06, 3.039836883544922e-06, 3.129243850708008e-06, 3.2186508178710938e-06, 3.3080577850341797e-06, 3.3974647521972656e-06]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 5.0, 11.0, 11.0, 12.0, 21.0, 12.0, 31.0, 18.0, 20.0, 33.0, 24.0, 40.0, 31.0, 51.0, 42.0, 45.0, 56.0, 53.0, 45.0, 48.0, 45.0, 45.0, 32.0, 35.0, 25.0, 25.0, 27.0, 21.0, 13.0, 22.0, 23.0, 16.0, 11.0, 7.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71484375, -1.654327392578125, -1.59381103515625, -1.533294677734375, -1.4727783203125, -1.412261962890625, -1.35174560546875, -1.291229248046875, -1.230712890625, -1.170196533203125, -1.10968017578125, -1.049163818359375, -0.9886474609375, -0.928131103515625, -0.86761474609375, -0.807098388671875, -0.74658203125, -0.686065673828125, -0.62554931640625, -0.565032958984375, -0.5045166015625, -0.444000244140625, -0.38348388671875, -0.322967529296875, -0.262451171875, -0.201934814453125, -0.14141845703125, -0.080902099609375, -0.0203857421875, 0.040130615234375, 0.10064697265625, 0.161163330078125, 0.2216796875, 0.282196044921875, 0.34271240234375, 0.403228759765625, 0.4637451171875, 0.524261474609375, 0.58477783203125, 0.645294189453125, 0.705810546875, 0.766326904296875, 0.82684326171875, 0.887359619140625, 0.9478759765625, 1.008392333984375, 1.06890869140625, 1.129425048828125, 1.18994140625, 1.250457763671875, 1.31097412109375, 1.371490478515625, 1.4320068359375, 1.492523193359375, 1.55303955078125, 1.613555908203125, 1.674072265625, 1.734588623046875, 1.79510498046875, 1.855621337890625, 1.9161376953125, 1.976654052734375, 2.03717041015625, 2.097686767578125, 2.158203125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 10.0, 9.0, 11.0, 17.0, 29.0, 36.0, 52.0, 69.0, 98.0, 178.0, 277.0, 430.0, 686.0, 1109.0, 1763.0, 3027.0, 5195.0, 9552.0, 18944.0, 40529.0, 104983.0, 337324.0, 336929.0, 105410.0, 40660.0, 18408.0, 9605.0, 5390.0, 3043.0, 1801.0, 1097.0, 665.0, 402.0, 258.0, 153.0, 125.0, 98.0, 59.0, 40.0, 22.0, 18.0, 15.0, 14.0, 7.0, 4.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.732421875, -1.67828369140625, -1.6241455078125, -1.57000732421875, -1.515869140625, -1.46173095703125, -1.4075927734375, -1.35345458984375, -1.29931640625, -1.24517822265625, -1.1910400390625, -1.13690185546875, -1.082763671875, -1.02862548828125, -0.9744873046875, -0.92034912109375, -0.8662109375, -0.81207275390625, -0.7579345703125, -0.70379638671875, -0.649658203125, -0.59552001953125, -0.5413818359375, -0.48724365234375, -0.43310546875, -0.37896728515625, -0.3248291015625, -0.27069091796875, -0.216552734375, -0.16241455078125, -0.1082763671875, -0.05413818359375, 0.0, 0.05413818359375, 0.1082763671875, 0.16241455078125, 0.216552734375, 0.27069091796875, 0.3248291015625, 0.37896728515625, 0.43310546875, 0.48724365234375, 0.5413818359375, 0.59552001953125, 0.649658203125, 0.70379638671875, 0.7579345703125, 0.81207275390625, 0.8662109375, 0.92034912109375, 0.9744873046875, 1.02862548828125, 1.082763671875, 1.13690185546875, 1.1910400390625, 1.24517822265625, 1.29931640625, 1.35345458984375, 1.4075927734375, 1.46173095703125, 1.515869140625, 1.57000732421875, 1.6241455078125, 1.67828369140625, 1.732421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 1.0, 7.0, 6.0, 8.0, 13.0, 17.0, 21.0, 9.0, 13.0, 28.0, 20.0, 22.0, 36.0, 30.0, 38.0, 49.0, 45.0, 70.0, 116.0, 294.0, 1537.0, 171.0, 96.0, 54.0, 39.0, 52.0, 44.0, 29.0, 22.0, 29.0, 25.0, 27.0, 11.0, 10.0, 9.0, 9.0, 6.0, 8.0, 5.0, 6.0, 4.0, 8.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.484375, -6.2769775390625, -6.069580078125, -5.8621826171875, -5.65478515625, -5.4473876953125, -5.239990234375, -5.0325927734375, -4.8251953125, -4.6177978515625, -4.410400390625, -4.2030029296875, -3.99560546875, -3.7882080078125, -3.580810546875, -3.3734130859375, -3.166015625, -2.9586181640625, -2.751220703125, -2.5438232421875, -2.33642578125, -2.1290283203125, -1.921630859375, -1.7142333984375, -1.5068359375, -1.2994384765625, -1.092041015625, -0.8846435546875, -0.67724609375, -0.4698486328125, -0.262451171875, -0.0550537109375, 0.15234375, 0.3597412109375, 0.567138671875, 0.7745361328125, 0.98193359375, 1.1893310546875, 1.396728515625, 1.6041259765625, 1.8115234375, 2.0189208984375, 2.226318359375, 2.4337158203125, 2.64111328125, 2.8485107421875, 3.055908203125, 3.2633056640625, 3.470703125, 3.6781005859375, 3.885498046875, 4.0928955078125, 4.30029296875, 4.5076904296875, 4.715087890625, 4.9224853515625, 5.1298828125, 5.3372802734375, 5.544677734375, 5.7520751953125, 5.95947265625, 6.1668701171875, 6.374267578125, 6.5816650390625, 6.7890625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 3.0, 7.0, 7.0, 6.0, 10.0, 7.0, 15.0, 24.0, 27.0, 55.0, 46.0, 71.0, 89.0, 160.0, 267.0, 500.0, 1933.0, 21300.0, 2472625.0, 635274.0, 10771.0, 1351.0, 392.0, 218.0, 172.0, 95.0, 66.0, 43.0, 34.0, 26.0, 11.0, 22.0, 16.0, 19.0, 8.0, 9.0, 5.0, 2.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.609375, -10.2867431640625, -9.964111328125, -9.6414794921875, -9.31884765625, -8.9962158203125, -8.673583984375, -8.3509521484375, -8.0283203125, -7.7056884765625, -7.383056640625, -7.0604248046875, -6.73779296875, -6.4151611328125, -6.092529296875, -5.7698974609375, -5.447265625, -5.1246337890625, -4.802001953125, -4.4793701171875, -4.15673828125, -3.8341064453125, -3.511474609375, -3.1888427734375, -2.8662109375, -2.5435791015625, -2.220947265625, -1.8983154296875, -1.57568359375, -1.2530517578125, -0.930419921875, -0.6077880859375, -0.28515625, 0.0374755859375, 0.360107421875, 0.6827392578125, 1.00537109375, 1.3280029296875, 1.650634765625, 1.9732666015625, 2.2958984375, 2.6185302734375, 2.941162109375, 3.2637939453125, 3.58642578125, 3.9090576171875, 4.231689453125, 4.5543212890625, 4.876953125, 5.1995849609375, 5.522216796875, 5.8448486328125, 6.16748046875, 6.4901123046875, 6.812744140625, 7.1353759765625, 7.4580078125, 7.7806396484375, 8.103271484375, 8.4259033203125, 8.74853515625, 9.0711669921875, 9.393798828125, 9.7164306640625, 10.0390625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 78.0, 895.0, 42.0, 1.0, 0.0, 0.0, 1.0], "bins": [-207.54798889160156, -203.99278259277344, -200.43759155273438, -196.88238525390625, -193.32717895507812, -189.77198791503906, -186.21678161621094, -182.66159057617188, -179.10638427734375, -175.55117797851562, -171.99598693847656, -168.44078063964844, -164.88558959960938, -161.33038330078125, -157.77517700195312, -154.21998596191406, -150.66477966308594, -147.1095733642578, -143.55438232421875, -139.99917602539062, -136.4439697265625, -132.88877868652344, -129.3335723876953, -125.77837371826172, -122.22317504882812, -118.66797637939453, -115.11277770996094, -111.55757141113281, -108.00237274169922, -104.44717407226562, -100.8919677734375, -97.3367691040039, -93.78157043457031, -90.22637176513672, -86.67117309570312, -83.115966796875, -79.5607681274414, -76.00556945800781, -72.45036315917969, -68.8951644897461, -65.3399658203125, -61.784767150878906, -58.22956466674805, -54.67436218261719, -51.119163513183594, -47.56396484375, -44.00876235961914, -40.45355987548828, -36.89836502075195, -33.343162536621094, -29.7879638671875, -26.232763290405273, -22.677562713623047, -19.12236213684082, -15.567161560058594, -12.011960983276367, -8.45676040649414, -4.901559829711914, -1.3463592529296875, 2.208841323852539, 5.764041900634766, 9.319242477416992, 12.874443054199219, 16.429643630981445, 19.984844207763672]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 9.0, 6.0, 13.0, 8.0, 10.0, 11.0, 20.0, 21.0, 23.0, 25.0, 26.0, 38.0, 44.0, 32.0, 36.0, 42.0, 40.0, 36.0, 48.0, 37.0, 48.0, 34.0, 42.0, 32.0, 42.0, 33.0, 33.0, 33.0, 22.0, 22.0, 28.0, 16.0, 21.0, 13.0, 15.0, 9.0, 7.0, 6.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.67119026184082, -20.99648666381836, -20.321781158447266, -19.647077560424805, -18.97237205505371, -18.29766845703125, -17.622962951660156, -16.948259353637695, -16.2735538482666, -15.598849296569824, -14.924144744873047, -14.24944019317627, -13.574735641479492, -12.900031089782715, -12.225326538085938, -11.550622940063477, -10.8759183883667, -10.201213836669922, -9.526509284973145, -8.851804733276367, -8.17710018157959, -7.5023956298828125, -6.827691555023193, -6.152987003326416, -5.478282451629639, -4.803577899932861, -4.128873348236084, -3.4541690349578857, -2.7794644832611084, -2.104759931564331, -1.4300556182861328, -0.7553510665893555, -0.08064651489257812, 0.5940579771995544, 1.268762469291687, 1.9434669017791748, 2.618171453475952, 3.2928760051727295, 3.9675803184509277, 4.642284870147705, 5.316989421844482, 5.99169397354126, 6.666398525238037, 7.341102600097656, 8.015807151794434, 8.690511703491211, 9.365216255187988, 10.039920806884766, 10.714625358581543, 11.38932991027832, 12.064034461975098, 12.738739013671875, 13.413443565368652, 14.08814811706543, 14.76285171508789, 15.437557220458984, 16.112260818481445, 16.786964416503906, 17.461669921875, 18.13637351989746, 18.811079025268555, 19.485782623291016, 20.16048812866211, 20.83519172668457, 21.509897232055664]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 5.0, 8.0, 6.0, 7.0, 10.0, 12.0, 17.0, 16.0, 19.0, 23.0, 28.0, 18.0, 31.0, 33.0, 32.0, 45.0, 42.0, 43.0, 52.0, 48.0, 39.0, 45.0, 44.0, 50.0, 38.0, 43.0, 35.0, 21.0, 21.0, 16.0, 26.0, 20.0, 21.0, 15.0, 22.0, 8.0, 9.0, 9.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865234375, -1.6264495849609375, -1.566375732421875, -1.5063018798828125, -1.44622802734375, -1.3861541748046875, -1.326080322265625, -1.2660064697265625, -1.2059326171875, -1.1458587646484375, -1.085784912109375, -1.0257110595703125, -0.96563720703125, -0.9055633544921875, -0.845489501953125, -0.7854156494140625, -0.725341796875, -0.6652679443359375, -0.605194091796875, -0.5451202392578125, -0.48504638671875, -0.4249725341796875, -0.364898681640625, -0.3048248291015625, -0.2447509765625, -0.1846771240234375, -0.124603271484375, -0.0645294189453125, -0.00445556640625, 0.0556182861328125, 0.115692138671875, 0.1757659912109375, 0.23583984375, 0.2959136962890625, 0.355987548828125, 0.4160614013671875, 0.47613525390625, 0.5362091064453125, 0.596282958984375, 0.6563568115234375, 0.7164306640625, 0.7765045166015625, 0.836578369140625, 0.8966522216796875, 0.95672607421875, 1.0167999267578125, 1.076873779296875, 1.1369476318359375, 1.197021484375, 1.2570953369140625, 1.317169189453125, 1.3772430419921875, 1.43731689453125, 1.4973907470703125, 1.557464599609375, 1.6175384521484375, 1.6776123046875, 1.7376861572265625, 1.797760009765625, 1.8578338623046875, 1.91790771484375, 1.9779815673828125, 2.038055419921875, 2.0981292724609375, 2.158203125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 10.0, 8.0, 12.0, 12.0, 19.0, 14.0, 14.0, 25.0, 36.0, 41.0, 64.0, 152.0, 332.0, 867.0, 2783.0, 10161.0, 41822.0, 211890.0, 1567512.0, 2013271.0, 275712.0, 51977.0, 12294.0, 3320.0, 1073.0, 373.0, 184.0, 87.0, 65.0, 26.0, 20.0, 23.0, 15.0, 15.0, 8.0, 17.0, 11.0, 7.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.52337646484375, -5.3397216796875, -5.15606689453125, -4.972412109375, -4.78875732421875, -4.6051025390625, -4.42144775390625, -4.23779296875, -4.05413818359375, -3.8704833984375, -3.68682861328125, -3.503173828125, -3.31951904296875, -3.1358642578125, -2.95220947265625, -2.7685546875, -2.58489990234375, -2.4012451171875, -2.21759033203125, -2.033935546875, -1.85028076171875, -1.6666259765625, -1.48297119140625, -1.29931640625, -1.11566162109375, -0.9320068359375, -0.74835205078125, -0.564697265625, -0.38104248046875, -0.1973876953125, -0.01373291015625, 0.169921875, 0.35357666015625, 0.5372314453125, 0.72088623046875, 0.904541015625, 1.08819580078125, 1.2718505859375, 1.45550537109375, 1.63916015625, 1.82281494140625, 2.0064697265625, 2.19012451171875, 2.373779296875, 2.55743408203125, 2.7410888671875, 2.92474365234375, 3.1083984375, 3.29205322265625, 3.4757080078125, 3.65936279296875, 3.843017578125, 4.02667236328125, 4.2103271484375, 4.39398193359375, 4.57763671875, 4.76129150390625, 4.9449462890625, 5.12860107421875, 5.312255859375, 5.49591064453125, 5.6795654296875, 5.86322021484375, 6.046875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 12.0, 11.0, 15.0, 27.0, 51.0, 75.0, 112.0, 144.0, 198.0, 299.0, 425.0, 540.0, 599.0, 458.0, 366.0, 235.0, 153.0, 115.0, 83.0, 44.0, 32.0, 22.0, 16.0, 13.0, 3.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0546875, -7.83209228515625, -7.6094970703125, -7.38690185546875, -7.164306640625, -6.94171142578125, -6.7191162109375, -6.49652099609375, -6.27392578125, -6.05133056640625, -5.8287353515625, -5.60614013671875, -5.383544921875, -5.16094970703125, -4.9383544921875, -4.71575927734375, -4.4931640625, -4.27056884765625, -4.0479736328125, -3.82537841796875, -3.602783203125, -3.38018798828125, -3.1575927734375, -2.93499755859375, -2.71240234375, -2.48980712890625, -2.2672119140625, -2.04461669921875, -1.822021484375, -1.59942626953125, -1.3768310546875, -1.15423583984375, -0.931640625, -0.70904541015625, -0.4864501953125, -0.26385498046875, -0.041259765625, 0.18133544921875, 0.4039306640625, 0.62652587890625, 0.84912109375, 1.07171630859375, 1.2943115234375, 1.51690673828125, 1.739501953125, 1.96209716796875, 2.1846923828125, 2.40728759765625, 2.6298828125, 2.85247802734375, 3.0750732421875, 3.29766845703125, 3.520263671875, 3.74285888671875, 3.9654541015625, 4.18804931640625, 4.41064453125, 4.63323974609375, 4.8558349609375, 5.07843017578125, 5.301025390625, 5.52362060546875, 5.7462158203125, 5.96881103515625, 6.19140625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 6.0, 7.0, 15.0, 27.0, 36.0, 74.0, 105.0, 166.0, 306.0, 541.0, 1108.0, 2743.0, 8722.0, 37763.0, 234685.0, 1848467.0, 1784173.0, 225101.0, 36845.0, 8383.0, 2661.0, 1063.0, 544.0, 303.0, 141.0, 125.0, 56.0, 38.0, 20.0, 20.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.1053466796875, -7.781005859375, -7.4566650390625, -7.13232421875, -6.8079833984375, -6.483642578125, -6.1593017578125, -5.8349609375, -5.5106201171875, -5.186279296875, -4.8619384765625, -4.53759765625, -4.2132568359375, -3.888916015625, -3.5645751953125, -3.240234375, -2.9158935546875, -2.591552734375, -2.2672119140625, -1.94287109375, -1.6185302734375, -1.294189453125, -0.9698486328125, -0.6455078125, -0.3211669921875, 0.003173828125, 0.3275146484375, 0.65185546875, 0.9761962890625, 1.300537109375, 1.6248779296875, 1.94921875, 2.2735595703125, 2.597900390625, 2.9222412109375, 3.24658203125, 3.5709228515625, 3.895263671875, 4.2196044921875, 4.5439453125, 4.8682861328125, 5.192626953125, 5.5169677734375, 5.84130859375, 6.1656494140625, 6.489990234375, 6.8143310546875, 7.138671875, 7.4630126953125, 7.787353515625, 8.1116943359375, 8.43603515625, 8.7603759765625, 9.084716796875, 9.4090576171875, 9.7333984375, 10.0577392578125, 10.382080078125, 10.7064208984375, 11.03076171875, 11.3551025390625, 11.679443359375, 12.0037841796875, 12.328125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 14.0, 22.0, 69.0, 131.0, 187.0, 229.0, 185.0, 109.0, 40.0, 19.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.75244903564453, -98.5795669555664, -96.40668487548828, -94.23381042480469, -92.06092834472656, -89.88804626464844, -87.71516418457031, -85.54228210449219, -83.36940002441406, -81.19651794433594, -79.02363586425781, -76.85076141357422, -74.6778793334961, -72.50499725341797, -70.33211517333984, -68.15923309326172, -65.98635864257812, -63.8134765625, -61.64059829711914, -59.467716217041016, -57.294837951660156, -55.12195587158203, -52.949073791503906, -50.77619171142578, -48.60331344604492, -46.4304313659668, -44.25755310058594, -42.08467102050781, -39.91178894042969, -37.73891067504883, -35.5660285949707, -33.393150329589844, -31.220260620117188, -29.047380447387695, -26.874500274658203, -24.701618194580078, -22.528738021850586, -20.355857849121094, -18.18297576904297, -16.010095596313477, -13.837215423583984, -11.664335250854492, -9.491454124450684, -7.318573474884033, -5.145692825317383, -2.9728126525878906, -0.799931526184082, 1.3729496002197266, 3.5458297729492188, 5.718710422515869, 7.8915910720825195, 10.064472198486328, 12.23735237121582, 14.410232543945312, 16.583114624023438, 18.75599479675293, 20.928874969482422, 23.101755142211914, 25.274635314941406, 27.44751739501953, 29.620397567749023, 31.793277740478516, 33.96615982055664, 36.1390380859375, 38.311920166015625]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 9.0, 13.0, 15.0, 15.0, 16.0, 22.0, 23.0, 25.0, 26.0, 28.0, 37.0, 31.0, 33.0, 40.0, 47.0, 57.0, 35.0, 44.0, 38.0, 43.0, 59.0, 30.0, 28.0, 40.0, 35.0, 32.0, 22.0, 25.0, 19.0, 17.0, 16.0, 13.0, 13.0, 6.0, 5.0, 10.0, 7.0, 4.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.508941650390625, -19.897199630737305, -19.28545570373535, -18.67371368408203, -18.06197166442871, -17.45022964477539, -16.838485717773438, -16.226743698120117, -15.61500072479248, -15.003257751464844, -14.391515731811523, -13.779772758483887, -13.16802978515625, -12.55628776550293, -11.944544792175293, -11.332801818847656, -10.721059799194336, -10.1093168258667, -9.497574806213379, -8.885831832885742, -8.274089813232422, -7.662346839904785, -7.050603866577148, -6.43886137008667, -5.827118873596191, -5.215376377105713, -4.603633880615234, -3.9918909072875977, -3.380148410797119, -2.7684059143066406, -2.156663179397583, -1.5449204444885254, -0.9331779479980469, -0.3214353322982788, 0.29030728340148926, 0.9020498991012573, 1.5137925148010254, 2.125535011291504, 2.7372777462005615, 3.349020481109619, 3.9607629776000977, 4.572505474090576, 5.184247970581055, 5.795990943908691, 6.40773344039917, 7.019475936889648, 7.631218910217285, 8.242961883544922, 8.854703903198242, 9.466446876525879, 10.0781888961792, 10.689931869506836, 11.301673889160156, 11.913416862487793, 12.52515983581543, 13.13690185546875, 13.748644828796387, 14.360387802124023, 14.972129821777344, 15.58387279510498, 16.195615768432617, 16.807357788085938, 17.419099807739258, 18.03084373474121, 18.64258575439453]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 2.0, 1.0, 5.0, 6.0, 6.0, 6.0, 8.0, 17.0, 8.0, 11.0, 23.0, 17.0, 28.0, 17.0, 18.0, 26.0, 24.0, 33.0, 35.0, 44.0, 32.0, 37.0, 39.0, 53.0, 46.0, 33.0, 36.0, 37.0, 34.0, 39.0, 29.0, 28.0, 26.0, 23.0, 25.0, 21.0, 16.0, 10.0, 17.0, 14.0, 12.0, 10.0, 14.0, 5.0, 7.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6572265625, -1.602142333984375, -1.54705810546875, -1.491973876953125, -1.4368896484375, -1.381805419921875, -1.32672119140625, -1.271636962890625, -1.216552734375, -1.161468505859375, -1.10638427734375, -1.051300048828125, -0.9962158203125, -0.941131591796875, -0.88604736328125, -0.830963134765625, -0.77587890625, -0.720794677734375, -0.66571044921875, -0.610626220703125, -0.5555419921875, -0.500457763671875, -0.44537353515625, -0.390289306640625, -0.335205078125, -0.280120849609375, -0.22503662109375, -0.169952392578125, -0.1148681640625, -0.059783935546875, -0.00469970703125, 0.050384521484375, 0.10546875, 0.160552978515625, 0.21563720703125, 0.270721435546875, 0.3258056640625, 0.380889892578125, 0.43597412109375, 0.491058349609375, 0.546142578125, 0.601226806640625, 0.65631103515625, 0.711395263671875, 0.7664794921875, 0.821563720703125, 0.87664794921875, 0.931732177734375, 0.98681640625, 1.041900634765625, 1.09698486328125, 1.152069091796875, 1.2071533203125, 1.262237548828125, 1.31732177734375, 1.372406005859375, 1.427490234375, 1.482574462890625, 1.53765869140625, 1.592742919921875, 1.6478271484375, 1.702911376953125, 1.75799560546875, 1.813079833984375, 1.8681640625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 6.0, 11.0, 17.0, 24.0, 32.0, 46.0, 58.0, 74.0, 92.0, 163.0, 257.0, 341.0, 527.0, 612.0, 896.0, 1185.0, 1793.0, 2395.0, 3390.0, 4690.0, 6566.0, 8889.0, 12340.0, 17803.0, 24879.0, 35209.0, 53042.0, 84369.0, 159263.0, 273651.0, 125893.0, 72925.0, 46757.0, 31911.0, 22157.0, 15720.0, 11538.0, 8231.0, 5805.0, 4209.0, 3049.0, 2154.0, 1526.0, 1184.0, 857.0, 596.0, 406.0, 275.0, 209.0, 156.0, 126.0, 81.0, 73.0, 42.0, 25.0, 19.0, 10.0, 6.0, 4.0, 3.0, 1.0], "bins": [-0.01157379150390625, -0.011216044425964355, -0.010858297348022461, -0.010500550270080566, -0.010142803192138672, -0.009785056114196777, -0.009427309036254883, -0.009069561958312988, -0.008711814880371094, -0.0083540678024292, -0.007996320724487305, -0.00763857364654541, -0.007280826568603516, -0.006923079490661621, -0.0065653324127197266, -0.006207585334777832, -0.0058498382568359375, -0.005492091178894043, -0.0051343441009521484, -0.004776597023010254, -0.004418849945068359, -0.004061102867126465, -0.0037033557891845703, -0.0033456087112426758, -0.0029878616333007812, -0.0026301145553588867, -0.002272367477416992, -0.0019146203994750977, -0.0015568733215332031, -0.0011991262435913086, -0.0008413791656494141, -0.00048363208770751953, -0.000125885009765625, 0.00023186206817626953, 0.0005896091461181641, 0.0009473562240600586, 0.0013051033020019531, 0.0016628503799438477, 0.002020597457885742, 0.0023783445358276367, 0.0027360916137695312, 0.0030938386917114258, 0.0034515857696533203, 0.003809332847595215, 0.004167079925537109, 0.004524827003479004, 0.0048825740814208984, 0.005240321159362793, 0.0055980682373046875, 0.005955815315246582, 0.0063135623931884766, 0.006671309471130371, 0.007029056549072266, 0.00738680362701416, 0.007744550704956055, 0.00810229778289795, 0.008460044860839844, 0.008817791938781738, 0.009175539016723633, 0.009533286094665527, 0.009891033172607422, 0.010248780250549316, 0.010606527328491211, 0.010964274406433105, 0.011322021484375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 3.0, 9.0, 8.0, 10.0, 16.0, 7.0, 17.0, 19.0, 29.0, 26.0, 26.0, 32.0, 29.0, 37.0, 32.0, 31.0, 52.0, 43.0, 1072.0, 36.0, 57.0, 36.0, 40.0, 35.0, 41.0, 28.0, 37.0, 38.0, 24.0, 25.0, 17.0, 21.0, 19.0, 13.0, 15.0, 11.0, 7.0, 8.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.0840911865234375, -1.042205810546875, -1.0003204345703125, -0.95843505859375, -0.9165496826171875, -0.874664306640625, -0.8327789306640625, -0.7908935546875, -0.7490081787109375, -0.707122802734375, -0.6652374267578125, -0.62335205078125, -0.5814666748046875, -0.539581298828125, -0.4976959228515625, -0.455810546875, -0.4139251708984375, -0.372039794921875, -0.3301544189453125, -0.28826904296875, -0.2463836669921875, -0.204498291015625, -0.1626129150390625, -0.1207275390625, -0.0788421630859375, -0.036956787109375, 0.0049285888671875, 0.04681396484375, 0.0886993408203125, 0.130584716796875, 0.1724700927734375, 0.21435546875, 0.2562408447265625, 0.298126220703125, 0.3400115966796875, 0.38189697265625, 0.4237823486328125, 0.465667724609375, 0.5075531005859375, 0.5494384765625, 0.5913238525390625, 0.633209228515625, 0.6750946044921875, 0.71697998046875, 0.7588653564453125, 0.800750732421875, 0.8426361083984375, 0.884521484375, 0.9264068603515625, 0.968292236328125, 1.0101776123046875, 1.05206298828125, 1.0939483642578125, 1.135833740234375, 1.1777191162109375, 1.2196044921875, 1.2614898681640625, 1.303375244140625, 1.3452606201171875, 1.38714599609375, 1.4290313720703125, 1.470916748046875, 1.5128021240234375, 1.5546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 18.0, 21.0, 30.0, 51.0, 81.0, 145.0, 202.0, 332.0, 476.0, 751.0, 1142.0, 1689.0, 2593.0, 3790.0, 5729.0, 8642.0, 13196.0, 20425.0, 32696.0, 53617.0, 95336.0, 214563.0, 1342000.0, 123753.0, 65538.0, 39365.0, 24572.0, 15650.0, 10270.0, 6706.0, 4542.0, 3072.0, 2071.0, 1362.0, 931.0, 644.0, 384.0, 270.0, 168.0, 112.0, 63.0, 38.0, 34.0, 15.0, 12.0, 13.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.0114288330078125, -0.011084437370300293, -0.010740041732788086, -0.010395646095275879, -0.010051250457763672, -0.009706854820251465, -0.009362459182739258, -0.00901806354522705, -0.008673667907714844, -0.008329272270202637, -0.00798487663269043, -0.007640480995178223, -0.007296085357666016, -0.006951689720153809, -0.0066072940826416016, -0.0062628984451293945, -0.0059185028076171875, -0.0055741071701049805, -0.0052297115325927734, -0.004885315895080566, -0.004540920257568359, -0.004196524620056152, -0.0038521289825439453, -0.0035077333450317383, -0.0031633377075195312, -0.0028189420700073242, -0.002474546432495117, -0.00213015079498291, -0.0017857551574707031, -0.001441359519958496, -0.001096963882446289, -0.000752568244934082, -0.000408172607421875, -6.377696990966797e-05, 0.00028061866760253906, 0.0006250143051147461, 0.0009694099426269531, 0.0013138055801391602, 0.0016582012176513672, 0.0020025968551635742, 0.0023469924926757812, 0.0026913881301879883, 0.0030357837677001953, 0.0033801794052124023, 0.0037245750427246094, 0.004068970680236816, 0.0044133663177490234, 0.0047577619552612305, 0.0051021575927734375, 0.0054465532302856445, 0.0057909488677978516, 0.006135344505310059, 0.006479740142822266, 0.006824135780334473, 0.00716853141784668, 0.007512927055358887, 0.007857322692871094, 0.0082017183303833, 0.008546113967895508, 0.008890509605407715, 0.009234905242919922, 0.009579300880432129, 0.009923696517944336, 0.010268092155456543, 0.01061248779296875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 932.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.980232238769531e-07, -2.896413207054138e-07, -2.812594175338745e-07, -2.728775143623352e-07, -2.644956111907959e-07, -2.561137080192566e-07, -2.477318048477173e-07, -2.39349901676178e-07, -2.3096799850463867e-07, -2.2258609533309937e-07, -2.1420419216156006e-07, -2.0582228899002075e-07, -1.9744038581848145e-07, -1.8905848264694214e-07, -1.8067657947540283e-07, -1.7229467630386353e-07, -1.6391277313232422e-07, -1.555308699607849e-07, -1.471489667892456e-07, -1.387670636177063e-07, -1.30385160446167e-07, -1.2200325727462769e-07, -1.1362135410308838e-07, -1.0523945093154907e-07, -9.685754776000977e-08, -8.847564458847046e-08, -8.009374141693115e-08, -7.171183824539185e-08, -6.332993507385254e-08, -5.494803190231323e-08, -4.6566128730773926e-08, -3.818422555923462e-08, -2.9802322387695312e-08, -2.1420419216156006e-08, -1.30385160446167e-08, -4.6566128730773926e-09, 3.725290298461914e-09, 1.210719347000122e-08, 2.0489096641540527e-08, 2.8870999813079834e-08, 3.725290298461914e-08, 4.563480615615845e-08, 5.4016709327697754e-08, 6.239861249923706e-08, 7.078051567077637e-08, 7.916241884231567e-08, 8.754432201385498e-08, 9.592622518539429e-08, 1.043081283569336e-07, 1.126900315284729e-07, 1.210719347000122e-07, 1.2945383787155151e-07, 1.3783574104309082e-07, 1.4621764421463013e-07, 1.5459954738616943e-07, 1.6298145055770874e-07, 1.7136335372924805e-07, 1.7974525690078735e-07, 1.8812716007232666e-07, 1.9650906324386597e-07, 2.0489096641540527e-07, 2.1327286958694458e-07, 2.2165477275848389e-07, 2.300366759300232e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 35.0, 19.0, 8.0, 65.0, 39.0, 166.0, 5221.0, 1012725.0, 29236.0, 814.0, 72.0, 51.0, 41.0, 17.0, 30.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2782554626464844e-06, -3.155320882797241e-06, -3.032386302947998e-06, -2.909451723098755e-06, -2.7865171432495117e-06, -2.6635825634002686e-06, -2.5406479835510254e-06, -2.4177134037017822e-06, -2.294778823852539e-06, -2.171844244003296e-06, -2.0489096641540527e-06, -1.9259750843048096e-06, -1.8030405044555664e-06, -1.6801059246063232e-06, -1.55717134475708e-06, -1.434236764907837e-06, -1.3113021850585938e-06, -1.1883676052093506e-06, -1.0654330253601074e-06, -9.424984455108643e-07, -8.195638656616211e-07, -6.966292858123779e-07, -5.736947059631348e-07, -4.507601261138916e-07, -3.2782554626464844e-07, -2.0489096641540527e-07, -8.195638656616211e-08, 4.0978193283081055e-08, 1.6391277313232422e-07, 2.868473529815674e-07, 4.0978193283081055e-07, 5.327165126800537e-07, 6.556510925292969e-07, 7.7858567237854e-07, 9.015202522277832e-07, 1.0244548320770264e-06, 1.1473894119262695e-06, 1.2703239917755127e-06, 1.3932585716247559e-06, 1.516193151473999e-06, 1.6391277313232422e-06, 1.7620623111724854e-06, 1.8849968910217285e-06, 2.0079314708709717e-06, 2.130866050720215e-06, 2.253800630569458e-06, 2.376735210418701e-06, 2.4996697902679443e-06, 2.6226043701171875e-06, 2.7455389499664307e-06, 2.868473529815674e-06, 2.991408109664917e-06, 3.11434268951416e-06, 3.2372772693634033e-06, 3.3602118492126465e-06, 3.4831464290618896e-06, 3.606081008911133e-06, 3.729015588760376e-06, 3.851950168609619e-06, 3.974884748458862e-06, 4.0978193283081055e-06, 4.220753908157349e-06, 4.343688488006592e-06, 4.466623067855835e-06, 4.589557647705078e-06]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1021.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4226133866231976e-08, -4.295573319268442e-08, -4.1685332519136864e-08, -4.041493184558931e-08, -3.914453117204175e-08, -3.7874130498494196e-08, -3.660372982494664e-08, -3.5333329151399084e-08, -3.406292847785153e-08, -3.279252780430397e-08, -3.1522127130756417e-08, -3.025172645720886e-08, -2.8981325783661305e-08, -2.771092511011375e-08, -2.6440526212923032e-08, -2.5170125539375476e-08, -2.389972664218476e-08, -2.2629325968637204e-08, -2.1358925295089648e-08, -2.0088524621542092e-08, -1.8818123947994536e-08, -1.754772327444698e-08, -1.6277324377256264e-08, -1.5006923703708708e-08, -1.3736523030161152e-08, -1.2466122356613596e-08, -1.119572168306604e-08, -9.925321897696904e-09, -8.654921224149348e-09, -7.384520550601792e-09, -6.114120765232656e-09, -4.8437200916851e-09, -3.573319418137544e-09, -2.302918966634593e-09, -1.0325185151316418e-09, 2.3788171432670424e-10, 1.5082823878742602e-09, 2.778683061421816e-09, 4.049082846790952e-09, 5.319483520338508e-09, 6.589884193886064e-09, 7.86028486743362e-09, 9.130685540981176e-09, 1.0401085326350312e-08, 1.1671485999897868e-08, 1.2941886673445424e-08, 1.421228645881456e-08, 1.5482687132362116e-08, 1.6753087805909672e-08, 1.8023488479457228e-08, 1.9293889153004784e-08, 2.056428982655234e-08, 2.1834690500099896e-08, 2.3105091173647452e-08, 2.4375490070838168e-08, 2.5645890744385724e-08, 2.691629141793328e-08, 2.8186692091480836e-08, 2.9457092765028392e-08, 3.072749166221911e-08, 3.1997892335766664e-08, 3.326829300931422e-08, 3.4538693682861776e-08, 3.580909435640933e-08, 3.707949502995689e-08]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1021.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 2.0, 1.0, 5.0, 6.0, 6.0, 6.0, 8.0, 17.0, 8.0, 11.0, 23.0, 17.0, 28.0, 17.0, 18.0, 26.0, 24.0, 33.0, 35.0, 44.0, 32.0, 37.0, 39.0, 53.0, 46.0, 33.0, 36.0, 37.0, 34.0, 39.0, 29.0, 28.0, 26.0, 23.0, 25.0, 21.0, 16.0, 10.0, 17.0, 14.0, 12.0, 10.0, 14.0, 5.0, 7.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6572265625, -1.602142333984375, -1.54705810546875, -1.491973876953125, -1.4368896484375, -1.381805419921875, -1.32672119140625, -1.271636962890625, -1.216552734375, -1.161468505859375, -1.10638427734375, -1.051300048828125, -0.9962158203125, -0.941131591796875, -0.88604736328125, -0.830963134765625, -0.77587890625, -0.720794677734375, -0.66571044921875, -0.610626220703125, -0.5555419921875, -0.500457763671875, -0.44537353515625, -0.390289306640625, -0.335205078125, -0.280120849609375, -0.22503662109375, -0.169952392578125, -0.1148681640625, -0.059783935546875, -0.00469970703125, 0.050384521484375, 0.10546875, 0.160552978515625, 0.21563720703125, 0.270721435546875, 0.3258056640625, 0.380889892578125, 0.43597412109375, 0.491058349609375, 0.546142578125, 0.601226806640625, 0.65631103515625, 0.711395263671875, 0.7664794921875, 0.821563720703125, 0.87664794921875, 0.931732177734375, 0.98681640625, 1.041900634765625, 1.09698486328125, 1.152069091796875, 1.2071533203125, 1.262237548828125, 1.31732177734375, 1.372406005859375, 1.427490234375, 1.482574462890625, 1.53765869140625, 1.592742919921875, 1.6478271484375, 1.702911376953125, 1.75799560546875, 1.813079833984375, 1.8681640625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 5.0, 13.0, 10.0, 17.0, 26.0, 27.0, 30.0, 48.0, 73.0, 98.0, 142.0, 209.0, 329.0, 474.0, 704.0, 1056.0, 1641.0, 2488.0, 3900.0, 6527.0, 12885.0, 29658.0, 83513.0, 367899.0, 388806.0, 86429.0, 30470.0, 12988.0, 6655.0, 3970.0, 2471.0, 1621.0, 1119.0, 726.0, 474.0, 358.0, 212.0, 127.0, 93.0, 54.0, 49.0, 41.0, 20.0, 19.0, 17.0, 12.0, 11.0, 17.0, 10.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.42578125, -2.347564697265625, -2.26934814453125, -2.191131591796875, -2.1129150390625, -2.034698486328125, -1.95648193359375, -1.878265380859375, -1.800048828125, -1.721832275390625, -1.64361572265625, -1.565399169921875, -1.4871826171875, -1.408966064453125, -1.33074951171875, -1.252532958984375, -1.17431640625, -1.096099853515625, -1.01788330078125, -0.939666748046875, -0.8614501953125, -0.783233642578125, -0.70501708984375, -0.626800537109375, -0.548583984375, -0.470367431640625, -0.39215087890625, -0.313934326171875, -0.2357177734375, -0.157501220703125, -0.07928466796875, -0.001068115234375, 0.0771484375, 0.155364990234375, 0.23358154296875, 0.311798095703125, 0.3900146484375, 0.468231201171875, 0.54644775390625, 0.624664306640625, 0.702880859375, 0.781097412109375, 0.85931396484375, 0.937530517578125, 1.0157470703125, 1.093963623046875, 1.17218017578125, 1.250396728515625, 1.32861328125, 1.406829833984375, 1.48504638671875, 1.563262939453125, 1.6414794921875, 1.719696044921875, 1.79791259765625, 1.876129150390625, 1.954345703125, 2.032562255859375, 2.11077880859375, 2.188995361328125, 2.2672119140625, 2.345428466796875, 2.42364501953125, 2.501861572265625, 2.580078125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 5.0, 7.0, 9.0, 8.0, 13.0, 14.0, 15.0, 18.0, 14.0, 25.0, 35.0, 36.0, 28.0, 46.0, 41.0, 35.0, 50.0, 61.0, 161.0, 1498.0, 367.0, 120.0, 84.0, 52.0, 50.0, 46.0, 30.0, 32.0, 37.0, 17.0, 18.0, 16.0, 17.0, 11.0, 9.0, 7.0, 6.0, 3.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.47265625, -7.24566650390625, -7.0186767578125, -6.79168701171875, -6.564697265625, -6.33770751953125, -6.1107177734375, -5.88372802734375, -5.65673828125, -5.42974853515625, -5.2027587890625, -4.97576904296875, -4.748779296875, -4.52178955078125, -4.2947998046875, -4.06781005859375, -3.8408203125, -3.61383056640625, -3.3868408203125, -3.15985107421875, -2.932861328125, -2.70587158203125, -2.4788818359375, -2.25189208984375, -2.02490234375, -1.79791259765625, -1.5709228515625, -1.34393310546875, -1.116943359375, -0.88995361328125, -0.6629638671875, -0.43597412109375, -0.208984375, 0.01800537109375, 0.2449951171875, 0.47198486328125, 0.698974609375, 0.92596435546875, 1.1529541015625, 1.37994384765625, 1.60693359375, 1.83392333984375, 2.0609130859375, 2.28790283203125, 2.514892578125, 2.74188232421875, 2.9688720703125, 3.19586181640625, 3.4228515625, 3.64984130859375, 3.8768310546875, 4.10382080078125, 4.330810546875, 4.55780029296875, 4.7847900390625, 5.01177978515625, 5.23876953125, 5.46575927734375, 5.6927490234375, 5.91973876953125, 6.146728515625, 6.37371826171875, 6.6007080078125, 6.82769775390625, 7.0546875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 8.0, 13.0, 8.0, 21.0, 22.0, 25.0, 41.0, 65.0, 75.0, 113.0, 190.0, 327.0, 847.0, 3113.0, 18085.0, 344052.0, 2720859.0, 48592.0, 6544.0, 1430.0, 470.0, 230.0, 142.0, 108.0, 77.0, 50.0, 38.0, 29.0, 31.0, 17.0, 22.0, 14.0, 8.0, 9.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.078125, -10.7232666015625, -10.368408203125, -10.0135498046875, -9.65869140625, -9.3038330078125, -8.948974609375, -8.5941162109375, -8.2392578125, -7.8843994140625, -7.529541015625, -7.1746826171875, -6.81982421875, -6.4649658203125, -6.110107421875, -5.7552490234375, -5.400390625, -5.0455322265625, -4.690673828125, -4.3358154296875, -3.98095703125, -3.6260986328125, -3.271240234375, -2.9163818359375, -2.5615234375, -2.2066650390625, -1.851806640625, -1.4969482421875, -1.14208984375, -0.7872314453125, -0.432373046875, -0.0775146484375, 0.27734375, 0.6322021484375, 0.987060546875, 1.3419189453125, 1.69677734375, 2.0516357421875, 2.406494140625, 2.7613525390625, 3.1162109375, 3.4710693359375, 3.825927734375, 4.1807861328125, 4.53564453125, 4.8905029296875, 5.245361328125, 5.6002197265625, 5.955078125, 6.3099365234375, 6.664794921875, 7.0196533203125, 7.37451171875, 7.7293701171875, 8.084228515625, 8.4390869140625, 8.7939453125, 9.1488037109375, 9.503662109375, 9.8585205078125, 10.21337890625, 10.5682373046875, 10.923095703125, 11.2779541015625, 11.6328125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [2.0, 56.0, 528.0, 390.0, 40.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.941797733306885, -4.52443790435791, -2.1070775985717773, 0.31028223037719727, 2.72764253616333, 5.145002841949463, 7.562362194061279, 9.97972297668457, 12.397083282470703, 14.814443588256836, 17.23180389404297, 19.64916229248047, 22.066524505615234, 24.483882904052734, 26.901243209838867, 29.318603515625, 31.735963821411133, 34.153324127197266, 36.570682525634766, 38.98804473876953, 41.40540313720703, 43.8227653503418, 46.2401237487793, 48.65748596191406, 51.07484436035156, 53.49220275878906, 55.90956497192383, 58.32692337036133, 60.744285583496094, 63.161643981933594, 65.5790023803711, 67.99636840820312, 70.4137191772461, 72.8310775756836, 75.2484359741211, 77.66580200195312, 80.08316040039062, 82.50051879882812, 84.91787719726562, 87.33523559570312, 89.75260162353516, 92.16996002197266, 94.58731842041016, 97.00468444824219, 99.42204284667969, 101.83940124511719, 104.25675964355469, 106.67411804199219, 109.09147644042969, 111.50883483886719, 113.92619323730469, 116.34355926513672, 118.76091766357422, 121.17827606201172, 123.59563446044922, 126.01300048828125, 128.43035888671875, 130.84771728515625, 133.26507568359375, 135.68243408203125, 138.09979248046875, 140.5171661376953, 142.9345245361328, 145.3518829345703, 147.7692413330078]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 8.0, 11.0, 14.0, 9.0, 7.0, 21.0, 17.0, 33.0, 21.0, 32.0, 16.0, 26.0, 32.0, 31.0, 39.0, 44.0, 52.0, 38.0, 59.0, 44.0, 36.0, 44.0, 34.0, 46.0, 35.0, 29.0, 22.0, 26.0, 25.0, 26.0, 17.0, 20.0, 12.0, 16.0, 12.0, 10.0, 7.0, 7.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-22.289552688598633, -21.63736343383789, -20.98517417907715, -20.332984924316406, -19.680797576904297, -19.028608322143555, -18.376419067382812, -17.72422981262207, -17.072040557861328, -16.419851303100586, -15.767662048339844, -15.115473747253418, -14.463284492492676, -13.811095237731934, -13.158906936645508, -12.506717681884766, -11.854528427124023, -11.202339172363281, -10.550149917602539, -9.897961616516113, -9.245772361755371, -8.593583106994629, -7.941394329071045, -7.289205551147461, -6.637016296386719, -5.984827041625977, -5.332638263702393, -4.680449485778809, -4.028260231018066, -3.3760712146759033, -2.7238821983337402, -2.0716934204101562, -1.4195022583007812, -0.7673132419586182, -0.11512422561645508, 0.537064790725708, 1.189253807067871, 1.8414428234100342, 2.4936318397521973, 3.1458206176757812, 3.7980098724365234, 4.450199127197266, 5.10238790512085, 5.754576683044434, 6.406765937805176, 7.058955192565918, 7.711143970489502, 8.363332748413086, 9.015522003173828, 9.66771125793457, 10.319900512695312, 10.972088813781738, 11.62427806854248, 12.276467323303223, 12.928655624389648, 13.58084487915039, 14.233034133911133, 14.885223388671875, 15.537412643432617, 16.18960189819336, 16.84178924560547, 17.49397850036621, 18.146167755126953, 18.798357009887695, 19.450546264648438]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 5.0, 6.0, 3.0, 12.0, 9.0, 9.0, 8.0, 16.0, 16.0, 11.0, 22.0, 29.0, 22.0, 29.0, 24.0, 30.0, 33.0, 33.0, 44.0, 32.0, 46.0, 37.0, 45.0, 37.0, 34.0, 37.0, 31.0, 32.0, 41.0, 31.0, 31.0, 23.0, 25.0, 17.0, 16.0, 13.0, 18.0, 12.0, 14.0, 10.0, 14.0, 5.0, 7.0, 7.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0], "bins": [-1.755859375, -1.7000274658203125, -1.644195556640625, -1.5883636474609375, -1.53253173828125, -1.4766998291015625, -1.420867919921875, -1.3650360107421875, -1.3092041015625, -1.2533721923828125, -1.197540283203125, -1.1417083740234375, -1.08587646484375, -1.0300445556640625, -0.974212646484375, -0.9183807373046875, -0.862548828125, -0.8067169189453125, -0.750885009765625, -0.6950531005859375, -0.63922119140625, -0.5833892822265625, -0.527557373046875, -0.4717254638671875, -0.4158935546875, -0.3600616455078125, -0.304229736328125, -0.2483978271484375, -0.19256591796875, -0.1367340087890625, -0.080902099609375, -0.0250701904296875, 0.03076171875, 0.0865936279296875, 0.142425537109375, 0.1982574462890625, 0.25408935546875, 0.3099212646484375, 0.365753173828125, 0.4215850830078125, 0.4774169921875, 0.5332489013671875, 0.589080810546875, 0.6449127197265625, 0.70074462890625, 0.7565765380859375, 0.812408447265625, 0.8682403564453125, 0.924072265625, 0.9799041748046875, 1.035736083984375, 1.0915679931640625, 1.14739990234375, 1.2032318115234375, 1.259063720703125, 1.3148956298828125, 1.3707275390625, 1.4265594482421875, 1.482391357421875, 1.5382232666015625, 1.59405517578125, 1.6498870849609375, 1.705718994140625, 1.7615509033203125, 1.8173828125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 7.0, 19.0, 28.0, 30.0, 56.0, 101.0, 139.0, 203.0, 333.0, 525.0, 953.0, 1600.0, 2783.0, 5217.0, 9988.0, 19897.0, 40377.0, 87542.0, 202370.0, 520696.0, 1232047.0, 1209243.0, 501032.0, 194955.0, 84593.0, 39387.0, 18952.0, 9478.0, 5056.0, 2739.0, 1545.0, 908.0, 570.0, 337.0, 173.0, 113.0, 96.0, 57.0, 43.0, 16.0, 23.0, 14.0, 15.0, 7.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0], "bins": [-3.00390625, -2.91802978515625, -2.8321533203125, -2.74627685546875, -2.660400390625, -2.57452392578125, -2.4886474609375, -2.40277099609375, -2.31689453125, -2.23101806640625, -2.1451416015625, -2.05926513671875, -1.973388671875, -1.88751220703125, -1.8016357421875, -1.71575927734375, -1.6298828125, -1.54400634765625, -1.4581298828125, -1.37225341796875, -1.286376953125, -1.20050048828125, -1.1146240234375, -1.02874755859375, -0.94287109375, -0.85699462890625, -0.7711181640625, -0.68524169921875, -0.599365234375, -0.51348876953125, -0.4276123046875, -0.34173583984375, -0.255859375, -0.16998291015625, -0.0841064453125, 0.00177001953125, 0.087646484375, 0.17352294921875, 0.2593994140625, 0.34527587890625, 0.43115234375, 0.51702880859375, 0.6029052734375, 0.68878173828125, 0.774658203125, 0.86053466796875, 0.9464111328125, 1.03228759765625, 1.1181640625, 1.20404052734375, 1.2899169921875, 1.37579345703125, 1.461669921875, 1.54754638671875, 1.6334228515625, 1.71929931640625, 1.80517578125, 1.89105224609375, 1.9769287109375, 2.06280517578125, 2.148681640625, 2.23455810546875, 2.3204345703125, 2.40631103515625, 2.4921875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 6.0, 4.0, 10.0, 11.0, 16.0, 34.0, 51.0, 63.0, 104.0, 157.0, 205.0, 291.0, 391.0, 462.0, 551.0, 509.0, 354.0, 255.0, 193.0, 124.0, 95.0, 70.0, 38.0, 20.0, 22.0, 11.0, 7.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.32769775390625, -6.1124267578125, -5.89715576171875, -5.681884765625, -5.46661376953125, -5.2513427734375, -5.03607177734375, -4.82080078125, -4.60552978515625, -4.3902587890625, -4.17498779296875, -3.959716796875, -3.74444580078125, -3.5291748046875, -3.31390380859375, -3.0986328125, -2.88336181640625, -2.6680908203125, -2.45281982421875, -2.237548828125, -2.02227783203125, -1.8070068359375, -1.59173583984375, -1.37646484375, -1.16119384765625, -0.9459228515625, -0.73065185546875, -0.515380859375, -0.30010986328125, -0.0848388671875, 0.13043212890625, 0.345703125, 0.56097412109375, 0.7762451171875, 0.99151611328125, 1.206787109375, 1.42205810546875, 1.6373291015625, 1.85260009765625, 2.06787109375, 2.28314208984375, 2.4984130859375, 2.71368408203125, 2.928955078125, 3.14422607421875, 3.3594970703125, 3.57476806640625, 3.7900390625, 4.00531005859375, 4.2205810546875, 4.43585205078125, 4.651123046875, 4.86639404296875, 5.0816650390625, 5.29693603515625, 5.51220703125, 5.72747802734375, 5.9427490234375, 6.15802001953125, 6.373291015625, 6.58856201171875, 6.8038330078125, 7.01910400390625, 7.234375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 3.0, 8.0, 9.0, 12.0, 18.0, 19.0, 30.0, 52.0, 94.0, 136.0, 248.0, 422.0, 942.0, 2288.0, 6986.0, 26922.0, 129837.0, 737991.0, 2402512.0, 721358.0, 126806.0, 26376.0, 6857.0, 2297.0, 964.0, 438.0, 248.0, 128.0, 90.0, 54.0, 36.0, 38.0, 22.0, 17.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-10.5703125, -10.29571533203125, -10.0211181640625, -9.74652099609375, -9.471923828125, -9.19732666015625, -8.9227294921875, -8.64813232421875, -8.37353515625, -8.09893798828125, -7.8243408203125, -7.54974365234375, -7.275146484375, -7.00054931640625, -6.7259521484375, -6.45135498046875, -6.1767578125, -5.90216064453125, -5.6275634765625, -5.35296630859375, -5.078369140625, -4.80377197265625, -4.5291748046875, -4.25457763671875, -3.97998046875, -3.70538330078125, -3.4307861328125, -3.15618896484375, -2.881591796875, -2.60699462890625, -2.3323974609375, -2.05780029296875, -1.783203125, -1.50860595703125, -1.2340087890625, -0.95941162109375, -0.684814453125, -0.41021728515625, -0.1356201171875, 0.13897705078125, 0.41357421875, 0.68817138671875, 0.9627685546875, 1.23736572265625, 1.511962890625, 1.78656005859375, 2.0611572265625, 2.33575439453125, 2.6103515625, 2.88494873046875, 3.1595458984375, 3.43414306640625, 3.708740234375, 3.98333740234375, 4.2579345703125, 4.53253173828125, 4.80712890625, 5.08172607421875, 5.3563232421875, 5.63092041015625, 5.905517578125, 6.18011474609375, 6.4547119140625, 6.72930908203125, 7.00390625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 24.0, 35.0, 58.0, 87.0, 132.0, 164.0, 167.0, 106.0, 103.0, 68.0, 37.0, 13.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.73130798339844, -59.140724182128906, -57.550140380859375, -55.959556579589844, -54.36897277832031, -52.77838897705078, -51.18780517578125, -49.59722137451172, -48.00663757324219, -46.416053771972656, -44.825469970703125, -43.234886169433594, -41.64430236816406, -40.05371856689453, -38.463134765625, -36.87255096435547, -35.2819709777832, -33.69138717651367, -32.10080337524414, -30.51021957397461, -28.919635772705078, -27.329051971435547, -25.73847007751465, -24.147886276245117, -22.557302474975586, -20.966718673706055, -19.376134872436523, -17.785552978515625, -16.194969177246094, -14.604384422302246, -13.013801574707031, -11.4232177734375, -9.832637786865234, -8.242053985595703, -6.65147066116333, -5.060887336730957, -3.470303535461426, -1.8797197341918945, -0.2891368865966797, 1.3014469146728516, 2.892030715942383, 4.482614517211914, 6.073197841644287, 7.66378116607666, 9.254364967346191, 10.844948768615723, 12.435531616210938, 14.026115417480469, 15.61669921875, 17.20728302001953, 18.797866821289062, 20.388450622558594, 21.979034423828125, 23.569618225097656, 25.160200119018555, 26.750783920288086, 28.341367721557617, 29.93195152282715, 31.52253532409668, 33.11311721801758, 34.70370101928711, 36.29428482055664, 37.88486862182617, 39.4754524230957, 41.066036224365234]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 8.0, 12.0, 6.0, 11.0, 11.0, 19.0, 15.0, 22.0, 16.0, 21.0, 19.0, 24.0, 31.0, 30.0, 23.0, 35.0, 36.0, 36.0, 40.0, 35.0, 46.0, 38.0, 26.0, 30.0, 34.0, 36.0, 32.0, 32.0, 32.0, 24.0, 28.0, 23.0, 26.0, 19.0, 15.0, 14.0, 21.0, 7.0, 19.0, 9.0, 10.0, 6.0, 4.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-18.88275909423828, -18.338769912719727, -17.794780731201172, -17.250791549682617, -16.706802368164062, -16.162813186645508, -15.618823051452637, -15.074833869934082, -14.530844688415527, -13.986855506896973, -13.442866325378418, -12.898877143859863, -12.354887008666992, -11.810897827148438, -11.266908645629883, -10.722919464111328, -10.178930282592773, -9.634941101074219, -9.090951919555664, -8.54696273803711, -8.002973556518555, -7.458983898162842, -6.914994239807129, -6.371005058288574, -5.8270158767700195, -5.283026695251465, -4.73903751373291, -4.195047855377197, -3.6510586738586426, -3.107069492340088, -2.563080072402954, -2.0190906524658203, -1.4751014709472656, -0.9311121702194214, -0.38712286949157715, 0.1568664312362671, 0.7008557319641113, 1.244844913482666, 1.7888343334197998, 2.3328237533569336, 2.8768129348754883, 3.420802116394043, 3.9647915363311768, 4.5087809562683105, 5.052770137786865, 5.59675931930542, 6.140748977661133, 6.6847381591796875, 7.228727340698242, 7.772716522216797, 8.316705703735352, 8.860694885253906, 9.404684066772461, 9.948673248291016, 10.492663383483887, 11.036652565002441, 11.580641746520996, 12.12463092803955, 12.668620109558105, 13.21260929107666, 13.756599426269531, 14.300588607788086, 14.84457778930664, 15.388566970825195, 15.93255615234375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 6.0, 8.0, 5.0, 11.0, 6.0, 11.0, 15.0, 14.0, 19.0, 18.0, 36.0, 31.0, 32.0, 32.0, 42.0, 48.0, 34.0, 50.0, 48.0, 43.0, 50.0, 40.0, 46.0, 46.0, 30.0, 31.0, 36.0, 37.0, 28.0, 20.0, 15.0, 16.0, 19.0, 18.0, 18.0, 10.0, 7.0, 7.0, 4.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.23046875, -2.162750244140625, -2.09503173828125, -2.027313232421875, -1.9595947265625, -1.891876220703125, -1.82415771484375, -1.756439208984375, -1.688720703125, -1.621002197265625, -1.55328369140625, -1.485565185546875, -1.4178466796875, -1.350128173828125, -1.28240966796875, -1.214691162109375, -1.14697265625, -1.079254150390625, -1.01153564453125, -0.943817138671875, -0.8760986328125, -0.808380126953125, -0.74066162109375, -0.672943115234375, -0.605224609375, -0.537506103515625, -0.46978759765625, -0.402069091796875, -0.3343505859375, -0.266632080078125, -0.19891357421875, -0.131195068359375, -0.0634765625, 0.004241943359375, 0.07196044921875, 0.139678955078125, 0.2073974609375, 0.275115966796875, 0.34283447265625, 0.410552978515625, 0.478271484375, 0.545989990234375, 0.61370849609375, 0.681427001953125, 0.7491455078125, 0.816864013671875, 0.88458251953125, 0.952301025390625, 1.02001953125, 1.087738037109375, 1.15545654296875, 1.223175048828125, 1.2908935546875, 1.358612060546875, 1.42633056640625, 1.494049072265625, 1.561767578125, 1.629486083984375, 1.69720458984375, 1.764923095703125, 1.8326416015625, 1.900360107421875, 1.96807861328125, 2.035797119140625, 2.103515625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 7.0, 10.0, 19.0, 19.0, 28.0, 54.0, 79.0, 101.0, 128.0, 210.0, 304.0, 358.0, 559.0, 758.0, 1094.0, 1577.0, 2318.0, 3204.0, 4677.0, 6511.0, 9355.0, 14163.0, 21068.0, 31518.0, 49941.0, 81952.0, 160209.0, 303169.0, 140503.0, 75428.0, 46648.0, 29921.0, 19723.0, 13240.0, 8947.0, 6132.0, 4505.0, 2939.0, 2171.0, 1477.0, 1069.0, 667.0, 548.0, 382.0, 245.0, 189.0, 156.0, 83.0, 59.0, 50.0, 34.0, 22.0, 10.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.01412200927734375, -0.013672590255737305, -0.01322317123413086, -0.012773752212524414, -0.012324333190917969, -0.011874914169311523, -0.011425495147705078, -0.010976076126098633, -0.010526657104492188, -0.010077238082885742, -0.009627819061279297, -0.009178400039672852, -0.008728981018066406, -0.008279561996459961, -0.007830142974853516, -0.00738072395324707, -0.006931304931640625, -0.00648188591003418, -0.006032466888427734, -0.005583047866821289, -0.005133628845214844, -0.0046842098236083984, -0.004234790802001953, -0.003785371780395508, -0.0033359527587890625, -0.002886533737182617, -0.002437114715576172, -0.0019876956939697266, -0.0015382766723632812, -0.001088857650756836, -0.0006394386291503906, -0.0001900196075439453, 0.0002593994140625, 0.0007088184356689453, 0.0011582374572753906, 0.001607656478881836, 0.0020570755004882812, 0.0025064945220947266, 0.002955913543701172, 0.003405332565307617, 0.0038547515869140625, 0.004304170608520508, 0.004753589630126953, 0.0052030086517333984, 0.005652427673339844, 0.006101846694946289, 0.006551265716552734, 0.00700068473815918, 0.007450103759765625, 0.00789952278137207, 0.008348941802978516, 0.008798360824584961, 0.009247779846191406, 0.009697198867797852, 0.010146617889404297, 0.010596036911010742, 0.011045455932617188, 0.011494874954223633, 0.011944293975830078, 0.012393712997436523, 0.012843132019042969, 0.013292551040649414, 0.01374197006225586, 0.014191389083862305, 0.01464080810546875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 6.0, 11.0, 10.0, 9.0, 13.0, 11.0, 19.0, 22.0, 32.0, 24.0, 22.0, 29.0, 40.0, 47.0, 50.0, 43.0, 43.0, 48.0, 1066.0, 44.0, 45.0, 54.0, 41.0, 31.0, 30.0, 32.0, 22.0, 35.0, 25.0, 21.0, 33.0, 15.0, 15.0, 13.0, 6.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.6767578125, -1.6307220458984375, -1.584686279296875, -1.5386505126953125, -1.49261474609375, -1.4465789794921875, -1.400543212890625, -1.3545074462890625, -1.3084716796875, -1.2624359130859375, -1.216400146484375, -1.1703643798828125, -1.12432861328125, -1.0782928466796875, -1.032257080078125, -0.9862213134765625, -0.940185546875, -0.8941497802734375, -0.848114013671875, -0.8020782470703125, -0.75604248046875, -0.7100067138671875, -0.663970947265625, -0.6179351806640625, -0.5718994140625, -0.5258636474609375, -0.479827880859375, -0.4337921142578125, -0.38775634765625, -0.3417205810546875, -0.295684814453125, -0.2496490478515625, -0.20361328125, -0.1575775146484375, -0.111541748046875, -0.0655059814453125, -0.01947021484375, 0.0265655517578125, 0.072601318359375, 0.1186370849609375, 0.1646728515625, 0.2107086181640625, 0.256744384765625, 0.3027801513671875, 0.34881591796875, 0.3948516845703125, 0.440887451171875, 0.4869232177734375, 0.532958984375, 0.5789947509765625, 0.625030517578125, 0.6710662841796875, 0.71710205078125, 0.7631378173828125, 0.809173583984375, 0.8552093505859375, 0.9012451171875, 0.9472808837890625, 0.993316650390625, 1.0393524169921875, 1.08538818359375, 1.1314239501953125, 1.177459716796875, 1.2234954833984375, 1.26953125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 8.0, 10.0, 8.0, 24.0, 23.0, 38.0, 53.0, 83.0, 136.0, 199.0, 292.0, 446.0, 713.0, 1050.0, 1594.0, 2380.0, 3667.0, 5623.0, 8581.0, 12907.0, 19958.0, 32511.0, 54202.0, 98546.0, 222401.0, 1338752.0, 123620.0, 64769.0, 37623.0, 23496.0, 14994.0, 9693.0, 6512.0, 4222.0, 2825.0, 1803.0, 1127.0, 756.0, 495.0, 336.0, 213.0, 144.0, 105.0, 66.0, 40.0, 31.0, 20.0, 17.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01132965087890625, -0.010966062545776367, -0.010602474212646484, -0.010238885879516602, -0.009875297546386719, -0.009511709213256836, -0.009148120880126953, -0.00878453254699707, -0.008420944213867188, -0.008057355880737305, -0.007693767547607422, -0.007330179214477539, -0.006966590881347656, -0.0066030025482177734, -0.006239414215087891, -0.005875825881958008, -0.005512237548828125, -0.005148649215698242, -0.004785060882568359, -0.0044214725494384766, -0.004057884216308594, -0.003694295883178711, -0.003330707550048828, -0.0029671192169189453, -0.0026035308837890625, -0.0022399425506591797, -0.0018763542175292969, -0.001512765884399414, -0.0011491775512695312, -0.0007855892181396484, -0.0004220008850097656, -5.841255187988281e-05, 0.00030517578125, 0.0006687641143798828, 0.0010323524475097656, 0.0013959407806396484, 0.0017595291137695312, 0.002123117446899414, 0.002486705780029297, 0.0028502941131591797, 0.0032138824462890625, 0.0035774707794189453, 0.003941059112548828, 0.004304647445678711, 0.004668235778808594, 0.0050318241119384766, 0.005395412445068359, 0.005759000778198242, 0.006122589111328125, 0.006486177444458008, 0.006849765777587891, 0.0072133541107177734, 0.007576942443847656, 0.007940530776977539, 0.008304119110107422, 0.008667707443237305, 0.009031295776367188, 0.00939488410949707, 0.009758472442626953, 0.010122060775756836, 0.010485649108886719, 0.010849237442016602, 0.011212825775146484, 0.011576414108276367, 0.01194000244140625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 913.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 50.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 23.0, 6.0, 22.0, 7.0, 23.0, 54.0, 39.0, 281.0, 973.0, 34078.0, 1005848.0, 5729.0, 1190.0, 97.0, 61.0, 27.0, 18.0, 7.0, 31.0, 8.0, 20.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-06, -3.4803524613380432e-06, -3.384426236152649e-06, -3.2885000109672546e-06, -3.1925737857818604e-06, -3.096647560596466e-06, -3.0007213354110718e-06, -2.9047951102256775e-06, -2.808868885040283e-06, -2.712942659854889e-06, -2.6170164346694946e-06, -2.5210902094841003e-06, -2.425163984298706e-06, -2.3292377591133118e-06, -2.2333115339279175e-06, -2.137385308742523e-06, -2.041459083557129e-06, -1.9455328583717346e-06, -1.8496066331863403e-06, -1.753680408000946e-06, -1.6577541828155518e-06, -1.5618279576301575e-06, -1.4659017324447632e-06, -1.369975507259369e-06, -1.2740492820739746e-06, -1.1781230568885803e-06, -1.082196831703186e-06, -9.862706065177917e-07, -8.903443813323975e-07, -7.944181561470032e-07, -6.984919309616089e-07, -6.025657057762146e-07, -5.066394805908203e-07, -4.10713255405426e-07, -3.1478703022003174e-07, -2.1886080503463745e-07, -1.2293457984924316e-07, -2.7008354663848877e-08, 6.891787052154541e-08, 1.648440957069397e-07, 2.60770320892334e-07, 3.5669654607772827e-07, 4.5262277126312256e-07, 5.485489964485168e-07, 6.444752216339111e-07, 7.404014468193054e-07, 8.363276720046997e-07, 9.32253897190094e-07, 1.0281801223754883e-06, 1.1241063475608826e-06, 1.2200325727462769e-06, 1.3159587979316711e-06, 1.4118850231170654e-06, 1.5078112483024597e-06, 1.603737473487854e-06, 1.6996636986732483e-06, 1.7955899238586426e-06, 1.8915161490440369e-06, 1.987442374229431e-06, 2.0833685994148254e-06, 2.1792948246002197e-06, 2.275221049785614e-06, 2.3711472749710083e-06, 2.4670735001564026e-06, 2.562999725341797e-06]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 6.0, 8.0, 5.0, 11.0, 6.0, 11.0, 15.0, 14.0, 19.0, 18.0, 36.0, 31.0, 32.0, 32.0, 42.0, 48.0, 34.0, 50.0, 48.0, 43.0, 50.0, 40.0, 46.0, 46.0, 30.0, 31.0, 36.0, 37.0, 28.0, 20.0, 15.0, 16.0, 19.0, 18.0, 18.0, 10.0, 7.0, 7.0, 4.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.23046875, -2.162750244140625, -2.09503173828125, -2.027313232421875, -1.9595947265625, -1.891876220703125, -1.82415771484375, -1.756439208984375, -1.688720703125, -1.621002197265625, -1.55328369140625, -1.485565185546875, -1.4178466796875, -1.350128173828125, -1.28240966796875, -1.214691162109375, -1.14697265625, -1.079254150390625, -1.01153564453125, -0.943817138671875, -0.8760986328125, -0.808380126953125, -0.74066162109375, -0.672943115234375, -0.605224609375, -0.537506103515625, -0.46978759765625, -0.402069091796875, -0.3343505859375, -0.266632080078125, -0.19891357421875, -0.131195068359375, -0.0634765625, 0.004241943359375, 0.07196044921875, 0.139678955078125, 0.2073974609375, 0.275115966796875, 0.34283447265625, 0.410552978515625, 0.478271484375, 0.545989990234375, 0.61370849609375, 0.681427001953125, 0.7491455078125, 0.816864013671875, 0.88458251953125, 0.952301025390625, 1.02001953125, 1.087738037109375, 1.15545654296875, 1.223175048828125, 1.2908935546875, 1.358612060546875, 1.42633056640625, 1.494049072265625, 1.561767578125, 1.629486083984375, 1.69720458984375, 1.764923095703125, 1.8326416015625, 1.900360107421875, 1.96807861328125, 2.035797119140625, 2.103515625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 12.0, 11.0, 17.0, 24.0, 34.0, 58.0, 91.0, 136.0, 216.0, 328.0, 547.0, 887.0, 1389.0, 2092.0, 3377.0, 5337.0, 8894.0, 15846.0, 35123.0, 100985.0, 396972.0, 324823.0, 84487.0, 30598.0, 14732.0, 8126.0, 4931.0, 3073.0, 1860.0, 1297.0, 836.0, 511.0, 335.0, 182.0, 133.0, 79.0, 52.0, 41.0, 29.0, 15.0, 14.0, 9.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -1.994964599609375, -1.92352294921875, -1.852081298828125, -1.7806396484375, -1.709197998046875, -1.63775634765625, -1.566314697265625, -1.494873046875, -1.423431396484375, -1.35198974609375, -1.280548095703125, -1.2091064453125, -1.137664794921875, -1.06622314453125, -0.994781494140625, -0.92333984375, -0.851898193359375, -0.78045654296875, -0.709014892578125, -0.6375732421875, -0.566131591796875, -0.49468994140625, -0.423248291015625, -0.351806640625, -0.280364990234375, -0.20892333984375, -0.137481689453125, -0.0660400390625, 0.005401611328125, 0.07684326171875, 0.148284912109375, 0.2197265625, 0.291168212890625, 0.36260986328125, 0.434051513671875, 0.5054931640625, 0.576934814453125, 0.64837646484375, 0.719818115234375, 0.791259765625, 0.862701416015625, 0.93414306640625, 1.005584716796875, 1.0770263671875, 1.148468017578125, 1.21990966796875, 1.291351318359375, 1.36279296875, 1.434234619140625, 1.50567626953125, 1.577117919921875, 1.6485595703125, 1.720001220703125, 1.79144287109375, 1.862884521484375, 1.934326171875, 2.005767822265625, 2.07720947265625, 2.148651123046875, 2.2200927734375, 2.291534423828125, 2.36297607421875, 2.434417724609375, 2.505859375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 8.0, 11.0, 9.0, 14.0, 14.0, 14.0, 20.0, 19.0, 17.0, 33.0, 30.0, 32.0, 39.0, 41.0, 53.0, 71.0, 140.0, 389.0, 1520.0, 117.0, 87.0, 48.0, 45.0, 51.0, 38.0, 32.0, 27.0, 23.0, 21.0, 19.0, 10.0, 10.0, 14.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.341064453125, -8.08056640625, -7.820068359375, -7.5595703125, -7.299072265625, -7.03857421875, -6.778076171875, -6.517578125, -6.257080078125, -5.99658203125, -5.736083984375, -5.4755859375, -5.215087890625, -4.95458984375, -4.694091796875, -4.43359375, -4.173095703125, -3.91259765625, -3.652099609375, -3.3916015625, -3.131103515625, -2.87060546875, -2.610107421875, -2.349609375, -2.089111328125, -1.82861328125, -1.568115234375, -1.3076171875, -1.047119140625, -0.78662109375, -0.526123046875, -0.265625, -0.005126953125, 0.25537109375, 0.515869140625, 0.7763671875, 1.036865234375, 1.29736328125, 1.557861328125, 1.818359375, 2.078857421875, 2.33935546875, 2.599853515625, 2.8603515625, 3.120849609375, 3.38134765625, 3.641845703125, 3.90234375, 4.162841796875, 4.42333984375, 4.683837890625, 4.9443359375, 5.204833984375, 5.46533203125, 5.725830078125, 5.986328125, 6.246826171875, 6.50732421875, 6.767822265625, 7.0283203125, 7.288818359375, 7.54931640625, 7.809814453125, 8.0703125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 9.0, 7.0, 10.0, 8.0, 17.0, 30.0, 24.0, 29.0, 52.0, 78.0, 84.0, 137.0, 167.0, 361.0, 1136.0, 8578.0, 751134.0, 2369458.0, 11883.0, 1382.0, 389.0, 194.0, 121.0, 119.0, 54.0, 63.0, 48.0, 16.0, 22.0, 16.0, 17.0, 12.0, 16.0, 11.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9765625, -14.4783935546875, -13.980224609375, -13.4820556640625, -12.98388671875, -12.4857177734375, -11.987548828125, -11.4893798828125, -10.9912109375, -10.4930419921875, -9.994873046875, -9.4967041015625, -8.99853515625, -8.5003662109375, -8.002197265625, -7.5040283203125, -7.005859375, -6.5076904296875, -6.009521484375, -5.5113525390625, -5.01318359375, -4.5150146484375, -4.016845703125, -3.5186767578125, -3.0205078125, -2.5223388671875, -2.024169921875, -1.5260009765625, -1.02783203125, -0.5296630859375, -0.031494140625, 0.4666748046875, 0.96484375, 1.4630126953125, 1.961181640625, 2.4593505859375, 2.95751953125, 3.4556884765625, 3.953857421875, 4.4520263671875, 4.9501953125, 5.4483642578125, 5.946533203125, 6.4447021484375, 6.94287109375, 7.4410400390625, 7.939208984375, 8.4373779296875, 8.935546875, 9.4337158203125, 9.931884765625, 10.4300537109375, 10.92822265625, 11.4263916015625, 11.924560546875, 12.4227294921875, 12.9208984375, 13.4190673828125, 13.917236328125, 14.4154052734375, 14.91357421875, 15.4117431640625, 15.909912109375, 16.4080810546875, 16.90625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 14.0, 37.0, 85.0, 153.0, 218.0, 207.0, 145.0, 96.0, 39.0, 9.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.816356658935547, -11.191030502319336, -10.565704345703125, -9.940378189086914, -9.315052032470703, -8.689725875854492, -8.064399719238281, -7.43907356262207, -6.813747406005859, -6.188421249389648, -5.5630950927734375, -4.937768936157227, -4.312442779541016, -3.6871166229248047, -3.0617904663085938, -2.436464309692383, -1.8111381530761719, -1.185811996459961, -0.56048583984375, 0.06484031677246094, 0.6901664733886719, 1.3154926300048828, 1.9408187866210938, 2.5661449432373047, 3.1914710998535156, 3.8167972564697266, 4.4421234130859375, 5.067449569702148, 5.692775726318359, 6.31810188293457, 6.943428039550781, 7.568754196166992, 8.19407844543457, 8.819404602050781, 9.444730758666992, 10.070056915283203, 10.695383071899414, 11.320709228515625, 11.946035385131836, 12.571361541748047, 13.196687698364258, 13.822013854980469, 14.44734001159668, 15.07266616821289, 15.697992324829102, 16.323318481445312, 16.948644638061523, 17.573970794677734, 18.199296951293945, 18.824623107910156, 19.449949264526367, 20.075275421142578, 20.70060157775879, 21.325927734375, 21.95125389099121, 22.576580047607422, 23.201906204223633, 23.827232360839844, 24.452558517456055, 25.077884674072266, 25.703210830688477, 26.328536987304688, 26.9538631439209, 27.57918930053711, 28.20451545715332]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 12.0, 11.0, 10.0, 11.0, 19.0, 20.0, 21.0, 27.0, 18.0, 35.0, 29.0, 33.0, 32.0, 36.0, 34.0, 53.0, 51.0, 45.0, 55.0, 39.0, 40.0, 43.0, 34.0, 28.0, 22.0, 30.0, 25.0, 26.0, 30.0, 16.0, 14.0, 14.0, 18.0, 9.0, 14.0, 6.0, 8.0, 9.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-20.193883895874023, -19.57158088684082, -18.949277877807617, -18.326974868774414, -17.70467185974121, -17.082368850708008, -16.460065841674805, -15.837761878967285, -15.215458869934082, -14.593155860900879, -13.970852851867676, -13.348549842834473, -12.726245880126953, -12.10394287109375, -11.481639862060547, -10.859336853027344, -10.23703384399414, -9.614730834960938, -8.992427825927734, -8.370124816894531, -7.74782133102417, -7.125518321990967, -6.5032148361206055, -5.880911827087402, -5.258608818054199, -4.636305809020996, -4.014002799987793, -3.3916993141174316, -2.7693963050842285, -2.1470932960510254, -1.5247900485992432, -0.9024868011474609, -0.2801856994628906, 0.34211742877960205, 0.9644205570220947, 1.5867236852645874, 2.20902681350708, 2.831329822540283, 3.4536330699920654, 4.075936317443848, 4.698239326477051, 5.320542335510254, 5.942845344543457, 6.565148830413818, 7.1874518394470215, 7.809754848480225, 8.432058334350586, 9.054361343383789, 9.676664352416992, 10.298967361450195, 10.921270370483398, 11.543573379516602, 12.165876388549805, 12.788179397583008, 13.410483360290527, 14.03278636932373, 14.655089378356934, 15.277392387390137, 15.89969539642334, 16.52199935913086, 17.144302368164062, 17.766605377197266, 18.38890838623047, 19.011211395263672, 19.633514404296875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 8.0, 7.0, 6.0, 6.0, 12.0, 8.0, 17.0, 22.0, 17.0, 14.0, 33.0, 24.0, 38.0, 33.0, 52.0, 41.0, 38.0, 47.0, 46.0, 54.0, 36.0, 43.0, 48.0, 34.0, 30.0, 41.0, 28.0, 32.0, 29.0, 26.0, 19.0, 18.0, 20.0, 14.0, 10.0, 15.0, 6.0, 8.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.267578125, -2.198577880859375, -2.12957763671875, -2.060577392578125, -1.9915771484375, -1.922576904296875, -1.85357666015625, -1.784576416015625, -1.715576171875, -1.646575927734375, -1.57757568359375, -1.508575439453125, -1.4395751953125, -1.370574951171875, -1.30157470703125, -1.232574462890625, -1.16357421875, -1.094573974609375, -1.02557373046875, -0.956573486328125, -0.8875732421875, -0.818572998046875, -0.74957275390625, -0.680572509765625, -0.611572265625, -0.542572021484375, -0.47357177734375, -0.404571533203125, -0.3355712890625, -0.266571044921875, -0.19757080078125, -0.128570556640625, -0.0595703125, 0.009429931640625, 0.07843017578125, 0.147430419921875, 0.2164306640625, 0.285430908203125, 0.35443115234375, 0.423431396484375, 0.492431640625, 0.561431884765625, 0.63043212890625, 0.699432373046875, 0.7684326171875, 0.837432861328125, 0.90643310546875, 0.975433349609375, 1.04443359375, 1.113433837890625, 1.18243408203125, 1.251434326171875, 1.3204345703125, 1.389434814453125, 1.45843505859375, 1.527435302734375, 1.596435546875, 1.665435791015625, 1.73443603515625, 1.803436279296875, 1.8724365234375, 1.941436767578125, 2.01043701171875, 2.079437255859375, 2.1484375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 5.0, 6.0, 12.0, 19.0, 19.0, 23.0, 26.0, 53.0, 57.0, 89.0, 132.0, 231.0, 494.0, 1326.0, 4723.0, 20641.0, 125006.0, 1139974.0, 2517190.0, 325376.0, 45846.0, 9067.0, 2284.0, 774.0, 331.0, 183.0, 122.0, 56.0, 52.0, 40.0, 30.0, 12.0, 19.0, 11.0, 15.0, 8.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.3614501953125, -7.133056640625, -6.9046630859375, -6.67626953125, -6.4478759765625, -6.219482421875, -5.9910888671875, -5.7626953125, -5.5343017578125, -5.305908203125, -5.0775146484375, -4.84912109375, -4.6207275390625, -4.392333984375, -4.1639404296875, -3.935546875, -3.7071533203125, -3.478759765625, -3.2503662109375, -3.02197265625, -2.7935791015625, -2.565185546875, -2.3367919921875, -2.1083984375, -1.8800048828125, -1.651611328125, -1.4232177734375, -1.19482421875, -0.9664306640625, -0.738037109375, -0.5096435546875, -0.28125, -0.0528564453125, 0.175537109375, 0.4039306640625, 0.63232421875, 0.8607177734375, 1.089111328125, 1.3175048828125, 1.5458984375, 1.7742919921875, 2.002685546875, 2.2310791015625, 2.45947265625, 2.6878662109375, 2.916259765625, 3.1446533203125, 3.373046875, 3.6014404296875, 3.829833984375, 4.0582275390625, 4.28662109375, 4.5150146484375, 4.743408203125, 4.9718017578125, 5.2001953125, 5.4285888671875, 5.656982421875, 5.8853759765625, 6.11376953125, 6.3421630859375, 6.570556640625, 6.7989501953125, 7.02734375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 12.0, 8.0, 25.0, 53.0, 107.0, 189.0, 317.0, 552.0, 818.0, 845.0, 512.0, 290.0, 176.0, 78.0, 48.0, 25.0, 10.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -17.211181640625, -16.84423828125, -16.477294921875, -16.1103515625, -15.743408203125, -15.37646484375, -15.009521484375, -14.642578125, -14.275634765625, -13.90869140625, -13.541748046875, -13.1748046875, -12.807861328125, -12.44091796875, -12.073974609375, -11.70703125, -11.340087890625, -10.97314453125, -10.606201171875, -10.2392578125, -9.872314453125, -9.50537109375, -9.138427734375, -8.771484375, -8.404541015625, -8.03759765625, -7.670654296875, -7.3037109375, -6.936767578125, -6.56982421875, -6.202880859375, -5.8359375, -5.468994140625, -5.10205078125, -4.735107421875, -4.3681640625, -4.001220703125, -3.63427734375, -3.267333984375, -2.900390625, -2.533447265625, -2.16650390625, -1.799560546875, -1.4326171875, -1.065673828125, -0.69873046875, -0.331787109375, 0.03515625, 0.402099609375, 0.76904296875, 1.135986328125, 1.5029296875, 1.869873046875, 2.23681640625, 2.603759765625, 2.970703125, 3.337646484375, 3.70458984375, 4.071533203125, 4.4384765625, 4.805419921875, 5.17236328125, 5.539306640625, 5.90625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 7.0, 9.0, 12.0, 21.0, 59.0, 113.0, 269.0, 622.0, 3216.0, 117147.0, 3883210.0, 184398.0, 3987.0, 719.0, 275.0, 114.0, 61.0, 28.0, 13.0, 10.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.703125, -11.829833984375, -10.95654296875, -10.083251953125, -9.2099609375, -8.336669921875, -7.46337890625, -6.590087890625, -5.716796875, -4.843505859375, -3.97021484375, -3.096923828125, -2.2236328125, -1.350341796875, -0.47705078125, 0.396240234375, 1.26953125, 2.142822265625, 3.01611328125, 3.889404296875, 4.7626953125, 5.635986328125, 6.50927734375, 7.382568359375, 8.255859375, 9.129150390625, 10.00244140625, 10.875732421875, 11.7490234375, 12.622314453125, 13.49560546875, 14.368896484375, 15.2421875, 16.115478515625, 16.98876953125, 17.862060546875, 18.7353515625, 19.608642578125, 20.48193359375, 21.355224609375, 22.228515625, 23.101806640625, 23.97509765625, 24.848388671875, 25.7216796875, 26.594970703125, 27.46826171875, 28.341552734375, 29.21484375, 30.088134765625, 30.96142578125, 31.834716796875, 32.7080078125, 33.581298828125, 34.45458984375, 35.327880859375, 36.201171875, 37.074462890625, 37.94775390625, 38.821044921875, 39.6943359375, 40.567626953125, 41.44091796875, 42.314208984375, 43.1875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 18.0, 46.0, 55.0, 96.0, 119.0, 156.0, 173.0, 129.0, 92.0, 67.0, 34.0, 11.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.53192138671875, -55.8416862487793, -54.15144729614258, -52.461212158203125, -50.770973205566406, -49.08073806762695, -47.3905029296875, -45.70026397705078, -44.01002502441406, -42.31978988647461, -40.62955093383789, -38.93931579589844, -37.24907684326172, -35.558841705322266, -33.86860656738281, -32.178367614746094, -30.48813247680664, -28.797895431518555, -27.10765838623047, -25.417423248291016, -23.727184295654297, -22.036949157714844, -20.346712112426758, -18.656475067138672, -16.966238021850586, -15.2760009765625, -13.585763931274414, -11.895527839660645, -10.205290794372559, -8.515053749084473, -6.824817657470703, -5.134580612182617, -3.4443435668945312, -1.7541067600250244, -0.06386995315551758, 1.6263666152954102, 3.316603660583496, 5.006840705871582, 6.697076797485352, 8.387313842773438, 10.077550888061523, 11.76778793334961, 13.458024978637695, 15.148261070251465, 16.838497161865234, 18.528736114501953, 20.218971252441406, 21.909208297729492, 23.599445343017578, 25.289682388305664, 26.97991943359375, 28.670154571533203, 30.360393524169922, 32.050628662109375, 33.740867614746094, 35.43110275268555, 37.121337890625, 38.81157302856445, 40.50181198120117, 42.192047119140625, 43.882286071777344, 45.5725212097168, 47.26275634765625, 48.95299530029297, 50.64323425292969]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 10.0, 10.0, 10.0, 15.0, 14.0, 15.0, 23.0, 17.0, 30.0, 20.0, 32.0, 21.0, 34.0, 37.0, 34.0, 35.0, 33.0, 47.0, 34.0, 30.0, 53.0, 42.0, 36.0, 48.0, 40.0, 25.0, 33.0, 35.0, 37.0, 25.0, 24.0, 12.0, 13.0, 18.0, 8.0, 9.0, 7.0, 8.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.242210388183594, -18.595462799072266, -17.948715209960938, -17.30196762084961, -16.65522003173828, -16.008472442626953, -15.361723899841309, -14.714975357055664, -14.068227767944336, -13.421480178833008, -12.77473258972168, -12.127985000610352, -11.481236457824707, -10.834488868713379, -10.18774127960205, -9.540992736816406, -8.894246101379395, -8.247498512268066, -7.60075044631958, -6.954002857208252, -6.307254791259766, -5.6605072021484375, -5.013759613037109, -4.367011547088623, -3.720263957977295, -3.0735161304473877, -2.4267683029174805, -1.7800207138061523, -1.1332728862762451, -0.4865250587463379, 0.16022253036499023, 0.8069705963134766, 1.4537181854248047, 2.100466012954712, 2.747213840484619, 3.3939614295959473, 4.040709495544434, 4.687457084655762, 5.33420467376709, 5.980952739715576, 6.627700328826904, 7.274447917938232, 7.921195983886719, 8.567943572998047, 9.214691162109375, 9.861438751220703, 10.508186340332031, 11.154934883117676, 11.801682472229004, 12.448430061340332, 13.09517765045166, 13.741926193237305, 14.388673782348633, 15.035421371459961, 15.682168960571289, 16.328916549682617, 16.975664138793945, 17.622411727905273, 18.2691593170166, 18.91590690612793, 19.562654495239258, 20.20940399169922, 20.856151580810547, 21.502899169921875, 22.149646759033203]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 11.0, 8.0, 6.0, 13.0, 10.0, 25.0, 15.0, 20.0, 27.0, 21.0, 29.0, 38.0, 27.0, 31.0, 32.0, 38.0, 44.0, 51.0, 41.0, 37.0, 53.0, 38.0, 35.0, 39.0, 35.0, 31.0, 26.0, 25.0, 29.0, 25.0, 21.0, 19.0, 21.0, 14.0, 12.0, 11.0, 8.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-2.17578125, -2.108673095703125, -2.04156494140625, -1.974456787109375, -1.9073486328125, -1.840240478515625, -1.77313232421875, -1.706024169921875, -1.638916015625, -1.571807861328125, -1.50469970703125, -1.437591552734375, -1.3704833984375, -1.303375244140625, -1.23626708984375, -1.169158935546875, -1.10205078125, -1.034942626953125, -0.96783447265625, -0.900726318359375, -0.8336181640625, -0.766510009765625, -0.69940185546875, -0.632293701171875, -0.565185546875, -0.498077392578125, -0.43096923828125, -0.363861083984375, -0.2967529296875, -0.229644775390625, -0.16253662109375, -0.095428466796875, -0.0283203125, 0.038787841796875, 0.10589599609375, 0.173004150390625, 0.2401123046875, 0.307220458984375, 0.37432861328125, 0.441436767578125, 0.508544921875, 0.575653076171875, 0.64276123046875, 0.709869384765625, 0.7769775390625, 0.844085693359375, 0.91119384765625, 0.978302001953125, 1.04541015625, 1.112518310546875, 1.17962646484375, 1.246734619140625, 1.3138427734375, 1.380950927734375, 1.44805908203125, 1.515167236328125, 1.582275390625, 1.649383544921875, 1.71649169921875, 1.783599853515625, 1.8507080078125, 1.917816162109375, 1.98492431640625, 2.052032470703125, 2.119140625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 8.0, 6.0, 5.0, 12.0, 25.0, 24.0, 22.0, 37.0, 63.0, 71.0, 81.0, 134.0, 207.0, 261.0, 326.0, 447.0, 641.0, 904.0, 1286.0, 1834.0, 2560.0, 3680.0, 5348.0, 7826.0, 11110.0, 16637.0, 24173.0, 36579.0, 57241.0, 97888.0, 218158.0, 260935.0, 112131.0, 63525.0, 39993.0, 26359.0, 18028.0, 12204.0, 8394.0, 5830.0, 3889.0, 2796.0, 2056.0, 1339.0, 1010.0, 658.0, 519.0, 339.0, 273.0, 185.0, 157.0, 91.0, 60.0, 64.0, 40.0, 31.0, 16.0, 22.0, 11.0, 8.0, 3.0, 7.0, 5.0], "bins": [-0.015106201171875, -0.014635682106018066, -0.014165163040161133, -0.0136946439743042, -0.013224124908447266, -0.012753605842590332, -0.012283086776733398, -0.011812567710876465, -0.011342048645019531, -0.010871529579162598, -0.010401010513305664, -0.00993049144744873, -0.009459972381591797, -0.008989453315734863, -0.00851893424987793, -0.008048415184020996, -0.0075778961181640625, -0.007107377052307129, -0.006636857986450195, -0.006166338920593262, -0.005695819854736328, -0.0052253007888793945, -0.004754781723022461, -0.004284262657165527, -0.0038137435913085938, -0.00334322452545166, -0.0028727054595947266, -0.002402186393737793, -0.0019316673278808594, -0.0014611482620239258, -0.0009906291961669922, -0.0005201101303100586, -4.9591064453125e-05, 0.0004209280014038086, 0.0008914470672607422, 0.0013619661331176758, 0.0018324851989746094, 0.002303004264831543, 0.0027735233306884766, 0.00324404239654541, 0.0037145614624023438, 0.004185080528259277, 0.004655599594116211, 0.0051261186599731445, 0.005596637725830078, 0.006067156791687012, 0.006537675857543945, 0.007008194923400879, 0.0074787139892578125, 0.007949233055114746, 0.00841975212097168, 0.008890271186828613, 0.009360790252685547, 0.00983130931854248, 0.010301828384399414, 0.010772347450256348, 0.011242866516113281, 0.011713385581970215, 0.012183904647827148, 0.012654423713684082, 0.013124942779541016, 0.01359546184539795, 0.014065980911254883, 0.014536499977111816, 0.01500701904296875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 8.0, 7.0, 6.0, 12.0, 18.0, 9.0, 16.0, 13.0, 14.0, 28.0, 36.0, 29.0, 34.0, 39.0, 48.0, 30.0, 30.0, 37.0, 37.0, 1068.0, 38.0, 41.0, 32.0, 32.0, 47.0, 44.0, 28.0, 23.0, 22.0, 27.0, 15.0, 30.0, 25.0, 14.0, 15.0, 3.0, 12.0, 10.0, 11.0, 10.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0], "bins": [-1.51171875, -1.4696807861328125, -1.427642822265625, -1.3856048583984375, -1.34356689453125, -1.3015289306640625, -1.259490966796875, -1.2174530029296875, -1.1754150390625, -1.1333770751953125, -1.091339111328125, -1.0493011474609375, -1.00726318359375, -0.9652252197265625, -0.923187255859375, -0.8811492919921875, -0.839111328125, -0.7970733642578125, -0.755035400390625, -0.7129974365234375, -0.67095947265625, -0.6289215087890625, -0.586883544921875, -0.5448455810546875, -0.5028076171875, -0.4607696533203125, -0.418731689453125, -0.3766937255859375, -0.33465576171875, -0.2926177978515625, -0.250579833984375, -0.2085418701171875, -0.16650390625, -0.1244659423828125, -0.082427978515625, -0.0403900146484375, 0.00164794921875, 0.0436859130859375, 0.085723876953125, 0.1277618408203125, 0.1697998046875, 0.2118377685546875, 0.253875732421875, 0.2959136962890625, 0.33795166015625, 0.3799896240234375, 0.422027587890625, 0.4640655517578125, 0.506103515625, 0.5481414794921875, 0.590179443359375, 0.6322174072265625, 0.67425537109375, 0.7162933349609375, 0.758331298828125, 0.8003692626953125, 0.8424072265625, 0.8844451904296875, 0.926483154296875, 0.9685211181640625, 1.01055908203125, 1.0525970458984375, 1.094635009765625, 1.1366729736328125, 1.1787109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 14.0, 22.0, 29.0, 48.0, 66.0, 96.0, 156.0, 204.0, 292.0, 437.0, 637.0, 841.0, 1252.0, 1726.0, 2463.0, 3418.0, 4814.0, 6960.0, 10252.0, 14838.0, 22578.0, 34767.0, 55863.0, 94745.0, 191855.0, 1317946.0, 129343.0, 71474.0, 43752.0, 27606.0, 18246.0, 11999.0, 8402.0, 5903.0, 4183.0, 2942.0, 2009.0, 1504.0, 1054.0, 727.0, 533.0, 376.0, 260.0, 169.0, 110.0, 84.0, 49.0, 34.0, 17.0, 15.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01044464111328125, -0.01011037826538086, -0.009776115417480469, -0.009441852569580078, -0.009107589721679688, -0.008773326873779297, -0.008439064025878906, -0.008104801177978516, -0.007770538330078125, -0.007436275482177734, -0.007102012634277344, -0.006767749786376953, -0.0064334869384765625, -0.006099224090576172, -0.005764961242675781, -0.005430698394775391, -0.005096435546875, -0.004762172698974609, -0.004427909851074219, -0.004093647003173828, -0.0037593841552734375, -0.003425121307373047, -0.0030908584594726562, -0.0027565956115722656, -0.002422332763671875, -0.0020880699157714844, -0.0017538070678710938, -0.0014195442199707031, -0.0010852813720703125, -0.0007510185241699219, -0.00041675567626953125, -8.249282836914062e-05, 0.00025177001953125, 0.0005860328674316406, 0.0009202957153320312, 0.0012545585632324219, 0.0015888214111328125, 0.0019230842590332031, 0.0022573471069335938, 0.0025916099548339844, 0.002925872802734375, 0.0032601356506347656, 0.0035943984985351562, 0.003928661346435547, 0.0042629241943359375, 0.004597187042236328, 0.004931449890136719, 0.005265712738037109, 0.0055999755859375, 0.005934238433837891, 0.006268501281738281, 0.006602764129638672, 0.0069370269775390625, 0.007271289825439453, 0.007605552673339844, 0.007939815521240234, 0.008274078369140625, 0.008608341217041016, 0.008942604064941406, 0.009276866912841797, 0.009611129760742188, 0.009945392608642578, 0.010279655456542969, 0.01061391830444336, 0.01094818115234375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 877.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.300366759300232e-07, -2.2165477275848389e-07, -2.1327286958694458e-07, -2.0489096641540527e-07, -1.9650906324386597e-07, -1.8812716007232666e-07, -1.7974525690078735e-07, -1.7136335372924805e-07, -1.6298145055770874e-07, -1.5459954738616943e-07, -1.4621764421463013e-07, -1.3783574104309082e-07, -1.2945383787155151e-07, -1.210719347000122e-07, -1.126900315284729e-07, -1.043081283569336e-07, -9.592622518539429e-08, -8.754432201385498e-08, -7.916241884231567e-08, -7.078051567077637e-08, -6.239861249923706e-08, -5.4016709327697754e-08, -4.563480615615845e-08, -3.725290298461914e-08, -2.8870999813079834e-08, -2.0489096641540527e-08, -1.210719347000122e-08, -3.725290298461914e-09, 4.6566128730773926e-09, 1.30385160446167e-08, 2.1420419216156006e-08, 2.9802322387695312e-08, 3.818422555923462e-08, 4.6566128730773926e-08, 5.494803190231323e-08, 6.332993507385254e-08, 7.171183824539185e-08, 8.009374141693115e-08, 8.847564458847046e-08, 9.685754776000977e-08, 1.0523945093154907e-07, 1.1362135410308838e-07, 1.2200325727462769e-07, 1.30385160446167e-07, 1.387670636177063e-07, 1.471489667892456e-07, 1.555308699607849e-07, 1.6391277313232422e-07, 1.7229467630386353e-07, 1.8067657947540283e-07, 1.8905848264694214e-07, 1.9744038581848145e-07, 2.0582228899002075e-07, 2.1420419216156006e-07, 2.2258609533309937e-07, 2.3096799850463867e-07, 2.39349901676178e-07, 2.477318048477173e-07, 2.561137080192566e-07, 2.644956111907959e-07, 2.728775143623352e-07, 2.812594175338745e-07, 2.896413207054138e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 25.0, 37.0, 17.0, 21.0, 157.0, 2262.0, 45453.0, 989843.0, 9841.0, 698.0, 78.0, 18.0, 12.0, 47.0, 20.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.589557647705078e-06, -4.455447196960449e-06, -4.32133674621582e-06, -4.187226295471191e-06, -4.0531158447265625e-06, -3.919005393981934e-06, -3.7848949432373047e-06, -3.6507844924926758e-06, -3.516674041748047e-06, -3.382563591003418e-06, -3.248453140258789e-06, -3.11434268951416e-06, -2.9802322387695312e-06, -2.8461217880249023e-06, -2.7120113372802734e-06, -2.5779008865356445e-06, -2.4437904357910156e-06, -2.3096799850463867e-06, -2.175569534301758e-06, -2.041459083557129e-06, -1.9073486328125e-06, -1.773238182067871e-06, -1.6391277313232422e-06, -1.5050172805786133e-06, -1.3709068298339844e-06, -1.2367963790893555e-06, -1.1026859283447266e-06, -9.685754776000977e-07, -8.344650268554688e-07, -7.003545761108398e-07, -5.662441253662109e-07, -4.3213367462158203e-07, -2.980232238769531e-07, -1.6391277313232422e-07, -2.9802322387695312e-08, 1.043081283569336e-07, 2.384185791015625e-07, 3.725290298461914e-07, 5.066394805908203e-07, 6.407499313354492e-07, 7.748603820800781e-07, 9.08970832824707e-07, 1.043081283569336e-06, 1.1771917343139648e-06, 1.3113021850585938e-06, 1.4454126358032227e-06, 1.5795230865478516e-06, 1.7136335372924805e-06, 1.8477439880371094e-06, 1.9818544387817383e-06, 2.115964889526367e-06, 2.250075340270996e-06, 2.384185791015625e-06, 2.518296241760254e-06, 2.652406692504883e-06, 2.7865171432495117e-06, 2.9206275939941406e-06, 3.0547380447387695e-06, 3.1888484954833984e-06, 3.3229589462280273e-06, 3.4570693969726562e-06, 3.591179847717285e-06, 3.725290298461914e-06, 3.859400749206543e-06, 3.993511199951172e-06]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1021.0], "bins": [-8.291275577221313e-08, -8.161724451838381e-08, -8.03217332645545e-08, -7.902622201072518e-08, -7.773071075689586e-08, -7.643519950306654e-08, -7.513968114380987e-08, -7.38441769954079e-08, -7.254865863615123e-08, -7.125314738232191e-08, -6.99576361284926e-08, -6.866212487466328e-08, -6.736661362083396e-08, -6.607110236700464e-08, -6.477559111317532e-08, -6.348007275391865e-08, -6.218456860551669e-08, -6.088905735168737e-08, -5.959354609785805e-08, -5.8298034844028734e-08, -5.700252003748574e-08, -5.570700878365642e-08, -5.44114975298271e-08, -5.3115986275997784e-08, -5.182047146945479e-08, -5.052496021562547e-08, -4.922944896179615e-08, -4.7933937707966834e-08, -4.663842290142384e-08, -4.534291164759452e-08, -4.40474003937652e-08, -4.2751889139935884e-08, -4.1456377886106566e-08, -4.016086663227725e-08, -3.886535537844793e-08, -3.7569840571904933e-08, -3.6274329318075615e-08, -3.49788180642463e-08, -3.368330681041698e-08, -3.238779555658766e-08, -3.1092284302758344e-08, -2.9796773048929026e-08, -2.850126001874287e-08, -2.720574876491355e-08, -2.5910237511084233e-08, -2.4614724480898076e-08, -2.3319213227068758e-08, -2.202370197323944e-08, -2.0728188943053283e-08, -1.9432677689223965e-08, -1.8137164659037808e-08, -1.684165340520849e-08, -1.5546142151379172e-08, -1.4250630009371434e-08, -1.2955117867363697e-08, -1.1659606613534379e-08, -1.0364094471526641e-08, -9.068582329518904e-09, -7.773071075689586e-09, -6.4775589336818484e-09, -5.182047235763321e-09, -3.886535537844793e-09, -2.5910233958370554e-09, -1.2955121420077376e-09, 0.0]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1021.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 11.0, 8.0, 6.0, 13.0, 10.0, 25.0, 15.0, 20.0, 27.0, 21.0, 29.0, 38.0, 27.0, 31.0, 32.0, 38.0, 44.0, 51.0, 41.0, 37.0, 53.0, 38.0, 35.0, 39.0, 35.0, 31.0, 26.0, 25.0, 29.0, 25.0, 21.0, 19.0, 21.0, 14.0, 12.0, 11.0, 8.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-2.17578125, -2.108673095703125, -2.04156494140625, -1.974456787109375, -1.9073486328125, -1.840240478515625, -1.77313232421875, -1.706024169921875, -1.638916015625, -1.571807861328125, -1.50469970703125, -1.437591552734375, -1.3704833984375, -1.303375244140625, -1.23626708984375, -1.169158935546875, -1.10205078125, -1.034942626953125, -0.96783447265625, -0.900726318359375, -0.8336181640625, -0.766510009765625, -0.69940185546875, -0.632293701171875, -0.565185546875, -0.498077392578125, -0.43096923828125, -0.363861083984375, -0.2967529296875, -0.229644775390625, -0.16253662109375, -0.095428466796875, -0.0283203125, 0.038787841796875, 0.10589599609375, 0.173004150390625, 0.2401123046875, 0.307220458984375, 0.37432861328125, 0.441436767578125, 0.508544921875, 0.575653076171875, 0.64276123046875, 0.709869384765625, 0.7769775390625, 0.844085693359375, 0.91119384765625, 0.978302001953125, 1.04541015625, 1.112518310546875, 1.17962646484375, 1.246734619140625, 1.3138427734375, 1.380950927734375, 1.44805908203125, 1.515167236328125, 1.582275390625, 1.649383544921875, 1.71649169921875, 1.783599853515625, 1.8507080078125, 1.917816162109375, 1.98492431640625, 2.052032470703125, 2.119140625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 7.0, 14.0, 18.0, 24.0, 30.0, 39.0, 61.0, 107.0, 120.0, 224.0, 380.0, 598.0, 1004.0, 1625.0, 2828.0, 4887.0, 8651.0, 15489.0, 29694.0, 63847.0, 180322.0, 432030.0, 178317.0, 63118.0, 29126.0, 15470.0, 8568.0, 4879.0, 2811.0, 1640.0, 965.0, 597.0, 356.0, 233.0, 146.0, 104.0, 63.0, 62.0, 34.0, 13.0, 15.0, 15.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4296875, -2.3525390625, -2.275390625, -2.1982421875, -2.12109375, -2.0439453125, -1.966796875, -1.8896484375, -1.8125, -1.7353515625, -1.658203125, -1.5810546875, -1.50390625, -1.4267578125, -1.349609375, -1.2724609375, -1.1953125, -1.1181640625, -1.041015625, -0.9638671875, -0.88671875, -0.8095703125, -0.732421875, -0.6552734375, -0.578125, -0.5009765625, -0.423828125, -0.3466796875, -0.26953125, -0.1923828125, -0.115234375, -0.0380859375, 0.0390625, 0.1162109375, 0.193359375, 0.2705078125, 0.34765625, 0.4248046875, 0.501953125, 0.5791015625, 0.65625, 0.7333984375, 0.810546875, 0.8876953125, 0.96484375, 1.0419921875, 1.119140625, 1.1962890625, 1.2734375, 1.3505859375, 1.427734375, 1.5048828125, 1.58203125, 1.6591796875, 1.736328125, 1.8134765625, 1.890625, 1.9677734375, 2.044921875, 2.1220703125, 2.19921875, 2.2763671875, 2.353515625, 2.4306640625, 2.5078125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 4.0, 8.0, 11.0, 9.0, 16.0, 13.0, 17.0, 25.0, 23.0, 25.0, 36.0, 48.0, 34.0, 35.0, 44.0, 60.0, 122.0, 260.0, 1552.0, 172.0, 98.0, 67.0, 55.0, 45.0, 38.0, 29.0, 35.0, 23.0, 29.0, 21.0, 20.0, 14.0, 15.0, 8.0, 11.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.671875, -8.403564453125, -8.13525390625, -7.866943359375, -7.5986328125, -7.330322265625, -7.06201171875, -6.793701171875, -6.525390625, -6.257080078125, -5.98876953125, -5.720458984375, -5.4521484375, -5.183837890625, -4.91552734375, -4.647216796875, -4.37890625, -4.110595703125, -3.84228515625, -3.573974609375, -3.3056640625, -3.037353515625, -2.76904296875, -2.500732421875, -2.232421875, -1.964111328125, -1.69580078125, -1.427490234375, -1.1591796875, -0.890869140625, -0.62255859375, -0.354248046875, -0.0859375, 0.182373046875, 0.45068359375, 0.718994140625, 0.9873046875, 1.255615234375, 1.52392578125, 1.792236328125, 2.060546875, 2.328857421875, 2.59716796875, 2.865478515625, 3.1337890625, 3.402099609375, 3.67041015625, 3.938720703125, 4.20703125, 4.475341796875, 4.74365234375, 5.011962890625, 5.2802734375, 5.548583984375, 5.81689453125, 6.085205078125, 6.353515625, 6.621826171875, 6.89013671875, 7.158447265625, 7.4267578125, 7.695068359375, 7.96337890625, 8.231689453125, 8.5]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 7.0, 19.0, 32.0, 40.0, 59.0, 93.0, 122.0, 263.0, 468.0, 1321.0, 23592.0, 3027863.0, 88340.0, 2218.0, 528.0, 267.0, 168.0, 109.0, 58.0, 34.0, 27.0, 33.0, 9.0, 8.0, 9.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.0625, -26.362060546875, -25.66162109375, -24.961181640625, -24.2607421875, -23.560302734375, -22.85986328125, -22.159423828125, -21.458984375, -20.758544921875, -20.05810546875, -19.357666015625, -18.6572265625, -17.956787109375, -17.25634765625, -16.555908203125, -15.85546875, -15.155029296875, -14.45458984375, -13.754150390625, -13.0537109375, -12.353271484375, -11.65283203125, -10.952392578125, -10.251953125, -9.551513671875, -8.85107421875, -8.150634765625, -7.4501953125, -6.749755859375, -6.04931640625, -5.348876953125, -4.6484375, -3.947998046875, -3.24755859375, -2.547119140625, -1.8466796875, -1.146240234375, -0.44580078125, 0.254638671875, 0.955078125, 1.655517578125, 2.35595703125, 3.056396484375, 3.7568359375, 4.457275390625, 5.15771484375, 5.858154296875, 6.55859375, 7.259033203125, 7.95947265625, 8.659912109375, 9.3603515625, 10.060791015625, 10.76123046875, 11.461669921875, 12.162109375, 12.862548828125, 13.56298828125, 14.263427734375, 14.9638671875, 15.664306640625, 16.36474609375, 17.065185546875, 17.765625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 6.0, 21.0, 63.0, 160.0, 243.0, 233.0, 164.0, 77.0, 33.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.620804786682129, -7.565092086791992, -6.509378910064697, -5.453665733337402, -4.397953033447266, -3.342240333557129, -2.286527156829834, -1.230813980102539, -0.17510128021240234, 0.8806116580963135, 1.9363245964050293, 2.992037534713745, 4.047750473022461, 5.103463172912598, 6.159176349639893, 7.2148895263671875, 8.270602226257324, 9.326314926147461, 10.382028579711914, 11.43774127960205, 12.493453979492188, 13.549166679382324, 14.604879379272461, 15.660593032836914, 16.716304779052734, 17.772018432617188, 18.827730178833008, 19.88344383239746, 20.93915557861328, 21.994869232177734, 23.050582885742188, 24.10629653930664, 25.162010192871094, 26.217723846435547, 27.273435592651367, 28.32914924621582, 29.38486099243164, 30.440574645996094, 31.496288299560547, 32.552001953125, 33.60771179199219, 34.66342544555664, 35.719139099121094, 36.77484893798828, 37.830562591552734, 38.88627624511719, 39.94198989868164, 40.997703552246094, 42.05341720581055, 43.109130859375, 44.16484451293945, 45.22055435180664, 46.276268005371094, 47.33198165893555, 48.3876953125, 49.44340896606445, 50.499122619628906, 51.55483627319336, 52.61054992675781, 53.666259765625, 54.72197341918945, 55.777687072753906, 56.83340072631836, 57.88911437988281, 58.94482421875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 2.0, 4.0, 1.0, 10.0, 11.0, 12.0, 12.0, 14.0, 13.0, 27.0, 30.0, 35.0, 41.0, 36.0, 34.0, 34.0, 38.0, 39.0, 41.0, 50.0, 39.0, 35.0, 39.0, 43.0, 38.0, 40.0, 43.0, 22.0, 27.0, 22.0, 20.0, 33.0, 31.0, 15.0, 12.0, 19.0, 10.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.871963500976562, -24.077754974365234, -23.283546447753906, -22.48933982849121, -21.695131301879883, -20.900922775268555, -20.10671615600586, -19.31250762939453, -18.518299102783203, -17.724090576171875, -16.929882049560547, -16.13567543029785, -15.341466903686523, -14.547258377075195, -13.753050804138184, -12.958843231201172, -12.164634704589844, -11.370426177978516, -10.576218605041504, -9.782011032104492, -8.987802505493164, -8.193593978881836, -7.399386405944824, -6.605178356170654, -5.810970306396484, -5.0167622566223145, -4.2225542068481445, -3.4283461570739746, -2.6341381072998047, -1.8399300575256348, -1.0457220077514648, -0.2515139579772949, 0.5426959991455078, 1.3369040489196777, 2.1311120986938477, 2.9253201484680176, 3.7195281982421875, 4.513736248016357, 5.307944297790527, 6.102152347564697, 6.896360397338867, 7.690568447113037, 8.484776496887207, 9.278984069824219, 10.073192596435547, 10.867401123046875, 11.661608695983887, 12.455816268920898, 13.250024795532227, 14.044233322143555, 14.838440895080566, 15.632648468017578, 16.426856994628906, 17.221065521240234, 18.015274047851562, 18.809480667114258, 19.603689193725586, 20.397897720336914, 21.19210433959961, 21.986312866210938, 22.780521392822266, 23.574729919433594, 24.368938446044922, 25.163145065307617, 25.957353591918945]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 16.0, 16.0, 14.0, 21.0, 21.0, 26.0, 29.0, 23.0, 36.0, 29.0, 32.0, 39.0, 37.0, 45.0, 52.0, 47.0, 49.0, 42.0, 34.0, 36.0, 57.0, 30.0, 32.0, 29.0, 21.0, 22.0, 22.0, 25.0, 19.0, 13.0, 14.0, 10.0, 12.0, 6.0, 6.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-2.419921875, -2.346649169921875, -2.27337646484375, -2.200103759765625, -2.1268310546875, -2.053558349609375, -1.98028564453125, -1.907012939453125, -1.833740234375, -1.760467529296875, -1.68719482421875, -1.613922119140625, -1.5406494140625, -1.467376708984375, -1.39410400390625, -1.320831298828125, -1.24755859375, -1.174285888671875, -1.10101318359375, -1.027740478515625, -0.9544677734375, -0.881195068359375, -0.80792236328125, -0.734649658203125, -0.661376953125, -0.588104248046875, -0.51483154296875, -0.441558837890625, -0.3682861328125, -0.295013427734375, -0.22174072265625, -0.148468017578125, -0.0751953125, -0.001922607421875, 0.07135009765625, 0.144622802734375, 0.2178955078125, 0.291168212890625, 0.36444091796875, 0.437713623046875, 0.510986328125, 0.584259033203125, 0.65753173828125, 0.730804443359375, 0.8040771484375, 0.877349853515625, 0.95062255859375, 1.023895263671875, 1.09716796875, 1.170440673828125, 1.24371337890625, 1.316986083984375, 1.3902587890625, 1.463531494140625, 1.53680419921875, 1.610076904296875, 1.683349609375, 1.756622314453125, 1.82989501953125, 1.903167724609375, 1.9764404296875, 2.049713134765625, 2.12298583984375, 2.196258544921875, 2.26953125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 10.0, 10.0, 24.0, 32.0, 43.0, 58.0, 94.0, 114.0, 191.0, 305.0, 512.0, 904.0, 1867.0, 4149.0, 9338.0, 23700.0, 62594.0, 181126.0, 580364.0, 1527151.0, 1211796.0, 388921.0, 125151.0, 44290.0, 17465.0, 7244.0, 3237.0, 1586.0, 770.0, 411.0, 251.0, 177.0, 114.0, 75.0, 58.0, 38.0, 26.0, 15.0, 19.0, 14.0, 7.0, 2.0, 4.0, 2.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.755859375, -3.63787841796875, -3.5198974609375, -3.40191650390625, -3.283935546875, -3.16595458984375, -3.0479736328125, -2.92999267578125, -2.81201171875, -2.69403076171875, -2.5760498046875, -2.45806884765625, -2.340087890625, -2.22210693359375, -2.1041259765625, -1.98614501953125, -1.8681640625, -1.75018310546875, -1.6322021484375, -1.51422119140625, -1.396240234375, -1.27825927734375, -1.1602783203125, -1.04229736328125, -0.92431640625, -0.80633544921875, -0.6883544921875, -0.57037353515625, -0.452392578125, -0.33441162109375, -0.2164306640625, -0.09844970703125, 0.01953125, 0.13751220703125, 0.2554931640625, 0.37347412109375, 0.491455078125, 0.60943603515625, 0.7274169921875, 0.84539794921875, 0.96337890625, 1.08135986328125, 1.1993408203125, 1.31732177734375, 1.435302734375, 1.55328369140625, 1.6712646484375, 1.78924560546875, 1.9072265625, 2.02520751953125, 2.1431884765625, 2.26116943359375, 2.379150390625, 2.49713134765625, 2.6151123046875, 2.73309326171875, 2.85107421875, 2.96905517578125, 3.0870361328125, 3.20501708984375, 3.322998046875, 3.44097900390625, 3.5589599609375, 3.67694091796875, 3.794921875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 9.0, 7.0, 13.0, 12.0, 22.0, 30.0, 33.0, 57.0, 65.0, 75.0, 119.0, 126.0, 181.0, 226.0, 303.0, 327.0, 402.0, 387.0, 377.0, 305.0, 244.0, 194.0, 139.0, 104.0, 79.0, 56.0, 49.0, 37.0, 27.0, 22.0, 20.0, 8.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.875, -4.70709228515625, -4.5391845703125, -4.37127685546875, -4.203369140625, -4.03546142578125, -3.8675537109375, -3.69964599609375, -3.53173828125, -3.36383056640625, -3.1959228515625, -3.02801513671875, -2.860107421875, -2.69219970703125, -2.5242919921875, -2.35638427734375, -2.1884765625, -2.02056884765625, -1.8526611328125, -1.68475341796875, -1.516845703125, -1.34893798828125, -1.1810302734375, -1.01312255859375, -0.84521484375, -0.67730712890625, -0.5093994140625, -0.34149169921875, -0.173583984375, -0.00567626953125, 0.1622314453125, 0.33013916015625, 0.498046875, 0.66595458984375, 0.8338623046875, 1.00177001953125, 1.169677734375, 1.33758544921875, 1.5054931640625, 1.67340087890625, 1.84130859375, 2.00921630859375, 2.1771240234375, 2.34503173828125, 2.512939453125, 2.68084716796875, 2.8487548828125, 3.01666259765625, 3.1845703125, 3.35247802734375, 3.5203857421875, 3.68829345703125, 3.856201171875, 4.02410888671875, 4.1920166015625, 4.35992431640625, 4.52783203125, 4.69573974609375, 4.8636474609375, 5.03155517578125, 5.199462890625, 5.36737060546875, 5.5352783203125, 5.70318603515625, 5.87109375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 8.0, 10.0, 11.0, 17.0, 20.0, 34.0, 35.0, 59.0, 63.0, 112.0, 134.0, 219.0, 343.0, 731.0, 2066.0, 8034.0, 41910.0, 277658.0, 1899579.0, 1679335.0, 236948.0, 36166.0, 7121.0, 1836.0, 711.0, 379.0, 223.0, 150.0, 87.0, 82.0, 64.0, 39.0, 23.0, 27.0, 14.0, 10.0, 2.0, 6.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.1953125, -9.885986328125, -9.57666015625, -9.267333984375, -8.9580078125, -8.648681640625, -8.33935546875, -8.030029296875, -7.720703125, -7.411376953125, -7.10205078125, -6.792724609375, -6.4833984375, -6.174072265625, -5.86474609375, -5.555419921875, -5.24609375, -4.936767578125, -4.62744140625, -4.318115234375, -4.0087890625, -3.699462890625, -3.39013671875, -3.080810546875, -2.771484375, -2.462158203125, -2.15283203125, -1.843505859375, -1.5341796875, -1.224853515625, -0.91552734375, -0.606201171875, -0.296875, 0.012451171875, 0.32177734375, 0.631103515625, 0.9404296875, 1.249755859375, 1.55908203125, 1.868408203125, 2.177734375, 2.487060546875, 2.79638671875, 3.105712890625, 3.4150390625, 3.724365234375, 4.03369140625, 4.343017578125, 4.65234375, 4.961669921875, 5.27099609375, 5.580322265625, 5.8896484375, 6.198974609375, 6.50830078125, 6.817626953125, 7.126953125, 7.436279296875, 7.74560546875, 8.054931640625, 8.3642578125, 8.673583984375, 8.98291015625, 9.292236328125, 9.6015625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 7.0, 6.0, 23.0, 34.0, 38.0, 50.0, 53.0, 88.0, 87.0, 96.0, 91.0, 64.0, 64.0, 70.0, 44.0, 56.0, 38.0, 39.0, 13.0, 11.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.618549346923828, -26.770231246948242, -25.921911239624023, -25.073593139648438, -24.22527503967285, -23.376956939697266, -22.528636932373047, -21.68031883239746, -20.832000732421875, -19.98368263244629, -19.13536262512207, -18.287044525146484, -17.4387264251709, -16.590408325195312, -15.742088317871094, -14.893770217895508, -14.045450210571289, -13.197131156921387, -12.3488130569458, -11.500494003295898, -10.652175903320312, -9.80385684967041, -8.955537796020508, -8.107219696044922, -7.2589006423950195, -6.410582065582275, -5.562263488769531, -4.713944435119629, -3.8656258583068848, -3.0173072814941406, -2.1689882278442383, -1.3206696510314941, -0.4723491668701172, 0.3759695291519165, 1.2242882251739502, 2.0726070404052734, 2.9209256172180176, 3.7692441940307617, 4.617563247680664, 5.465881824493408, 6.314200401306152, 7.1625189781188965, 8.01083755493164, 8.859156608581543, 9.707475662231445, 10.555793762207031, 11.404112815856934, 12.252431869506836, 13.100749969482422, 13.949069023132324, 14.79738712310791, 15.645706176757812, 16.4940242767334, 17.342342376708984, 18.190662384033203, 19.03898048400879, 19.887298583984375, 20.73561668395996, 21.58393669128418, 22.432254791259766, 23.28057289123535, 24.128890991210938, 24.977210998535156, 25.825529098510742, 26.67384910583496]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 7.0, 7.0, 13.0, 7.0, 9.0, 11.0, 10.0, 17.0, 19.0, 30.0, 15.0, 20.0, 31.0, 26.0, 37.0, 27.0, 36.0, 45.0, 32.0, 41.0, 29.0, 33.0, 45.0, 46.0, 36.0, 35.0, 30.0, 35.0, 26.0, 35.0, 34.0, 28.0, 22.0, 20.0, 14.0, 17.0, 18.0, 15.0, 6.0, 5.0, 4.0, 5.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.818429946899414, -18.250732421875, -17.683032989501953, -17.11533546447754, -16.547637939453125, -15.979938507080078, -15.412240982055664, -14.844542503356934, -14.276844024658203, -13.709145545959473, -13.141447067260742, -12.573749542236328, -12.006051063537598, -11.438352584838867, -10.870655059814453, -10.302956581115723, -9.735258102416992, -9.167559623718262, -8.599861145019531, -8.032163619995117, -7.464465141296387, -6.896766662597656, -6.329068660736084, -5.761370658874512, -5.193672180175781, -4.625973701477051, -4.0582756996154785, -3.490577459335327, -2.922879219055176, -2.3551809787750244, -1.787482738494873, -1.2197844982147217, -0.6520843505859375, -0.08438611030578613, 0.48331212997436523, 1.0510103702545166, 1.618708610534668, 2.1864068508148193, 2.7541050910949707, 3.321803331375122, 3.8895015716552734, 4.457200050354004, 5.024898052215576, 5.592596054077148, 6.160294532775879, 6.727993011474609, 7.295691013336182, 7.863389015197754, 8.431087493896484, 8.998785972595215, 9.566484451293945, 10.13418197631836, 10.70188045501709, 11.26957893371582, 11.837276458740234, 12.404974937438965, 12.972673416137695, 13.540371894836426, 14.108070373535156, 14.67576789855957, 15.2434663772583, 15.811164855957031, 16.378862380981445, 16.946561813354492, 17.514259338378906]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 7.0, 10.0, 17.0, 16.0, 21.0, 30.0, 27.0, 25.0, 38.0, 37.0, 33.0, 35.0, 50.0, 46.0, 42.0, 51.0, 52.0, 48.0, 41.0, 51.0, 44.0, 35.0, 40.0, 28.0, 28.0, 17.0, 26.0, 25.0, 13.0, 13.0, 9.0, 9.0, 11.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6640625, -2.5810546875, -2.498046875, -2.4150390625, -2.33203125, -2.2490234375, -2.166015625, -2.0830078125, -2.0, -1.9169921875, -1.833984375, -1.7509765625, -1.66796875, -1.5849609375, -1.501953125, -1.4189453125, -1.3359375, -1.2529296875, -1.169921875, -1.0869140625, -1.00390625, -0.9208984375, -0.837890625, -0.7548828125, -0.671875, -0.5888671875, -0.505859375, -0.4228515625, -0.33984375, -0.2568359375, -0.173828125, -0.0908203125, -0.0078125, 0.0751953125, 0.158203125, 0.2412109375, 0.32421875, 0.4072265625, 0.490234375, 0.5732421875, 0.65625, 0.7392578125, 0.822265625, 0.9052734375, 0.98828125, 1.0712890625, 1.154296875, 1.2373046875, 1.3203125, 1.4033203125, 1.486328125, 1.5693359375, 1.65234375, 1.7353515625, 1.818359375, 1.9013671875, 1.984375, 2.0673828125, 2.150390625, 2.2333984375, 2.31640625, 2.3994140625, 2.482421875, 2.5654296875, 2.6484375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 6.0, 9.0, 25.0, 14.0, 29.0, 34.0, 49.0, 66.0, 119.0, 142.0, 164.0, 293.0, 414.0, 632.0, 877.0, 1425.0, 2107.0, 3112.0, 4838.0, 7586.0, 12094.0, 19812.0, 32876.0, 55878.0, 101938.0, 232302.0, 293508.0, 118153.0, 63588.0, 36996.0, 21988.0, 13608.0, 8289.0, 5222.0, 3469.0, 2235.0, 1491.0, 952.0, 682.0, 468.0, 317.0, 207.0, 163.0, 111.0, 79.0, 53.0, 43.0, 29.0, 13.0, 24.0, 15.0, 8.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0], "bins": [-0.02001953125, -0.019396066665649414, -0.018772602081298828, -0.018149137496948242, -0.017525672912597656, -0.01690220832824707, -0.016278743743896484, -0.0156552791595459, -0.015031814575195312, -0.014408349990844727, -0.01378488540649414, -0.013161420822143555, -0.012537956237792969, -0.011914491653442383, -0.011291027069091797, -0.010667562484741211, -0.010044097900390625, -0.009420633316040039, -0.008797168731689453, -0.008173704147338867, -0.007550239562988281, -0.006926774978637695, -0.006303310394287109, -0.0056798458099365234, -0.0050563812255859375, -0.0044329166412353516, -0.0038094520568847656, -0.0031859874725341797, -0.0025625228881835938, -0.0019390583038330078, -0.0013155937194824219, -0.0006921291351318359, -6.866455078125e-05, 0.0005548000335693359, 0.0011782646179199219, 0.0018017292022705078, 0.0024251937866210938, 0.0030486583709716797, 0.0036721229553222656, 0.0042955875396728516, 0.0049190521240234375, 0.0055425167083740234, 0.006165981292724609, 0.006789445877075195, 0.007412910461425781, 0.008036375045776367, 0.008659839630126953, 0.009283304214477539, 0.009906768798828125, 0.010530233383178711, 0.011153697967529297, 0.011777162551879883, 0.012400627136230469, 0.013024091720581055, 0.01364755630493164, 0.014271020889282227, 0.014894485473632812, 0.015517950057983398, 0.016141414642333984, 0.01676487922668457, 0.017388343811035156, 0.018011808395385742, 0.018635272979736328, 0.019258737564086914, 0.0198822021484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 4.0, 4.0, 6.0, 9.0, 13.0, 15.0, 22.0, 28.0, 22.0, 29.0, 23.0, 31.0, 44.0, 37.0, 40.0, 50.0, 43.0, 44.0, 37.0, 1069.0, 43.0, 53.0, 39.0, 38.0, 42.0, 44.0, 20.0, 34.0, 26.0, 28.0, 21.0, 6.0, 14.0, 7.0, 7.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3779296875, -1.32696533203125, -1.2760009765625, -1.22503662109375, -1.174072265625, -1.12310791015625, -1.0721435546875, -1.02117919921875, -0.97021484375, -0.91925048828125, -0.8682861328125, -0.81732177734375, -0.766357421875, -0.71539306640625, -0.6644287109375, -0.61346435546875, -0.5625, -0.51153564453125, -0.4605712890625, -0.40960693359375, -0.358642578125, -0.30767822265625, -0.2567138671875, -0.20574951171875, -0.15478515625, -0.10382080078125, -0.0528564453125, -0.00189208984375, 0.049072265625, 0.10003662109375, 0.1510009765625, 0.20196533203125, 0.2529296875, 0.30389404296875, 0.3548583984375, 0.40582275390625, 0.456787109375, 0.50775146484375, 0.5587158203125, 0.60968017578125, 0.66064453125, 0.71160888671875, 0.7625732421875, 0.81353759765625, 0.864501953125, 0.91546630859375, 0.9664306640625, 1.01739501953125, 1.068359375, 1.11932373046875, 1.1702880859375, 1.22125244140625, 1.272216796875, 1.32318115234375, 1.3741455078125, 1.42510986328125, 1.47607421875, 1.52703857421875, 1.5780029296875, 1.62896728515625, 1.679931640625, 1.73089599609375, 1.7818603515625, 1.83282470703125, 1.8837890625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 9.0, 3.0, 13.0, 21.0, 32.0, 35.0, 55.0, 94.0, 149.0, 203.0, 280.0, 462.0, 685.0, 974.0, 1474.0, 2337.0, 3486.0, 5437.0, 8232.0, 12662.0, 20282.0, 33234.0, 57280.0, 106454.0, 246058.0, 1322908.0, 117375.0, 61588.0, 35691.0, 21417.0, 13350.0, 8629.0, 5569.0, 3587.0, 2307.0, 1574.0, 1052.0, 712.0, 450.0, 330.0, 212.0, 139.0, 88.0, 60.0, 47.0, 32.0, 16.0, 12.0, 12.0, 14.0, 3.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.0137176513671875, -0.013302803039550781, -0.012887954711914062, -0.012473106384277344, -0.012058258056640625, -0.011643409729003906, -0.011228561401367188, -0.010813713073730469, -0.01039886474609375, -0.009984016418457031, -0.009569168090820312, -0.009154319763183594, -0.008739471435546875, -0.008324623107910156, -0.007909774780273438, -0.007494926452636719, -0.007080078125, -0.006665229797363281, -0.0062503814697265625, -0.005835533142089844, -0.005420684814453125, -0.005005836486816406, -0.0045909881591796875, -0.004176139831542969, -0.00376129150390625, -0.0033464431762695312, -0.0029315948486328125, -0.0025167465209960938, -0.002101898193359375, -0.0016870498657226562, -0.0012722015380859375, -0.0008573532104492188, -0.0004425048828125, -2.765655517578125e-05, 0.0003871917724609375, 0.0008020401000976562, 0.001216888427734375, 0.0016317367553710938, 0.0020465850830078125, 0.0024614334106445312, 0.00287628173828125, 0.0032911300659179688, 0.0037059783935546875, 0.004120826721191406, 0.004535675048828125, 0.004950523376464844, 0.0053653717041015625, 0.005780220031738281, 0.006195068359375, 0.006609916687011719, 0.0070247650146484375, 0.007439613342285156, 0.007854461669921875, 0.008269309997558594, 0.008684158325195312, 0.009099006652832031, 0.00951385498046875, 0.009928703308105469, 0.010343551635742188, 0.010758399963378906, 0.011173248291015625, 0.011588096618652344, 0.012002944946289062, 0.012417793273925781, 0.0128326416015625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.0, 0.0, 0.0, 0.0, 0.0, 0.0, 812.0, 0.0, 0.0, 0.0, 0.0, 0.0, 80.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4831464290618896e-07, -3.390014171600342e-07, -3.296881914138794e-07, -3.203749656677246e-07, -3.110617399215698e-07, -3.0174851417541504e-07, -2.9243528842926025e-07, -2.8312206268310547e-07, -2.738088369369507e-07, -2.644956111907959e-07, -2.551823854446411e-07, -2.4586915969848633e-07, -2.3655593395233154e-07, -2.2724270820617676e-07, -2.1792948246002197e-07, -2.086162567138672e-07, -1.993030309677124e-07, -1.8998980522155762e-07, -1.8067657947540283e-07, -1.7136335372924805e-07, -1.6205012798309326e-07, -1.5273690223693848e-07, -1.434236764907837e-07, -1.341104507446289e-07, -1.2479722499847412e-07, -1.1548399925231934e-07, -1.0617077350616455e-07, -9.685754776000977e-08, -8.754432201385498e-08, -7.82310962677002e-08, -6.891787052154541e-08, -5.960464477539063e-08, -5.029141902923584e-08, -4.0978193283081055e-08, -3.166496753692627e-08, -2.2351741790771484e-08, -1.30385160446167e-08, -3.725290298461914e-09, 5.587935447692871e-09, 1.4901161193847656e-08, 2.421438694000244e-08, 3.3527612686157227e-08, 4.284083843231201e-08, 5.21540641784668e-08, 6.146728992462158e-08, 7.078051567077637e-08, 8.009374141693115e-08, 8.940696716308594e-08, 9.872019290924072e-08, 1.0803341865539551e-07, 1.1734664440155029e-07, 1.2665987014770508e-07, 1.3597309589385986e-07, 1.4528632164001465e-07, 1.5459954738616943e-07, 1.6391277313232422e-07, 1.73225998878479e-07, 1.825392246246338e-07, 1.9185245037078857e-07, 2.0116567611694336e-07, 2.1047890186309814e-07, 2.1979212760925293e-07, 2.2910535335540771e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 10.0, 6.0, 2.0, 3.0, 4.0, 5.0, 17.0, 67.0, 29.0, 40.0, 255.0, 900.0, 68758.0, 974617.0, 3147.0, 496.0, 57.0, 28.0, 66.0, 16.0, 18.0, 3.0, 1.0, 1.0, 6.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.993511199951172e-06, -3.8351863622665405e-06, -3.676861524581909e-06, -3.518536686897278e-06, -3.3602118492126465e-06, -3.201887011528015e-06, -3.043562173843384e-06, -2.8852373361587524e-06, -2.726912498474121e-06, -2.5685876607894897e-06, -2.4102628231048584e-06, -2.251937985420227e-06, -2.0936131477355957e-06, -1.9352883100509644e-06, -1.776963472366333e-06, -1.6186386346817017e-06, -1.4603137969970703e-06, -1.301988959312439e-06, -1.1436641216278076e-06, -9.853392839431763e-07, -8.270144462585449e-07, -6.686896085739136e-07, -5.103647708892822e-07, -3.520399332046509e-07, -1.9371509552001953e-07, -3.5390257835388184e-08, 1.2293457984924316e-07, 2.812594175338745e-07, 4.3958425521850586e-07, 5.979090929031372e-07, 7.562339305877686e-07, 9.145587682723999e-07, 1.0728836059570312e-06, 1.2312084436416626e-06, 1.389533281326294e-06, 1.5478581190109253e-06, 1.7061829566955566e-06, 1.864507794380188e-06, 2.0228326320648193e-06, 2.1811574697494507e-06, 2.339482307434082e-06, 2.4978071451187134e-06, 2.6561319828033447e-06, 2.814456820487976e-06, 2.9727816581726074e-06, 3.1311064958572388e-06, 3.28943133354187e-06, 3.4477561712265015e-06, 3.606081008911133e-06, 3.764405846595764e-06, 3.9227306842803955e-06, 4.081055521965027e-06, 4.239380359649658e-06, 4.3977051973342896e-06, 4.556030035018921e-06, 4.714354872703552e-06, 4.872679710388184e-06, 5.031004548072815e-06, 5.189329385757446e-06, 5.347654223442078e-06, 5.505979061126709e-06, 5.66430389881134e-06, 5.822628736495972e-06, 5.980953574180603e-06, 6.139278411865234e-06]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 973.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9522666150351142e-07, -1.9050148125643318e-07, -1.8577630100935494e-07, -1.810511349731314e-07, -1.7632595472605317e-07, -1.7160077447897493e-07, -1.6687559423189668e-07, -1.6215041398481844e-07, -1.574252337377402e-07, -1.5270005349066196e-07, -1.4797487324358372e-07, -1.432497072073602e-07, -1.3852452696028195e-07, -1.337993467132037e-07, -1.2907416646612546e-07, -1.2434898621904722e-07, -1.196238201828237e-07, -1.1489863993574545e-07, -1.1017346679409457e-07, -1.0544828654701632e-07, -1.0072311340536544e-07, -9.59979331582872e-08, -9.127275291120895e-08, -8.654757266413071e-08, -8.182239952247983e-08, -7.709721927540159e-08, -7.23720461337507e-08, -6.764686588667246e-08, -6.292168563959422e-08, -5.819651249794333e-08, -5.347133225086509e-08, -4.8746155556500526e-08, -4.402099307299068e-08, -3.9295816378626114e-08, -3.457063968426155e-08, -2.984545943718331e-08, -2.5120282742818745e-08, -2.039510604845418e-08, -1.566992757773278e-08, -1.0944749107011376e-08, -6.219572412646812e-09, -1.494394830103829e-09, 3.230782752439154e-09, 7.955960334982137e-09, 1.268113791752512e-08, 1.7406314611889684e-08, 2.2131493082611087e-08, 2.685667155333249e-08, 3.158184824769705e-08, 3.6307024942061616e-08, 4.103220163642618e-08, 4.575738188350442e-08, 5.0482558577868986e-08, 5.520773527223355e-08, 5.993291551931179e-08, 6.465809576639003e-08, 6.938326890804092e-08, 7.410844915511916e-08, 7.883362229677005e-08, 8.355880254384829e-08, 8.828398279092653e-08, 9.300915593257741e-08, 9.773433617965566e-08, 1.0245950932130654e-07, 1.0718468956838478e-07]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 973.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 7.0, 10.0, 17.0, 16.0, 21.0, 30.0, 27.0, 25.0, 38.0, 37.0, 33.0, 35.0, 50.0, 46.0, 42.0, 51.0, 52.0, 48.0, 41.0, 51.0, 44.0, 35.0, 40.0, 28.0, 28.0, 17.0, 26.0, 25.0, 13.0, 13.0, 9.0, 9.0, 11.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6640625, -2.5810546875, -2.498046875, -2.4150390625, -2.33203125, -2.2490234375, -2.166015625, -2.0830078125, -2.0, -1.9169921875, -1.833984375, -1.7509765625, -1.66796875, -1.5849609375, -1.501953125, -1.4189453125, -1.3359375, -1.2529296875, -1.169921875, -1.0869140625, -1.00390625, -0.9208984375, -0.837890625, -0.7548828125, -0.671875, -0.5888671875, -0.505859375, -0.4228515625, -0.33984375, -0.2568359375, -0.173828125, -0.0908203125, -0.0078125, 0.0751953125, 0.158203125, 0.2412109375, 0.32421875, 0.4072265625, 0.490234375, 0.5732421875, 0.65625, 0.7392578125, 0.822265625, 0.9052734375, 0.98828125, 1.0712890625, 1.154296875, 1.2373046875, 1.3203125, 1.4033203125, 1.486328125, 1.5693359375, 1.65234375, 1.7353515625, 1.818359375, 1.9013671875, 1.984375, 2.0673828125, 2.150390625, 2.2333984375, 2.31640625, 2.3994140625, 2.482421875, 2.5654296875, 2.6484375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 10.0, 26.0, 35.0, 63.0, 141.0, 235.0, 445.0, 894.0, 1849.0, 3688.0, 7474.0, 16973.0, 39253.0, 99249.0, 327746.0, 365186.0, 108658.0, 42687.0, 17966.0, 8130.0, 3850.0, 1936.0, 984.0, 526.0, 256.0, 139.0, 82.0, 42.0, 10.0, 12.0, 3.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.490234375, -3.381317138671875, -3.27239990234375, -3.163482666015625, -3.0545654296875, -2.945648193359375, -2.83673095703125, -2.727813720703125, -2.618896484375, -2.509979248046875, -2.40106201171875, -2.292144775390625, -2.1832275390625, -2.074310302734375, -1.96539306640625, -1.856475830078125, -1.74755859375, -1.638641357421875, -1.52972412109375, -1.420806884765625, -1.3118896484375, -1.202972412109375, -1.09405517578125, -0.985137939453125, -0.876220703125, -0.767303466796875, -0.65838623046875, -0.549468994140625, -0.4405517578125, -0.331634521484375, -0.22271728515625, -0.113800048828125, -0.0048828125, 0.104034423828125, 0.21295166015625, 0.321868896484375, 0.4307861328125, 0.539703369140625, 0.64862060546875, 0.757537841796875, 0.866455078125, 0.975372314453125, 1.08428955078125, 1.193206787109375, 1.3021240234375, 1.411041259765625, 1.51995849609375, 1.628875732421875, 1.73779296875, 1.846710205078125, 1.95562744140625, 2.064544677734375, 2.1734619140625, 2.282379150390625, 2.39129638671875, 2.500213623046875, 2.609130859375, 2.718048095703125, 2.82696533203125, 2.935882568359375, 3.0447998046875, 3.153717041015625, 3.26263427734375, 3.371551513671875, 3.48046875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 5.0, 1.0, 8.0, 15.0, 17.0, 19.0, 25.0, 30.0, 24.0, 35.0, 30.0, 44.0, 62.0, 78.0, 128.0, 234.0, 1576.0, 227.0, 108.0, 77.0, 47.0, 44.0, 43.0, 41.0, 32.0, 23.0, 15.0, 12.0, 9.0, 12.0, 4.0, 9.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.8671875, -10.5220947265625, -10.177001953125, -9.8319091796875, -9.48681640625, -9.1417236328125, -8.796630859375, -8.4515380859375, -8.1064453125, -7.7613525390625, -7.416259765625, -7.0711669921875, -6.72607421875, -6.3809814453125, -6.035888671875, -5.6907958984375, -5.345703125, -5.0006103515625, -4.655517578125, -4.3104248046875, -3.96533203125, -3.6202392578125, -3.275146484375, -2.9300537109375, -2.5849609375, -2.2398681640625, -1.894775390625, -1.5496826171875, -1.20458984375, -0.8594970703125, -0.514404296875, -0.1693115234375, 0.17578125, 0.5208740234375, 0.865966796875, 1.2110595703125, 1.55615234375, 1.9012451171875, 2.246337890625, 2.5914306640625, 2.9365234375, 3.2816162109375, 3.626708984375, 3.9718017578125, 4.31689453125, 4.6619873046875, 5.007080078125, 5.3521728515625, 5.697265625, 6.0423583984375, 6.387451171875, 6.7325439453125, 7.07763671875, 7.4227294921875, 7.767822265625, 8.1129150390625, 8.4580078125, 8.8031005859375, 9.148193359375, 9.4932861328125, 9.83837890625, 10.1834716796875, 10.528564453125, 10.8736572265625, 11.21875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 7.0, 10.0, 11.0, 16.0, 14.0, 18.0, 43.0, 47.0, 66.0, 101.0, 121.0, 194.0, 340.0, 974.0, 6166.0, 832190.0, 2293590.0, 9472.0, 1216.0, 377.0, 201.0, 155.0, 105.0, 64.0, 63.0, 34.0, 33.0, 24.0, 12.0, 13.0, 6.0, 2.0, 7.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -21.01123046875, -20.3349609375, -19.65869140625, -18.982421875, -18.30615234375, -17.6298828125, -16.95361328125, -16.27734375, -15.60107421875, -14.9248046875, -14.24853515625, -13.572265625, -12.89599609375, -12.2197265625, -11.54345703125, -10.8671875, -10.19091796875, -9.5146484375, -8.83837890625, -8.162109375, -7.48583984375, -6.8095703125, -6.13330078125, -5.45703125, -4.78076171875, -4.1044921875, -3.42822265625, -2.751953125, -2.07568359375, -1.3994140625, -0.72314453125, -0.046875, 0.62939453125, 1.3056640625, 1.98193359375, 2.658203125, 3.33447265625, 4.0107421875, 4.68701171875, 5.36328125, 6.03955078125, 6.7158203125, 7.39208984375, 8.068359375, 8.74462890625, 9.4208984375, 10.09716796875, 10.7734375, 11.44970703125, 12.1259765625, 12.80224609375, 13.478515625, 14.15478515625, 14.8310546875, 15.50732421875, 16.18359375, 16.85986328125, 17.5361328125, 18.21240234375, 18.888671875, 19.56494140625, 20.2412109375, 20.91748046875, 21.59375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 16.0, 37.0, 64.0, 107.0, 135.0, 144.0, 151.0, 129.0, 82.0, 63.0, 36.0, 12.0, 7.0, 6.0, 1.0, 6.0, 1.0, 0.0, 2.0], "bins": [-33.42950439453125, -32.77307891845703, -32.11665344238281, -31.46022605895996, -30.803800582885742, -30.147375106811523, -29.490949630737305, -28.834524154663086, -28.178096771240234, -27.521671295166016, -26.865245819091797, -26.208818435668945, -25.552392959594727, -24.895967483520508, -24.23954200744629, -23.58311653137207, -22.92669105529785, -22.270265579223633, -21.613840103149414, -20.957412719726562, -20.300987243652344, -19.644561767578125, -18.988136291503906, -18.331710815429688, -17.67528533935547, -17.01885986328125, -16.36243438720703, -15.706007957458496, -15.049581527709961, -14.393156051635742, -13.736730575561523, -13.080305099487305, -12.423877716064453, -11.767452239990234, -11.1110258102417, -10.45460033416748, -9.798173904418945, -9.141748428344727, -8.485322952270508, -7.828896999359131, -7.172471046447754, -6.516045093536377, -5.859619140625, -5.203193664550781, -4.546767711639404, -3.8903417587280273, -3.2339160442352295, -2.5774903297424316, -1.9210643768310547, -1.2646385431289673, -0.6082127094268799, 0.04821312427520752, 0.7046389579772949, 1.3610649108886719, 2.0174906253814697, 2.6739163398742676, 3.3303422927856445, 3.9867682456970215, 4.643194198608398, 5.299619674682617, 5.956045627593994, 6.612471580505371, 7.26889705657959, 7.925323009490967, 8.581748962402344]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 6.0, 9.0, 7.0, 19.0, 12.0, 20.0, 15.0, 19.0, 18.0, 21.0, 26.0, 30.0, 23.0, 29.0, 25.0, 36.0, 38.0, 42.0, 40.0, 41.0, 41.0, 39.0, 40.0, 38.0, 39.0, 28.0, 32.0, 32.0, 27.0, 31.0, 15.0, 24.0, 19.0, 20.0, 22.0, 13.0, 7.0, 6.0, 16.0, 12.0, 5.0, 7.0, 3.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.224117279052734, -17.59691047668457, -16.969703674316406, -16.342496871948242, -15.715290069580078, -15.088083267211914, -14.46087646484375, -13.833669662475586, -13.206462860107422, -12.579256057739258, -11.952049255371094, -11.32484245300293, -10.697635650634766, -10.070428848266602, -9.443222045898438, -8.816015243530273, -8.18880844116211, -7.561601638793945, -6.934394836425781, -6.307188034057617, -5.679981231689453, -5.052774429321289, -4.425567626953125, -3.798360824584961, -3.171154022216797, -2.543947219848633, -1.9167404174804688, -1.2895336151123047, -0.6623268127441406, -0.03512001037597656, 0.5920867919921875, 1.2192935943603516, 1.8464984893798828, 2.473705291748047, 3.100912094116211, 3.728118896484375, 4.355325698852539, 4.982532501220703, 5.609739303588867, 6.236946105957031, 6.864152908325195, 7.491359710693359, 8.118566513061523, 8.745773315429688, 9.372980117797852, 10.000186920166016, 10.62739372253418, 11.254600524902344, 11.881807327270508, 12.509014129638672, 13.136220932006836, 13.763427734375, 14.390634536743164, 15.017841339111328, 15.645048141479492, 16.272254943847656, 16.89946174621582, 17.526668548583984, 18.15387535095215, 18.781082153320312, 19.408288955688477, 20.03549575805664, 20.662702560424805, 21.28990936279297, 21.917116165161133]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 9.0, 12.0, 16.0, 20.0, 28.0, 19.0, 28.0, 34.0, 35.0, 37.0, 38.0, 36.0, 44.0, 39.0, 55.0, 35.0, 66.0, 56.0, 45.0, 35.0, 34.0, 38.0, 37.0, 36.0, 25.0, 26.0, 17.0, 10.0, 17.0, 12.0, 12.0, 8.0, 10.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.818359375, -2.732177734375, -2.64599609375, -2.559814453125, -2.4736328125, -2.387451171875, -2.30126953125, -2.215087890625, -2.12890625, -2.042724609375, -1.95654296875, -1.870361328125, -1.7841796875, -1.697998046875, -1.61181640625, -1.525634765625, -1.439453125, -1.353271484375, -1.26708984375, -1.180908203125, -1.0947265625, -1.008544921875, -0.92236328125, -0.836181640625, -0.75, -0.663818359375, -0.57763671875, -0.491455078125, -0.4052734375, -0.319091796875, -0.23291015625, -0.146728515625, -0.060546875, 0.025634765625, 0.11181640625, 0.197998046875, 0.2841796875, 0.370361328125, 0.45654296875, 0.542724609375, 0.62890625, 0.715087890625, 0.80126953125, 0.887451171875, 0.9736328125, 1.059814453125, 1.14599609375, 1.232177734375, 1.318359375, 1.404541015625, 1.49072265625, 1.576904296875, 1.6630859375, 1.749267578125, 1.83544921875, 1.921630859375, 2.0078125, 2.093994140625, 2.18017578125, 2.266357421875, 2.3525390625, 2.438720703125, 2.52490234375, 2.611083984375, 2.697265625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 12.0, 6.0, 10.0, 9.0, 21.0, 18.0, 28.0, 28.0, 32.0, 48.0, 89.0, 179.0, 489.0, 1966.0, 9438.0, 63260.0, 636276.0, 2871181.0, 544889.0, 55010.0, 8555.0, 1774.0, 515.0, 148.0, 71.0, 40.0, 36.0, 19.0, 25.0, 19.0, 17.0, 13.0, 8.0, 10.0, 8.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.640625, -8.37451171875, -8.1083984375, -7.84228515625, -7.576171875, -7.31005859375, -7.0439453125, -6.77783203125, -6.51171875, -6.24560546875, -5.9794921875, -5.71337890625, -5.447265625, -5.18115234375, -4.9150390625, -4.64892578125, -4.3828125, -4.11669921875, -3.8505859375, -3.58447265625, -3.318359375, -3.05224609375, -2.7861328125, -2.52001953125, -2.25390625, -1.98779296875, -1.7216796875, -1.45556640625, -1.189453125, -0.92333984375, -0.6572265625, -0.39111328125, -0.125, 0.14111328125, 0.4072265625, 0.67333984375, 0.939453125, 1.20556640625, 1.4716796875, 1.73779296875, 2.00390625, 2.27001953125, 2.5361328125, 2.80224609375, 3.068359375, 3.33447265625, 3.6005859375, 3.86669921875, 4.1328125, 4.39892578125, 4.6650390625, 4.93115234375, 5.197265625, 5.46337890625, 5.7294921875, 5.99560546875, 6.26171875, 6.52783203125, 6.7939453125, 7.06005859375, 7.326171875, 7.59228515625, 7.8583984375, 8.12451171875, 8.390625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 9.0, 10.0, 8.0, 23.0, 14.0, 34.0, 45.0, 49.0, 65.0, 94.0, 131.0, 149.0, 197.0, 204.0, 303.0, 356.0, 412.0, 373.0, 364.0, 276.0, 211.0, 179.0, 138.0, 114.0, 81.0, 52.0, 47.0, 43.0, 30.0, 19.0, 11.0, 12.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.27734375, -6.1156005859375, -5.953857421875, -5.7921142578125, -5.63037109375, -5.4686279296875, -5.306884765625, -5.1451416015625, -4.9833984375, -4.8216552734375, -4.659912109375, -4.4981689453125, -4.33642578125, -4.1746826171875, -4.012939453125, -3.8511962890625, -3.689453125, -3.5277099609375, -3.365966796875, -3.2042236328125, -3.04248046875, -2.8807373046875, -2.718994140625, -2.5572509765625, -2.3955078125, -2.2337646484375, -2.072021484375, -1.9102783203125, -1.74853515625, -1.5867919921875, -1.425048828125, -1.2633056640625, -1.1015625, -0.9398193359375, -0.778076171875, -0.6163330078125, -0.45458984375, -0.2928466796875, -0.131103515625, 0.0306396484375, 0.1923828125, 0.3541259765625, 0.515869140625, 0.6776123046875, 0.83935546875, 1.0010986328125, 1.162841796875, 1.3245849609375, 1.486328125, 1.6480712890625, 1.809814453125, 1.9715576171875, 2.13330078125, 2.2950439453125, 2.456787109375, 2.6185302734375, 2.7802734375, 2.9420166015625, 3.103759765625, 3.2655029296875, 3.42724609375, 3.5889892578125, 3.750732421875, 3.9124755859375, 4.07421875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 18.0, 27.0, 41.0, 54.0, 97.0, 130.0, 228.0, 383.0, 1003.0, 5052.0, 61978.0, 1284479.0, 2671432.0, 156596.0, 10017.0, 1524.0, 514.0, 230.0, 168.0, 85.0, 67.0, 48.0, 36.0, 19.0, 19.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1328125, -14.6622314453125, -14.191650390625, -13.7210693359375, -13.25048828125, -12.7799072265625, -12.309326171875, -11.8387451171875, -11.3681640625, -10.8975830078125, -10.427001953125, -9.9564208984375, -9.48583984375, -9.0152587890625, -8.544677734375, -8.0740966796875, -7.603515625, -7.1329345703125, -6.662353515625, -6.1917724609375, -5.72119140625, -5.2506103515625, -4.780029296875, -4.3094482421875, -3.8388671875, -3.3682861328125, -2.897705078125, -2.4271240234375, -1.95654296875, -1.4859619140625, -1.015380859375, -0.5447998046875, -0.07421875, 0.3963623046875, 0.866943359375, 1.3375244140625, 1.80810546875, 2.2786865234375, 2.749267578125, 3.2198486328125, 3.6904296875, 4.1610107421875, 4.631591796875, 5.1021728515625, 5.57275390625, 6.0433349609375, 6.513916015625, 6.9844970703125, 7.455078125, 7.9256591796875, 8.396240234375, 8.8668212890625, 9.33740234375, 9.8079833984375, 10.278564453125, 10.7491455078125, 11.2197265625, 11.6903076171875, 12.160888671875, 12.6314697265625, 13.10205078125, 13.5726318359375, 14.043212890625, 14.5137939453125, 14.984375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [2.0, 9.0, 16.0, 66.0, 139.0, 244.0, 254.0, 189.0, 68.0, 26.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.429969787597656, -13.760418891906738, -11.09086799621582, -8.421317100524902, -5.751766204833984, -3.0822153091430664, -0.41266441345214844, 2.256885528564453, 4.9264373779296875, 7.5959882736206055, 10.265539169311523, 12.935090065002441, 15.60464096069336, 18.274192810058594, 20.943742752075195, 23.613292694091797, 26.28284454345703, 28.952396392822266, 31.621946334838867, 34.29149627685547, 36.9610481262207, 39.63059997558594, 42.300148010253906, 44.96969985961914, 47.639251708984375, 50.30880355834961, 52.978355407714844, 55.64790344238281, 58.31745529174805, 60.98700714111328, 63.65655517578125, 66.32611083984375, 68.99565124511719, 71.66519927978516, 74.33475494384766, 77.00430297851562, 79.67385864257812, 82.3434066772461, 85.01295471191406, 87.68251037597656, 90.35205841064453, 93.0216064453125, 95.691162109375, 98.36071014404297, 101.03025817871094, 103.69981384277344, 106.3693618774414, 109.03890991210938, 111.70846557617188, 114.37801361083984, 117.04756927490234, 119.71711730957031, 122.38667297363281, 125.05622100830078, 127.72576904296875, 130.39532470703125, 133.06488037109375, 135.73443603515625, 138.4039764404297, 141.0735321044922, 143.7430877685547, 146.41262817382812, 149.08218383789062, 151.75173950195312, 154.42127990722656]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 9.0, 6.0, 13.0, 9.0, 9.0, 19.0, 23.0, 25.0, 27.0, 22.0, 22.0, 29.0, 23.0, 39.0, 29.0, 27.0, 43.0, 38.0, 35.0, 42.0, 48.0, 38.0, 33.0, 46.0, 31.0, 33.0, 27.0, 23.0, 31.0, 23.0, 27.0, 25.0, 12.0, 17.0, 9.0, 12.0, 14.0, 8.0, 9.0, 9.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-17.674179077148438, -17.130205154418945, -16.586231231689453, -16.04225730895996, -15.498283386230469, -14.954309463500977, -14.410335540771484, -13.866361618041992, -13.3223876953125, -12.778413772583008, -12.234439849853516, -11.690465927124023, -11.146492004394531, -10.602518081665039, -10.058544158935547, -9.514570236206055, -8.970596313476562, -8.42662239074707, -7.882648468017578, -7.338674545288086, -6.794700622558594, -6.250726699829102, -5.706752777099609, -5.162778854370117, -4.618804931640625, -4.074831008911133, -3.5308570861816406, -2.9868831634521484, -2.4429092407226562, -1.898935317993164, -1.3549613952636719, -0.8109874725341797, -0.2670135498046875, 0.2769603729248047, 0.8209342956542969, 1.364908218383789, 1.9088821411132812, 2.4528560638427734, 2.9968299865722656, 3.540803909301758, 4.08477783203125, 4.628751754760742, 5.172725677490234, 5.716699600219727, 6.260673522949219, 6.804647445678711, 7.348621368408203, 7.892595291137695, 8.436569213867188, 8.98054313659668, 9.524517059326172, 10.068490982055664, 10.612464904785156, 11.156438827514648, 11.70041275024414, 12.244386672973633, 12.788360595703125, 13.332334518432617, 13.87630844116211, 14.420282363891602, 14.964256286621094, 15.508230209350586, 16.052204132080078, 16.59617805480957, 17.140151977539062]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 13.0, 14.0, 20.0, 15.0, 37.0, 26.0, 31.0, 39.0, 35.0, 31.0, 55.0, 41.0, 42.0, 50.0, 46.0, 41.0, 41.0, 47.0, 52.0, 35.0, 45.0, 29.0, 33.0, 20.0, 20.0, 32.0, 12.0, 24.0, 12.0, 12.0, 7.0, 4.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.828125, -2.742156982421875, -2.65618896484375, -2.570220947265625, -2.4842529296875, -2.398284912109375, -2.31231689453125, -2.226348876953125, -2.140380859375, -2.054412841796875, -1.96844482421875, -1.882476806640625, -1.7965087890625, -1.710540771484375, -1.62457275390625, -1.538604736328125, -1.45263671875, -1.366668701171875, -1.28070068359375, -1.194732666015625, -1.1087646484375, -1.022796630859375, -0.93682861328125, -0.850860595703125, -0.764892578125, -0.678924560546875, -0.59295654296875, -0.506988525390625, -0.4210205078125, -0.335052490234375, -0.24908447265625, -0.163116455078125, -0.0771484375, 0.008819580078125, 0.09478759765625, 0.180755615234375, 0.2667236328125, 0.352691650390625, 0.43865966796875, 0.524627685546875, 0.610595703125, 0.696563720703125, 0.78253173828125, 0.868499755859375, 0.9544677734375, 1.040435791015625, 1.12640380859375, 1.212371826171875, 1.29833984375, 1.384307861328125, 1.47027587890625, 1.556243896484375, 1.6422119140625, 1.728179931640625, 1.81414794921875, 1.900115966796875, 1.986083984375, 2.072052001953125, 2.15802001953125, 2.243988037109375, 2.3299560546875, 2.415924072265625, 2.50189208984375, 2.587860107421875, 2.673828125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 12.0, 14.0, 26.0, 43.0, 52.0, 89.0, 99.0, 154.0, 227.0, 328.0, 525.0, 691.0, 1148.0, 1778.0, 2765.0, 4313.0, 7034.0, 11362.0, 19289.0, 32843.0, 57928.0, 108862.0, 261298.0, 278642.0, 113530.0, 59656.0, 34210.0, 19776.0, 11999.0, 7216.0, 4590.0, 2780.0, 1867.0, 1149.0, 726.0, 505.0, 323.0, 239.0, 137.0, 106.0, 63.0, 45.0, 28.0, 24.0, 18.0, 14.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0209808349609375, -0.02030467987060547, -0.019628524780273438, -0.018952369689941406, -0.018276214599609375, -0.017600059509277344, -0.016923904418945312, -0.01624774932861328, -0.01557159423828125, -0.014895439147949219, -0.014219284057617188, -0.013543128967285156, -0.012866973876953125, -0.012190818786621094, -0.011514663696289062, -0.010838508605957031, -0.010162353515625, -0.009486198425292969, -0.008810043334960938, -0.008133888244628906, -0.007457733154296875, -0.006781578063964844, -0.0061054229736328125, -0.005429267883300781, -0.00475311279296875, -0.004076957702636719, -0.0034008026123046875, -0.0027246475219726562, -0.002048492431640625, -0.0013723373413085938, -0.0006961822509765625, -2.002716064453125e-05, 0.0006561279296875, 0.0013322830200195312, 0.0020084381103515625, 0.0026845932006835938, 0.003360748291015625, 0.004036903381347656, 0.0047130584716796875, 0.005389213562011719, 0.00606536865234375, 0.006741523742675781, 0.0074176788330078125, 0.008093833923339844, 0.008769989013671875, 0.009446144104003906, 0.010122299194335938, 0.010798454284667969, 0.011474609375, 0.012150764465332031, 0.012826919555664062, 0.013503074645996094, 0.014179229736328125, 0.014855384826660156, 0.015531539916992188, 0.01620769500732422, 0.01688385009765625, 0.01756000518798828, 0.018236160278320312, 0.018912315368652344, 0.019588470458984375, 0.020264625549316406, 0.020940780639648438, 0.02161693572998047, 0.0222930908203125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 10.0, 5.0, 12.0, 7.0, 14.0, 20.0, 15.0, 26.0, 20.0, 27.0, 37.0, 24.0, 29.0, 21.0, 48.0, 38.0, 37.0, 32.0, 34.0, 45.0, 1065.0, 41.0, 36.0, 40.0, 27.0, 35.0, 24.0, 27.0, 30.0, 30.0, 25.0, 19.0, 19.0, 12.0, 15.0, 8.0, 14.0, 10.0, 6.0, 7.0, 4.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.4775390625, -1.43023681640625, -1.3829345703125, -1.33563232421875, -1.288330078125, -1.24102783203125, -1.1937255859375, -1.14642333984375, -1.09912109375, -1.05181884765625, -1.0045166015625, -0.95721435546875, -0.909912109375, -0.86260986328125, -0.8153076171875, -0.76800537109375, -0.720703125, -0.67340087890625, -0.6260986328125, -0.57879638671875, -0.531494140625, -0.48419189453125, -0.4368896484375, -0.38958740234375, -0.34228515625, -0.29498291015625, -0.2476806640625, -0.20037841796875, -0.153076171875, -0.10577392578125, -0.0584716796875, -0.01116943359375, 0.0361328125, 0.08343505859375, 0.1307373046875, 0.17803955078125, 0.225341796875, 0.27264404296875, 0.3199462890625, 0.36724853515625, 0.41455078125, 0.46185302734375, 0.5091552734375, 0.55645751953125, 0.603759765625, 0.65106201171875, 0.6983642578125, 0.74566650390625, 0.79296875, 0.84027099609375, 0.8875732421875, 0.93487548828125, 0.982177734375, 1.02947998046875, 1.0767822265625, 1.12408447265625, 1.17138671875, 1.21868896484375, 1.2659912109375, 1.31329345703125, 1.360595703125, 1.40789794921875, 1.4552001953125, 1.50250244140625, 1.5498046875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 8.0, 7.0, 13.0, 25.0, 25.0, 55.0, 71.0, 95.0, 143.0, 187.0, 274.0, 375.0, 557.0, 739.0, 985.0, 1349.0, 1843.0, 2502.0, 3502.0, 4734.0, 6570.0, 9106.0, 12695.0, 18057.0, 25789.0, 38290.0, 57819.0, 94009.0, 185691.0, 1291227.0, 121786.0, 70266.0, 45189.0, 30191.0, 20568.0, 14659.0, 10446.0, 7421.0, 5413.0, 3771.0, 2844.0, 2101.0, 1554.0, 1126.0, 839.0, 643.0, 449.0, 322.0, 235.0, 178.0, 128.0, 81.0, 65.0, 37.0, 31.0, 26.0, 13.0, 10.0, 7.0, 2.0, 2.0], "bins": [-0.0108795166015625, -0.010541796684265137, -0.010204076766967773, -0.00986635684967041, -0.009528636932373047, -0.009190917015075684, -0.00885319709777832, -0.008515477180480957, -0.008177757263183594, -0.00784003734588623, -0.007502317428588867, -0.007164597511291504, -0.006826877593994141, -0.006489157676696777, -0.006151437759399414, -0.005813717842102051, -0.0054759979248046875, -0.005138278007507324, -0.004800558090209961, -0.004462838172912598, -0.004125118255615234, -0.003787398338317871, -0.003449678421020508, -0.0031119585037231445, -0.0027742385864257812, -0.002436518669128418, -0.0020987987518310547, -0.0017610788345336914, -0.0014233589172363281, -0.0010856389999389648, -0.0007479190826416016, -0.0004101991653442383, -7.2479248046875e-05, 0.0002652406692504883, 0.0006029605865478516, 0.0009406805038452148, 0.0012784004211425781, 0.0016161203384399414, 0.0019538402557373047, 0.002291560173034668, 0.0026292800903320312, 0.0029670000076293945, 0.003304719924926758, 0.003642439842224121, 0.003980159759521484, 0.004317879676818848, 0.004655599594116211, 0.004993319511413574, 0.0053310394287109375, 0.005668759346008301, 0.006006479263305664, 0.006344199180603027, 0.006681919097900391, 0.007019639015197754, 0.007357358932495117, 0.0076950788497924805, 0.008032798767089844, 0.008370518684387207, 0.00870823860168457, 0.009045958518981934, 0.009383678436279297, 0.00972139835357666, 0.010059118270874023, 0.010396838188171387, 0.01073455810546875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 105.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 769.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 113.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 10.0, 101.0, 13.0, 20.0, 17.0, 103.0, 426.0, 4010.0, 79906.0, 945116.0, 17174.0, 1221.0, 253.0, 18.0, 13.0, 18.0, 79.0, 22.0, 10.0, 3.0, 1.0, 0.0, 0.0, 2.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.112720489501953e-06, -3.9851292967796326e-06, -3.857538104057312e-06, -3.7299469113349915e-06, -3.602355718612671e-06, -3.4747645258903503e-06, -3.3471733331680298e-06, -3.2195821404457092e-06, -3.0919909477233887e-06, -2.964399755001068e-06, -2.8368085622787476e-06, -2.709217369556427e-06, -2.5816261768341064e-06, -2.454034984111786e-06, -2.3264437913894653e-06, -2.1988525986671448e-06, -2.0712614059448242e-06, -1.9436702132225037e-06, -1.816079020500183e-06, -1.6884878277778625e-06, -1.560896635055542e-06, -1.4333054423332214e-06, -1.3057142496109009e-06, -1.1781230568885803e-06, -1.0505318641662598e-06, -9.229406714439392e-07, -7.953494787216187e-07, -6.677582859992981e-07, -5.401670932769775e-07, -4.12575900554657e-07, -2.849847078323364e-07, -1.5739351511001587e-07, -2.9802322387695312e-08, 9.778887033462524e-08, 2.253800630569458e-07, 3.5297125577926636e-07, 4.805624485015869e-07, 6.081536412239075e-07, 7.35744833946228e-07, 8.633360266685486e-07, 9.909272193908691e-07, 1.1185184121131897e-06, 1.2461096048355103e-06, 1.3737007975578308e-06, 1.5012919902801514e-06, 1.628883183002472e-06, 1.7564743757247925e-06, 1.884065568447113e-06, 2.0116567611694336e-06, 2.139247953891754e-06, 2.2668391466140747e-06, 2.3944303393363953e-06, 2.522021532058716e-06, 2.6496127247810364e-06, 2.777203917503357e-06, 2.9047951102256775e-06, 3.032386302947998e-06, 3.1599774956703186e-06, 3.287568688392639e-06, 3.4151598811149597e-06, 3.5427510738372803e-06, 3.670342266559601e-06, 3.7979334592819214e-06, 3.925524652004242e-06, 4.0531158447265625e-06]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 944.0, 2.0, 4.0, 1.0, 6.0, 3.0, 4.0, 2.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.008131960134051e-07, -9.528780253731384e-08, -8.976241616664993e-08, -8.423702269055866e-08, -7.87116292144674e-08, -7.318624284380348e-08, -6.766084936771222e-08, -6.213545589162095e-08, -5.661006596824336e-08, -5.108467604486577e-08, -4.5559282568774506e-08, -4.003389264539692e-08, -3.450850272201933e-08, -2.8983109245928063e-08, -2.3457719322550474e-08, -1.7932325846459207e-08, -1.2406935923081619e-08, -6.881544667436401e-09, -1.3561534117911833e-09, 4.169237399764825e-09, 9.694629099499252e-09, 1.522002079923368e-08, 2.0745410722611268e-08, 2.6270804198702535e-08, 3.1796194122080124e-08, 3.732158404545771e-08, 4.284697752154898e-08, 4.837236744492657e-08, 5.3897757368304156e-08, 5.942315084439542e-08, 6.494853721505933e-08, 7.04739306911506e-08, 7.599932416724187e-08, 8.152471764333313e-08, 8.705010401399704e-08, 9.257549749008831e-08, 9.810089096617958e-08, 1.0362627733684349e-07, 1.0915167081293475e-07, 1.1467706428902602e-07, 1.202024577651173e-07, 1.2572785124120855e-07, 1.3125324471729982e-07, 1.3677862398253637e-07, 1.4230401745862764e-07, 1.478294109347189e-07, 1.5335480441081017e-07, 1.5888019788690144e-07, 1.64405577152138e-07, 1.6993097062822926e-07, 1.7545636410432053e-07, 1.8098174336955708e-07, 1.8650713684564835e-07, 1.9203253032173961e-07, 1.9755792379783088e-07, 2.0308331727392215e-07, 2.0860871075001342e-07, 2.1413410422610468e-07, 2.1965949770219595e-07, 2.2518489117828722e-07, 2.3071027044352377e-07, 2.3623566391961504e-07, 2.417610573957063e-07, 2.4728643666094285e-07, 2.5281184434788884e-07]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 941.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 13.0, 14.0, 20.0, 15.0, 37.0, 26.0, 31.0, 39.0, 35.0, 31.0, 55.0, 41.0, 42.0, 50.0, 46.0, 41.0, 41.0, 47.0, 52.0, 35.0, 45.0, 29.0, 33.0, 20.0, 20.0, 32.0, 12.0, 24.0, 12.0, 12.0, 7.0, 4.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.828125, -2.742156982421875, -2.65618896484375, -2.570220947265625, -2.4842529296875, -2.398284912109375, -2.31231689453125, -2.226348876953125, -2.140380859375, -2.054412841796875, -1.96844482421875, -1.882476806640625, -1.7965087890625, -1.710540771484375, -1.62457275390625, -1.538604736328125, -1.45263671875, -1.366668701171875, -1.28070068359375, -1.194732666015625, -1.1087646484375, -1.022796630859375, -0.93682861328125, -0.850860595703125, -0.764892578125, -0.678924560546875, -0.59295654296875, -0.506988525390625, -0.4210205078125, -0.335052490234375, -0.24908447265625, -0.163116455078125, -0.0771484375, 0.008819580078125, 0.09478759765625, 0.180755615234375, 0.2667236328125, 0.352691650390625, 0.43865966796875, 0.524627685546875, 0.610595703125, 0.696563720703125, 0.78253173828125, 0.868499755859375, 0.9544677734375, 1.040435791015625, 1.12640380859375, 1.212371826171875, 1.29833984375, 1.384307861328125, 1.47027587890625, 1.556243896484375, 1.6422119140625, 1.728179931640625, 1.81414794921875, 1.900115966796875, 1.986083984375, 2.072052001953125, 2.15802001953125, 2.243988037109375, 2.3299560546875, 2.415924072265625, 2.50189208984375, 2.587860107421875, 2.673828125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 33.0, 52.0, 76.0, 100.0, 187.0, 314.0, 521.0, 863.0, 1488.0, 2538.0, 4096.0, 6838.0, 11602.0, 19430.0, 35498.0, 69441.0, 166319.0, 413583.0, 163573.0, 69240.0, 34916.0, 19681.0, 11404.0, 6776.0, 3972.0, 2431.0, 1437.0, 806.0, 543.0, 285.0, 181.0, 101.0, 67.0, 47.0, 26.0, 21.0, 13.0, 8.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.97265625, -2.88116455078125, -2.7896728515625, -2.69818115234375, -2.606689453125, -2.51519775390625, -2.4237060546875, -2.33221435546875, -2.24072265625, -2.14923095703125, -2.0577392578125, -1.96624755859375, -1.874755859375, -1.78326416015625, -1.6917724609375, -1.60028076171875, -1.5087890625, -1.41729736328125, -1.3258056640625, -1.23431396484375, -1.142822265625, -1.05133056640625, -0.9598388671875, -0.86834716796875, -0.77685546875, -0.68536376953125, -0.5938720703125, -0.50238037109375, -0.410888671875, -0.31939697265625, -0.2279052734375, -0.13641357421875, -0.044921875, 0.04656982421875, 0.1380615234375, 0.22955322265625, 0.321044921875, 0.41253662109375, 0.5040283203125, 0.59552001953125, 0.68701171875, 0.77850341796875, 0.8699951171875, 0.96148681640625, 1.052978515625, 1.14447021484375, 1.2359619140625, 1.32745361328125, 1.4189453125, 1.51043701171875, 1.6019287109375, 1.69342041015625, 1.784912109375, 1.87640380859375, 1.9678955078125, 2.05938720703125, 2.15087890625, 2.24237060546875, 2.3338623046875, 2.42535400390625, 2.516845703125, 2.60833740234375, 2.6998291015625, 2.79132080078125, 2.8828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 4.0, 10.0, 6.0, 11.0, 17.0, 23.0, 19.0, 19.0, 30.0, 36.0, 28.0, 41.0, 54.0, 58.0, 57.0, 81.0, 150.0, 1472.0, 312.0, 141.0, 98.0, 53.0, 47.0, 38.0, 32.0, 31.0, 38.0, 28.0, 25.0, 13.0, 16.0, 14.0, 11.0, 8.0, 1.0, 6.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41796875, -7.14154052734375, -6.8651123046875, -6.58868408203125, -6.312255859375, -6.03582763671875, -5.7593994140625, -5.48297119140625, -5.20654296875, -4.93011474609375, -4.6536865234375, -4.37725830078125, -4.100830078125, -3.82440185546875, -3.5479736328125, -3.27154541015625, -2.9951171875, -2.71868896484375, -2.4422607421875, -2.16583251953125, -1.889404296875, -1.61297607421875, -1.3365478515625, -1.06011962890625, -0.78369140625, -0.50726318359375, -0.2308349609375, 0.04559326171875, 0.322021484375, 0.59844970703125, 0.8748779296875, 1.15130615234375, 1.427734375, 1.70416259765625, 1.9805908203125, 2.25701904296875, 2.533447265625, 2.80987548828125, 3.0863037109375, 3.36273193359375, 3.63916015625, 3.91558837890625, 4.1920166015625, 4.46844482421875, 4.744873046875, 5.02130126953125, 5.2977294921875, 5.57415771484375, 5.8505859375, 6.12701416015625, 6.4034423828125, 6.67987060546875, 6.956298828125, 7.23272705078125, 7.5091552734375, 7.78558349609375, 8.06201171875, 8.33843994140625, 8.6148681640625, 8.89129638671875, 9.167724609375, 9.44415283203125, 9.7205810546875, 9.99700927734375, 10.2734375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 5.0, 8.0, 8.0, 19.0, 27.0, 23.0, 34.0, 41.0, 71.0, 81.0, 99.0, 140.0, 224.0, 387.0, 1531.0, 17663.0, 1255616.0, 1846992.0, 19921.0, 1549.0, 393.0, 260.0, 143.0, 105.0, 90.0, 70.0, 45.0, 35.0, 30.0, 22.0, 21.0, 10.0, 11.0, 8.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.3125, -20.73681640625, -20.1611328125, -19.58544921875, -19.009765625, -18.43408203125, -17.8583984375, -17.28271484375, -16.70703125, -16.13134765625, -15.5556640625, -14.97998046875, -14.404296875, -13.82861328125, -13.2529296875, -12.67724609375, -12.1015625, -11.52587890625, -10.9501953125, -10.37451171875, -9.798828125, -9.22314453125, -8.6474609375, -8.07177734375, -7.49609375, -6.92041015625, -6.3447265625, -5.76904296875, -5.193359375, -4.61767578125, -4.0419921875, -3.46630859375, -2.890625, -2.31494140625, -1.7392578125, -1.16357421875, -0.587890625, -0.01220703125, 0.5634765625, 1.13916015625, 1.71484375, 2.29052734375, 2.8662109375, 3.44189453125, 4.017578125, 4.59326171875, 5.1689453125, 5.74462890625, 6.3203125, 6.89599609375, 7.4716796875, 8.04736328125, 8.623046875, 9.19873046875, 9.7744140625, 10.35009765625, 10.92578125, 11.50146484375, 12.0771484375, 12.65283203125, 13.228515625, 13.80419921875, 14.3798828125, 14.95556640625, 15.53125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 25.0, 17.0, 45.0, 78.0, 106.0, 109.0, 140.0, 145.0, 130.0, 84.0, 58.0, 33.0, 14.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.611065864562988, -8.951837539672852, -8.292609214782715, -7.633380889892578, -6.974152565002441, -6.314924240112305, -5.65569543838501, -4.996467113494873, -4.337238788604736, -3.6780104637145996, -3.018782138824463, -2.359553575515747, -1.7003252506256104, -1.0410969257354736, -0.3818683624267578, 0.2773599624633789, 0.9365882873535156, 1.5958166122436523, 2.255044937133789, 2.914273500442505, 3.5735018253326416, 4.232729911804199, 4.891958713531494, 5.551187038421631, 6.210415363311768, 6.869643688201904, 7.528872013092041, 8.188100814819336, 8.847329139709473, 9.50655746459961, 10.165785789489746, 10.825014114379883, 11.484243392944336, 12.143471717834473, 12.80270004272461, 13.461928367614746, 14.121156692504883, 14.78038501739502, 15.439613342285156, 16.09884262084961, 16.75806999206543, 17.417299270629883, 18.076526641845703, 18.735755920410156, 19.394983291625977, 20.05421257019043, 20.71343994140625, 21.372669219970703, 22.031898498535156, 22.69112777709961, 23.35035514831543, 24.009584426879883, 24.668811798095703, 25.328041076660156, 25.987268447875977, 26.64649772644043, 27.30572509765625, 27.964954376220703, 28.624181747436523, 29.283411026000977, 29.942638397216797, 30.60186767578125, 31.26109504699707, 31.920324325561523, 32.579551696777344]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 7.0, 5.0, 7.0, 5.0, 10.0, 20.0, 11.0, 17.0, 32.0, 38.0, 27.0, 41.0, 41.0, 40.0, 51.0, 40.0, 49.0, 55.0, 60.0, 58.0, 58.0, 43.0, 43.0, 27.0, 36.0, 29.0, 24.0, 27.0, 25.0, 20.0, 17.0, 12.0, 8.0, 11.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.664934158325195, -28.733346939086914, -27.801761627197266, -26.870174407958984, -25.938587188720703, -25.006999969482422, -24.07541275024414, -23.143827438354492, -22.21224021911621, -21.28065299987793, -20.34906768798828, -19.41748046875, -18.48589324951172, -17.554306030273438, -16.622718811035156, -15.691133499145508, -14.759546279907227, -13.827959060668945, -12.89637279510498, -11.964786529541016, -11.033199310302734, -10.101612091064453, -9.170025825500488, -8.238439559936523, -7.306852340698242, -6.375265598297119, -5.443678855895996, -4.512092113494873, -3.58050537109375, -2.648918628692627, -1.717331886291504, -0.7857451438903809, 0.1458415985107422, 1.0774283409118652, 2.0090150833129883, 2.9406018257141113, 3.8721885681152344, 4.803775310516357, 5.7353620529174805, 6.6669487953186035, 7.598535537719727, 8.530122756958008, 9.461709022521973, 10.393295288085938, 11.324882507324219, 12.2564697265625, 13.188055992126465, 14.11964225769043, 15.051229476928711, 15.982816696166992, 16.91440200805664, 17.845989227294922, 18.777576446533203, 19.709163665771484, 20.640750885009766, 21.572336196899414, 22.503923416137695, 23.435510635375977, 24.367095947265625, 25.298683166503906, 26.230270385742188, 27.16185760498047, 28.09344482421875, 29.0250301361084, 29.95661735534668]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 9.0, 8.0, 8.0, 23.0, 21.0, 22.0, 30.0, 32.0, 36.0, 33.0, 27.0, 44.0, 48.0, 43.0, 45.0, 43.0, 42.0, 50.0, 44.0, 40.0, 43.0, 48.0, 35.0, 28.0, 24.0, 24.0, 32.0, 16.0, 19.0, 17.0, 19.0, 6.0, 14.0, 7.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.06640625, -2.975067138671875, -2.88372802734375, -2.792388916015625, -2.7010498046875, -2.609710693359375, -2.51837158203125, -2.427032470703125, -2.335693359375, -2.244354248046875, -2.15301513671875, -2.061676025390625, -1.9703369140625, -1.878997802734375, -1.78765869140625, -1.696319580078125, -1.60498046875, -1.513641357421875, -1.42230224609375, -1.330963134765625, -1.2396240234375, -1.148284912109375, -1.05694580078125, -0.965606689453125, -0.874267578125, -0.782928466796875, -0.69158935546875, -0.600250244140625, -0.5089111328125, -0.417572021484375, -0.32623291015625, -0.234893798828125, -0.1435546875, -0.052215576171875, 0.03912353515625, 0.130462646484375, 0.2218017578125, 0.313140869140625, 0.40447998046875, 0.495819091796875, 0.587158203125, 0.678497314453125, 0.76983642578125, 0.861175537109375, 0.9525146484375, 1.043853759765625, 1.13519287109375, 1.226531982421875, 1.31787109375, 1.409210205078125, 1.50054931640625, 1.591888427734375, 1.6832275390625, 1.774566650390625, 1.86590576171875, 1.957244873046875, 2.048583984375, 2.139923095703125, 2.23126220703125, 2.322601318359375, 2.4139404296875, 2.505279541015625, 2.59661865234375, 2.687957763671875, 2.779296875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 13.0, 15.0, 18.0, 40.0, 53.0, 54.0, 99.0, 167.0, 281.0, 540.0, 1372.0, 4212.0, 16101.0, 73890.0, 431672.0, 2106328.0, 1303572.0, 202669.0, 38907.0, 9435.0, 2713.0, 955.0, 474.0, 219.0, 127.0, 88.0, 66.0, 30.0, 30.0, 20.0, 18.0, 15.0, 13.0, 13.0, 10.0, 3.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.73046875, -6.5252685546875, -6.320068359375, -6.1148681640625, -5.90966796875, -5.7044677734375, -5.499267578125, -5.2940673828125, -5.0888671875, -4.8836669921875, -4.678466796875, -4.4732666015625, -4.26806640625, -4.0628662109375, -3.857666015625, -3.6524658203125, -3.447265625, -3.2420654296875, -3.036865234375, -2.8316650390625, -2.62646484375, -2.4212646484375, -2.216064453125, -2.0108642578125, -1.8056640625, -1.6004638671875, -1.395263671875, -1.1900634765625, -0.98486328125, -0.7796630859375, -0.574462890625, -0.3692626953125, -0.1640625, 0.0411376953125, 0.246337890625, 0.4515380859375, 0.65673828125, 0.8619384765625, 1.067138671875, 1.2723388671875, 1.4775390625, 1.6827392578125, 1.887939453125, 2.0931396484375, 2.29833984375, 2.5035400390625, 2.708740234375, 2.9139404296875, 3.119140625, 3.3243408203125, 3.529541015625, 3.7347412109375, 3.93994140625, 4.1451416015625, 4.350341796875, 4.5555419921875, 4.7607421875, 4.9659423828125, 5.171142578125, 5.3763427734375, 5.58154296875, 5.7867431640625, 5.991943359375, 6.1971435546875, 6.40234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 9.0, 8.0, 8.0, 23.0, 26.0, 41.0, 51.0, 55.0, 85.0, 102.0, 160.0, 193.0, 232.0, 297.0, 341.0, 411.0, 426.0, 360.0, 277.0, 221.0, 165.0, 160.0, 112.0, 85.0, 62.0, 36.0, 28.0, 21.0, 13.0, 14.0, 11.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.70703125, -5.5386962890625, -5.370361328125, -5.2020263671875, -5.03369140625, -4.8653564453125, -4.697021484375, -4.5286865234375, -4.3603515625, -4.1920166015625, -4.023681640625, -3.8553466796875, -3.68701171875, -3.5186767578125, -3.350341796875, -3.1820068359375, -3.013671875, -2.8453369140625, -2.677001953125, -2.5086669921875, -2.34033203125, -2.1719970703125, -2.003662109375, -1.8353271484375, -1.6669921875, -1.4986572265625, -1.330322265625, -1.1619873046875, -0.99365234375, -0.8253173828125, -0.656982421875, -0.4886474609375, -0.3203125, -0.1519775390625, 0.016357421875, 0.1846923828125, 0.35302734375, 0.5213623046875, 0.689697265625, 0.8580322265625, 1.0263671875, 1.1947021484375, 1.363037109375, 1.5313720703125, 1.69970703125, 1.8680419921875, 2.036376953125, 2.2047119140625, 2.373046875, 2.5413818359375, 2.709716796875, 2.8780517578125, 3.04638671875, 3.2147216796875, 3.383056640625, 3.5513916015625, 3.7197265625, 3.8880615234375, 4.056396484375, 4.2247314453125, 4.39306640625, 4.5614013671875, 4.729736328125, 4.8980712890625, 5.06640625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 7.0, 7.0, 17.0, 15.0, 17.0, 39.0, 45.0, 50.0, 61.0, 126.0, 142.0, 234.0, 384.0, 664.0, 2702.0, 30475.0, 858870.0, 3125928.0, 163511.0, 8274.0, 1233.0, 543.0, 288.0, 178.0, 127.0, 89.0, 68.0, 39.0, 45.0, 30.0, 21.0, 10.0, 15.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.5, -15.97216796875, -15.4443359375, -14.91650390625, -14.388671875, -13.86083984375, -13.3330078125, -12.80517578125, -12.27734375, -11.74951171875, -11.2216796875, -10.69384765625, -10.166015625, -9.63818359375, -9.1103515625, -8.58251953125, -8.0546875, -7.52685546875, -6.9990234375, -6.47119140625, -5.943359375, -5.41552734375, -4.8876953125, -4.35986328125, -3.83203125, -3.30419921875, -2.7763671875, -2.24853515625, -1.720703125, -1.19287109375, -0.6650390625, -0.13720703125, 0.390625, 0.91845703125, 1.4462890625, 1.97412109375, 2.501953125, 3.02978515625, 3.5576171875, 4.08544921875, 4.61328125, 5.14111328125, 5.6689453125, 6.19677734375, 6.724609375, 7.25244140625, 7.7802734375, 8.30810546875, 8.8359375, 9.36376953125, 9.8916015625, 10.41943359375, 10.947265625, 11.47509765625, 12.0029296875, 12.53076171875, 13.05859375, 13.58642578125, 14.1142578125, 14.64208984375, 15.169921875, 15.69775390625, 16.2255859375, 16.75341796875, 17.28125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 7.0, 13.0, 20.0, 42.0, 53.0, 79.0, 105.0, 134.0, 123.0, 121.0, 100.0, 75.0, 57.0, 33.0, 20.0, 13.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.02088165283203, -21.828243255615234, -20.63560676574707, -19.442968368530273, -18.25033187866211, -17.057693481445312, -15.865055084228516, -14.672417640686035, -13.479780197143555, -12.287142753601074, -11.094505310058594, -9.901866912841797, -8.709229469299316, -7.516592025756836, -6.323954105377197, -5.131316184997559, -3.938678741455078, -2.7460410594940186, -1.553403377532959, -0.3607656955718994, 0.8318719863891602, 2.0245094299316406, 3.2171473503112793, 4.409785270690918, 5.602422714233398, 6.795060157775879, 7.987698078155518, 9.180335998535156, 10.372973442077637, 11.565610885620117, 12.758249282836914, 13.950886726379395, 15.143524169921875, 16.336162567138672, 17.528799057006836, 18.721437454223633, 19.914073944091797, 21.106712341308594, 22.29935073852539, 23.491989135742188, 24.68462562561035, 25.87726402282715, 27.069900512695312, 28.26253890991211, 29.455177307128906, 30.64781379699707, 31.840452194213867, 33.03308868408203, 34.22572708129883, 35.418365478515625, 36.61100387573242, 37.80363845825195, 38.99627685546875, 40.18891525268555, 41.381553649902344, 42.57419204711914, 43.76683044433594, 44.959468841552734, 46.15210723876953, 47.34474182128906, 48.53738021850586, 49.730018615722656, 50.92265701293945, 52.11529541015625, 53.30792999267578]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 6.0, 8.0, 17.0, 9.0, 5.0, 20.0, 15.0, 29.0, 23.0, 30.0, 26.0, 24.0, 33.0, 36.0, 25.0, 35.0, 37.0, 43.0, 41.0, 35.0, 39.0, 41.0, 44.0, 39.0, 41.0, 28.0, 32.0, 36.0, 22.0, 23.0, 31.0, 26.0, 12.0, 15.0, 10.0, 14.0, 12.0, 8.0, 5.0, 9.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.776592254638672, -18.217782974243164, -17.658973693847656, -17.10016441345215, -16.54135513305664, -15.98254680633545, -15.423738479614258, -14.86492919921875, -14.306119918823242, -13.747310638427734, -13.188501358032227, -12.629693031311035, -12.070883750915527, -11.51207447052002, -10.953266143798828, -10.39445686340332, -9.835647583007812, -9.276838302612305, -8.718029022216797, -8.159220695495605, -7.600411415100098, -7.04160213470459, -6.48279333114624, -5.923984527587891, -5.365175247192383, -4.806365966796875, -4.247557163238525, -3.6887481212615967, -3.129939079284668, -2.5711300373077393, -2.0123209953308105, -1.4535119533538818, -0.8947029113769531, -0.3358938694000244, 0.2229151725769043, 0.781724214553833, 1.3405332565307617, 1.8993422985076904, 2.458151340484619, 3.016960382461548, 3.5757694244384766, 4.134578704833984, 4.693387508392334, 5.252196311950684, 5.811005592346191, 6.369814872741699, 6.928623676300049, 7.487432479858398, 8.046241760253906, 8.605051040649414, 9.163860321044922, 9.722668647766113, 10.281477928161621, 10.840287208557129, 11.39909553527832, 11.957904815673828, 12.516714096069336, 13.075523376464844, 13.634332656860352, 14.193140983581543, 14.75195026397705, 15.310759544372559, 15.86956787109375, 16.428377151489258, 16.987186431884766]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 8.0, 10.0, 12.0, 13.0, 26.0, 22.0, 28.0, 32.0, 28.0, 29.0, 43.0, 44.0, 47.0, 41.0, 39.0, 41.0, 39.0, 43.0, 39.0, 45.0, 27.0, 44.0, 42.0, 21.0, 34.0, 31.0, 17.0, 27.0, 16.0, 16.0, 12.0, 20.0, 8.0, 10.0, 4.0, 7.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.736328125, -2.65240478515625, -2.5684814453125, -2.48455810546875, -2.400634765625, -2.31671142578125, -2.2327880859375, -2.14886474609375, -2.06494140625, -1.98101806640625, -1.8970947265625, -1.81317138671875, -1.729248046875, -1.64532470703125, -1.5614013671875, -1.47747802734375, -1.3935546875, -1.30963134765625, -1.2257080078125, -1.14178466796875, -1.057861328125, -0.97393798828125, -0.8900146484375, -0.80609130859375, -0.72216796875, -0.63824462890625, -0.5543212890625, -0.47039794921875, -0.386474609375, -0.30255126953125, -0.2186279296875, -0.13470458984375, -0.05078125, 0.03314208984375, 0.1170654296875, 0.20098876953125, 0.284912109375, 0.36883544921875, 0.4527587890625, 0.53668212890625, 0.62060546875, 0.70452880859375, 0.7884521484375, 0.87237548828125, 0.956298828125, 1.04022216796875, 1.1241455078125, 1.20806884765625, 1.2919921875, 1.37591552734375, 1.4598388671875, 1.54376220703125, 1.627685546875, 1.71160888671875, 1.7955322265625, 1.87945556640625, 1.96337890625, 2.04730224609375, 2.1312255859375, 2.21514892578125, 2.299072265625, 2.38299560546875, 2.4669189453125, 2.55084228515625, 2.634765625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 22.0, 14.0, 35.0, 32.0, 69.0, 88.0, 118.0, 187.0, 269.0, 431.0, 616.0, 870.0, 1290.0, 2020.0, 2914.0, 4244.0, 6512.0, 9776.0, 14721.0, 22027.0, 33646.0, 52325.0, 86049.0, 158841.0, 285513.0, 143189.0, 79803.0, 48921.0, 31545.0, 20875.0, 13690.0, 9185.0, 6103.0, 4174.0, 2723.0, 1824.0, 1245.0, 841.0, 573.0, 413.0, 257.0, 175.0, 130.0, 84.0, 55.0, 40.0, 25.0, 19.0, 12.0, 8.0, 10.0, 6.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.018524169921875, -0.017952919006347656, -0.017381668090820312, -0.01681041717529297, -0.016239166259765625, -0.01566791534423828, -0.015096664428710938, -0.014525413513183594, -0.01395416259765625, -0.013382911682128906, -0.012811660766601562, -0.012240409851074219, -0.011669158935546875, -0.011097908020019531, -0.010526657104492188, -0.009955406188964844, -0.0093841552734375, -0.008812904357910156, -0.008241653442382812, -0.007670402526855469, -0.007099151611328125, -0.006527900695800781, -0.0059566497802734375, -0.005385398864746094, -0.00481414794921875, -0.004242897033691406, -0.0036716461181640625, -0.0031003952026367188, -0.002529144287109375, -0.0019578933715820312, -0.0013866424560546875, -0.0008153915405273438, -0.000244140625, 0.00032711029052734375, 0.0008983612060546875, 0.0014696121215820312, 0.002040863037109375, 0.0026121139526367188, 0.0031833648681640625, 0.0037546157836914062, 0.00432586669921875, 0.004897117614746094, 0.0054683685302734375, 0.006039619445800781, 0.006610870361328125, 0.007182121276855469, 0.0077533721923828125, 0.008324623107910156, 0.0088958740234375, 0.009467124938964844, 0.010038375854492188, 0.010609626770019531, 0.011180877685546875, 0.011752128601074219, 0.012323379516601562, 0.012894630432128906, 0.01346588134765625, 0.014037132263183594, 0.014608383178710938, 0.015179634094238281, 0.015750885009765625, 0.01632213592529297, 0.016893386840820312, 0.017464637756347656, 0.018035888671875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 7.0, 11.0, 15.0, 10.0, 15.0, 15.0, 19.0, 28.0, 32.0, 38.0, 26.0, 26.0, 33.0, 37.0, 40.0, 44.0, 46.0, 52.0, 1073.0, 47.0, 30.0, 25.0, 50.0, 35.0, 25.0, 34.0, 33.0, 22.0, 22.0, 17.0, 20.0, 14.0, 10.0, 9.0, 12.0, 8.0, 8.0, 9.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5263671875, -1.47406005859375, -1.4217529296875, -1.36944580078125, -1.317138671875, -1.26483154296875, -1.2125244140625, -1.16021728515625, -1.10791015625, -1.05560302734375, -1.0032958984375, -0.95098876953125, -0.898681640625, -0.84637451171875, -0.7940673828125, -0.74176025390625, -0.689453125, -0.63714599609375, -0.5848388671875, -0.53253173828125, -0.480224609375, -0.42791748046875, -0.3756103515625, -0.32330322265625, -0.27099609375, -0.21868896484375, -0.1663818359375, -0.11407470703125, -0.061767578125, -0.00946044921875, 0.0428466796875, 0.09515380859375, 0.1474609375, 0.19976806640625, 0.2520751953125, 0.30438232421875, 0.356689453125, 0.40899658203125, 0.4613037109375, 0.51361083984375, 0.56591796875, 0.61822509765625, 0.6705322265625, 0.72283935546875, 0.775146484375, 0.82745361328125, 0.8797607421875, 0.93206787109375, 0.984375, 1.03668212890625, 1.0889892578125, 1.14129638671875, 1.193603515625, 1.24591064453125, 1.2982177734375, 1.35052490234375, 1.40283203125, 1.45513916015625, 1.5074462890625, 1.55975341796875, 1.612060546875, 1.66436767578125, 1.7166748046875, 1.76898193359375, 1.8212890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 13.0, 13.0, 29.0, 36.0, 39.0, 74.0, 104.0, 142.0, 217.0, 303.0, 441.0, 644.0, 921.0, 1372.0, 1938.0, 2672.0, 3766.0, 5472.0, 7994.0, 11679.0, 17410.0, 26111.0, 41304.0, 67868.0, 123759.0, 1328033.0, 203321.0, 93833.0, 54649.0, 34218.0, 21838.0, 14762.0, 9912.0, 6687.0, 4588.0, 3229.0, 2287.0, 1641.0, 1197.0, 807.0, 562.0, 374.0, 261.0, 187.0, 125.0, 91.0, 65.0, 53.0, 27.0, 33.0, 16.0, 5.0, 8.0, 6.0, 2.0, 0.0, 2.0], "bins": [-0.0132293701171875, -0.012825965881347656, -0.012422561645507812, -0.012019157409667969, -0.011615753173828125, -0.011212348937988281, -0.010808944702148438, -0.010405540466308594, -0.01000213623046875, -0.009598731994628906, -0.009195327758789062, -0.008791923522949219, -0.008388519287109375, -0.007985115051269531, -0.0075817108154296875, -0.007178306579589844, -0.00677490234375, -0.006371498107910156, -0.0059680938720703125, -0.005564689636230469, -0.005161285400390625, -0.004757881164550781, -0.0043544769287109375, -0.003951072692871094, -0.00354766845703125, -0.0031442642211914062, -0.0027408599853515625, -0.0023374557495117188, -0.001934051513671875, -0.0015306472778320312, -0.0011272430419921875, -0.0007238388061523438, -0.0003204345703125, 8.296966552734375e-05, 0.0004863739013671875, 0.0008897781372070312, 0.001293182373046875, 0.0016965866088867188, 0.0020999908447265625, 0.0025033950805664062, 0.00290679931640625, 0.0033102035522460938, 0.0037136077880859375, 0.004117012023925781, 0.004520416259765625, 0.004923820495605469, 0.0053272247314453125, 0.005730628967285156, 0.006134033203125, 0.006537437438964844, 0.0069408416748046875, 0.007344245910644531, 0.007747650146484375, 0.008151054382324219, 0.008554458618164062, 0.008957862854003906, 0.00936126708984375, 0.009764671325683594, 0.010168075561523438, 0.010571479797363281, 0.010974884033203125, 0.011378288269042969, 0.011781692504882812, 0.012185096740722656, 0.0125885009765625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 95.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 776.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 100.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0], "bins": [-3.5762786865234375e-07, -3.4924596548080444e-07, -3.4086406230926514e-07, -3.3248215913772583e-07, -3.241002559661865e-07, -3.157183527946472e-07, -3.073364496231079e-07, -2.989545464515686e-07, -2.905726432800293e-07, -2.8219074010849e-07, -2.738088369369507e-07, -2.654269337654114e-07, -2.5704503059387207e-07, -2.4866312742233276e-07, -2.4028122425079346e-07, -2.3189932107925415e-07, -2.2351741790771484e-07, -2.1513551473617554e-07, -2.0675361156463623e-07, -1.9837170839309692e-07, -1.8998980522155762e-07, -1.816079020500183e-07, -1.73225998878479e-07, -1.648440957069397e-07, -1.564621925354004e-07, -1.4808028936386108e-07, -1.3969838619232178e-07, -1.3131648302078247e-07, -1.2293457984924316e-07, -1.1455267667770386e-07, -1.0617077350616455e-07, -9.778887033462524e-08, -8.940696716308594e-08, -8.102506399154663e-08, -7.264316082000732e-08, -6.426125764846802e-08, -5.587935447692871e-08, -4.7497451305389404e-08, -3.91155481338501e-08, -3.073364496231079e-08, -2.2351741790771484e-08, -1.3969838619232178e-08, -5.587935447692871e-09, 2.7939677238464355e-09, 1.1175870895385742e-08, 1.955777406692505e-08, 2.7939677238464355e-08, 3.632158041000366e-08, 4.470348358154297e-08, 5.3085386753082275e-08, 6.146728992462158e-08, 6.984919309616089e-08, 7.82310962677002e-08, 8.66129994392395e-08, 9.499490261077881e-08, 1.0337680578231812e-07, 1.1175870895385742e-07, 1.2014061212539673e-07, 1.2852251529693604e-07, 1.3690441846847534e-07, 1.4528632164001465e-07, 1.5366822481155396e-07, 1.6205012798309326e-07, 1.7043203115463257e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 18.0, 83.0, 14.0, 29.0, 39.0, 278.0, 1136.0, 85041.0, 957172.0, 4261.0, 213.0, 92.0, 25.0, 26.0, 65.0, 23.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.933906555175781e-06, -3.7709251046180725e-06, -3.6079436540603638e-06, -3.444962203502655e-06, -3.2819807529449463e-06, -3.1189993023872375e-06, -2.956017851829529e-06, -2.79303640127182e-06, -2.6300549507141113e-06, -2.4670735001564026e-06, -2.304092049598694e-06, -2.141110599040985e-06, -1.9781291484832764e-06, -1.8151476979255676e-06, -1.6521662473678589e-06, -1.4891847968101501e-06, -1.3262033462524414e-06, -1.1632218956947327e-06, -1.000240445137024e-06, -8.372589945793152e-07, -6.742775440216064e-07, -5.112960934638977e-07, -3.4831464290618896e-07, -1.8533319234848022e-07, -2.2351741790771484e-08, 1.4062970876693726e-07, 3.03611159324646e-07, 4.6659260988235474e-07, 6.295740604400635e-07, 7.925555109977722e-07, 9.55536961555481e-07, 1.1185184121131897e-06, 1.2814998626708984e-06, 1.4444813132286072e-06, 1.607462763786316e-06, 1.7704442143440247e-06, 1.9334256649017334e-06, 2.096407115459442e-06, 2.259388566017151e-06, 2.4223700165748596e-06, 2.5853514671325684e-06, 2.748332917690277e-06, 2.911314368247986e-06, 3.0742958188056946e-06, 3.2372772693634033e-06, 3.400258719921112e-06, 3.563240170478821e-06, 3.7262216210365295e-06, 3.889203071594238e-06, 4.052184522151947e-06, 4.215165972709656e-06, 4.3781474232673645e-06, 4.541128873825073e-06, 4.704110324382782e-06, 4.867091774940491e-06, 5.0300732254981995e-06, 5.193054676055908e-06, 5.356036126613617e-06, 5.519017577171326e-06, 5.6819990277290344e-06, 5.844980478286743e-06, 6.007961928844452e-06, 6.170943379402161e-06, 6.333924829959869e-06, 6.496906280517578e-06]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 982.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2714042441075435e-07, -1.2371306468139665e-07, -1.2028571916289366e-07, -1.1685835943353595e-07, -1.134310068096056e-07, -1.100036470802479e-07, -1.0657629445631756e-07, -1.0314893472695985e-07, -9.97215821030295e-08, -9.629422947909916e-08, -9.286686974974145e-08, -8.943951712581111e-08, -8.601216450188076e-08, -8.258480477252306e-08, -7.915745214859271e-08, -7.573009952466236e-08, -7.230273979530466e-08, -6.887538717137431e-08, -6.544802744201661e-08, -6.202067481808626e-08, -5.859331864144224e-08, -5.516596246479821e-08, -5.1738609840867866e-08, -4.831125366422384e-08, -4.4883904593007173e-08, -4.145654841636315e-08, -3.80291957924328e-08, -3.4601839615788776e-08, -3.117448343914475e-08, -2.7747129038857565e-08, -2.431977463857038e-08, -2.0892418461926354e-08, -1.746506228528233e-08, -1.4037706996816723e-08, -1.0610351708351118e-08, -7.182997308063932e-09, -3.7556420195983264e-09, -3.282867311327209e-10, 3.099067669154465e-09, 6.52642384579849e-09, 9.953778246085676e-09, 1.3381133534551282e-08, 1.6808488823016887e-08, 2.0235843223304073e-08, 2.366319762359126e-08, 2.7090553800235284e-08, 3.051790997687931e-08, 3.3945262600809656e-08, 3.737261877745368e-08, 4.0799974954097706e-08, 4.422732757802805e-08, 4.765468375467208e-08, 5.1082039931316103e-08, 5.450939255524645e-08, 5.7936748731890475e-08, 6.13641049085345e-08, 6.479145753246485e-08, 6.821881015639519e-08, 7.16461698857529e-08, 7.507352250968324e-08, 7.850087513361359e-08, 8.19282348629713e-08, 8.535558748690164e-08, 8.878294011083199e-08, 9.221029984018969e-08]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [26.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 982.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 8.0, 10.0, 12.0, 13.0, 26.0, 22.0, 28.0, 32.0, 28.0, 29.0, 43.0, 44.0, 47.0, 41.0, 39.0, 41.0, 39.0, 43.0, 39.0, 45.0, 27.0, 44.0, 42.0, 21.0, 34.0, 31.0, 17.0, 27.0, 16.0, 16.0, 12.0, 20.0, 8.0, 10.0, 4.0, 7.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.736328125, -2.65240478515625, -2.5684814453125, -2.48455810546875, -2.400634765625, -2.31671142578125, -2.2327880859375, -2.14886474609375, -2.06494140625, -1.98101806640625, -1.8970947265625, -1.81317138671875, -1.729248046875, -1.64532470703125, -1.5614013671875, -1.47747802734375, -1.3935546875, -1.30963134765625, -1.2257080078125, -1.14178466796875, -1.057861328125, -0.97393798828125, -0.8900146484375, -0.80609130859375, -0.72216796875, -0.63824462890625, -0.5543212890625, -0.47039794921875, -0.386474609375, -0.30255126953125, -0.2186279296875, -0.13470458984375, -0.05078125, 0.03314208984375, 0.1170654296875, 0.20098876953125, 0.284912109375, 0.36883544921875, 0.4527587890625, 0.53668212890625, 0.62060546875, 0.70452880859375, 0.7884521484375, 0.87237548828125, 0.956298828125, 1.04022216796875, 1.1241455078125, 1.20806884765625, 1.2919921875, 1.37591552734375, 1.4598388671875, 1.54376220703125, 1.627685546875, 1.71160888671875, 1.7955322265625, 1.87945556640625, 1.96337890625, 2.04730224609375, 2.1312255859375, 2.21514892578125, 2.299072265625, 2.38299560546875, 2.4669189453125, 2.55084228515625, 2.634765625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 6.0, 18.0, 26.0, 45.0, 64.0, 82.0, 171.0, 267.0, 428.0, 754.0, 1209.0, 1966.0, 3204.0, 5650.0, 9652.0, 18370.0, 36991.0, 91050.0, 277635.0, 380307.0, 123735.0, 46661.0, 22246.0, 11886.0, 6539.0, 3793.0, 2320.0, 1328.0, 826.0, 487.0, 304.0, 188.0, 118.0, 95.0, 42.0, 32.0, 22.0, 14.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.935546875, -2.838165283203125, -2.74078369140625, -2.643402099609375, -2.5460205078125, -2.448638916015625, -2.35125732421875, -2.253875732421875, -2.156494140625, -2.059112548828125, -1.96173095703125, -1.864349365234375, -1.7669677734375, -1.669586181640625, -1.57220458984375, -1.474822998046875, -1.37744140625, -1.280059814453125, -1.18267822265625, -1.085296630859375, -0.9879150390625, -0.890533447265625, -0.79315185546875, -0.695770263671875, -0.598388671875, -0.501007080078125, -0.40362548828125, -0.306243896484375, -0.2088623046875, -0.111480712890625, -0.01409912109375, 0.083282470703125, 0.1806640625, 0.278045654296875, 0.37542724609375, 0.472808837890625, 0.5701904296875, 0.667572021484375, 0.76495361328125, 0.862335205078125, 0.959716796875, 1.057098388671875, 1.15447998046875, 1.251861572265625, 1.3492431640625, 1.446624755859375, 1.54400634765625, 1.641387939453125, 1.73876953125, 1.836151123046875, 1.93353271484375, 2.030914306640625, 2.1282958984375, 2.225677490234375, 2.32305908203125, 2.420440673828125, 2.517822265625, 2.615203857421875, 2.71258544921875, 2.809967041015625, 2.9073486328125, 3.004730224609375, 3.10211181640625, 3.199493408203125, 3.296875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 4.0, 5.0, 8.0, 8.0, 10.0, 10.0, 22.0, 12.0, 21.0, 21.0, 28.0, 38.0, 38.0, 38.0, 52.0, 54.0, 59.0, 90.0, 202.0, 1494.0, 277.0, 120.0, 86.0, 55.0, 47.0, 38.0, 31.0, 28.0, 34.0, 22.0, 17.0, 13.0, 11.0, 12.0, 3.0, 11.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.3984375, -9.1109619140625, -8.823486328125, -8.5360107421875, -8.24853515625, -7.9610595703125, -7.673583984375, -7.3861083984375, -7.0986328125, -6.8111572265625, -6.523681640625, -6.2362060546875, -5.94873046875, -5.6612548828125, -5.373779296875, -5.0863037109375, -4.798828125, -4.5113525390625, -4.223876953125, -3.9364013671875, -3.64892578125, -3.3614501953125, -3.073974609375, -2.7864990234375, -2.4990234375, -2.2115478515625, -1.924072265625, -1.6365966796875, -1.34912109375, -1.0616455078125, -0.774169921875, -0.4866943359375, -0.19921875, 0.0882568359375, 0.375732421875, 0.6632080078125, 0.95068359375, 1.2381591796875, 1.525634765625, 1.8131103515625, 2.1005859375, 2.3880615234375, 2.675537109375, 2.9630126953125, 3.25048828125, 3.5379638671875, 3.825439453125, 4.1129150390625, 4.400390625, 4.6878662109375, 4.975341796875, 5.2628173828125, 5.55029296875, 5.8377685546875, 6.125244140625, 6.4127197265625, 6.7001953125, 6.9876708984375, 7.275146484375, 7.5626220703125, 7.85009765625, 8.1375732421875, 8.425048828125, 8.7125244140625, 9.0]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 6.0, 8.0, 7.0, 10.0, 14.0, 15.0, 19.0, 19.0, 30.0, 32.0, 42.0, 50.0, 85.0, 97.0, 143.0, 176.0, 240.0, 406.0, 1223.0, 8377.0, 211502.0, 2855543.0, 61253.0, 4260.0, 810.0, 354.0, 212.0, 151.0, 145.0, 104.0, 61.0, 54.0, 58.0, 43.0, 30.0, 28.0, 24.0, 21.0, 5.0, 15.0, 9.0, 6.0, 6.0, 5.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-16.0, -15.50537109375, -15.0107421875, -14.51611328125, -14.021484375, -13.52685546875, -13.0322265625, -12.53759765625, -12.04296875, -11.54833984375, -11.0537109375, -10.55908203125, -10.064453125, -9.56982421875, -9.0751953125, -8.58056640625, -8.0859375, -7.59130859375, -7.0966796875, -6.60205078125, -6.107421875, -5.61279296875, -5.1181640625, -4.62353515625, -4.12890625, -3.63427734375, -3.1396484375, -2.64501953125, -2.150390625, -1.65576171875, -1.1611328125, -0.66650390625, -0.171875, 0.32275390625, 0.8173828125, 1.31201171875, 1.806640625, 2.30126953125, 2.7958984375, 3.29052734375, 3.78515625, 4.27978515625, 4.7744140625, 5.26904296875, 5.763671875, 6.25830078125, 6.7529296875, 7.24755859375, 7.7421875, 8.23681640625, 8.7314453125, 9.22607421875, 9.720703125, 10.21533203125, 10.7099609375, 11.20458984375, 11.69921875, 12.19384765625, 12.6884765625, 13.18310546875, 13.677734375, 14.17236328125, 14.6669921875, 15.16162109375, 15.65625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 20.0, 227.0, 433.0, 267.0, 63.0, 3.0, 1.0, 1.0], "bins": [-116.76702880859375, -114.77269744873047, -112.77835845947266, -110.78402709960938, -108.7896957397461, -106.79535675048828, -104.801025390625, -102.80669403076172, -100.8123550415039, -98.81802368164062, -96.82368469238281, -94.82935333251953, -92.83502197265625, -90.84068298339844, -88.84635162353516, -86.85202026367188, -84.85768127441406, -82.86334991455078, -80.86901092529297, -78.87467956542969, -76.8803482055664, -74.8860092163086, -72.89167785644531, -70.89734649658203, -68.90301513671875, -66.90868377685547, -64.91434478759766, -62.920013427734375, -60.92567825317383, -58.93134307861328, -56.93701171875, -54.94267654418945, -52.948341369628906, -50.95400619506836, -48.95967483520508, -46.96533966064453, -44.971004486083984, -42.97666931152344, -40.982337951660156, -38.98800277709961, -36.99366760253906, -34.999332427978516, -33.005001068115234, -31.010665893554688, -29.01633071899414, -27.021997451782227, -25.027664184570312, -23.033329010009766, -21.03899574279785, -19.044662475585938, -17.05032730102539, -15.055994033813477, -13.061659812927246, -11.067325592041016, -9.072992324829102, -7.078658103942871, -5.084323883056641, -3.0899899005889893, -1.095655918121338, 0.8986778259277344, 2.893012046813965, 4.887346267700195, 6.881679534912109, 8.87601375579834, 10.87034797668457]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 5.0, 6.0, 9.0, 10.0, 12.0, 12.0, 18.0, 22.0, 19.0, 20.0, 22.0, 35.0, 40.0, 38.0, 30.0, 37.0, 40.0, 30.0, 30.0, 42.0, 37.0, 42.0, 42.0, 45.0, 43.0, 38.0, 34.0, 35.0, 21.0, 30.0, 21.0, 21.0, 14.0, 9.0, 21.0, 15.0, 12.0, 8.0, 10.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-25.356788635253906, -24.58197784423828, -23.80716896057129, -23.032358169555664, -22.25754737854004, -21.482736587524414, -20.707927703857422, -19.933116912841797, -19.158306121826172, -18.383495330810547, -17.608686447143555, -16.83387565612793, -16.059064865112305, -15.284255027770996, -14.509445190429688, -13.734634399414062, -12.959824562072754, -12.185014724731445, -11.41020393371582, -10.635394096374512, -9.860583305358887, -9.085773468017578, -8.310962677001953, -7.5361528396606445, -6.761342525482178, -5.986532211303711, -5.211721897125244, -4.436911582946777, -3.6621015071868896, -2.887291193008423, -2.112481117248535, -1.3376708030700684, -0.5628604888916016, 0.21194976568222046, 0.9867600202560425, 1.7615702152252197, 2.5363805294036865, 3.3111908435821533, 4.086000919342041, 4.860811233520508, 5.635621547698975, 6.410431861877441, 7.185242176055908, 7.960052490234375, 8.734862327575684, 9.509673118591309, 10.284482955932617, 11.059293746948242, 11.83410358428955, 12.60891342163086, 13.383724212646484, 14.158534049987793, 14.933344841003418, 15.708154678344727, 16.48296546936035, 17.257774353027344, 18.03258514404297, 18.807395935058594, 19.582204818725586, 20.35701560974121, 21.131826400756836, 21.90663719177246, 22.681446075439453, 23.456256866455078, 24.231067657470703]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 7.0, 7.0, 6.0, 15.0, 11.0, 16.0, 15.0, 25.0, 29.0, 28.0, 34.0, 38.0, 34.0, 30.0, 39.0, 51.0, 39.0, 48.0, 34.0, 39.0, 45.0, 33.0, 45.0, 35.0, 38.0, 29.0, 27.0, 27.0, 24.0, 27.0, 14.0, 20.0, 13.0, 12.0, 13.0, 6.0, 10.0, 7.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.697265625, -2.6121826171875, -2.527099609375, -2.4420166015625, -2.35693359375, -2.2718505859375, -2.186767578125, -2.1016845703125, -2.0166015625, -1.9315185546875, -1.846435546875, -1.7613525390625, -1.67626953125, -1.5911865234375, -1.506103515625, -1.4210205078125, -1.3359375, -1.2508544921875, -1.165771484375, -1.0806884765625, -0.99560546875, -0.9105224609375, -0.825439453125, -0.7403564453125, -0.6552734375, -0.5701904296875, -0.485107421875, -0.4000244140625, -0.31494140625, -0.2298583984375, -0.144775390625, -0.0596923828125, 0.025390625, 0.1104736328125, 0.195556640625, 0.2806396484375, 0.36572265625, 0.4508056640625, 0.535888671875, 0.6209716796875, 0.7060546875, 0.7911376953125, 0.876220703125, 0.9613037109375, 1.04638671875, 1.1314697265625, 1.216552734375, 1.3016357421875, 1.38671875, 1.4718017578125, 1.556884765625, 1.6419677734375, 1.72705078125, 1.8121337890625, 1.897216796875, 1.9822998046875, 2.0673828125, 2.1524658203125, 2.237548828125, 2.3226318359375, 2.40771484375, 2.4927978515625, 2.577880859375, 2.6629638671875, 2.748046875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 8.0, 9.0, 7.0, 11.0, 11.0, 16.0, 49.0, 49.0, 78.0, 110.0, 169.0, 312.0, 532.0, 1107.0, 2430.0, 5795.0, 14689.0, 40795.0, 129146.0, 462280.0, 1439730.0, 1447557.0, 456529.0, 126634.0, 40784.0, 14636.0, 5672.0, 2502.0, 1102.0, 629.0, 340.0, 177.0, 114.0, 73.0, 47.0, 30.0, 31.0, 17.0, 12.0, 11.0, 12.0, 10.0, 10.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-4.7890625, -4.6522216796875, -4.515380859375, -4.3785400390625, -4.24169921875, -4.1048583984375, -3.968017578125, -3.8311767578125, -3.6943359375, -3.5574951171875, -3.420654296875, -3.2838134765625, -3.14697265625, -3.0101318359375, -2.873291015625, -2.7364501953125, -2.599609375, -2.4627685546875, -2.325927734375, -2.1890869140625, -2.05224609375, -1.9154052734375, -1.778564453125, -1.6417236328125, -1.5048828125, -1.3680419921875, -1.231201171875, -1.0943603515625, -0.95751953125, -0.8206787109375, -0.683837890625, -0.5469970703125, -0.41015625, -0.2733154296875, -0.136474609375, 0.0003662109375, 0.13720703125, 0.2740478515625, 0.410888671875, 0.5477294921875, 0.6845703125, 0.8214111328125, 0.958251953125, 1.0950927734375, 1.23193359375, 1.3687744140625, 1.505615234375, 1.6424560546875, 1.779296875, 1.9161376953125, 2.052978515625, 2.1898193359375, 2.32666015625, 2.4635009765625, 2.600341796875, 2.7371826171875, 2.8740234375, 3.0108642578125, 3.147705078125, 3.2845458984375, 3.42138671875, 3.5582275390625, 3.695068359375, 3.8319091796875, 3.96875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 15.0, 13.0, 8.0, 18.0, 34.0, 50.0, 81.0, 89.0, 147.0, 191.0, 262.0, 364.0, 482.0, 486.0, 463.0, 421.0, 269.0, 177.0, 149.0, 119.0, 86.0, 51.0, 31.0, 16.0, 21.0, 11.0, 6.0, 3.0, 1.0, 1.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90234375, -7.69732666015625, -7.4923095703125, -7.28729248046875, -7.082275390625, -6.87725830078125, -6.6722412109375, -6.46722412109375, -6.26220703125, -6.05718994140625, -5.8521728515625, -5.64715576171875, -5.442138671875, -5.23712158203125, -5.0321044921875, -4.82708740234375, -4.6220703125, -4.41705322265625, -4.2120361328125, -4.00701904296875, -3.802001953125, -3.59698486328125, -3.3919677734375, -3.18695068359375, -2.98193359375, -2.77691650390625, -2.5718994140625, -2.36688232421875, -2.161865234375, -1.95684814453125, -1.7518310546875, -1.54681396484375, -1.341796875, -1.13677978515625, -0.9317626953125, -0.72674560546875, -0.521728515625, -0.31671142578125, -0.1116943359375, 0.09332275390625, 0.29833984375, 0.50335693359375, 0.7083740234375, 0.91339111328125, 1.118408203125, 1.32342529296875, 1.5284423828125, 1.73345947265625, 1.9384765625, 2.14349365234375, 2.3485107421875, 2.55352783203125, 2.758544921875, 2.96356201171875, 3.1685791015625, 3.37359619140625, 3.57861328125, 3.78363037109375, 3.9886474609375, 4.19366455078125, 4.398681640625, 4.60369873046875, 4.8087158203125, 5.01373291015625, 5.21875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 2.0, 9.0, 9.0, 22.0, 34.0, 34.0, 76.0, 124.0, 194.0, 284.0, 458.0, 1355.0, 19436.0, 1665558.0, 2474404.0, 29413.0, 1543.0, 521.0, 286.0, 179.0, 126.0, 78.0, 46.0, 28.0, 23.0, 15.0, 12.0, 5.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0, -16.293212890625, -15.58642578125, -14.879638671875, -14.1728515625, -13.466064453125, -12.75927734375, -12.052490234375, -11.345703125, -10.638916015625, -9.93212890625, -9.225341796875, -8.5185546875, -7.811767578125, -7.10498046875, -6.398193359375, -5.69140625, -4.984619140625, -4.27783203125, -3.571044921875, -2.8642578125, -2.157470703125, -1.45068359375, -0.743896484375, -0.037109375, 0.669677734375, 1.37646484375, 2.083251953125, 2.7900390625, 3.496826171875, 4.20361328125, 4.910400390625, 5.6171875, 6.323974609375, 7.03076171875, 7.737548828125, 8.4443359375, 9.151123046875, 9.85791015625, 10.564697265625, 11.271484375, 11.978271484375, 12.68505859375, 13.391845703125, 14.0986328125, 14.805419921875, 15.51220703125, 16.218994140625, 16.92578125, 17.632568359375, 18.33935546875, 19.046142578125, 19.7529296875, 20.459716796875, 21.16650390625, 21.873291015625, 22.580078125, 23.286865234375, 23.99365234375, 24.700439453125, 25.4072265625, 26.114013671875, 26.82080078125, 27.527587890625, 28.234375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 6.0, 7.0, 11.0, 18.0, 30.0, 28.0, 42.0, 51.0, 74.0, 81.0, 69.0, 80.0, 85.0, 87.0, 54.0, 69.0, 51.0, 45.0, 43.0, 26.0, 14.0, 14.0, 10.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.18958854675293, -15.41402530670166, -14.63846206665039, -13.862899780273438, -13.087335586547852, -12.311773300170898, -11.536210060119629, -10.76064682006836, -9.98508358001709, -9.20952033996582, -8.43395709991455, -7.6583943367004395, -6.88283109664917, -6.1072678565979, -5.331705093383789, -4.5561418533325195, -3.78057861328125, -3.0050153732299805, -2.22945237159729, -1.4538893699645996, -0.6783261299133301, 0.09723711013793945, 0.8727998733520508, 1.6483631134033203, 2.42392635345459, 3.1994895935058594, 3.97505259513855, 4.75061559677124, 5.52617883682251, 6.301742076873779, 7.077304840087891, 7.85286808013916, 8.628433227539062, 9.403996467590332, 10.179559707641602, 10.955121994018555, 11.73068618774414, 12.506248474121094, 13.281811714172363, 14.057374954223633, 14.832938194274902, 15.608501434326172, 16.384063720703125, 17.15962791442871, 17.935190200805664, 18.71075439453125, 19.486316680908203, 20.261878967285156, 21.037443161010742, 21.813005447387695, 22.58856964111328, 23.364131927490234, 24.13969612121582, 24.915258407592773, 25.69082260131836, 26.466384887695312, 27.241947174072266, 28.01750946044922, 28.793073654174805, 29.568635940551758, 30.344200134277344, 31.119762420654297, 31.89532470703125, 32.67089080810547, 33.44645309448242]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 5.0, 8.0, 7.0, 3.0, 6.0, 14.0, 16.0, 21.0, 15.0, 19.0, 26.0, 23.0, 22.0, 33.0, 33.0, 27.0, 31.0, 40.0, 37.0, 47.0, 38.0, 38.0, 40.0, 45.0, 32.0, 53.0, 39.0, 36.0, 29.0, 35.0, 32.0, 19.0, 26.0, 17.0, 11.0, 13.0, 17.0, 11.0, 8.0, 6.0, 5.0, 6.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-19.629379272460938, -19.080183029174805, -18.530986785888672, -17.98179054260254, -17.432594299316406, -16.883398056030273, -16.33420181274414, -15.785005569458008, -15.235809326171875, -14.686613082885742, -14.13741683959961, -13.588220596313477, -13.039024353027344, -12.489828109741211, -11.940631866455078, -11.391435623168945, -10.842239379882812, -10.29304313659668, -9.743846893310547, -9.194650650024414, -8.645454406738281, -8.096258163452148, -7.547061920166016, -6.997865676879883, -6.44866943359375, -5.899473190307617, -5.350276947021484, -4.801080703735352, -4.251884460449219, -3.702688217163086, -3.153491973876953, -2.6042957305908203, -2.0550994873046875, -1.5059032440185547, -0.9567070007324219, -0.40751075744628906, 0.14168548583984375, 0.6908817291259766, 1.2400779724121094, 1.7892742156982422, 2.338470458984375, 2.887666702270508, 3.4368629455566406, 3.9860591888427734, 4.535255432128906, 5.084451675415039, 5.633647918701172, 6.182844161987305, 6.7320404052734375, 7.28123664855957, 7.830432891845703, 8.379629135131836, 8.928825378417969, 9.478021621704102, 10.027217864990234, 10.576414108276367, 11.1256103515625, 11.674806594848633, 12.224002838134766, 12.773199081420898, 13.322395324707031, 13.871591567993164, 14.420787811279297, 14.96998405456543, 15.519180297851562]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 5.0, 12.0, 9.0, 13.0, 11.0, 15.0, 22.0, 33.0, 25.0, 31.0, 28.0, 33.0, 39.0, 41.0, 40.0, 37.0, 41.0, 45.0, 34.0, 34.0, 51.0, 36.0, 49.0, 28.0, 32.0, 36.0, 31.0, 23.0, 24.0, 25.0, 22.0, 14.0, 15.0, 14.0, 16.0, 5.0, 7.0, 7.0, 3.0, 5.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0], "bins": [-3.0390625, -2.951690673828125, -2.86431884765625, -2.776947021484375, -2.6895751953125, -2.602203369140625, -2.51483154296875, -2.427459716796875, -2.340087890625, -2.252716064453125, -2.16534423828125, -2.077972412109375, -1.9906005859375, -1.903228759765625, -1.81585693359375, -1.728485107421875, -1.64111328125, -1.553741455078125, -1.46636962890625, -1.378997802734375, -1.2916259765625, -1.204254150390625, -1.11688232421875, -1.029510498046875, -0.942138671875, -0.854766845703125, -0.76739501953125, -0.680023193359375, -0.5926513671875, -0.505279541015625, -0.41790771484375, -0.330535888671875, -0.2431640625, -0.155792236328125, -0.06842041015625, 0.018951416015625, 0.1063232421875, 0.193695068359375, 0.28106689453125, 0.368438720703125, 0.455810546875, 0.543182373046875, 0.63055419921875, 0.717926025390625, 0.8052978515625, 0.892669677734375, 0.98004150390625, 1.067413330078125, 1.15478515625, 1.242156982421875, 1.32952880859375, 1.416900634765625, 1.5042724609375, 1.591644287109375, 1.67901611328125, 1.766387939453125, 1.853759765625, 1.941131591796875, 2.02850341796875, 2.115875244140625, 2.2032470703125, 2.290618896484375, 2.37799072265625, 2.465362548828125, 2.552734375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 0.0, 5.0, 8.0, 14.0, 12.0, 17.0, 26.0, 42.0, 58.0, 85.0, 118.0, 156.0, 257.0, 355.0, 553.0, 742.0, 1073.0, 1571.0, 2442.0, 3791.0, 5622.0, 8773.0, 13626.0, 21272.0, 34674.0, 56110.0, 98145.0, 211623.0, 281311.0, 125339.0, 68021.0, 40994.0, 25447.0, 16158.0, 10361.0, 6662.0, 4387.0, 2944.0, 1817.0, 1275.0, 844.0, 608.0, 387.0, 281.0, 191.0, 116.0, 76.0, 48.0, 46.0, 28.0, 13.0, 15.0, 15.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0203094482421875, -0.01961350440979004, -0.018917560577392578, -0.018221616744995117, -0.017525672912597656, -0.016829729080200195, -0.016133785247802734, -0.015437841415405273, -0.014741897583007812, -0.014045953750610352, -0.01335000991821289, -0.01265406608581543, -0.011958122253417969, -0.011262178421020508, -0.010566234588623047, -0.009870290756225586, -0.009174346923828125, -0.008478403091430664, -0.007782459259033203, -0.007086515426635742, -0.006390571594238281, -0.00569462776184082, -0.004998683929443359, -0.0043027400970458984, -0.0036067962646484375, -0.0029108524322509766, -0.0022149085998535156, -0.0015189647674560547, -0.0008230209350585938, -0.0001270771026611328, 0.0005688667297363281, 0.001264810562133789, 0.00196075439453125, 0.002656698226928711, 0.003352642059326172, 0.004048585891723633, 0.004744529724121094, 0.005440473556518555, 0.006136417388916016, 0.0068323612213134766, 0.0075283050537109375, 0.008224248886108398, 0.00892019271850586, 0.00961613655090332, 0.010312080383300781, 0.011008024215698242, 0.011703968048095703, 0.012399911880493164, 0.013095855712890625, 0.013791799545288086, 0.014487743377685547, 0.015183687210083008, 0.01587963104248047, 0.01657557487487793, 0.01727151870727539, 0.01796746253967285, 0.018663406372070312, 0.019359350204467773, 0.020055294036865234, 0.020751237869262695, 0.021447181701660156, 0.022143125534057617, 0.022839069366455078, 0.02353501319885254, 0.02423095703125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 14.0, 7.0, 6.0, 15.0, 10.0, 11.0, 21.0, 33.0, 19.0, 27.0, 28.0, 43.0, 31.0, 31.0, 36.0, 29.0, 40.0, 54.0, 1066.0, 46.0, 38.0, 32.0, 34.0, 49.0, 37.0, 23.0, 27.0, 27.0, 32.0, 30.0, 23.0, 21.0, 18.0, 16.0, 6.0, 13.0, 7.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.021484375, -1.965301513671875, -1.90911865234375, -1.852935791015625, -1.7967529296875, -1.740570068359375, -1.68438720703125, -1.628204345703125, -1.572021484375, -1.515838623046875, -1.45965576171875, -1.403472900390625, -1.3472900390625, -1.291107177734375, -1.23492431640625, -1.178741455078125, -1.12255859375, -1.066375732421875, -1.01019287109375, -0.954010009765625, -0.8978271484375, -0.841644287109375, -0.78546142578125, -0.729278564453125, -0.673095703125, -0.616912841796875, -0.56072998046875, -0.504547119140625, -0.4483642578125, -0.392181396484375, -0.33599853515625, -0.279815673828125, -0.2236328125, -0.167449951171875, -0.11126708984375, -0.055084228515625, 0.0010986328125, 0.057281494140625, 0.11346435546875, 0.169647216796875, 0.225830078125, 0.282012939453125, 0.33819580078125, 0.394378662109375, 0.4505615234375, 0.506744384765625, 0.56292724609375, 0.619110107421875, 0.67529296875, 0.731475830078125, 0.78765869140625, 0.843841552734375, 0.9000244140625, 0.956207275390625, 1.01239013671875, 1.068572998046875, 1.124755859375, 1.180938720703125, 1.23712158203125, 1.293304443359375, 1.3494873046875, 1.405670166015625, 1.46185302734375, 1.518035888671875, 1.57421875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 10.0, 18.0, 17.0, 35.0, 29.0, 62.0, 88.0, 145.0, 200.0, 295.0, 491.0, 677.0, 1085.0, 1429.0, 2200.0, 3186.0, 4804.0, 7179.0, 10599.0, 15760.0, 24065.0, 37783.0, 61048.0, 105907.0, 237745.0, 1296642.0, 110039.0, 62838.0, 38585.0, 24705.0, 16058.0, 10939.0, 7349.0, 4910.0, 3314.0, 2244.0, 1532.0, 1082.0, 680.0, 473.0, 302.0, 189.0, 147.0, 86.0, 56.0, 38.0, 19.0, 20.0, 7.0, 10.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.013763427734375, -0.013319849967956543, -0.012876272201538086, -0.012432694435119629, -0.011989116668701172, -0.011545538902282715, -0.011101961135864258, -0.0106583833694458, -0.010214805603027344, -0.009771227836608887, -0.00932765007019043, -0.008884072303771973, -0.008440494537353516, -0.007996916770935059, -0.0075533390045166016, -0.0071097612380981445, -0.0066661834716796875, -0.0062226057052612305, -0.0057790279388427734, -0.005335450172424316, -0.004891872406005859, -0.004448294639587402, -0.004004716873168945, -0.0035611391067504883, -0.0031175613403320312, -0.0026739835739135742, -0.002230405807495117, -0.0017868280410766602, -0.0013432502746582031, -0.0008996725082397461, -0.00045609474182128906, -1.2516975402832031e-05, 0.000431060791015625, 0.000874638557434082, 0.001318216323852539, 0.001761794090270996, 0.002205371856689453, 0.00264894962310791, 0.003092527389526367, 0.0035361051559448242, 0.003979682922363281, 0.004423260688781738, 0.004866838455200195, 0.005310416221618652, 0.005753993988037109, 0.006197571754455566, 0.0066411495208740234, 0.0070847272872924805, 0.0075283050537109375, 0.007971882820129395, 0.008415460586547852, 0.008859038352966309, 0.009302616119384766, 0.009746193885803223, 0.01018977165222168, 0.010633349418640137, 0.011076927185058594, 0.01152050495147705, 0.011964082717895508, 0.012407660484313965, 0.012851238250732422, 0.013294816017150879, 0.013738393783569336, 0.014181971549987793, 0.01462554931640625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 39.0, 0.0, 0.0, 0.0, 0.0, 110.0, 0.0, 0.0, 0.0, 0.0, 0.0, 676.0, 0.0, 0.0, 0.0, 0.0, 123.0, 0.0, 0.0, 0.0, 0.0, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.46451997756958e-07, -3.3527612686157227e-07, -3.241002559661865e-07, -3.129243850708008e-07, -3.0174851417541504e-07, -2.905726432800293e-07, -2.7939677238464355e-07, -2.682209014892578e-07, -2.5704503059387207e-07, -2.4586915969848633e-07, -2.3469328880310059e-07, -2.2351741790771484e-07, -2.123415470123291e-07, -2.0116567611694336e-07, -1.8998980522155762e-07, -1.7881393432617188e-07, -1.6763806343078613e-07, -1.564621925354004e-07, -1.4528632164001465e-07, -1.341104507446289e-07, -1.2293457984924316e-07, -1.1175870895385742e-07, -1.0058283805847168e-07, -8.940696716308594e-08, -7.82310962677002e-08, -6.705522537231445e-08, -5.587935447692871e-08, -4.470348358154297e-08, -3.3527612686157227e-08, -2.2351741790771484e-08, -1.1175870895385742e-08, 0.0, 1.1175870895385742e-08, 2.2351741790771484e-08, 3.3527612686157227e-08, 4.470348358154297e-08, 5.587935447692871e-08, 6.705522537231445e-08, 7.82310962677002e-08, 8.940696716308594e-08, 1.0058283805847168e-07, 1.1175870895385742e-07, 1.2293457984924316e-07, 1.341104507446289e-07, 1.4528632164001465e-07, 1.564621925354004e-07, 1.6763806343078613e-07, 1.7881393432617188e-07, 1.8998980522155762e-07, 2.0116567611694336e-07, 2.123415470123291e-07, 2.2351741790771484e-07, 2.3469328880310059e-07, 2.4586915969848633e-07, 2.5704503059387207e-07, 2.682209014892578e-07, 2.7939677238464355e-07, 2.905726432800293e-07, 3.0174851417541504e-07, 3.129243850708008e-07, 3.241002559661865e-07, 3.3527612686157227e-07, 3.46451997756958e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 0.0, 2.0, 5.0, 7.0, 2.0, 0.0, 4.0, 4.0, 23.0, 4.0, 8.0, 4.0, 23.0, 119.0, 46.0, 87.0, 252.0, 3500.0, 117642.0, 922779.0, 3506.0, 227.0, 72.0, 57.0, 107.0, 20.0, 3.0, 3.0, 3.0, 25.0, 7.0, 6.0, 1.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.556510925292969e-06, -6.345100700855255e-06, -6.1336904764175415e-06, -5.922280251979828e-06, -5.710870027542114e-06, -5.499459803104401e-06, -5.288049578666687e-06, -5.076639354228973e-06, -4.86522912979126e-06, -4.653818905353546e-06, -4.4424086809158325e-06, -4.230998456478119e-06, -4.019588232040405e-06, -3.8081780076026917e-06, -3.596767783164978e-06, -3.3853575587272644e-06, -3.1739473342895508e-06, -2.962537109851837e-06, -2.7511268854141235e-06, -2.53971666097641e-06, -2.3283064365386963e-06, -2.1168962121009827e-06, -1.905485987663269e-06, -1.6940757632255554e-06, -1.4826655387878418e-06, -1.2712553143501282e-06, -1.0598450899124146e-06, -8.484348654747009e-07, -6.370246410369873e-07, -4.256144165992737e-07, -2.1420419216156006e-07, -2.7939677238464355e-09, 2.086162567138672e-07, 4.200264811515808e-07, 6.314367055892944e-07, 8.428469300270081e-07, 1.0542571544647217e-06, 1.2656673789024353e-06, 1.477077603340149e-06, 1.6884878277778625e-06, 1.8998980522155762e-06, 2.11130827665329e-06, 2.3227185010910034e-06, 2.534128725528717e-06, 2.7455389499664307e-06, 2.9569491744041443e-06, 3.168359398841858e-06, 3.3797696232795715e-06, 3.591179847717285e-06, 3.8025900721549988e-06, 4.014000296592712e-06, 4.225410521030426e-06, 4.43682074546814e-06, 4.648230969905853e-06, 4.859641194343567e-06, 5.0710514187812805e-06, 5.282461643218994e-06, 5.493871867656708e-06, 5.705282092094421e-06, 5.916692316532135e-06, 6.128102540969849e-06, 6.339512765407562e-06, 6.550922989845276e-06, 6.7623332142829895e-06, 6.973743438720703e-06]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 11.0, 23.0, 36.0, 877.0, 28.0, 12.0, 16.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.128985153784015e-07, -3.890868640610279e-07, -3.6527518432194483e-07, -3.414635330045712e-07, -3.176518816871976e-07, -2.93840230369824e-07, -2.7002855063074094e-07, -2.462168993133673e-07, -2.22405233785139e-07, -1.9859356825691066e-07, -1.7478191693953704e-07, -1.509702514113087e-07, -1.2715858588308038e-07, -1.0334693456570676e-07, -7.953526903747843e-08, -5.572361772010481e-08, -3.191195219187648e-08, -8.100291992718667e-09, 1.5711368206439147e-08, 3.95230301819538e-08, 6.333468860475477e-08, 8.714634702755575e-08, 1.1095801255578408e-07, 1.347696638731577e-07, 1.5858132940138603e-07, 1.8239299492961436e-07, 2.0620464624698798e-07, 2.300163117752163e-07, 2.5382797730344464e-07, 2.7763962862081826e-07, 3.014512799381919e-07, 3.252629312555655e-07, 3.490745825729391e-07, 3.728862338903127e-07, 3.9669791362939577e-07, 4.205095649467694e-07, 4.44321216264143e-07, 4.6813289600322605e-07, 4.919445473205997e-07, 5.157561986379733e-07, 5.395678499553469e-07, 5.633795012727205e-07, 5.871911525900941e-07, 6.110028607508866e-07, 6.348145120682602e-07, 6.586261633856338e-07, 6.824378147030075e-07, 7.062494660203811e-07, 7.300611741811736e-07, 7.538728254985472e-07, 7.776844768159208e-07, 8.014961849767133e-07, 8.253078362940869e-07, 8.491194876114605e-07, 8.729311389288341e-07, 8.967427902462077e-07, 9.205544415635813e-07, 9.44366092880955e-07, 9.681778010417474e-07, 9.919893955157022e-07, 1.0158011036764947e-06, 1.0396126981504494e-06, 1.063424406311242e-06, 1.0872361144720344e-06, 1.1110477089459891e-06]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 859.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 72.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 5.0, 12.0, 9.0, 13.0, 11.0, 15.0, 22.0, 33.0, 25.0, 31.0, 28.0, 33.0, 39.0, 41.0, 40.0, 37.0, 41.0, 45.0, 34.0, 34.0, 51.0, 36.0, 49.0, 28.0, 32.0, 36.0, 31.0, 23.0, 24.0, 25.0, 22.0, 14.0, 15.0, 14.0, 16.0, 5.0, 7.0, 7.0, 3.0, 5.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0], "bins": [-3.0390625, -2.951690673828125, -2.86431884765625, -2.776947021484375, -2.6895751953125, -2.602203369140625, -2.51483154296875, -2.427459716796875, -2.340087890625, -2.252716064453125, -2.16534423828125, -2.077972412109375, -1.9906005859375, -1.903228759765625, -1.81585693359375, -1.728485107421875, -1.64111328125, -1.553741455078125, -1.46636962890625, -1.378997802734375, -1.2916259765625, -1.204254150390625, -1.11688232421875, -1.029510498046875, -0.942138671875, -0.854766845703125, -0.76739501953125, -0.680023193359375, -0.5926513671875, -0.505279541015625, -0.41790771484375, -0.330535888671875, -0.2431640625, -0.155792236328125, -0.06842041015625, 0.018951416015625, 0.1063232421875, 0.193695068359375, 0.28106689453125, 0.368438720703125, 0.455810546875, 0.543182373046875, 0.63055419921875, 0.717926025390625, 0.8052978515625, 0.892669677734375, 0.98004150390625, 1.067413330078125, 1.15478515625, 1.242156982421875, 1.32952880859375, 1.416900634765625, 1.5042724609375, 1.591644287109375, 1.67901611328125, 1.766387939453125, 1.853759765625, 1.941131591796875, 2.02850341796875, 2.115875244140625, 2.2032470703125, 2.290618896484375, 2.37799072265625, 2.465362548828125, 2.552734375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 14.0, 8.0, 19.0, 22.0, 42.0, 38.0, 79.0, 104.0, 163.0, 229.0, 391.0, 587.0, 952.0, 1551.0, 2598.0, 4385.0, 7680.0, 14054.0, 28321.0, 62058.0, 154271.0, 407425.0, 209873.0, 79166.0, 35265.0, 17197.0, 9152.0, 5141.0, 2973.0, 1798.0, 1077.0, 684.0, 400.0, 262.0, 196.0, 116.0, 76.0, 49.0, 42.0, 26.0, 19.0, 10.0, 7.0, 13.0, 5.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.576171875, -2.499603271484375, -2.42303466796875, -2.346466064453125, -2.2698974609375, -2.193328857421875, -2.11676025390625, -2.040191650390625, -1.963623046875, -1.887054443359375, -1.81048583984375, -1.733917236328125, -1.6573486328125, -1.580780029296875, -1.50421142578125, -1.427642822265625, -1.35107421875, -1.274505615234375, -1.19793701171875, -1.121368408203125, -1.0447998046875, -0.968231201171875, -0.89166259765625, -0.815093994140625, -0.738525390625, -0.661956787109375, -0.58538818359375, -0.508819580078125, -0.4322509765625, -0.355682373046875, -0.27911376953125, -0.202545166015625, -0.1259765625, -0.049407958984375, 0.02716064453125, 0.103729248046875, 0.1802978515625, 0.256866455078125, 0.33343505859375, 0.410003662109375, 0.486572265625, 0.563140869140625, 0.63970947265625, 0.716278076171875, 0.7928466796875, 0.869415283203125, 0.94598388671875, 1.022552490234375, 1.09912109375, 1.175689697265625, 1.25225830078125, 1.328826904296875, 1.4053955078125, 1.481964111328125, 1.55853271484375, 1.635101318359375, 1.711669921875, 1.788238525390625, 1.86480712890625, 1.941375732421875, 2.0179443359375, 2.094512939453125, 2.17108154296875, 2.247650146484375, 2.32421875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 5.0, 6.0, 7.0, 11.0, 8.0, 11.0, 11.0, 19.0, 21.0, 22.0, 33.0, 23.0, 35.0, 32.0, 46.0, 46.0, 52.0, 95.0, 254.0, 1568.0, 209.0, 90.0, 67.0, 40.0, 43.0, 44.0, 44.0, 34.0, 25.0, 21.0, 21.0, 21.0, 14.0, 8.0, 12.0, 9.0, 9.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.8511962890625, -7.553955078125, -7.2567138671875, -6.95947265625, -6.6622314453125, -6.364990234375, -6.0677490234375, -5.7705078125, -5.4732666015625, -5.176025390625, -4.8787841796875, -4.58154296875, -4.2843017578125, -3.987060546875, -3.6898193359375, -3.392578125, -3.0953369140625, -2.798095703125, -2.5008544921875, -2.20361328125, -1.9063720703125, -1.609130859375, -1.3118896484375, -1.0146484375, -0.7174072265625, -0.420166015625, -0.1229248046875, 0.17431640625, 0.4715576171875, 0.768798828125, 1.0660400390625, 1.36328125, 1.6605224609375, 1.957763671875, 2.2550048828125, 2.55224609375, 2.8494873046875, 3.146728515625, 3.4439697265625, 3.7412109375, 4.0384521484375, 4.335693359375, 4.6329345703125, 4.93017578125, 5.2274169921875, 5.524658203125, 5.8218994140625, 6.119140625, 6.4163818359375, 6.713623046875, 7.0108642578125, 7.30810546875, 7.6053466796875, 7.902587890625, 8.1998291015625, 8.4970703125, 8.7943115234375, 9.091552734375, 9.3887939453125, 9.68603515625, 9.9832763671875, 10.280517578125, 10.5777587890625, 10.875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 4.0, 8.0, 10.0, 14.0, 16.0, 13.0, 25.0, 25.0, 30.0, 49.0, 66.0, 90.0, 121.0, 153.0, 207.0, 384.0, 785.0, 3284.0, 76817.0, 3015867.0, 43447.0, 2500.0, 663.0, 303.0, 212.0, 152.0, 110.0, 74.0, 48.0, 43.0, 41.0, 28.0, 20.0, 19.0, 12.0, 8.0, 11.0, 7.0, 5.0, 6.0, 2.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0], "bins": [-20.8125, -20.2413330078125, -19.670166015625, -19.0989990234375, -18.52783203125, -17.9566650390625, -17.385498046875, -16.8143310546875, -16.2431640625, -15.6719970703125, -15.100830078125, -14.5296630859375, -13.95849609375, -13.3873291015625, -12.816162109375, -12.2449951171875, -11.673828125, -11.1026611328125, -10.531494140625, -9.9603271484375, -9.38916015625, -8.8179931640625, -8.246826171875, -7.6756591796875, -7.1044921875, -6.5333251953125, -5.962158203125, -5.3909912109375, -4.81982421875, -4.2486572265625, -3.677490234375, -3.1063232421875, -2.53515625, -1.9639892578125, -1.392822265625, -0.8216552734375, -0.25048828125, 0.3206787109375, 0.891845703125, 1.4630126953125, 2.0341796875, 2.6053466796875, 3.176513671875, 3.7476806640625, 4.31884765625, 4.8900146484375, 5.461181640625, 6.0323486328125, 6.603515625, 7.1746826171875, 7.745849609375, 8.3170166015625, 8.88818359375, 9.4593505859375, 10.030517578125, 10.6016845703125, 11.1728515625, 11.7440185546875, 12.315185546875, 12.8863525390625, 13.45751953125, 14.0286865234375, 14.599853515625, 15.1710205078125, 15.7421875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 22.0, 84.0, 239.0, 387.0, 203.0, 70.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.57625961303711, -46.338165283203125, -45.100067138671875, -43.86197280883789, -42.623878479003906, -41.385780334472656, -40.14768600463867, -38.90959167480469, -37.67149353027344, -36.43339920043945, -35.1953010559082, -33.95720672607422, -32.719112396240234, -31.481014251708984, -30.242919921875, -29.004823684692383, -27.7667293548584, -26.52863311767578, -25.290538787841797, -24.05244255065918, -22.814346313476562, -21.576251983642578, -20.33815574645996, -19.100059509277344, -17.86196517944336, -16.623868942260742, -15.385773658752441, -14.14767837524414, -12.909582138061523, -11.671486854553223, -10.433391571044922, -9.195295333862305, -7.9571990966796875, -6.7191033363342285, -5.4810075759887695, -4.242912292480469, -3.0048165321350098, -1.7667207717895508, -0.52862548828125, 0.7094707489013672, 1.947566032409668, 3.185661792755127, 4.423757553100586, 5.661852836608887, 6.899948596954346, 8.138044357299805, 9.376139640808105, 10.614235877990723, 11.852331161499023, 13.090426445007324, 14.328522682189941, 15.566617965698242, 16.80471420288086, 18.042808532714844, 19.28090476989746, 20.519001007080078, 21.757095336914062, 22.99519157409668, 24.233285903930664, 25.47138214111328, 26.7094783782959, 27.947574615478516, 29.1856689453125, 30.423765182495117, 31.661861419677734]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 7.0, 11.0, 10.0, 13.0, 15.0, 21.0, 18.0, 23.0, 32.0, 27.0, 47.0, 42.0, 44.0, 40.0, 57.0, 42.0, 36.0, 62.0, 57.0, 43.0, 40.0, 44.0, 41.0, 41.0, 29.0, 27.0, 21.0, 19.0, 12.0, 14.0, 15.0, 7.0, 5.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.67438507080078, -30.776508331298828, -29.878633499145508, -28.980756759643555, -28.0828800201416, -27.18500518798828, -26.287128448486328, -25.389251708984375, -24.491374969482422, -23.59349822998047, -22.69562339782715, -21.797746658325195, -20.899869918823242, -20.001995086669922, -19.10411834716797, -18.206241607666016, -17.308364868164062, -16.41048812866211, -15.512612342834473, -14.614736557006836, -13.716859817504883, -12.818984031677246, -11.92110824584961, -11.023231506347656, -10.125356674194336, -9.2274808883667, -8.329604148864746, -7.431728363037109, -6.533851623535156, -5.6359758377075195, -4.738099575042725, -3.8402233123779297, -2.9423465728759766, -2.0444703102111816, -1.1465941667556763, -0.2487180233001709, 0.649158239364624, 1.5470342636108398, 2.4449105262756348, 3.3427867889404297, 4.240663051605225, 5.1385393142700195, 6.0364155769348145, 6.934291839599609, 7.832167625427246, 8.730043411254883, 9.627920150756836, 10.525796890258789, 11.423672676086426, 12.321548461914062, 13.219425201416016, 14.117300987243652, 15.015177726745605, 15.913053512573242, 16.810930252075195, 17.708805084228516, 18.60668182373047, 19.504558563232422, 20.402433395385742, 21.300310134887695, 22.19818687438965, 23.09606170654297, 23.993938446044922, 24.891815185546875, 25.789691925048828]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 7.0, 12.0, 15.0, 14.0, 22.0, 21.0, 36.0, 26.0, 17.0, 23.0, 40.0, 36.0, 40.0, 33.0, 50.0, 40.0, 43.0, 40.0, 27.0, 39.0, 44.0, 35.0, 31.0, 29.0, 27.0, 31.0, 33.0, 14.0, 23.0, 21.0, 21.0, 15.0, 19.0, 10.0, 10.0, 10.0, 4.0, 4.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0], "bins": [-3.0703125, -2.983917236328125, -2.89752197265625, -2.811126708984375, -2.7247314453125, -2.638336181640625, -2.55194091796875, -2.465545654296875, -2.379150390625, -2.292755126953125, -2.20635986328125, -2.119964599609375, -2.0335693359375, -1.947174072265625, -1.86077880859375, -1.774383544921875, -1.68798828125, -1.601593017578125, -1.51519775390625, -1.428802490234375, -1.3424072265625, -1.256011962890625, -1.16961669921875, -1.083221435546875, -0.996826171875, -0.910430908203125, -0.82403564453125, -0.737640380859375, -0.6512451171875, -0.564849853515625, -0.47845458984375, -0.392059326171875, -0.3056640625, -0.219268798828125, -0.13287353515625, -0.046478271484375, 0.0399169921875, 0.126312255859375, 0.21270751953125, 0.299102783203125, 0.385498046875, 0.471893310546875, 0.55828857421875, 0.644683837890625, 0.7310791015625, 0.817474365234375, 0.90386962890625, 0.990264892578125, 1.07666015625, 1.163055419921875, 1.24945068359375, 1.335845947265625, 1.4222412109375, 1.508636474609375, 1.59503173828125, 1.681427001953125, 1.767822265625, 1.854217529296875, 1.94061279296875, 2.027008056640625, 2.1134033203125, 2.199798583984375, 2.28619384765625, 2.372589111328125, 2.458984375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 12.0, 11.0, 14.0, 23.0, 25.0, 31.0, 56.0, 67.0, 86.0, 126.0, 184.0, 315.0, 626.0, 1251.0, 2707.0, 6715.0, 19355.0, 61124.0, 216831.0, 843586.0, 1823245.0, 894222.0, 226273.0, 63715.0, 20367.0, 7213.0, 3037.0, 1310.0, 635.0, 332.0, 232.0, 150.0, 85.0, 77.0, 61.0, 36.0, 33.0, 28.0, 9.0, 11.0, 17.0, 12.0, 8.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.9921875, -4.84326171875, -4.6943359375, -4.54541015625, -4.396484375, -4.24755859375, -4.0986328125, -3.94970703125, -3.80078125, -3.65185546875, -3.5029296875, -3.35400390625, -3.205078125, -3.05615234375, -2.9072265625, -2.75830078125, -2.609375, -2.46044921875, -2.3115234375, -2.16259765625, -2.013671875, -1.86474609375, -1.7158203125, -1.56689453125, -1.41796875, -1.26904296875, -1.1201171875, -0.97119140625, -0.822265625, -0.67333984375, -0.5244140625, -0.37548828125, -0.2265625, -0.07763671875, 0.0712890625, 0.22021484375, 0.369140625, 0.51806640625, 0.6669921875, 0.81591796875, 0.96484375, 1.11376953125, 1.2626953125, 1.41162109375, 1.560546875, 1.70947265625, 1.8583984375, 2.00732421875, 2.15625, 2.30517578125, 2.4541015625, 2.60302734375, 2.751953125, 2.90087890625, 3.0498046875, 3.19873046875, 3.34765625, 3.49658203125, 3.6455078125, 3.79443359375, 3.943359375, 4.09228515625, 4.2412109375, 4.39013671875, 4.5390625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 8.0, 9.0, 13.0, 21.0, 37.0, 41.0, 55.0, 81.0, 126.0, 176.0, 237.0, 300.0, 390.0, 457.0, 479.0, 405.0, 339.0, 268.0, 169.0, 120.0, 91.0, 63.0, 51.0, 38.0, 30.0, 22.0, 15.0, 12.0, 4.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.8046875, -7.6107177734375, -7.416748046875, -7.2227783203125, -7.02880859375, -6.8348388671875, -6.640869140625, -6.4468994140625, -6.2529296875, -6.0589599609375, -5.864990234375, -5.6710205078125, -5.47705078125, -5.2830810546875, -5.089111328125, -4.8951416015625, -4.701171875, -4.5072021484375, -4.313232421875, -4.1192626953125, -3.92529296875, -3.7313232421875, -3.537353515625, -3.3433837890625, -3.1494140625, -2.9554443359375, -2.761474609375, -2.5675048828125, -2.37353515625, -2.1795654296875, -1.985595703125, -1.7916259765625, -1.59765625, -1.4036865234375, -1.209716796875, -1.0157470703125, -0.82177734375, -0.6278076171875, -0.433837890625, -0.2398681640625, -0.0458984375, 0.1480712890625, 0.342041015625, 0.5360107421875, 0.72998046875, 0.9239501953125, 1.117919921875, 1.3118896484375, 1.505859375, 1.6998291015625, 1.893798828125, 2.0877685546875, 2.28173828125, 2.4757080078125, 2.669677734375, 2.8636474609375, 3.0576171875, 3.2515869140625, 3.445556640625, 3.6395263671875, 3.83349609375, 4.0274658203125, 4.221435546875, 4.4154052734375, 4.609375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 11.0, 24.0, 38.0, 34.0, 51.0, 88.0, 117.0, 190.0, 346.0, 672.0, 5799.0, 1378621.0, 2796173.0, 10308.0, 803.0, 372.0, 231.0, 144.0, 74.0, 64.0, 49.0, 18.0, 16.0, 9.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.359375, -22.388916015625, -21.41845703125, -20.447998046875, -19.4775390625, -18.507080078125, -17.53662109375, -16.566162109375, -15.595703125, -14.625244140625, -13.65478515625, -12.684326171875, -11.7138671875, -10.743408203125, -9.77294921875, -8.802490234375, -7.83203125, -6.861572265625, -5.89111328125, -4.920654296875, -3.9501953125, -2.979736328125, -2.00927734375, -1.038818359375, -0.068359375, 0.902099609375, 1.87255859375, 2.843017578125, 3.8134765625, 4.783935546875, 5.75439453125, 6.724853515625, 7.6953125, 8.665771484375, 9.63623046875, 10.606689453125, 11.5771484375, 12.547607421875, 13.51806640625, 14.488525390625, 15.458984375, 16.429443359375, 17.39990234375, 18.370361328125, 19.3408203125, 20.311279296875, 21.28173828125, 22.252197265625, 23.22265625, 24.193115234375, 25.16357421875, 26.134033203125, 27.1044921875, 28.074951171875, 29.04541015625, 30.015869140625, 30.986328125, 31.956787109375, 32.92724609375, 33.897705078125, 34.8681640625, 35.838623046875, 36.80908203125, 37.779541015625, 38.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 53.0, 239.0, 394.0, 242.0, 73.0, 11.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.37049865722656, -140.72056579589844, -137.07064819335938, -133.42071533203125, -129.77078247070312, -126.12085723876953, -122.47093200683594, -118.82099914550781, -115.17107391357422, -111.52114868164062, -107.8712158203125, -104.2212905883789, -100.57136535644531, -96.92143249511719, -93.2715072631836, -89.62158203125, -85.97164916992188, -82.32172393798828, -78.67179107666016, -75.02186584472656, -71.37193298339844, -67.72200775146484, -64.07208251953125, -60.42215347290039, -56.77222442626953, -53.12229537963867, -49.47236633300781, -45.82244110107422, -42.17251205444336, -38.5225830078125, -34.872657775878906, -31.222728729248047, -27.572792053222656, -23.922863006591797, -20.27293586730957, -16.623008728027344, -12.973079681396484, -9.323150634765625, -5.673223495483398, -2.023296356201172, 1.6266326904296875, 5.2765607833862305, 8.926488876342773, 12.576416969299316, 16.22634506225586, 19.87627410888672, 23.526201248168945, 27.176128387451172, 30.82605743408203, 34.47598648071289, 38.12591552734375, 41.775840759277344, 45.4257698059082, 49.07569885253906, 52.725624084472656, 56.375553131103516, 60.025482177734375, 63.675411224365234, 67.3253402709961, 70.97526550292969, 74.62519836425781, 78.2751235961914, 81.925048828125, 85.57498168945312, 89.22490692138672]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 5.0, 5.0, 5.0, 2.0, 12.0, 17.0, 12.0, 19.0, 35.0, 25.0, 28.0, 31.0, 27.0, 29.0, 44.0, 48.0, 45.0, 48.0, 49.0, 45.0, 42.0, 52.0, 55.0, 39.0, 40.0, 38.0, 28.0, 33.0, 28.0, 18.0, 19.0, 22.0, 18.0, 11.0, 8.0, 7.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.5091552734375, -21.86259651184082, -21.21603775024414, -20.569480895996094, -19.922922134399414, -19.276363372802734, -18.629806518554688, -17.983247756958008, -17.336688995361328, -16.69013023376465, -16.04357147216797, -15.397014617919922, -14.750455856323242, -14.103897094726562, -13.4573392868042, -12.810781478881836, -12.164222717285156, -11.517663955688477, -10.871106147766113, -10.22454833984375, -9.57798957824707, -8.93143081665039, -8.284873008728027, -7.638314723968506, -6.991756439208984, -6.345198154449463, -5.698639869689941, -5.05208158493042, -4.405523300170898, -3.758965015411377, -3.1124067306518555, -2.465848445892334, -1.8192882537841797, -1.1727299690246582, -0.5261716842651367, 0.12038660049438477, 0.7669448852539062, 1.4135031700134277, 2.060061454772949, 2.7066197395324707, 3.353178024291992, 3.9997363090515137, 4.646294593811035, 5.292852878570557, 5.939411163330078, 6.5859694480896, 7.232527732849121, 7.879086017608643, 8.525644302368164, 9.172203063964844, 9.818760871887207, 10.46531867980957, 11.11187744140625, 11.75843620300293, 12.404994010925293, 13.051551818847656, 13.698110580444336, 14.344669342041016, 14.991227149963379, 15.637784957885742, 16.284343719482422, 16.9309024810791, 17.57746124267578, 18.224018096923828, 18.870576858520508]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 5.0, 11.0, 7.0, 9.0, 7.0, 10.0, 16.0, 17.0, 25.0, 23.0, 22.0, 26.0, 26.0, 25.0, 38.0, 29.0, 31.0, 37.0, 43.0, 48.0, 36.0, 31.0, 38.0, 32.0, 34.0, 31.0, 46.0, 19.0, 21.0, 33.0, 30.0, 24.0, 16.0, 21.0, 12.0, 14.0, 19.0, 10.0, 14.0, 11.0, 4.0, 9.0, 7.0, 5.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.630859375, -2.552337646484375, -2.47381591796875, -2.395294189453125, -2.3167724609375, -2.238250732421875, -2.15972900390625, -2.081207275390625, -2.002685546875, -1.924163818359375, -1.84564208984375, -1.767120361328125, -1.6885986328125, -1.610076904296875, -1.53155517578125, -1.453033447265625, -1.37451171875, -1.295989990234375, -1.21746826171875, -1.138946533203125, -1.0604248046875, -0.981903076171875, -0.90338134765625, -0.824859619140625, -0.746337890625, -0.667816162109375, -0.58929443359375, -0.510772705078125, -0.4322509765625, -0.353729248046875, -0.27520751953125, -0.196685791015625, -0.1181640625, -0.039642333984375, 0.03887939453125, 0.117401123046875, 0.1959228515625, 0.274444580078125, 0.35296630859375, 0.431488037109375, 0.510009765625, 0.588531494140625, 0.66705322265625, 0.745574951171875, 0.8240966796875, 0.902618408203125, 0.98114013671875, 1.059661865234375, 1.13818359375, 1.216705322265625, 1.29522705078125, 1.373748779296875, 1.4522705078125, 1.530792236328125, 1.60931396484375, 1.687835693359375, 1.766357421875, 1.844879150390625, 1.92340087890625, 2.001922607421875, 2.0804443359375, 2.158966064453125, 2.23748779296875, 2.316009521484375, 2.39453125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 8.0, 7.0, 18.0, 19.0, 26.0, 32.0, 61.0, 72.0, 122.0, 175.0, 260.0, 424.0, 570.0, 826.0, 1161.0, 1624.0, 2358.0, 3354.0, 4592.0, 6653.0, 9737.0, 14222.0, 20659.0, 31014.0, 48199.0, 77689.0, 143855.0, 273162.0, 164632.0, 85109.0, 52233.0, 33804.0, 22451.0, 15187.0, 10327.0, 7177.0, 4963.0, 3494.0, 2380.0, 1784.0, 1255.0, 900.0, 604.0, 421.0, 278.0, 202.0, 149.0, 105.0, 77.0, 45.0, 40.0, 15.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.018798828125, -0.0182037353515625, -0.017608642578125, -0.0170135498046875, -0.01641845703125, -0.0158233642578125, -0.015228271484375, -0.0146331787109375, -0.0140380859375, -0.0134429931640625, -0.012847900390625, -0.0122528076171875, -0.01165771484375, -0.0110626220703125, -0.010467529296875, -0.0098724365234375, -0.00927734375, -0.0086822509765625, -0.008087158203125, -0.0074920654296875, -0.00689697265625, -0.0063018798828125, -0.005706787109375, -0.0051116943359375, -0.0045166015625, -0.0039215087890625, -0.003326416015625, -0.0027313232421875, -0.00213623046875, -0.0015411376953125, -0.000946044921875, -0.0003509521484375, 0.000244140625, 0.0008392333984375, 0.001434326171875, 0.0020294189453125, 0.00262451171875, 0.0032196044921875, 0.003814697265625, 0.0044097900390625, 0.0050048828125, 0.0055999755859375, 0.006195068359375, 0.0067901611328125, 0.00738525390625, 0.0079803466796875, 0.008575439453125, 0.0091705322265625, 0.009765625, 0.0103607177734375, 0.010955810546875, 0.0115509033203125, 0.01214599609375, 0.0127410888671875, 0.013336181640625, 0.0139312744140625, 0.0145263671875, 0.0151214599609375, 0.015716552734375, 0.0163116455078125, 0.01690673828125, 0.0175018310546875, 0.018096923828125, 0.0186920166015625, 0.019287109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 1.0, 3.0, 7.0, 7.0, 8.0, 13.0, 6.0, 10.0, 19.0, 26.0, 15.0, 15.0, 25.0, 25.0, 28.0, 43.0, 25.0, 32.0, 41.0, 38.0, 54.0, 1073.0, 50.0, 42.0, 54.0, 35.0, 38.0, 44.0, 37.0, 25.0, 31.0, 26.0, 12.0, 24.0, 27.0, 18.0, 10.0, 9.0, 7.0, 11.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.943359375, -1.8823394775390625, -1.821319580078125, -1.7602996826171875, -1.69927978515625, -1.6382598876953125, -1.577239990234375, -1.5162200927734375, -1.4552001953125, -1.3941802978515625, -1.333160400390625, -1.2721405029296875, -1.21112060546875, -1.1501007080078125, -1.089080810546875, -1.0280609130859375, -0.967041015625, -0.9060211181640625, -0.845001220703125, -0.7839813232421875, -0.72296142578125, -0.6619415283203125, -0.600921630859375, -0.5399017333984375, -0.4788818359375, -0.4178619384765625, -0.356842041015625, -0.2958221435546875, -0.23480224609375, -0.1737823486328125, -0.112762451171875, -0.0517425537109375, 0.00927734375, 0.0702972412109375, 0.131317138671875, 0.1923370361328125, 0.25335693359375, 0.3143768310546875, 0.375396728515625, 0.4364166259765625, 0.4974365234375, 0.5584564208984375, 0.619476318359375, 0.6804962158203125, 0.74151611328125, 0.8025360107421875, 0.863555908203125, 0.9245758056640625, 0.985595703125, 1.0466156005859375, 1.107635498046875, 1.1686553955078125, 1.22967529296875, 1.2906951904296875, 1.351715087890625, 1.4127349853515625, 1.4737548828125, 1.5347747802734375, 1.595794677734375, 1.6568145751953125, 1.71783447265625, 1.7788543701171875, 1.839874267578125, 1.9008941650390625, 1.9619140625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 16.0, 20.0, 28.0, 51.0, 52.0, 84.0, 118.0, 176.0, 218.0, 325.0, 437.0, 633.0, 879.0, 1257.0, 1802.0, 2558.0, 3526.0, 5113.0, 6975.0, 10028.0, 14439.0, 21713.0, 32285.0, 51183.0, 85902.0, 179429.0, 1336013.0, 135684.0, 71431.0, 43942.0, 28442.0, 19010.0, 12896.0, 8881.0, 6326.0, 4568.0, 3146.0, 2275.0, 1568.0, 1099.0, 735.0, 543.0, 397.0, 264.0, 190.0, 131.0, 94.0, 80.0, 42.0, 41.0, 30.0, 20.0, 14.0, 8.0, 9.0, 2.0, 1.0, 2.0], "bins": [-0.0140380859375, -0.013603925704956055, -0.01316976547241211, -0.012735605239868164, -0.012301445007324219, -0.011867284774780273, -0.011433124542236328, -0.010998964309692383, -0.010564804077148438, -0.010130643844604492, -0.009696483612060547, -0.009262323379516602, -0.008828163146972656, -0.008394002914428711, -0.007959842681884766, -0.00752568244934082, -0.007091522216796875, -0.00665736198425293, -0.006223201751708984, -0.005789041519165039, -0.005354881286621094, -0.0049207210540771484, -0.004486560821533203, -0.004052400588989258, -0.0036182403564453125, -0.003184080123901367, -0.002749919891357422, -0.0023157596588134766, -0.0018815994262695312, -0.001447439193725586, -0.0010132789611816406, -0.0005791187286376953, -0.00014495849609375, 0.0002892017364501953, 0.0007233619689941406, 0.001157522201538086, 0.0015916824340820312, 0.0020258426666259766, 0.002460002899169922, 0.002894163131713867, 0.0033283233642578125, 0.003762483596801758, 0.004196643829345703, 0.0046308040618896484, 0.005064964294433594, 0.005499124526977539, 0.005933284759521484, 0.00636744499206543, 0.006801605224609375, 0.00723576545715332, 0.007669925689697266, 0.008104085922241211, 0.008538246154785156, 0.008972406387329102, 0.009406566619873047, 0.009840726852416992, 0.010274887084960938, 0.010709047317504883, 0.011143207550048828, 0.011577367782592773, 0.012011528015136719, 0.012445688247680664, 0.01287984848022461, 0.013314008712768555, 0.0137481689453125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 0.0, 0.0, 141.0, 0.0, 0.0, 0.0, 0.0, 681.0, 0.0, 0.0, 0.0, 0.0, 0.0, 105.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.473833203315735e-07, -3.371387720108032e-07, -3.2689422369003296e-07, -3.166496753692627e-07, -3.0640512704849243e-07, -2.9616057872772217e-07, -2.859160304069519e-07, -2.7567148208618164e-07, -2.654269337654114e-07, -2.551823854446411e-07, -2.4493783712387085e-07, -2.3469328880310059e-07, -2.2444874048233032e-07, -2.1420419216156006e-07, -2.039596438407898e-07, -1.9371509552001953e-07, -1.8347054719924927e-07, -1.73225998878479e-07, -1.6298145055770874e-07, -1.5273690223693848e-07, -1.424923539161682e-07, -1.3224780559539795e-07, -1.2200325727462769e-07, -1.1175870895385742e-07, -1.0151416063308716e-07, -9.12696123123169e-08, -8.102506399154663e-08, -7.078051567077637e-08, -6.05359673500061e-08, -5.029141902923584e-08, -4.0046870708465576e-08, -2.9802322387695312e-08, -1.955777406692505e-08, -9.313225746154785e-09, 9.313225746154785e-10, 1.1175870895385742e-08, 2.1420419216156006e-08, 3.166496753692627e-08, 4.190951585769653e-08, 5.21540641784668e-08, 6.239861249923706e-08, 7.264316082000732e-08, 8.288770914077759e-08, 9.313225746154785e-08, 1.0337680578231812e-07, 1.1362135410308838e-07, 1.2386590242385864e-07, 1.341104507446289e-07, 1.4435499906539917e-07, 1.5459954738616943e-07, 1.648440957069397e-07, 1.7508864402770996e-07, 1.8533319234848022e-07, 1.955777406692505e-07, 2.0582228899002075e-07, 2.1606683731079102e-07, 2.2631138563156128e-07, 2.3655593395233154e-07, 2.468004822731018e-07, 2.5704503059387207e-07, 2.6728957891464233e-07, 2.775341272354126e-07, 2.8777867555618286e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 21.0, 6.0, 4.0, 4.0, 4.0, 13.0, 93.0, 68.0, 46.0, 204.0, 826.0, 27183.0, 1012015.0, 7221.0, 472.0, 76.0, 41.0, 68.0, 107.0, 21.0, 2.0, 5.0, 4.0, 7.0, 19.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.602836608886719e-06, -5.411915481090546e-06, -5.2209943532943726e-06, -5.0300732254981995e-06, -4.839152097702026e-06, -4.648230969905853e-06, -4.45730984210968e-06, -4.266388714313507e-06, -4.075467586517334e-06, -3.884546458721161e-06, -3.693625330924988e-06, -3.5027042031288147e-06, -3.3117830753326416e-06, -3.1208619475364685e-06, -2.9299408197402954e-06, -2.7390196919441223e-06, -2.5480985641479492e-06, -2.357177436351776e-06, -2.166256308555603e-06, -1.97533518075943e-06, -1.7844140529632568e-06, -1.5934929251670837e-06, -1.4025717973709106e-06, -1.2116506695747375e-06, -1.0207295417785645e-06, -8.298084139823914e-07, -6.388872861862183e-07, -4.4796615839004517e-07, -2.5704503059387207e-07, -6.612390279769897e-08, 1.2479722499847412e-07, 3.157183527946472e-07, 5.066394805908203e-07, 6.975606083869934e-07, 8.884817361831665e-07, 1.0794028639793396e-06, 1.2703239917755127e-06, 1.4612451195716858e-06, 1.6521662473678589e-06, 1.843087375164032e-06, 2.034008502960205e-06, 2.224929630756378e-06, 2.4158507585525513e-06, 2.6067718863487244e-06, 2.7976930141448975e-06, 2.9886141419410706e-06, 3.1795352697372437e-06, 3.3704563975334167e-06, 3.56137752532959e-06, 3.752298653125763e-06, 3.943219780921936e-06, 4.134140908718109e-06, 4.325062036514282e-06, 4.515983164310455e-06, 4.706904292106628e-06, 4.8978254199028015e-06, 5.088746547698975e-06, 5.279667675495148e-06, 5.470588803291321e-06, 5.661509931087494e-06, 5.852431058883667e-06, 6.04335218667984e-06, 6.234273314476013e-06, 6.425194442272186e-06, 6.616115570068359e-06]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 5.0, 11.0, 914.0, 12.0, 8.0, 6.0, 10.0, 8.0, 6.0, 7.0, 1.0, 4.0, 2.0, 1.0], "bins": [-4.322822064750653e-07, -4.240960436163732e-07, -4.159098807576811e-07, -4.07723717898989e-07, -3.9953755504029687e-07, -3.913513637598953e-07, -3.831652009012032e-07, -3.749790380425111e-07, -3.66792875183819e-07, -3.5860671232512686e-07, -3.5042054946643475e-07, -3.4223438660774264e-07, -3.340481953273411e-07, -3.25862032468649e-07, -3.1767586960995686e-07, -3.0948970675126475e-07, -3.0130354389257263e-07, -2.931173810338805e-07, -2.849312181751884e-07, -2.767450553164963e-07, -2.685588924578042e-07, -2.6037270117740263e-07, -2.521865383187105e-07, -2.440003754600184e-07, -2.358142126013263e-07, -2.2762804974263418e-07, -2.1944188688394206e-07, -2.1125570981439523e-07, -2.0306954695570312e-07, -1.94883384097011e-07, -1.8669720702746417e-07, -1.7851104416877206e-07, -1.7032488131007995e-07, -1.6213871845138783e-07, -1.5395255559269572e-07, -1.457663785231489e-07, -1.3758021566445677e-07, -1.2939405280576466e-07, -1.2120787573621783e-07, -1.1302171287752572e-07, -1.048355500188336e-07, -9.664938716014149e-08, -8.846321719602201e-08, -8.027704723190254e-08, -7.209088437321043e-08, -6.390472151451831e-08, -5.571855155039884e-08, -4.753238513899305e-08, -3.9346218727587257e-08, -3.1160052316181464e-08, -2.297388590477567e-08, -1.4787719493369877e-08, -6.601553081964084e-09, 1.5846133294417086e-09, 9.770779740847502e-09, 1.7956946152253295e-08, 2.6143112563659088e-08, 3.432927897506488e-08, 4.2515445386470674e-08, 5.070161179787647e-08, 5.888777820928226e-08, 6.707394106797437e-08, 7.526011103209385e-08, 8.344628099621332e-08, 9.163244385490543e-08]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [60.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 906.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.960464477539063e-08, -5.681067705154419e-08, -5.4016709327697754e-08, -5.122274160385132e-08, -4.842877388000488e-08, -4.563480615615845e-08, -4.284083843231201e-08, -4.0046870708465576e-08, -3.725290298461914e-08, -3.4458935260772705e-08, -3.166496753692627e-08, -2.8870999813079834e-08, -2.60770320892334e-08, -2.3283064365386963e-08, -2.0489096641540527e-08, -1.7695128917694092e-08, -1.4901161193847656e-08, -1.210719347000122e-08, -9.313225746154785e-09, -6.51925802230835e-09, -3.725290298461914e-09, -9.313225746154785e-10, 1.862645149230957e-09, 4.6566128730773926e-09, 7.450580596923828e-09, 1.0244548320770264e-08, 1.30385160446167e-08, 1.5832483768463135e-08, 1.862645149230957e-08, 2.1420419216156006e-08, 2.421438694000244e-08, 2.7008354663848877e-08, 2.9802322387695312e-08, 3.259629011154175e-08, 3.5390257835388184e-08, 3.818422555923462e-08, 4.0978193283081055e-08, 4.377216100692749e-08, 4.6566128730773926e-08, 4.936009645462036e-08, 5.21540641784668e-08, 5.494803190231323e-08, 5.774199962615967e-08, 6.05359673500061e-08, 6.332993507385254e-08, 6.612390279769897e-08, 6.891787052154541e-08, 7.171183824539185e-08, 7.450580596923828e-08, 7.729977369308472e-08, 8.009374141693115e-08, 8.288770914077759e-08, 8.568167686462402e-08, 8.847564458847046e-08, 9.12696123123169e-08, 9.406358003616333e-08, 9.685754776000977e-08, 9.96515154838562e-08, 1.0244548320770264e-07, 1.0523945093154907e-07, 1.0803341865539551e-07, 1.1082738637924194e-07, 1.1362135410308838e-07, 1.1641532182693481e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 5.0, 11.0, 7.0, 9.0, 7.0, 10.0, 16.0, 17.0, 25.0, 23.0, 22.0, 26.0, 26.0, 25.0, 38.0, 29.0, 31.0, 37.0, 43.0, 48.0, 36.0, 31.0, 38.0, 32.0, 34.0, 31.0, 46.0, 19.0, 21.0, 33.0, 30.0, 24.0, 16.0, 21.0, 12.0, 14.0, 19.0, 10.0, 14.0, 11.0, 4.0, 9.0, 7.0, 5.0, 5.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.630859375, -2.552337646484375, -2.47381591796875, -2.395294189453125, -2.3167724609375, -2.238250732421875, -2.15972900390625, -2.081207275390625, -2.002685546875, -1.924163818359375, -1.84564208984375, -1.767120361328125, -1.6885986328125, -1.610076904296875, -1.53155517578125, -1.453033447265625, -1.37451171875, -1.295989990234375, -1.21746826171875, -1.138946533203125, -1.0604248046875, -0.981903076171875, -0.90338134765625, -0.824859619140625, -0.746337890625, -0.667816162109375, -0.58929443359375, -0.510772705078125, -0.4322509765625, -0.353729248046875, -0.27520751953125, -0.196685791015625, -0.1181640625, -0.039642333984375, 0.03887939453125, 0.117401123046875, 0.1959228515625, 0.274444580078125, 0.35296630859375, 0.431488037109375, 0.510009765625, 0.588531494140625, 0.66705322265625, 0.745574951171875, 0.8240966796875, 0.902618408203125, 0.98114013671875, 1.059661865234375, 1.13818359375, 1.216705322265625, 1.29522705078125, 1.373748779296875, 1.4522705078125, 1.530792236328125, 1.60931396484375, 1.687835693359375, 1.766357421875, 1.844879150390625, 1.92340087890625, 2.001922607421875, 2.0804443359375, 2.158966064453125, 2.23748779296875, 2.316009521484375, 2.39453125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 18.0, 13.0, 32.0, 45.0, 57.0, 99.0, 123.0, 223.0, 316.0, 493.0, 810.0, 1207.0, 1974.0, 2950.0, 4602.0, 7560.0, 12170.0, 20493.0, 35209.0, 66165.0, 149280.0, 362964.0, 196915.0, 81504.0, 42071.0, 23750.0, 14225.0, 8418.0, 5389.0, 3365.0, 2196.0, 1363.0, 901.0, 579.0, 386.0, 254.0, 158.0, 105.0, 57.0, 43.0, 30.0, 18.0, 7.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.599609375, -2.5174560546875, -2.435302734375, -2.3531494140625, -2.27099609375, -2.1888427734375, -2.106689453125, -2.0245361328125, -1.9423828125, -1.8602294921875, -1.778076171875, -1.6959228515625, -1.61376953125, -1.5316162109375, -1.449462890625, -1.3673095703125, -1.28515625, -1.2030029296875, -1.120849609375, -1.0386962890625, -0.95654296875, -0.8743896484375, -0.792236328125, -0.7100830078125, -0.6279296875, -0.5457763671875, -0.463623046875, -0.3814697265625, -0.29931640625, -0.2171630859375, -0.135009765625, -0.0528564453125, 0.029296875, 0.1114501953125, 0.193603515625, 0.2757568359375, 0.35791015625, 0.4400634765625, 0.522216796875, 0.6043701171875, 0.6865234375, 0.7686767578125, 0.850830078125, 0.9329833984375, 1.01513671875, 1.0972900390625, 1.179443359375, 1.2615966796875, 1.34375, 1.4259033203125, 1.508056640625, 1.5902099609375, 1.67236328125, 1.7545166015625, 1.836669921875, 1.9188232421875, 2.0009765625, 2.0831298828125, 2.165283203125, 2.2474365234375, 2.32958984375, 2.4117431640625, 2.493896484375, 2.5760498046875, 2.658203125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 1.0, 7.0, 4.0, 4.0, 10.0, 6.0, 14.0, 11.0, 8.0, 20.0, 24.0, 32.0, 32.0, 41.0, 30.0, 41.0, 39.0, 61.0, 90.0, 163.0, 1495.0, 324.0, 131.0, 64.0, 57.0, 58.0, 41.0, 41.0, 21.0, 22.0, 28.0, 29.0, 19.0, 15.0, 11.0, 8.0, 7.0, 7.0, 4.0, 9.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.0078125, -10.69189453125, -10.3759765625, -10.06005859375, -9.744140625, -9.42822265625, -9.1123046875, -8.79638671875, -8.48046875, -8.16455078125, -7.8486328125, -7.53271484375, -7.216796875, -6.90087890625, -6.5849609375, -6.26904296875, -5.953125, -5.63720703125, -5.3212890625, -5.00537109375, -4.689453125, -4.37353515625, -4.0576171875, -3.74169921875, -3.42578125, -3.10986328125, -2.7939453125, -2.47802734375, -2.162109375, -1.84619140625, -1.5302734375, -1.21435546875, -0.8984375, -0.58251953125, -0.2666015625, 0.04931640625, 0.365234375, 0.68115234375, 0.9970703125, 1.31298828125, 1.62890625, 1.94482421875, 2.2607421875, 2.57666015625, 2.892578125, 3.20849609375, 3.5244140625, 3.84033203125, 4.15625, 4.47216796875, 4.7880859375, 5.10400390625, 5.419921875, 5.73583984375, 6.0517578125, 6.36767578125, 6.68359375, 6.99951171875, 7.3154296875, 7.63134765625, 7.947265625, 8.26318359375, 8.5791015625, 8.89501953125, 9.2109375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 12.0, 4.0, 8.0, 9.0, 10.0, 14.0, 28.0, 42.0, 30.0, 56.0, 70.0, 96.0, 146.0, 191.0, 293.0, 702.0, 3396.0, 158061.0, 2947796.0, 31633.0, 1634.0, 515.0, 290.0, 168.0, 118.0, 79.0, 66.0, 50.0, 46.0, 28.0, 21.0, 15.0, 15.0, 11.0, 13.0, 3.0, 8.0, 5.0, 3.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.859375, -20.148193359375, -19.43701171875, -18.725830078125, -18.0146484375, -17.303466796875, -16.59228515625, -15.881103515625, -15.169921875, -14.458740234375, -13.74755859375, -13.036376953125, -12.3251953125, -11.614013671875, -10.90283203125, -10.191650390625, -9.48046875, -8.769287109375, -8.05810546875, -7.346923828125, -6.6357421875, -5.924560546875, -5.21337890625, -4.502197265625, -3.791015625, -3.079833984375, -2.36865234375, -1.657470703125, -0.9462890625, -0.235107421875, 0.47607421875, 1.187255859375, 1.8984375, 2.609619140625, 3.32080078125, 4.031982421875, 4.7431640625, 5.454345703125, 6.16552734375, 6.876708984375, 7.587890625, 8.299072265625, 9.01025390625, 9.721435546875, 10.4326171875, 11.143798828125, 11.85498046875, 12.566162109375, 13.27734375, 13.988525390625, 14.69970703125, 15.410888671875, 16.1220703125, 16.833251953125, 17.54443359375, 18.255615234375, 18.966796875, 19.677978515625, 20.38916015625, 21.100341796875, 21.8115234375, 22.522705078125, 23.23388671875, 23.945068359375, 24.65625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 747.0, 265.0], "bins": [-364.1663513183594, -358.36676025390625, -352.5671691894531, -346.7675476074219, -340.96795654296875, -335.1683654785156, -329.3687744140625, -323.5691833496094, -317.76959228515625, -311.9700012207031, -306.17041015625, -300.37078857421875, -294.5711975097656, -288.7716064453125, -282.9720153808594, -277.17242431640625, -271.372802734375, -265.5732116699219, -259.77362060546875, -253.97401428222656, -248.17440795898438, -242.37481689453125, -236.57522583007812, -230.775634765625, -224.9760284423828, -219.1764373779297, -213.3768310546875, -207.57723999023438, -201.77764892578125, -195.97804260253906, -190.17845153808594, -184.37884521484375, -178.57925415039062, -172.7796630859375, -166.9800567626953, -161.1804656982422, -155.380859375, -149.58126831054688, -143.78167724609375, -137.98208618164062, -132.18247985839844, -126.38288116455078, -120.58328247070312, -114.78369140625, -108.98409271240234, -103.18449401855469, -97.38490295410156, -91.5853042602539, -85.78570556640625, -79.9861068725586, -74.18650817871094, -68.38691711425781, -62.587318420410156, -56.7877197265625, -50.98812484741211, -45.18852996826172, -39.3889274597168, -33.589332580566406, -27.78973388671875, -21.990137100219727, -16.190540313720703, -10.39094352722168, -4.591346740722656, 1.2082481384277344, 7.007845878601074]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 3.0, 2.0, 10.0, 5.0, 9.0, 11.0, 12.0, 12.0, 25.0, 19.0, 13.0, 25.0, 24.0, 25.0, 35.0, 36.0, 26.0, 30.0, 31.0, 33.0, 33.0, 49.0, 46.0, 39.0, 36.0, 41.0, 38.0, 38.0, 41.0, 36.0, 32.0, 26.0, 22.0, 23.0, 14.0, 15.0, 12.0, 15.0, 13.0, 4.0, 3.0, 10.0, 4.0, 8.0, 11.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.730037689208984, -20.976560592651367, -20.223081588745117, -19.4696044921875, -18.716127395629883, -17.962650299072266, -17.209171295166016, -16.4556941986084, -15.702217102050781, -14.948739051818848, -14.19526195526123, -13.441783905029297, -12.68830680847168, -11.934828758239746, -11.181350708007812, -10.427873611450195, -9.674395561218262, -8.920917510986328, -8.167440414428711, -7.413962364196777, -6.66048526763916, -5.907007217407227, -5.153529644012451, -4.400052070617676, -3.6465744972229004, -2.893096923828125, -2.1396193504333496, -1.3861415386199951, -0.6326639652252197, 0.12081360816955566, 0.8742914199829102, 1.6277689933776855, 2.381246566772461, 3.1347241401672363, 3.8882017135620117, 4.641679763793945, 5.3951568603515625, 6.148634910583496, 6.9021124839782715, 7.655590057373047, 8.409067153930664, 9.162545204162598, 9.916022300720215, 10.669500350952148, 11.422977447509766, 12.1764554977417, 12.929933547973633, 13.68341064453125, 14.436888694763184, 15.190366744995117, 15.943843841552734, 16.69732093811035, 17.4507999420166, 18.20427703857422, 18.957754135131836, 19.711231231689453, 20.464710235595703, 21.21818733215332, 21.97166633605957, 22.725143432617188, 23.478620529174805, 24.232097625732422, 24.985576629638672, 25.73905372619629, 26.492530822753906]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 3.0, 7.0, 6.0, 12.0, 14.0, 21.0, 17.0, 19.0, 26.0, 26.0, 26.0, 25.0, 29.0, 30.0, 27.0, 37.0, 41.0, 37.0, 40.0, 35.0, 47.0, 36.0, 38.0, 27.0, 37.0, 30.0, 38.0, 23.0, 35.0, 21.0, 30.0, 21.0, 15.0, 17.0, 11.0, 9.0, 14.0, 9.0, 7.0, 10.0, 8.0, 11.0, 9.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.869140625, -2.78338623046875, -2.6976318359375, -2.61187744140625, -2.526123046875, -2.44036865234375, -2.3546142578125, -2.26885986328125, -2.18310546875, -2.09735107421875, -2.0115966796875, -1.92584228515625, -1.840087890625, -1.75433349609375, -1.6685791015625, -1.58282470703125, -1.4970703125, -1.41131591796875, -1.3255615234375, -1.23980712890625, -1.154052734375, -1.06829833984375, -0.9825439453125, -0.89678955078125, -0.81103515625, -0.72528076171875, -0.6395263671875, -0.55377197265625, -0.468017578125, -0.38226318359375, -0.2965087890625, -0.21075439453125, -0.125, -0.03924560546875, 0.0465087890625, 0.13226318359375, 0.218017578125, 0.30377197265625, 0.3895263671875, 0.47528076171875, 0.56103515625, 0.64678955078125, 0.7325439453125, 0.81829833984375, 0.904052734375, 0.98980712890625, 1.0755615234375, 1.16131591796875, 1.2470703125, 1.33282470703125, 1.4185791015625, 1.50433349609375, 1.590087890625, 1.67584228515625, 1.7615966796875, 1.84735107421875, 1.93310546875, 2.01885986328125, 2.1046142578125, 2.19036865234375, 2.276123046875, 2.36187744140625, 2.4476318359375, 2.53338623046875, 2.619140625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 5.0, 7.0, 5.0, 8.0, 14.0, 13.0, 15.0, 27.0, 34.0, 39.0, 51.0, 75.0, 151.0, 281.0, 601.0, 1510.0, 3957.0, 13403.0, 53895.0, 285659.0, 1654466.0, 1786991.0, 312416.0, 58707.0, 14455.0, 4400.0, 1569.0, 680.0, 320.0, 167.0, 102.0, 63.0, 34.0, 33.0, 18.0, 16.0, 9.0, 15.0, 11.0, 16.0, 7.0, 6.0, 8.0, 2.0, 1.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.78125, -6.575927734375, -6.37060546875, -6.165283203125, -5.9599609375, -5.754638671875, -5.54931640625, -5.343994140625, -5.138671875, -4.933349609375, -4.72802734375, -4.522705078125, -4.3173828125, -4.112060546875, -3.90673828125, -3.701416015625, -3.49609375, -3.290771484375, -3.08544921875, -2.880126953125, -2.6748046875, -2.469482421875, -2.26416015625, -2.058837890625, -1.853515625, -1.648193359375, -1.44287109375, -1.237548828125, -1.0322265625, -0.826904296875, -0.62158203125, -0.416259765625, -0.2109375, -0.005615234375, 0.19970703125, 0.405029296875, 0.6103515625, 0.815673828125, 1.02099609375, 1.226318359375, 1.431640625, 1.636962890625, 1.84228515625, 2.047607421875, 2.2529296875, 2.458251953125, 2.66357421875, 2.868896484375, 3.07421875, 3.279541015625, 3.48486328125, 3.690185546875, 3.8955078125, 4.100830078125, 4.30615234375, 4.511474609375, 4.716796875, 4.922119140625, 5.12744140625, 5.332763671875, 5.5380859375, 5.743408203125, 5.94873046875, 6.154052734375, 6.359375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 6.0, 3.0, 7.0, 18.0, 17.0, 32.0, 26.0, 47.0, 46.0, 75.0, 82.0, 112.0, 165.0, 208.0, 292.0, 318.0, 404.0, 435.0, 348.0, 316.0, 261.0, 220.0, 171.0, 104.0, 72.0, 66.0, 53.0, 54.0, 28.0, 31.0, 12.0, 15.0, 8.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.05078125, -5.88055419921875, -5.7103271484375, -5.54010009765625, -5.369873046875, -5.19964599609375, -5.0294189453125, -4.85919189453125, -4.68896484375, -4.51873779296875, -4.3485107421875, -4.17828369140625, -4.008056640625, -3.83782958984375, -3.6676025390625, -3.49737548828125, -3.3271484375, -3.15692138671875, -2.9866943359375, -2.81646728515625, -2.646240234375, -2.47601318359375, -2.3057861328125, -2.13555908203125, -1.96533203125, -1.79510498046875, -1.6248779296875, -1.45465087890625, -1.284423828125, -1.11419677734375, -0.9439697265625, -0.77374267578125, -0.603515625, -0.43328857421875, -0.2630615234375, -0.09283447265625, 0.077392578125, 0.24761962890625, 0.4178466796875, 0.58807373046875, 0.75830078125, 0.92852783203125, 1.0987548828125, 1.26898193359375, 1.439208984375, 1.60943603515625, 1.7796630859375, 1.94989013671875, 2.1201171875, 2.29034423828125, 2.4605712890625, 2.63079833984375, 2.801025390625, 2.97125244140625, 3.1414794921875, 3.31170654296875, 3.48193359375, 3.65216064453125, 3.8223876953125, 3.99261474609375, 4.162841796875, 4.33306884765625, 4.5032958984375, 4.67352294921875, 4.84375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 11.0, 2.0, 9.0, 12.0, 27.0, 26.0, 35.0, 52.0, 59.0, 95.0, 111.0, 150.0, 246.0, 377.0, 805.0, 4715.0, 239412.0, 3787374.0, 155130.0, 3592.0, 757.0, 411.0, 255.0, 162.0, 106.0, 101.0, 61.0, 42.0, 37.0, 36.0, 25.0, 14.0, 6.0, 9.0, 6.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.328125, -19.587646484375, -18.84716796875, -18.106689453125, -17.3662109375, -16.625732421875, -15.88525390625, -15.144775390625, -14.404296875, -13.663818359375, -12.92333984375, -12.182861328125, -11.4423828125, -10.701904296875, -9.96142578125, -9.220947265625, -8.48046875, -7.739990234375, -6.99951171875, -6.259033203125, -5.5185546875, -4.778076171875, -4.03759765625, -3.297119140625, -2.556640625, -1.816162109375, -1.07568359375, -0.335205078125, 0.4052734375, 1.145751953125, 1.88623046875, 2.626708984375, 3.3671875, 4.107666015625, 4.84814453125, 5.588623046875, 6.3291015625, 7.069580078125, 7.81005859375, 8.550537109375, 9.291015625, 10.031494140625, 10.77197265625, 11.512451171875, 12.2529296875, 12.993408203125, 13.73388671875, 14.474365234375, 15.21484375, 15.955322265625, 16.69580078125, 17.436279296875, 18.1767578125, 18.917236328125, 19.65771484375, 20.398193359375, 21.138671875, 21.879150390625, 22.61962890625, 23.360107421875, 24.1005859375, 24.841064453125, 25.58154296875, 26.322021484375, 27.0625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 10.0, 27.0, 79.0, 142.0, 244.0, 226.0, 151.0, 85.0, 36.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.45936965942383, -52.44554138183594, -50.43171310424805, -48.417884826660156, -46.404056549072266, -44.390228271484375, -42.37639617919922, -40.362571716308594, -38.34873962402344, -36.33491134643555, -34.321083068847656, -32.307254791259766, -30.293426513671875, -28.279598236083984, -26.26576805114746, -24.25193977355957, -22.238113403320312, -20.224285125732422, -18.21045684814453, -16.19662857055664, -14.182799339294434, -12.168971061706543, -10.155141830444336, -8.141313552856445, -6.127485275268555, -4.113656997680664, -2.0998282432556152, -0.0859994888305664, 1.9278287887573242, 3.941657066345215, 5.955486297607422, 7.9693145751953125, 9.983139038085938, 11.996967315673828, 14.010795593261719, 16.02462387084961, 18.0384521484375, 20.05228042602539, 22.066110610961914, 24.079938888549805, 26.093767166137695, 28.107595443725586, 30.121423721313477, 32.13525390625, 34.14908218383789, 36.16291046142578, 38.17673873901367, 40.19056701660156, 42.20439529418945, 44.218223571777344, 46.232051849365234, 48.245880126953125, 50.259708404541016, 52.273536682128906, 54.28736877441406, 56.30119323730469, 58.315025329589844, 60.328853607177734, 62.342681884765625, 64.35651397705078, 66.3703384399414, 68.38417053222656, 70.39799499511719, 72.41182708740234, 74.42565155029297]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 5.0, 9.0, 5.0, 8.0, 10.0, 15.0, 13.0, 19.0, 19.0, 23.0, 18.0, 36.0, 30.0, 30.0, 42.0, 33.0, 36.0, 42.0, 39.0, 41.0, 47.0, 37.0, 46.0, 35.0, 40.0, 40.0, 38.0, 33.0, 28.0, 23.0, 28.0, 16.0, 12.0, 13.0, 10.0, 11.0, 16.0, 12.0, 7.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.994049072265625, -18.389142990112305, -17.784236907958984, -17.17932891845703, -16.57442283630371, -15.96951675415039, -15.36461067199707, -14.75970458984375, -14.154797554016113, -13.549891471862793, -12.944984436035156, -12.340078353881836, -11.735172271728516, -11.130265235900879, -10.525359153747559, -9.920452117919922, -9.315546035766602, -8.710639953613281, -8.105732917785645, -7.500826835632324, -6.895920276641846, -6.291013717651367, -5.686107635498047, -5.081201076507568, -4.47629451751709, -3.8713879585266113, -3.266481637954712, -2.6615753173828125, -2.056668758392334, -1.4517621994018555, -0.846855878829956, -0.24194955825805664, 0.36295509338378906, 0.967861533164978, 1.572767972946167, 2.1776742935180664, 2.782580852508545, 3.3874874114990234, 3.992393732070923, 4.597300052642822, 5.202206611633301, 5.807113170623779, 6.412019729614258, 7.016925811767578, 7.621832370758057, 8.226738929748535, 8.831645011901855, 9.436552047729492, 10.041458129882812, 10.646364212036133, 11.25127124786377, 11.85617733001709, 12.461084365844727, 13.065990447998047, 13.670896530151367, 14.275802612304688, 14.880709648132324, 15.485615730285645, 16.09052276611328, 16.6954288482666, 17.300334930419922, 17.905242919921875, 18.510149002075195, 19.115055084228516, 19.719961166381836]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 3.0, 5.0, 10.0, 7.0, 15.0, 23.0, 17.0, 18.0, 12.0, 19.0, 24.0, 23.0, 25.0, 35.0, 27.0, 35.0, 35.0, 45.0, 39.0, 43.0, 45.0, 28.0, 20.0, 41.0, 30.0, 35.0, 31.0, 36.0, 34.0, 28.0, 19.0, 20.0, 19.0, 22.0, 20.0, 13.0, 12.0, 14.0, 16.0, 12.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.6953125, -2.61199951171875, -2.5286865234375, -2.44537353515625, -2.362060546875, -2.27874755859375, -2.1954345703125, -2.11212158203125, -2.02880859375, -1.94549560546875, -1.8621826171875, -1.77886962890625, -1.695556640625, -1.61224365234375, -1.5289306640625, -1.44561767578125, -1.3623046875, -1.27899169921875, -1.1956787109375, -1.11236572265625, -1.029052734375, -0.94573974609375, -0.8624267578125, -0.77911376953125, -0.69580078125, -0.61248779296875, -0.5291748046875, -0.44586181640625, -0.362548828125, -0.27923583984375, -0.1959228515625, -0.11260986328125, -0.029296875, 0.05401611328125, 0.1373291015625, 0.22064208984375, 0.303955078125, 0.38726806640625, 0.4705810546875, 0.55389404296875, 0.63720703125, 0.72052001953125, 0.8038330078125, 0.88714599609375, 0.970458984375, 1.05377197265625, 1.1370849609375, 1.22039794921875, 1.3037109375, 1.38702392578125, 1.4703369140625, 1.55364990234375, 1.636962890625, 1.72027587890625, 1.8035888671875, 1.88690185546875, 1.97021484375, 2.05352783203125, 2.1368408203125, 2.22015380859375, 2.303466796875, 2.38677978515625, 2.4700927734375, 2.55340576171875, 2.63671875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 10.0, 5.0, 12.0, 20.0, 45.0, 52.0, 65.0, 109.0, 131.0, 185.0, 322.0, 515.0, 746.0, 1019.0, 1529.0, 2198.0, 3272.0, 4843.0, 7321.0, 10794.0, 15957.0, 24107.0, 37169.0, 60330.0, 107915.0, 249257.0, 244572.0, 106850.0, 60012.0, 36614.0, 24140.0, 15630.0, 10582.0, 7408.0, 4842.0, 3178.0, 2189.0, 1540.0, 969.0, 639.0, 446.0, 298.0, 244.0, 151.0, 117.0, 63.0, 39.0, 34.0, 24.0, 17.0, 16.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.02203369140625, -0.021344900131225586, -0.020656108856201172, -0.019967317581176758, -0.019278526306152344, -0.01858973503112793, -0.017900943756103516, -0.0172121524810791, -0.016523361206054688, -0.015834569931030273, -0.01514577865600586, -0.014456987380981445, -0.013768196105957031, -0.013079404830932617, -0.012390613555908203, -0.011701822280883789, -0.011013031005859375, -0.010324239730834961, -0.009635448455810547, -0.008946657180786133, -0.008257865905761719, -0.007569074630737305, -0.006880283355712891, -0.0061914920806884766, -0.0055027008056640625, -0.0048139095306396484, -0.004125118255615234, -0.0034363269805908203, -0.0027475357055664062, -0.002058744430541992, -0.0013699531555175781, -0.0006811618804931641, 7.62939453125e-06, 0.0006964206695556641, 0.0013852119445800781, 0.002074003219604492, 0.0027627944946289062, 0.0034515857696533203, 0.004140377044677734, 0.0048291683197021484, 0.0055179595947265625, 0.0062067508697509766, 0.006895542144775391, 0.007584333419799805, 0.008273124694824219, 0.008961915969848633, 0.009650707244873047, 0.010339498519897461, 0.011028289794921875, 0.011717081069946289, 0.012405872344970703, 0.013094663619995117, 0.013783454895019531, 0.014472246170043945, 0.01516103744506836, 0.015849828720092773, 0.016538619995117188, 0.0172274112701416, 0.017916202545166016, 0.01860499382019043, 0.019293785095214844, 0.019982576370239258, 0.020671367645263672, 0.021360158920288086, 0.0220489501953125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 9.0, 7.0, 5.0, 5.0, 10.0, 17.0, 16.0, 17.0, 17.0, 24.0, 11.0, 25.0, 27.0, 30.0, 29.0, 37.0, 38.0, 47.0, 42.0, 38.0, 48.0, 1070.0, 46.0, 42.0, 42.0, 43.0, 48.0, 37.0, 33.0, 26.0, 19.0, 16.0, 20.0, 17.0, 11.0, 15.0, 12.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.986328125, -1.9244384765625, -1.862548828125, -1.8006591796875, -1.73876953125, -1.6768798828125, -1.614990234375, -1.5531005859375, -1.4912109375, -1.4293212890625, -1.367431640625, -1.3055419921875, -1.24365234375, -1.1817626953125, -1.119873046875, -1.0579833984375, -0.99609375, -0.9342041015625, -0.872314453125, -0.8104248046875, -0.74853515625, -0.6866455078125, -0.624755859375, -0.5628662109375, -0.5009765625, -0.4390869140625, -0.377197265625, -0.3153076171875, -0.25341796875, -0.1915283203125, -0.129638671875, -0.0677490234375, -0.005859375, 0.0560302734375, 0.117919921875, 0.1798095703125, 0.24169921875, 0.3035888671875, 0.365478515625, 0.4273681640625, 0.4892578125, 0.5511474609375, 0.613037109375, 0.6749267578125, 0.73681640625, 0.7987060546875, 0.860595703125, 0.9224853515625, 0.984375, 1.0462646484375, 1.108154296875, 1.1700439453125, 1.23193359375, 1.2938232421875, 1.355712890625, 1.4176025390625, 1.4794921875, 1.5413818359375, 1.603271484375, 1.6651611328125, 1.72705078125, 1.7889404296875, 1.850830078125, 1.9127197265625, 1.974609375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 5.0, 15.0, 9.0, 14.0, 35.0, 37.0, 64.0, 96.0, 129.0, 194.0, 300.0, 398.0, 528.0, 796.0, 1108.0, 1636.0, 2164.0, 3097.0, 4309.0, 5993.0, 8205.0, 11831.0, 17284.0, 26217.0, 41133.0, 67796.0, 125070.0, 1316977.0, 203589.0, 96217.0, 55483.0, 34406.0, 21950.0, 14904.0, 10144.0, 7122.0, 5104.0, 3740.0, 2659.0, 1831.0, 1355.0, 919.0, 684.0, 458.0, 329.0, 225.0, 183.0, 123.0, 83.0, 69.0, 44.0, 29.0, 28.0, 5.0, 7.0, 8.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.014190673828125, -0.013744473457336426, -0.013298273086547852, -0.012852072715759277, -0.012405872344970703, -0.011959671974182129, -0.011513471603393555, -0.01106727123260498, -0.010621070861816406, -0.010174870491027832, -0.009728670120239258, -0.009282469749450684, -0.00883626937866211, -0.008390069007873535, -0.007943868637084961, -0.007497668266296387, -0.0070514678955078125, -0.006605267524719238, -0.006159067153930664, -0.00571286678314209, -0.005266666412353516, -0.004820466041564941, -0.004374265670776367, -0.003928065299987793, -0.0034818649291992188, -0.0030356645584106445, -0.0025894641876220703, -0.002143263816833496, -0.0016970634460449219, -0.0012508630752563477, -0.0008046627044677734, -0.0003584623336791992, 8.7738037109375e-05, 0.0005339384078979492, 0.0009801387786865234, 0.0014263391494750977, 0.0018725395202636719, 0.002318739891052246, 0.0027649402618408203, 0.0032111406326293945, 0.0036573410034179688, 0.004103541374206543, 0.004549741744995117, 0.004995942115783691, 0.005442142486572266, 0.00588834285736084, 0.006334543228149414, 0.006780743598937988, 0.0072269439697265625, 0.007673144340515137, 0.008119344711303711, 0.008565545082092285, 0.00901174545288086, 0.009457945823669434, 0.009904146194458008, 0.010350346565246582, 0.010796546936035156, 0.01124274730682373, 0.011688947677612305, 0.012135148048400879, 0.012581348419189453, 0.013027548789978027, 0.013473749160766602, 0.013919949531555176, 0.01436614990234375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 0.0, 0.0, 137.0, 0.0, 0.0, 0.0, 624.0, 0.0, 0.0, 0.0, 0.0, 131.0, 0.0, 0.0, 0.0, 44.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.76837158203125e-07, -4.637986421585083e-07, -4.507601261138916e-07, -4.377216100692749e-07, -4.246830940246582e-07, -4.116445779800415e-07, -3.986060619354248e-07, -3.855675458908081e-07, -3.725290298461914e-07, -3.594905138015747e-07, -3.46451997756958e-07, -3.334134817123413e-07, -3.203749656677246e-07, -3.073364496231079e-07, -2.942979335784912e-07, -2.812594175338745e-07, -2.682209014892578e-07, -2.551823854446411e-07, -2.421438694000244e-07, -2.2910535335540771e-07, -2.1606683731079102e-07, -2.0302832126617432e-07, -1.8998980522155762e-07, -1.7695128917694092e-07, -1.6391277313232422e-07, -1.5087425708770752e-07, -1.3783574104309082e-07, -1.2479722499847412e-07, -1.1175870895385742e-07, -9.872019290924072e-08, -8.568167686462402e-08, -7.264316082000732e-08, -5.960464477539063e-08, -4.6566128730773926e-08, -3.3527612686157227e-08, -2.0489096641540527e-08, -7.450580596923828e-09, 5.587935447692871e-09, 1.862645149230957e-08, 3.166496753692627e-08, 4.470348358154297e-08, 5.774199962615967e-08, 7.078051567077637e-08, 8.381903171539307e-08, 9.685754776000977e-08, 1.0989606380462646e-07, 1.2293457984924316e-07, 1.3597309589385986e-07, 1.4901161193847656e-07, 1.6205012798309326e-07, 1.7508864402770996e-07, 1.8812716007232666e-07, 2.0116567611694336e-07, 2.1420419216156006e-07, 2.2724270820617676e-07, 2.4028122425079346e-07, 2.5331974029541016e-07, 2.6635825634002686e-07, 2.7939677238464355e-07, 2.9243528842926025e-07, 3.0547380447387695e-07, 3.1851232051849365e-07, 3.3155083656311035e-07, 3.4458935260772705e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 7.0, 1.0, 1.0, 3.0, 31.0, 13.0, 8.0, 17.0, 120.0, 96.0, 128.0, 647.0, 128280.0, 917517.0, 1261.0, 132.0, 80.0, 113.0, 30.0, 9.0, 5.0, 20.0, 12.0, 2.0, 4.0, 7.0, 7.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.450580596923828e-06, -7.164664566516876e-06, -6.878748536109924e-06, -6.592832505702972e-06, -6.3069164752960205e-06, -6.021000444889069e-06, -5.735084414482117e-06, -5.449168384075165e-06, -5.163252353668213e-06, -4.877336323261261e-06, -4.591420292854309e-06, -4.305504262447357e-06, -4.019588232040405e-06, -3.7336722016334534e-06, -3.4477561712265015e-06, -3.1618401408195496e-06, -2.8759241104125977e-06, -2.5900080800056458e-06, -2.304092049598694e-06, -2.018176019191742e-06, -1.73225998878479e-06, -1.4463439583778381e-06, -1.1604279279708862e-06, -8.745118975639343e-07, -5.885958671569824e-07, -3.026798367500305e-07, -1.6763806343078613e-08, 2.691522240638733e-07, 5.550682544708252e-07, 8.409842848777771e-07, 1.126900315284729e-06, 1.412816345691681e-06, 1.6987323760986328e-06, 1.9846484065055847e-06, 2.2705644369125366e-06, 2.5564804673194885e-06, 2.8423964977264404e-06, 3.1283125281333923e-06, 3.4142285585403442e-06, 3.700144588947296e-06, 3.986060619354248e-06, 4.2719766497612e-06, 4.557892680168152e-06, 4.843808710575104e-06, 5.129724740982056e-06, 5.4156407713890076e-06, 5.7015568017959595e-06, 5.987472832202911e-06, 6.273388862609863e-06, 6.559304893016815e-06, 6.845220923423767e-06, 7.131136953830719e-06, 7.417052984237671e-06, 7.702969014644623e-06, 7.988885045051575e-06, 8.274801075458527e-06, 8.560717105865479e-06, 8.84663313627243e-06, 9.132549166679382e-06, 9.418465197086334e-06, 9.704381227493286e-06, 9.990297257900238e-06, 1.027621328830719e-05, 1.0562129318714142e-05, 1.0848045349121094e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 9.0, 3.0, 14.0, 9.0, 11.0, 15.0, 832.0, 12.0, 10.0, 10.0, 15.0, 5.0, 7.0, 10.0, 7.0, 6.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3872428894501354e-07, -1.3205570326135785e-07, -1.2538713178855687e-07, -1.1871855321032854e-07, -1.120499746321002e-07, -1.0538138894844451e-07, -9.871281747564353e-08, -9.204423179198784e-08, -8.537566031918686e-08, -7.870708174095853e-08, -7.20385031627302e-08, -6.536992458450186e-08, -5.8701346006273525e-08, -5.203276387533151e-08, -4.536418529710318e-08, -3.869560671887484e-08, -3.202702458793283e-08, -2.5358446009704494e-08, -1.868986743147616e-08, -1.2021287076890985e-08, -5.3527084986626505e-09, 1.3158718559225235e-09, 7.984450434150858e-09, 1.4653029012379193e-08, 2.1321607590607528e-08, 2.7990186168835862e-08, 3.46587647470642e-08, 4.132734687800621e-08, 4.7995925456234545e-08, 5.466450403446288e-08, 6.133308261269121e-08, 6.800166119091955e-08, 7.467023976914788e-08, 8.133881834737622e-08, 8.800739692560455e-08, 9.467597550383289e-08, 1.0134455408206122e-07, 1.0801313976571691e-07, 1.1468171123851789e-07, 1.2135029692217358e-07, 1.2801886839497456e-07, 1.3468745407863025e-07, 1.4135602555143123e-07, 1.4802461123508692e-07, 1.546931827078879e-07, 1.613617683915436e-07, 1.6803033986434457e-07, 1.7469892554800026e-07, 1.8136751123165595e-07, 1.8803609691531165e-07, 1.9470466838811262e-07, 2.0137325407176832e-07, 2.080418255445693e-07, 2.1471041122822498e-07, 2.2137898270102596e-07, 2.2804756838468165e-07, 2.3471613985748263e-07, 2.413847255411383e-07, 2.48053311224794e-07, 2.547218684867403e-07, 2.6139045417039597e-07, 2.6805903985405166e-07, 2.7472762553770735e-07, 2.813961827996536e-07, 2.880647684833093e-07]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 92.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 828.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 3.0, 5.0, 10.0, 7.0, 15.0, 23.0, 17.0, 18.0, 12.0, 19.0, 24.0, 23.0, 25.0, 35.0, 27.0, 35.0, 35.0, 45.0, 39.0, 43.0, 45.0, 28.0, 20.0, 41.0, 30.0, 35.0, 31.0, 36.0, 34.0, 28.0, 19.0, 20.0, 19.0, 22.0, 20.0, 13.0, 12.0, 14.0, 16.0, 12.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.6953125, -2.61199951171875, -2.5286865234375, -2.44537353515625, -2.362060546875, -2.27874755859375, -2.1954345703125, -2.11212158203125, -2.02880859375, -1.94549560546875, -1.8621826171875, -1.77886962890625, -1.695556640625, -1.61224365234375, -1.5289306640625, -1.44561767578125, -1.3623046875, -1.27899169921875, -1.1956787109375, -1.11236572265625, -1.029052734375, -0.94573974609375, -0.8624267578125, -0.77911376953125, -0.69580078125, -0.61248779296875, -0.5291748046875, -0.44586181640625, -0.362548828125, -0.27923583984375, -0.1959228515625, -0.11260986328125, -0.029296875, 0.05401611328125, 0.1373291015625, 0.22064208984375, 0.303955078125, 0.38726806640625, 0.4705810546875, 0.55389404296875, 0.63720703125, 0.72052001953125, 0.8038330078125, 0.88714599609375, 0.970458984375, 1.05377197265625, 1.1370849609375, 1.22039794921875, 1.3037109375, 1.38702392578125, 1.4703369140625, 1.55364990234375, 1.636962890625, 1.72027587890625, 1.8035888671875, 1.88690185546875, 1.97021484375, 2.05352783203125, 2.1368408203125, 2.22015380859375, 2.303466796875, 2.38677978515625, 2.4700927734375, 2.55340576171875, 2.63671875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 9.0, 13.0, 20.0, 25.0, 33.0, 41.0, 94.0, 146.0, 240.0, 381.0, 698.0, 1067.0, 1719.0, 2912.0, 4698.0, 7660.0, 12589.0, 20801.0, 35100.0, 62758.0, 128011.0, 343645.0, 213541.0, 92738.0, 48747.0, 28060.0, 16624.0, 10240.0, 6105.0, 3857.0, 2367.0, 1412.0, 789.0, 512.0, 323.0, 192.0, 135.0, 80.0, 46.0, 27.0, 26.0, 16.0, 15.0, 10.0, 12.0, 6.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.353515625, -2.271759033203125, -2.19000244140625, -2.108245849609375, -2.0264892578125, -1.944732666015625, -1.86297607421875, -1.781219482421875, -1.699462890625, -1.617706298828125, -1.53594970703125, -1.454193115234375, -1.3724365234375, -1.290679931640625, -1.20892333984375, -1.127166748046875, -1.04541015625, -0.963653564453125, -0.88189697265625, -0.800140380859375, -0.7183837890625, -0.636627197265625, -0.55487060546875, -0.473114013671875, -0.391357421875, -0.309600830078125, -0.22784423828125, -0.146087646484375, -0.0643310546875, 0.017425537109375, 0.09918212890625, 0.180938720703125, 0.2626953125, 0.344451904296875, 0.42620849609375, 0.507965087890625, 0.5897216796875, 0.671478271484375, 0.75323486328125, 0.834991455078125, 0.916748046875, 0.998504638671875, 1.08026123046875, 1.162017822265625, 1.2437744140625, 1.325531005859375, 1.40728759765625, 1.489044189453125, 1.57080078125, 1.652557373046875, 1.73431396484375, 1.816070556640625, 1.8978271484375, 1.979583740234375, 2.06134033203125, 2.143096923828125, 2.224853515625, 2.306610107421875, 2.38836669921875, 2.470123291015625, 2.5518798828125, 2.633636474609375, 2.71539306640625, 2.797149658203125, 2.87890625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 3.0, 8.0, 5.0, 9.0, 11.0, 10.0, 15.0, 19.0, 23.0, 18.0, 27.0, 33.0, 29.0, 24.0, 42.0, 38.0, 49.0, 63.0, 129.0, 238.0, 1551.0, 203.0, 93.0, 66.0, 48.0, 45.0, 33.0, 33.0, 18.0, 30.0, 33.0, 17.0, 18.0, 8.0, 11.0, 11.0, 5.0, 12.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.28125, -8.9755859375, -8.669921875, -8.3642578125, -8.05859375, -7.7529296875, -7.447265625, -7.1416015625, -6.8359375, -6.5302734375, -6.224609375, -5.9189453125, -5.61328125, -5.3076171875, -5.001953125, -4.6962890625, -4.390625, -4.0849609375, -3.779296875, -3.4736328125, -3.16796875, -2.8623046875, -2.556640625, -2.2509765625, -1.9453125, -1.6396484375, -1.333984375, -1.0283203125, -0.72265625, -0.4169921875, -0.111328125, 0.1943359375, 0.5, 0.8056640625, 1.111328125, 1.4169921875, 1.72265625, 2.0283203125, 2.333984375, 2.6396484375, 2.9453125, 3.2509765625, 3.556640625, 3.8623046875, 4.16796875, 4.4736328125, 4.779296875, 5.0849609375, 5.390625, 5.6962890625, 6.001953125, 6.3076171875, 6.61328125, 6.9189453125, 7.224609375, 7.5302734375, 7.8359375, 8.1416015625, 8.447265625, 8.7529296875, 9.05859375, 9.3642578125, 9.669921875, 9.9755859375, 10.28125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 12.0, 13.0, 13.0, 18.0, 16.0, 20.0, 31.0, 35.0, 58.0, 57.0, 68.0, 110.0, 138.0, 226.0, 364.0, 678.0, 1716.0, 13658.0, 543879.0, 2545447.0, 33961.0, 2952.0, 840.0, 389.0, 278.0, 173.0, 121.0, 97.0, 59.0, 62.0, 48.0, 28.0, 31.0, 14.0, 21.0, 14.0, 11.0, 10.0, 7.0, 5.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-17.671875, -17.138916015625, -16.60595703125, -16.072998046875, -15.5400390625, -15.007080078125, -14.47412109375, -13.941162109375, -13.408203125, -12.875244140625, -12.34228515625, -11.809326171875, -11.2763671875, -10.743408203125, -10.21044921875, -9.677490234375, -9.14453125, -8.611572265625, -8.07861328125, -7.545654296875, -7.0126953125, -6.479736328125, -5.94677734375, -5.413818359375, -4.880859375, -4.347900390625, -3.81494140625, -3.281982421875, -2.7490234375, -2.216064453125, -1.68310546875, -1.150146484375, -0.6171875, -0.084228515625, 0.44873046875, 0.981689453125, 1.5146484375, 2.047607421875, 2.58056640625, 3.113525390625, 3.646484375, 4.179443359375, 4.71240234375, 5.245361328125, 5.7783203125, 6.311279296875, 6.84423828125, 7.377197265625, 7.91015625, 8.443115234375, 8.97607421875, 9.509033203125, 10.0419921875, 10.574951171875, 11.10791015625, 11.640869140625, 12.173828125, 12.706787109375, 13.23974609375, 13.772705078125, 14.3056640625, 14.838623046875, 15.37158203125, 15.904541015625, 16.4375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 151.0, 724.0, 133.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.312050819396973, -8.086647033691406, -4.861243724822998, -1.6358404159545898, 1.5895633697509766, 4.814967155456543, 8.040369987487793, 11.265774726867676, 14.491177558898926, 17.716581344604492, 20.941984176635742, 24.167388916015625, 27.392791748046875, 30.618194580078125, 33.843597412109375, 37.06900405883789, 40.29440689086914, 43.51980972290039, 46.74521255493164, 49.970619201660156, 53.196022033691406, 56.421424865722656, 59.646827697753906, 62.872230529785156, 66.0976333618164, 69.32303619384766, 72.5484390258789, 75.77384185791016, 78.9992446899414, 82.22465515136719, 85.45005798339844, 88.67546081542969, 91.9008560180664, 95.12625885009766, 98.3516616821289, 101.57706451416016, 104.8024673461914, 108.02787780761719, 111.25328063964844, 114.47868347167969, 117.70408630371094, 120.92948913574219, 124.15489196777344, 127.38029479980469, 130.60569763183594, 133.8311004638672, 137.05650329589844, 140.2819061279297, 143.50730895996094, 146.7327117919922, 149.95811462402344, 153.1835174560547, 156.40892028808594, 159.6343231201172, 162.85972595214844, 166.0851287841797, 169.310546875, 172.53594970703125, 175.7613525390625, 178.98675537109375, 182.212158203125, 185.43756103515625, 188.6629638671875, 191.88836669921875, 195.11376953125]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 4.0, 5.0, 8.0, 6.0, 4.0, 7.0, 13.0, 14.0, 18.0, 17.0, 19.0, 26.0, 21.0, 33.0, 28.0, 37.0, 40.0, 38.0, 48.0, 43.0, 55.0, 37.0, 46.0, 36.0, 45.0, 39.0, 34.0, 37.0, 23.0, 35.0, 26.0, 20.0, 26.0, 25.0, 16.0, 15.0, 9.0, 12.0, 12.0, 3.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0], "bins": [-28.717435836791992, -27.950998306274414, -27.184560775756836, -26.41812515258789, -25.651687622070312, -24.885250091552734, -24.118812561035156, -23.352375030517578, -22.5859375, -21.819499969482422, -21.053062438964844, -20.286624908447266, -19.52018928527832, -18.753751754760742, -17.987314224243164, -17.220876693725586, -16.45444107055664, -15.688003540039062, -14.9215669631958, -14.155129432678223, -13.388692855834961, -12.622255325317383, -11.855817794799805, -11.089380264282227, -10.322943687438965, -9.556506156921387, -8.790069580078125, -8.023632049560547, -7.257194995880127, -6.490757942199707, -5.724320411682129, -4.957883358001709, -4.191448211669922, -3.425011157989502, -2.658573865890503, -1.892136573791504, -1.125699520111084, -0.35926246643066406, 0.40717506408691406, 1.173612117767334, 1.940049171447754, 2.706486225128174, 3.472923517227173, 4.239360809326172, 5.005797863006592, 5.772234916687012, 6.53867244720459, 7.30510950088501, 8.07154655456543, 8.837984085083008, 9.60442066192627, 10.370858192443848, 11.13729476928711, 11.903732299804688, 12.670169830322266, 13.436607360839844, 14.203043937683105, 14.969481468200684, 15.735918045043945, 16.502355575561523, 17.2687931060791, 18.035228729248047, 18.801666259765625, 19.568103790283203, 20.33454132080078]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 4.0, 9.0, 7.0, 16.0, 12.0, 18.0, 22.0, 10.0, 19.0, 20.0, 26.0, 19.0, 36.0, 33.0, 41.0, 48.0, 33.0, 42.0, 42.0, 43.0, 41.0, 29.0, 40.0, 25.0, 28.0, 29.0, 38.0, 28.0, 19.0, 25.0, 22.0, 27.0, 16.0, 19.0, 15.0, 17.0, 19.0, 10.0, 8.0, 6.0, 8.0, 6.0, 4.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0], "bins": [-3.06640625, -2.97711181640625, -2.8878173828125, -2.79852294921875, -2.709228515625, -2.61993408203125, -2.5306396484375, -2.44134521484375, -2.35205078125, -2.26275634765625, -2.1734619140625, -2.08416748046875, -1.994873046875, -1.90557861328125, -1.8162841796875, -1.72698974609375, -1.6376953125, -1.54840087890625, -1.4591064453125, -1.36981201171875, -1.280517578125, -1.19122314453125, -1.1019287109375, -1.01263427734375, -0.92333984375, -0.83404541015625, -0.7447509765625, -0.65545654296875, -0.566162109375, -0.47686767578125, -0.3875732421875, -0.29827880859375, -0.208984375, -0.11968994140625, -0.0303955078125, 0.05889892578125, 0.148193359375, 0.23748779296875, 0.3267822265625, 0.41607666015625, 0.50537109375, 0.59466552734375, 0.6839599609375, 0.77325439453125, 0.862548828125, 0.95184326171875, 1.0411376953125, 1.13043212890625, 1.2197265625, 1.30902099609375, 1.3983154296875, 1.48760986328125, 1.576904296875, 1.66619873046875, 1.7554931640625, 1.84478759765625, 1.93408203125, 2.02337646484375, 2.1126708984375, 2.20196533203125, 2.291259765625, 2.38055419921875, 2.4698486328125, 2.55914306640625, 2.6484375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 3.0, 5.0, 9.0, 15.0, 8.0, 10.0, 14.0, 19.0, 21.0, 16.0, 21.0, 32.0, 42.0, 69.0, 140.0, 356.0, 1018.0, 3211.0, 12416.0, 66207.0, 545387.0, 2723610.0, 735907.0, 84539.0, 15361.0, 3813.0, 1131.0, 405.0, 161.0, 80.0, 51.0, 31.0, 26.0, 22.0, 18.0, 19.0, 12.0, 21.0, 10.0, 11.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 2.0], "bins": [-8.84375, -8.587890625, -8.33203125, -8.076171875, -7.8203125, -7.564453125, -7.30859375, -7.052734375, -6.796875, -6.541015625, -6.28515625, -6.029296875, -5.7734375, -5.517578125, -5.26171875, -5.005859375, -4.75, -4.494140625, -4.23828125, -3.982421875, -3.7265625, -3.470703125, -3.21484375, -2.958984375, -2.703125, -2.447265625, -2.19140625, -1.935546875, -1.6796875, -1.423828125, -1.16796875, -0.912109375, -0.65625, -0.400390625, -0.14453125, 0.111328125, 0.3671875, 0.623046875, 0.87890625, 1.134765625, 1.390625, 1.646484375, 1.90234375, 2.158203125, 2.4140625, 2.669921875, 2.92578125, 3.181640625, 3.4375, 3.693359375, 3.94921875, 4.205078125, 4.4609375, 4.716796875, 4.97265625, 5.228515625, 5.484375, 5.740234375, 5.99609375, 6.251953125, 6.5078125, 6.763671875, 7.01953125, 7.275390625, 7.53125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 5.0, 11.0, 21.0, 18.0, 27.0, 42.0, 63.0, 70.0, 112.0, 171.0, 213.0, 274.0, 380.0, 428.0, 463.0, 465.0, 335.0, 262.0, 172.0, 143.0, 113.0, 75.0, 59.0, 41.0, 23.0, 27.0, 19.0, 13.0, 8.0, 3.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90625, -4.72064208984375, -4.5350341796875, -4.34942626953125, -4.163818359375, -3.97821044921875, -3.7926025390625, -3.60699462890625, -3.42138671875, -3.23577880859375, -3.0501708984375, -2.86456298828125, -2.678955078125, -2.49334716796875, -2.3077392578125, -2.12213134765625, -1.9365234375, -1.75091552734375, -1.5653076171875, -1.37969970703125, -1.194091796875, -1.00848388671875, -0.8228759765625, -0.63726806640625, -0.45166015625, -0.26605224609375, -0.0804443359375, 0.10516357421875, 0.290771484375, 0.47637939453125, 0.6619873046875, 0.84759521484375, 1.033203125, 1.21881103515625, 1.4044189453125, 1.59002685546875, 1.775634765625, 1.96124267578125, 2.1468505859375, 2.33245849609375, 2.51806640625, 2.70367431640625, 2.8892822265625, 3.07489013671875, 3.260498046875, 3.44610595703125, 3.6317138671875, 3.81732177734375, 4.0029296875, 4.18853759765625, 4.3741455078125, 4.55975341796875, 4.745361328125, 4.93096923828125, 5.1165771484375, 5.30218505859375, 5.48779296875, 5.67340087890625, 5.8590087890625, 6.04461669921875, 6.230224609375, 6.41583251953125, 6.6014404296875, 6.78704833984375, 6.97265625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 7.0, 11.0, 14.0, 22.0, 26.0, 37.0, 42.0, 82.0, 108.0, 159.0, 210.0, 316.0, 627.0, 5214.0, 1059260.0, 3113268.0, 12894.0, 790.0, 395.0, 252.0, 184.0, 117.0, 62.0, 51.0, 40.0, 27.0, 18.0, 17.0, 13.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-37.78125, -36.789794921875, -35.79833984375, -34.806884765625, -33.8154296875, -32.823974609375, -31.83251953125, -30.841064453125, -29.849609375, -28.858154296875, -27.86669921875, -26.875244140625, -25.8837890625, -24.892333984375, -23.90087890625, -22.909423828125, -21.91796875, -20.926513671875, -19.93505859375, -18.943603515625, -17.9521484375, -16.960693359375, -15.96923828125, -14.977783203125, -13.986328125, -12.994873046875, -12.00341796875, -11.011962890625, -10.0205078125, -9.029052734375, -8.03759765625, -7.046142578125, -6.0546875, -5.063232421875, -4.07177734375, -3.080322265625, -2.0888671875, -1.097412109375, -0.10595703125, 0.885498046875, 1.876953125, 2.868408203125, 3.85986328125, 4.851318359375, 5.8427734375, 6.834228515625, 7.82568359375, 8.817138671875, 9.80859375, 10.800048828125, 11.79150390625, 12.782958984375, 13.7744140625, 14.765869140625, 15.75732421875, 16.748779296875, 17.740234375, 18.731689453125, 19.72314453125, 20.714599609375, 21.7060546875, 22.697509765625, 23.68896484375, 24.680419921875, 25.671875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 8.0, 13.0, 27.0, 59.0, 126.0, 205.0, 209.0, 170.0, 103.0, 53.0, 28.0, 13.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.92949104309082, -15.289589881896973, -13.649688720703125, -12.009786605834961, -10.36988639831543, -8.729984283447266, -7.090083122253418, -5.45018196105957, -3.8102807998657227, -2.170379638671875, -0.5304782390594482, 1.1094231605529785, 2.749324321746826, 4.389225959777832, 6.02912712097168, 7.669028282165527, 9.308929443359375, 10.948830604553223, 12.58873176574707, 14.228633880615234, 15.868534088134766, 17.50843620300293, 19.148338317871094, 20.788238525390625, 22.428138732910156, 24.06804084777832, 25.70794105529785, 27.347843170166016, 28.987743377685547, 30.62764549255371, 32.267547607421875, 33.907447814941406, 35.5473518371582, 37.187252044677734, 38.82715606689453, 40.46705627441406, 42.106956481933594, 43.746856689453125, 45.38676071166992, 47.02666091918945, 48.666561126708984, 50.306461334228516, 51.94636535644531, 53.586265563964844, 55.226165771484375, 56.866065979003906, 58.5059700012207, 60.145870208740234, 61.78577423095703, 63.42567443847656, 65.0655746459961, 66.70547485351562, 68.34538269042969, 69.98528289794922, 71.62518310546875, 73.26508331298828, 74.90498352050781, 76.54488372802734, 78.18478393554688, 79.8246841430664, 81.46459197998047, 83.1044921875, 84.74439239501953, 86.38429260253906, 88.0241928100586]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 8.0, 4.0, 4.0, 7.0, 12.0, 14.0, 14.0, 17.0, 23.0, 24.0, 34.0, 32.0, 26.0, 45.0, 31.0, 33.0, 47.0, 43.0, 46.0, 45.0, 52.0, 60.0, 44.0, 41.0, 41.0, 36.0, 35.0, 28.0, 22.0, 20.0, 19.0, 10.0, 13.0, 11.0, 14.0, 12.0, 6.0, 5.0, 9.0, 5.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.77593994140625, -18.181564331054688, -17.587188720703125, -16.992813110351562, -16.398439407348633, -15.80406379699707, -15.209688186645508, -14.615312576293945, -14.020936965942383, -13.42656135559082, -12.832186698913574, -12.237811088562012, -11.64343547821045, -11.049060821533203, -10.45468521118164, -9.860309600830078, -9.265934944152832, -8.67155933380127, -8.077184677124023, -7.482809066772461, -6.888433456420898, -6.294058322906494, -5.69968318939209, -5.105307579040527, -4.510932445526123, -3.9165570735931396, -3.3221817016601562, -2.727806568145752, -2.1334311962127686, -1.5390558242797852, -0.9446806907653809, -0.35030508041381836, 0.24407005310058594, 0.8384453654289246, 1.4328206777572632, 2.027195930480957, 2.6215713024139404, 3.215946674346924, 3.810321807861328, 4.404697418212891, 4.999072551727295, 5.593447685241699, 6.187823295593262, 6.782198429107666, 7.37657356262207, 7.970949172973633, 8.565324783325195, 9.159700393676758, 9.754075050354004, 10.348450660705566, 10.942825317382812, 11.537200927734375, 12.131576538085938, 12.7259521484375, 13.320326805114746, 13.914702415466309, 14.509077072143555, 15.103452682495117, 15.697827339172363, 16.29220199584961, 16.886577606201172, 17.480953216552734, 18.075328826904297, 18.66970443725586, 19.264080047607422]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 10.0, 16.0, 18.0, 14.0, 24.0, 23.0, 20.0, 25.0, 25.0, 40.0, 49.0, 37.0, 48.0, 46.0, 44.0, 35.0, 49.0, 46.0, 51.0, 41.0, 30.0, 31.0, 36.0, 23.0, 25.0, 26.0, 28.0, 23.0, 14.0, 20.0, 14.0, 10.0, 12.0, 8.0, 7.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.494140625, -3.38909912109375, -3.2840576171875, -3.17901611328125, -3.073974609375, -2.96893310546875, -2.8638916015625, -2.75885009765625, -2.65380859375, -2.54876708984375, -2.4437255859375, -2.33868408203125, -2.233642578125, -2.12860107421875, -2.0235595703125, -1.91851806640625, -1.8134765625, -1.70843505859375, -1.6033935546875, -1.49835205078125, -1.393310546875, -1.28826904296875, -1.1832275390625, -1.07818603515625, -0.97314453125, -0.86810302734375, -0.7630615234375, -0.65802001953125, -0.552978515625, -0.44793701171875, -0.3428955078125, -0.23785400390625, -0.1328125, -0.02777099609375, 0.0772705078125, 0.18231201171875, 0.287353515625, 0.39239501953125, 0.4974365234375, 0.60247802734375, 0.70751953125, 0.81256103515625, 0.9176025390625, 1.02264404296875, 1.127685546875, 1.23272705078125, 1.3377685546875, 1.44281005859375, 1.5478515625, 1.65289306640625, 1.7579345703125, 1.86297607421875, 1.968017578125, 2.07305908203125, 2.1781005859375, 2.28314208984375, 2.38818359375, 2.49322509765625, 2.5982666015625, 2.70330810546875, 2.808349609375, 2.91339111328125, 3.0184326171875, 3.12347412109375, 3.228515625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 4.0, 11.0, 15.0, 36.0, 35.0, 56.0, 78.0, 135.0, 190.0, 320.0, 499.0, 772.0, 1229.0, 1962.0, 3074.0, 5085.0, 8158.0, 13279.0, 21587.0, 35844.0, 62975.0, 123749.0, 350660.0, 210339.0, 87723.0, 47854.0, 27914.0, 16968.0, 10619.0, 6466.0, 4064.0, 2507.0, 1536.0, 979.0, 627.0, 415.0, 276.0, 163.0, 119.0, 84.0, 45.0, 31.0, 29.0, 15.0, 9.0, 5.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0288848876953125, -0.027945995330810547, -0.027007102966308594, -0.02606821060180664, -0.025129318237304688, -0.024190425872802734, -0.02325153350830078, -0.022312641143798828, -0.021373748779296875, -0.020434856414794922, -0.01949596405029297, -0.018557071685791016, -0.017618179321289062, -0.01667928695678711, -0.015740394592285156, -0.014801502227783203, -0.01386260986328125, -0.012923717498779297, -0.011984825134277344, -0.01104593276977539, -0.010107040405273438, -0.009168148040771484, -0.008229255676269531, -0.007290363311767578, -0.006351470947265625, -0.005412578582763672, -0.004473686218261719, -0.0035347938537597656, -0.0025959014892578125, -0.0016570091247558594, -0.0007181167602539062, 0.00022077560424804688, 0.00115966796875, 0.002098560333251953, 0.0030374526977539062, 0.003976345062255859, 0.0049152374267578125, 0.005854129791259766, 0.006793022155761719, 0.007731914520263672, 0.008670806884765625, 0.009609699249267578, 0.010548591613769531, 0.011487483978271484, 0.012426376342773438, 0.01336526870727539, 0.014304161071777344, 0.015243053436279297, 0.01618194580078125, 0.017120838165283203, 0.018059730529785156, 0.01899862289428711, 0.019937515258789062, 0.020876407623291016, 0.02181529998779297, 0.022754192352294922, 0.023693084716796875, 0.024631977081298828, 0.02557086944580078, 0.026509761810302734, 0.027448654174804688, 0.02838754653930664, 0.029326438903808594, 0.030265331268310547, 0.0312042236328125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 5.0, 11.0, 11.0, 15.0, 20.0, 21.0, 20.0, 26.0, 29.0, 42.0, 41.0, 41.0, 51.0, 46.0, 44.0, 42.0, 53.0, 1064.0, 46.0, 43.0, 41.0, 46.0, 31.0, 31.0, 28.0, 29.0, 30.0, 17.0, 16.0, 18.0, 17.0, 13.0, 8.0, 5.0, 6.0, 6.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.95050048828125, -1.8756103515625, -1.80072021484375, -1.725830078125, -1.65093994140625, -1.5760498046875, -1.50115966796875, -1.42626953125, -1.35137939453125, -1.2764892578125, -1.20159912109375, -1.126708984375, -1.05181884765625, -0.9769287109375, -0.90203857421875, -0.8271484375, -0.75225830078125, -0.6773681640625, -0.60247802734375, -0.527587890625, -0.45269775390625, -0.3778076171875, -0.30291748046875, -0.22802734375, -0.15313720703125, -0.0782470703125, -0.00335693359375, 0.071533203125, 0.14642333984375, 0.2213134765625, 0.29620361328125, 0.37109375, 0.44598388671875, 0.5208740234375, 0.59576416015625, 0.670654296875, 0.74554443359375, 0.8204345703125, 0.89532470703125, 0.97021484375, 1.04510498046875, 1.1199951171875, 1.19488525390625, 1.269775390625, 1.34466552734375, 1.4195556640625, 1.49444580078125, 1.5693359375, 1.64422607421875, 1.7191162109375, 1.79400634765625, 1.868896484375, 1.94378662109375, 2.0186767578125, 2.09356689453125, 2.16845703125, 2.24334716796875, 2.3182373046875, 2.39312744140625, 2.468017578125, 2.54290771484375, 2.6177978515625, 2.69268798828125, 2.767578125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 3.0, 11.0, 17.0, 18.0, 36.0, 29.0, 62.0, 106.0, 156.0, 221.0, 350.0, 544.0, 877.0, 1258.0, 2087.0, 3145.0, 4870.0, 7349.0, 11517.0, 18410.0, 30117.0, 51345.0, 92811.0, 202378.0, 1362365.0, 134057.0, 69132.0, 39396.0, 23475.0, 14575.0, 9247.0, 6001.0, 3942.0, 2512.0, 1655.0, 1070.0, 706.0, 444.0, 304.0, 154.0, 128.0, 76.0, 45.0, 38.0, 25.0, 15.0, 13.0, 10.0, 10.0, 9.0, 1.0, 4.0, 4.0, 0.0, 4.0], "bins": [-0.020050048828125, -0.01944732666015625, -0.0188446044921875, -0.01824188232421875, -0.01763916015625, -0.01703643798828125, -0.0164337158203125, -0.01583099365234375, -0.015228271484375, -0.01462554931640625, -0.0140228271484375, -0.01342010498046875, -0.0128173828125, -0.01221466064453125, -0.0116119384765625, -0.01100921630859375, -0.010406494140625, -0.00980377197265625, -0.0092010498046875, -0.00859832763671875, -0.00799560546875, -0.00739288330078125, -0.0067901611328125, -0.00618743896484375, -0.005584716796875, -0.00498199462890625, -0.0043792724609375, -0.00377655029296875, -0.003173828125, -0.00257110595703125, -0.0019683837890625, -0.00136566162109375, -0.000762939453125, -0.00016021728515625, 0.0004425048828125, 0.00104522705078125, 0.00164794921875, 0.00225067138671875, 0.0028533935546875, 0.00345611572265625, 0.004058837890625, 0.00466156005859375, 0.0052642822265625, 0.00586700439453125, 0.0064697265625, 0.00707244873046875, 0.0076751708984375, 0.00827789306640625, 0.008880615234375, 0.00948333740234375, 0.0100860595703125, 0.01068878173828125, 0.01129150390625, 0.01189422607421875, 0.0124969482421875, 0.01309967041015625, 0.013702392578125, 0.01430511474609375, 0.0149078369140625, 0.01551055908203125, 0.01611328125, 0.01671600341796875, 0.0173187255859375, 0.01792144775390625, 0.018524169921875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 55.0, 0.0, 0.0, 0.0, 132.0, 0.0, 0.0, 0.0, 534.0, 0.0, 0.0, 153.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.76837158203125e-07, -4.6100467443466187e-07, -4.4517219066619873e-07, -4.293397068977356e-07, -4.1350722312927246e-07, -3.976747393608093e-07, -3.818422555923462e-07, -3.6600977182388306e-07, -3.501772880554199e-07, -3.343448042869568e-07, -3.1851232051849365e-07, -3.026798367500305e-07, -2.868473529815674e-07, -2.7101486921310425e-07, -2.551823854446411e-07, -2.39349901676178e-07, -2.2351741790771484e-07, -2.076849341392517e-07, -1.9185245037078857e-07, -1.7601996660232544e-07, -1.601874828338623e-07, -1.4435499906539917e-07, -1.2852251529693604e-07, -1.126900315284729e-07, -9.685754776000977e-08, -8.102506399154663e-08, -6.51925802230835e-08, -4.936009645462036e-08, -3.3527612686157227e-08, -1.7695128917694092e-08, -1.862645149230957e-09, 1.3969838619232178e-08, 2.9802322387695312e-08, 4.563480615615845e-08, 6.146728992462158e-08, 7.729977369308472e-08, 9.313225746154785e-08, 1.0896474123001099e-07, 1.2479722499847412e-07, 1.4062970876693726e-07, 1.564621925354004e-07, 1.7229467630386353e-07, 1.8812716007232666e-07, 2.039596438407898e-07, 2.1979212760925293e-07, 2.3562461137771606e-07, 2.514570951461792e-07, 2.6728957891464233e-07, 2.8312206268310547e-07, 2.989545464515686e-07, 3.1478703022003174e-07, 3.3061951398849487e-07, 3.46451997756958e-07, 3.6228448152542114e-07, 3.781169652938843e-07, 3.939494490623474e-07, 4.0978193283081055e-07, 4.256144165992737e-07, 4.414469003677368e-07, 4.5727938413619995e-07, 4.731118679046631e-07, 4.889443516731262e-07, 5.047768354415894e-07, 5.206093192100525e-07, 5.364418029785156e-07]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 3.0, 6.0, 14.0, 6.0, 2.0, 15.0, 46.0, 20.0, 26.0, 47.0, 229.0, 134.0, 2134.0, 1004100.0, 40641.0, 656.0, 124.0, 183.0, 36.0, 8.0, 35.0, 33.0, 8.0, 3.0, 8.0, 11.0, 3.0, 1.0, 6.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1205673217773438e-05, -1.0874122381210327e-05, -1.0542571544647217e-05, -1.0211020708084106e-05, -9.879469871520996e-06, -9.547919034957886e-06, -9.216368198394775e-06, -8.884817361831665e-06, -8.553266525268555e-06, -8.221715688705444e-06, -7.890164852142334e-06, -7.558614015579224e-06, -7.227063179016113e-06, -6.895512342453003e-06, -6.563961505889893e-06, -6.232410669326782e-06, -5.900859832763672e-06, -5.5693089962005615e-06, -5.237758159637451e-06, -4.906207323074341e-06, -4.5746564865112305e-06, -4.24310564994812e-06, -3.91155481338501e-06, -3.5800039768218994e-06, -3.248453140258789e-06, -2.9169023036956787e-06, -2.5853514671325684e-06, -2.253800630569458e-06, -1.9222497940063477e-06, -1.5906989574432373e-06, -1.259148120880127e-06, -9.275972843170166e-07, -5.960464477539062e-07, -2.644956111907959e-07, 6.705522537231445e-08, 3.986060619354248e-07, 7.301568984985352e-07, 1.0617077350616455e-06, 1.3932585716247559e-06, 1.7248094081878662e-06, 2.0563602447509766e-06, 2.387911081314087e-06, 2.7194619178771973e-06, 3.0510127544403076e-06, 3.382563591003418e-06, 3.7141144275665283e-06, 4.045665264129639e-06, 4.377216100692749e-06, 4.708766937255859e-06, 5.04031777381897e-06, 5.37186861038208e-06, 5.7034194469451904e-06, 6.034970283508301e-06, 6.366521120071411e-06, 6.6980719566345215e-06, 7.029622793197632e-06, 7.361173629760742e-06, 7.692724466323853e-06, 8.024275302886963e-06, 8.355826139450073e-06, 8.687376976013184e-06, 9.018927812576294e-06, 9.350478649139404e-06, 9.682029485702515e-06, 1.0013580322265625e-05]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 13.0, 11.0, 10.0, 17.0, 21.0, 19.0, 781.0, 15.0, 15.0, 19.0, 11.0, 10.0, 11.0, 13.0, 8.0, 5.0, 3.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.686910025000543e-07, -1.613263407307386e-07, -1.5396167896142288e-07, -1.4659703140296187e-07, -1.3923236963364616e-07, -1.3186770786433044e-07, -1.2450304609501472e-07, -1.1713839143112637e-07, -1.09773736767238e-07, -1.0240907499792229e-07, -9.504442033403393e-08, -8.767975856471821e-08, -8.031510390082985e-08, -7.295044213151414e-08, -6.558578036219842e-08, -5.822112569831006e-08, -5.0856463928994344e-08, -4.3491805712392306e-08, -3.612714749579027e-08, -2.876248750283139e-08, -2.1397829286229353e-08, -1.4033169293270475e-08, -6.6685110766684375e-09, 6.961471399336006e-10, 8.060805356535639e-09, 1.5425463573137677e-08, 2.2790121789739715e-08, 3.015478000634175e-08, 3.751944177565747e-08, 4.488409999225951e-08, 5.2248758208861545e-08, 5.96134128727499e-08, 6.697807464206562e-08, 7.434273641138134e-08, 8.17073910752697e-08, 8.907205284458541e-08, 9.643670750847377e-08, 1.0380136927778949e-07, 1.1116603104710521e-07, 1.1853068571099357e-07, 1.2589534037488193e-07, 1.3326000214419764e-07, 1.4062466391351336e-07, 1.4798931147197436e-07, 1.5535397324129008e-07, 1.627186350106058e-07, 1.700832967799215e-07, 1.7744795854923723e-07, 1.8481262031855294e-07, 1.9217728208786866e-07, 1.9954194385718438e-07, 2.0690659141564538e-07, 2.142712531849611e-07, 2.2163591495427681e-07, 2.2900057672359253e-07, 2.3636522428205353e-07, 2.4372988605136925e-07, 2.5109454782068497e-07, 2.584592095900007e-07, 2.658238713593164e-07, 2.731885331286321e-07, 2.8055319489794783e-07, 2.879178282455541e-07, 2.9528249001486984e-07, 3.0264715178418555e-07]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 117.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 765.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 122.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1362135410308838e-07, -1.0803341865539551e-07, -1.0244548320770264e-07, -9.685754776000977e-08, -9.12696123123169e-08, -8.568167686462402e-08, -8.009374141693115e-08, -7.450580596923828e-08, -6.891787052154541e-08, -6.332993507385254e-08, -5.774199962615967e-08, -5.21540641784668e-08, -4.6566128730773926e-08, -4.0978193283081055e-08, -3.5390257835388184e-08, -2.9802322387695312e-08, -2.421438694000244e-08, -1.862645149230957e-08, -1.30385160446167e-08, -7.450580596923828e-09, -1.862645149230957e-09, 3.725290298461914e-09, 9.313225746154785e-09, 1.4901161193847656e-08, 2.0489096641540527e-08, 2.60770320892334e-08, 3.166496753692627e-08, 3.725290298461914e-08, 4.284083843231201e-08, 4.842877388000488e-08, 5.4016709327697754e-08, 5.960464477539063e-08, 6.51925802230835e-08, 7.078051567077637e-08, 7.636845111846924e-08, 8.195638656616211e-08, 8.754432201385498e-08, 9.313225746154785e-08, 9.872019290924072e-08, 1.043081283569336e-07, 1.0989606380462646e-07, 1.1548399925231934e-07, 1.210719347000122e-07, 1.2665987014770508e-07, 1.3224780559539795e-07, 1.3783574104309082e-07, 1.434236764907837e-07, 1.4901161193847656e-07, 1.5459954738616943e-07, 1.601874828338623e-07, 1.6577541828155518e-07, 1.7136335372924805e-07, 1.7695128917694092e-07, 1.825392246246338e-07, 1.8812716007232666e-07, 1.9371509552001953e-07, 1.993030309677124e-07, 2.0489096641540527e-07, 2.1047890186309814e-07, 2.1606683731079102e-07, 2.2165477275848389e-07, 2.2724270820617676e-07, 2.3283064365386963e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 10.0, 16.0, 18.0, 14.0, 24.0, 23.0, 20.0, 25.0, 25.0, 40.0, 49.0, 37.0, 48.0, 46.0, 44.0, 35.0, 49.0, 46.0, 51.0, 41.0, 30.0, 31.0, 36.0, 23.0, 25.0, 26.0, 28.0, 23.0, 14.0, 20.0, 14.0, 10.0, 12.0, 8.0, 7.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.494140625, -3.38909912109375, -3.2840576171875, -3.17901611328125, -3.073974609375, -2.96893310546875, -2.8638916015625, -2.75885009765625, -2.65380859375, -2.54876708984375, -2.4437255859375, -2.33868408203125, -2.233642578125, -2.12860107421875, -2.0235595703125, -1.91851806640625, -1.8134765625, -1.70843505859375, -1.6033935546875, -1.49835205078125, -1.393310546875, -1.28826904296875, -1.1832275390625, -1.07818603515625, -0.97314453125, -0.86810302734375, -0.7630615234375, -0.65802001953125, -0.552978515625, -0.44793701171875, -0.3428955078125, -0.23785400390625, -0.1328125, -0.02777099609375, 0.0772705078125, 0.18231201171875, 0.287353515625, 0.39239501953125, 0.4974365234375, 0.60247802734375, 0.70751953125, 0.81256103515625, 0.9176025390625, 1.02264404296875, 1.127685546875, 1.23272705078125, 1.3377685546875, 1.44281005859375, 1.5478515625, 1.65289306640625, 1.7579345703125, 1.86297607421875, 1.968017578125, 2.07305908203125, 2.1781005859375, 2.28314208984375, 2.38818359375, 2.49322509765625, 2.5982666015625, 2.70330810546875, 2.808349609375, 2.91339111328125, 3.0184326171875, 3.12347412109375, 3.228515625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 14.0, 15.0, 18.0, 28.0, 40.0, 69.0, 99.0, 178.0, 296.0, 543.0, 977.0, 1805.0, 3375.0, 6324.0, 12948.0, 27743.0, 76611.0, 416669.0, 374968.0, 73127.0, 27032.0, 12291.0, 6166.0, 3263.0, 1722.0, 932.0, 488.0, 299.0, 175.0, 109.0, 66.0, 48.0, 29.0, 19.0, 16.0, 11.0, 8.0, 6.0, 5.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.80078125, -4.65521240234375, -4.5096435546875, -4.36407470703125, -4.218505859375, -4.07293701171875, -3.9273681640625, -3.78179931640625, -3.63623046875, -3.49066162109375, -3.3450927734375, -3.19952392578125, -3.053955078125, -2.90838623046875, -2.7628173828125, -2.61724853515625, -2.4716796875, -2.32611083984375, -2.1805419921875, -2.03497314453125, -1.889404296875, -1.74383544921875, -1.5982666015625, -1.45269775390625, -1.30712890625, -1.16156005859375, -1.0159912109375, -0.87042236328125, -0.724853515625, -0.57928466796875, -0.4337158203125, -0.28814697265625, -0.142578125, 0.00299072265625, 0.1485595703125, 0.29412841796875, 0.439697265625, 0.58526611328125, 0.7308349609375, 0.87640380859375, 1.02197265625, 1.16754150390625, 1.3131103515625, 1.45867919921875, 1.604248046875, 1.74981689453125, 1.8953857421875, 2.04095458984375, 2.1865234375, 2.33209228515625, 2.4776611328125, 2.62322998046875, 2.768798828125, 2.91436767578125, 3.0599365234375, 3.20550537109375, 3.35107421875, 3.49664306640625, 3.6422119140625, 3.78778076171875, 3.933349609375, 4.07891845703125, 4.2244873046875, 4.37005615234375, 4.515625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 7.0, 7.0, 13.0, 17.0, 16.0, 25.0, 19.0, 33.0, 32.0, 29.0, 33.0, 35.0, 46.0, 56.0, 65.0, 153.0, 1635.0, 297.0, 98.0, 60.0, 40.0, 34.0, 30.0, 38.0, 30.0, 37.0, 29.0, 24.0, 19.0, 16.0, 13.0, 7.0, 8.0, 12.0, 9.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.65625, -11.2899169921875, -10.923583984375, -10.5572509765625, -10.19091796875, -9.8245849609375, -9.458251953125, -9.0919189453125, -8.7255859375, -8.3592529296875, -7.992919921875, -7.6265869140625, -7.26025390625, -6.8939208984375, -6.527587890625, -6.1612548828125, -5.794921875, -5.4285888671875, -5.062255859375, -4.6959228515625, -4.32958984375, -3.9632568359375, -3.596923828125, -3.2305908203125, -2.8642578125, -2.4979248046875, -2.131591796875, -1.7652587890625, -1.39892578125, -1.0325927734375, -0.666259765625, -0.2999267578125, 0.06640625, 0.4327392578125, 0.799072265625, 1.1654052734375, 1.53173828125, 1.8980712890625, 2.264404296875, 2.6307373046875, 2.9970703125, 3.3634033203125, 3.729736328125, 4.0960693359375, 4.46240234375, 4.8287353515625, 5.195068359375, 5.5614013671875, 5.927734375, 6.2940673828125, 6.660400390625, 7.0267333984375, 7.39306640625, 7.7593994140625, 8.125732421875, 8.4920654296875, 8.8583984375, 9.2247314453125, 9.591064453125, 9.9573974609375, 10.32373046875, 10.6900634765625, 11.056396484375, 11.4227294921875, 11.7890625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 10.0, 10.0, 7.0, 8.0, 10.0, 17.0, 23.0, 23.0, 30.0, 35.0, 54.0, 56.0, 89.0, 105.0, 207.0, 504.0, 3319.0, 284103.0, 2845749.0, 9752.0, 783.0, 256.0, 171.0, 87.0, 51.0, 40.0, 41.0, 40.0, 21.0, 23.0, 17.0, 15.0, 12.0, 9.0, 3.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-28.875, -27.977294921875, -27.07958984375, -26.181884765625, -25.2841796875, -24.386474609375, -23.48876953125, -22.591064453125, -21.693359375, -20.795654296875, -19.89794921875, -19.000244140625, -18.1025390625, -17.204833984375, -16.30712890625, -15.409423828125, -14.51171875, -13.614013671875, -12.71630859375, -11.818603515625, -10.9208984375, -10.023193359375, -9.12548828125, -8.227783203125, -7.330078125, -6.432373046875, -5.53466796875, -4.636962890625, -3.7392578125, -2.841552734375, -1.94384765625, -1.046142578125, -0.1484375, 0.749267578125, 1.64697265625, 2.544677734375, 3.4423828125, 4.340087890625, 5.23779296875, 6.135498046875, 7.033203125, 7.930908203125, 8.82861328125, 9.726318359375, 10.6240234375, 11.521728515625, 12.41943359375, 13.317138671875, 14.21484375, 15.112548828125, 16.01025390625, 16.907958984375, 17.8056640625, 18.703369140625, 19.60107421875, 20.498779296875, 21.396484375, 22.294189453125, 23.19189453125, 24.089599609375, 24.9873046875, 25.885009765625, 26.78271484375, 27.680419921875, 28.578125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 6.0, 17.0, 20.0, 18.0, 22.0, 36.0, 30.0, 44.0, 51.0, 62.0, 62.0, 54.0, 70.0, 70.0, 69.0, 61.0, 61.0, 59.0, 35.0, 36.0, 27.0, 19.0, 22.0, 12.0, 8.0, 13.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.306954383850098, -6.050226211547852, -5.793498516082764, -5.536770343780518, -5.28004264831543, -5.023314476013184, -4.7665863037109375, -4.509858131408691, -4.2531304359436035, -3.9964025020599365, -3.7396745681762695, -3.4829463958740234, -3.2262184619903564, -2.9694905281066895, -2.7127623558044434, -2.4560344219207764, -2.1993064880371094, -1.9425785541534424, -1.6858505010604858, -1.4291224479675293, -1.1723945140838623, -0.9156665802001953, -0.6589385271072388, -0.4022104740142822, -0.14548254013061523, 0.11124545335769653, 0.3679734468460083, 0.6247014403343201, 0.8814294338226318, 1.1381573677062988, 1.3948854207992554, 1.651613473892212, 1.9083423614501953, 2.1650702953338623, 2.4217982292175293, 2.6785264015197754, 2.9352543354034424, 3.1919822692871094, 3.4487104415893555, 3.7054383754730225, 3.9621663093566895, 4.2188944816589355, 4.475622177124023, 4.7323503494262695, 4.989078521728516, 5.2458062171936035, 5.50253438949585, 5.7592620849609375, 6.015990257263184, 6.27271842956543, 6.529446125030518, 6.786174297332764, 7.042901992797852, 7.299630165100098, 7.556358337402344, 7.81308650970459, 8.069814682006836, 8.326542854309082, 8.583271026611328, 8.839998245239258, 9.096726417541504, 9.35345458984375, 9.610182762145996, 9.866910934448242, 10.123638153076172]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 6.0, 7.0, 6.0, 13.0, 7.0, 16.0, 18.0, 14.0, 8.0, 17.0, 17.0, 24.0, 22.0, 28.0, 33.0, 37.0, 43.0, 36.0, 51.0, 49.0, 43.0, 36.0, 38.0, 43.0, 54.0, 37.0, 29.0, 30.0, 27.0, 28.0, 31.0, 20.0, 19.0, 22.0, 16.0, 10.0, 13.0, 6.0, 4.0, 7.0, 10.0, 2.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.508697509765625, -32.48554229736328, -31.46238899230957, -30.43923568725586, -29.41608238220215, -28.392929077148438, -27.369773864746094, -26.346620559692383, -25.323467254638672, -24.30031394958496, -23.277158737182617, -22.254005432128906, -21.230852127075195, -20.207698822021484, -19.18454360961914, -18.16139030456543, -17.138235092163086, -16.115081787109375, -15.091927528381348, -14.06877326965332, -13.04561996459961, -12.022465705871582, -10.999311447143555, -9.976158142089844, -8.953003883361816, -7.929850101470947, -6.906696319580078, -5.883542060852051, -4.860388278961182, -3.8372344970703125, -2.814080238342285, -1.790926456451416, -0.7677726745605469, 0.2553812265396118, 1.2785351276397705, 2.3016891479492188, 3.324842929840088, 4.347996711730957, 5.371150970458984, 6.3943047523498535, 7.417458534240723, 8.44061279296875, 9.463766098022461, 10.486920356750488, 11.510074615478516, 12.533227920532227, 13.556382179260254, 14.579536437988281, 15.602689743041992, 16.625843048095703, 17.648998260498047, 18.672151565551758, 19.69530487060547, 20.718460083007812, 21.741613388061523, 22.764766693115234, 23.787921905517578, 24.81107521057129, 25.834230422973633, 26.857383728027344, 27.880537033081055, 28.903690338134766, 29.92684555053711, 30.94999885559082, 31.97315216064453]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 14.0, 11.0, 16.0, 17.0, 16.0, 29.0, 15.0, 33.0, 21.0, 20.0, 46.0, 46.0, 48.0, 58.0, 41.0, 37.0, 40.0, 55.0, 45.0, 38.0, 39.0, 40.0, 33.0, 25.0, 37.0, 23.0, 23.0, 19.0, 19.0, 21.0, 13.0, 11.0, 10.0, 3.0, 8.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.689453125, -3.576385498046875, -3.46331787109375, -3.350250244140625, -3.2371826171875, -3.124114990234375, -3.01104736328125, -2.897979736328125, -2.784912109375, -2.671844482421875, -2.55877685546875, -2.445709228515625, -2.3326416015625, -2.219573974609375, -2.10650634765625, -1.993438720703125, -1.88037109375, -1.767303466796875, -1.65423583984375, -1.541168212890625, -1.4281005859375, -1.315032958984375, -1.20196533203125, -1.088897705078125, -0.975830078125, -0.862762451171875, -0.74969482421875, -0.636627197265625, -0.5235595703125, -0.410491943359375, -0.29742431640625, -0.184356689453125, -0.0712890625, 0.041778564453125, 0.15484619140625, 0.267913818359375, 0.3809814453125, 0.494049072265625, 0.60711669921875, 0.720184326171875, 0.833251953125, 0.946319580078125, 1.05938720703125, 1.172454833984375, 1.2855224609375, 1.398590087890625, 1.51165771484375, 1.624725341796875, 1.73779296875, 1.850860595703125, 1.96392822265625, 2.076995849609375, 2.1900634765625, 2.303131103515625, 2.41619873046875, 2.529266357421875, 2.642333984375, 2.755401611328125, 2.86846923828125, 2.981536865234375, 3.0946044921875, 3.207672119140625, 3.32073974609375, 3.433807373046875, 3.546875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 2.0, 6.0, 9.0, 12.0, 19.0, 24.0, 35.0, 50.0, 77.0, 123.0, 195.0, 224.0, 358.0, 554.0, 943.0, 1540.0, 2605.0, 4484.0, 7708.0, 14194.0, 27162.0, 54490.0, 112907.0, 243235.0, 518989.0, 939864.0, 1046830.0, 638078.0, 302231.0, 139106.0, 65797.0, 32727.0, 17128.0, 9361.0, 5122.0, 3052.0, 1831.0, 1096.0, 699.0, 440.0, 295.0, 203.0, 142.0, 99.0, 78.0, 46.0, 35.0, 26.0, 11.0, 18.0, 7.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.759765625, -2.665069580078125, -2.57037353515625, -2.475677490234375, -2.3809814453125, -2.286285400390625, -2.19158935546875, -2.096893310546875, -2.002197265625, -1.907501220703125, -1.81280517578125, -1.718109130859375, -1.6234130859375, -1.528717041015625, -1.43402099609375, -1.339324951171875, -1.24462890625, -1.149932861328125, -1.05523681640625, -0.960540771484375, -0.8658447265625, -0.771148681640625, -0.67645263671875, -0.581756591796875, -0.487060546875, -0.392364501953125, -0.29766845703125, -0.202972412109375, -0.1082763671875, -0.013580322265625, 0.08111572265625, 0.175811767578125, 0.2705078125, 0.365203857421875, 0.45989990234375, 0.554595947265625, 0.6492919921875, 0.743988037109375, 0.83868408203125, 0.933380126953125, 1.028076171875, 1.122772216796875, 1.21746826171875, 1.312164306640625, 1.4068603515625, 1.501556396484375, 1.59625244140625, 1.690948486328125, 1.78564453125, 1.880340576171875, 1.97503662109375, 2.069732666015625, 2.1644287109375, 2.259124755859375, 2.35382080078125, 2.448516845703125, 2.543212890625, 2.637908935546875, 2.73260498046875, 2.827301025390625, 2.9219970703125, 3.016693115234375, 3.11138916015625, 3.206085205078125, 3.30078125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 8.0, 11.0, 13.0, 25.0, 22.0, 36.0, 52.0, 72.0, 80.0, 101.0, 142.0, 161.0, 233.0, 298.0, 368.0, 411.0, 363.0, 381.0, 254.0, 251.0, 188.0, 158.0, 109.0, 76.0, 66.0, 49.0, 35.0, 30.0, 20.0, 16.0, 8.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.287841796875, -6.10302734375, -5.918212890625, -5.7333984375, -5.548583984375, -5.36376953125, -5.178955078125, -4.994140625, -4.809326171875, -4.62451171875, -4.439697265625, -4.2548828125, -4.070068359375, -3.88525390625, -3.700439453125, -3.515625, -3.330810546875, -3.14599609375, -2.961181640625, -2.7763671875, -2.591552734375, -2.40673828125, -2.221923828125, -2.037109375, -1.852294921875, -1.66748046875, -1.482666015625, -1.2978515625, -1.113037109375, -0.92822265625, -0.743408203125, -0.55859375, -0.373779296875, -0.18896484375, -0.004150390625, 0.1806640625, 0.365478515625, 0.55029296875, 0.735107421875, 0.919921875, 1.104736328125, 1.28955078125, 1.474365234375, 1.6591796875, 1.843994140625, 2.02880859375, 2.213623046875, 2.3984375, 2.583251953125, 2.76806640625, 2.952880859375, 3.1376953125, 3.322509765625, 3.50732421875, 3.692138671875, 3.876953125, 4.061767578125, 4.24658203125, 4.431396484375, 4.6162109375, 4.801025390625, 4.98583984375, 5.170654296875, 5.35546875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 14.0, 15.0, 24.0, 29.0, 26.0, 47.0, 71.0, 84.0, 155.0, 199.0, 266.0, 414.0, 847.0, 3799.0, 75856.0, 3071180.0, 1015013.0, 22550.0, 1896.0, 616.0, 328.0, 224.0, 151.0, 113.0, 86.0, 72.0, 59.0, 39.0, 19.0, 18.0, 15.0, 14.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -16.9228515625, -16.267578125, -15.6123046875, -14.95703125, -14.3017578125, -13.646484375, -12.9912109375, -12.3359375, -11.6806640625, -11.025390625, -10.3701171875, -9.71484375, -9.0595703125, -8.404296875, -7.7490234375, -7.09375, -6.4384765625, -5.783203125, -5.1279296875, -4.47265625, -3.8173828125, -3.162109375, -2.5068359375, -1.8515625, -1.1962890625, -0.541015625, 0.1142578125, 0.76953125, 1.4248046875, 2.080078125, 2.7353515625, 3.390625, 4.0458984375, 4.701171875, 5.3564453125, 6.01171875, 6.6669921875, 7.322265625, 7.9775390625, 8.6328125, 9.2880859375, 9.943359375, 10.5986328125, 11.25390625, 11.9091796875, 12.564453125, 13.2197265625, 13.875, 14.5302734375, 15.185546875, 15.8408203125, 16.49609375, 17.1513671875, 17.806640625, 18.4619140625, 19.1171875, 19.7724609375, 20.427734375, 21.0830078125, 21.73828125, 22.3935546875, 23.048828125, 23.7041015625, 24.359375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 46.0, 64.0, 163.0, 291.0, 220.0, 140.0, 58.0, 18.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.3547592163086, -108.04390716552734, -105.73304748535156, -103.42219543457031, -101.11134338378906, -98.80049133300781, -96.48963928222656, -94.17877960205078, -91.86792755126953, -89.55707550048828, -87.2462158203125, -84.93536376953125, -82.62451171875, -80.31365966796875, -78.0028076171875, -75.69194793701172, -73.38109588623047, -71.07024383544922, -68.75938415527344, -66.44853210449219, -64.13768005371094, -61.82682800292969, -59.51597213745117, -57.205116271972656, -54.894264221191406, -52.583412170410156, -50.27255630493164, -47.961700439453125, -45.650848388671875, -43.339996337890625, -41.02914047241211, -38.718284606933594, -36.40742874145508, -34.09657287597656, -31.785720825195312, -29.47486686706543, -27.164012908935547, -24.853158950805664, -22.54230499267578, -20.2314510345459, -17.920597076416016, -15.609743118286133, -13.29888916015625, -10.988035202026367, -8.677181243896484, -6.366327285766602, -4.055473327636719, -1.744619369506836, 0.5662345886230469, 2.8770885467529297, 5.1879425048828125, 7.498796463012695, 9.809650421142578, 12.120504379272461, 14.431358337402344, 16.742212295532227, 19.05306625366211, 21.363920211791992, 23.674774169921875, 25.985628128051758, 28.29648208618164, 30.607336044311523, 32.918190002441406, 35.229042053222656, 37.53989791870117]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 8.0, 7.0, 1.0, 7.0, 9.0, 3.0, 17.0, 21.0, 14.0, 17.0, 30.0, 14.0, 28.0, 40.0, 42.0, 35.0, 36.0, 33.0, 41.0, 62.0, 36.0, 42.0, 32.0, 39.0, 45.0, 38.0, 39.0, 28.0, 38.0, 37.0, 27.0, 23.0, 22.0, 14.0, 15.0, 12.0, 12.0, 13.0, 6.0, 6.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.601394653320312, -20.906360626220703, -20.211326599121094, -19.516292572021484, -18.821258544921875, -18.126224517822266, -17.431190490722656, -16.736156463623047, -16.041122436523438, -15.346088409423828, -14.651054382324219, -13.95602035522461, -13.260986328125, -12.56595230102539, -11.870919227600098, -11.175885200500488, -10.480852127075195, -9.785818099975586, -9.090784072875977, -8.395750045776367, -7.700716495513916, -7.005682468414307, -6.3106489181518555, -5.615614891052246, -4.920580863952637, -4.225546836853027, -3.530513048171997, -2.835479259490967, -2.1404452323913574, -1.445411205291748, -0.7503776550292969, -0.0553436279296875, 0.6396903991699219, 1.3347243070602417, 2.0297582149505615, 2.724792003631592, 3.419826030731201, 4.1148600578308105, 4.809893608093262, 5.504927635192871, 6.1999616622924805, 6.89499568939209, 7.590029716491699, 8.285062789916992, 8.980096817016602, 9.675130844116211, 10.37016487121582, 11.06519889831543, 11.760232925415039, 12.455266952514648, 13.150300979614258, 13.845335006713867, 14.540369033813477, 15.235403060913086, 15.930436134338379, 16.625469207763672, 17.32050323486328, 18.01553726196289, 18.7105712890625, 19.40560531616211, 20.10063934326172, 20.795673370361328, 21.490707397460938, 22.185741424560547, 22.880775451660156]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 10.0, 5.0, 20.0, 17.0, 12.0, 16.0, 27.0, 26.0, 23.0, 30.0, 33.0, 44.0, 43.0, 48.0, 55.0, 43.0, 46.0, 41.0, 49.0, 38.0, 33.0, 28.0, 42.0, 41.0, 23.0, 16.0, 27.0, 22.0, 20.0, 19.0, 16.0, 13.0, 11.0, 11.0, 4.0, 7.0, 8.0, 8.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.453125, -3.34539794921875, -3.2376708984375, -3.12994384765625, -3.022216796875, -2.91448974609375, -2.8067626953125, -2.69903564453125, -2.59130859375, -2.48358154296875, -2.3758544921875, -2.26812744140625, -2.160400390625, -2.05267333984375, -1.9449462890625, -1.83721923828125, -1.7294921875, -1.62176513671875, -1.5140380859375, -1.40631103515625, -1.298583984375, -1.19085693359375, -1.0831298828125, -0.97540283203125, -0.86767578125, -0.75994873046875, -0.6522216796875, -0.54449462890625, -0.436767578125, -0.32904052734375, -0.2213134765625, -0.11358642578125, -0.005859375, 0.10186767578125, 0.2095947265625, 0.31732177734375, 0.425048828125, 0.53277587890625, 0.6405029296875, 0.74822998046875, 0.85595703125, 0.96368408203125, 1.0714111328125, 1.17913818359375, 1.286865234375, 1.39459228515625, 1.5023193359375, 1.61004638671875, 1.7177734375, 1.82550048828125, 1.9332275390625, 2.04095458984375, 2.148681640625, 2.25640869140625, 2.3641357421875, 2.47186279296875, 2.57958984375, 2.68731689453125, 2.7950439453125, 2.90277099609375, 3.010498046875, 3.11822509765625, 3.2259521484375, 3.33367919921875, 3.44140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 6.0, 6.0, 12.0, 7.0, 17.0, 24.0, 40.0, 34.0, 57.0, 70.0, 110.0, 156.0, 235.0, 278.0, 427.0, 571.0, 733.0, 1010.0, 1502.0, 2077.0, 2975.0, 4073.0, 5724.0, 8168.0, 11353.0, 16617.0, 24255.0, 36892.0, 57943.0, 100492.0, 214216.0, 250894.0, 115610.0, 64699.0, 40513.0, 26310.0, 17838.0, 12413.0, 8599.0, 6248.0, 4365.0, 3054.0, 2276.0, 1587.0, 1103.0, 810.0, 616.0, 456.0, 299.0, 234.0, 156.0, 109.0, 79.0, 49.0, 54.0, 44.0, 26.0, 17.0, 13.0, 7.0, 8.0, 3.0, 3.0], "bins": [-0.0232696533203125, -0.02254486083984375, -0.021820068359375, -0.02109527587890625, -0.0203704833984375, -0.01964569091796875, -0.0189208984375, -0.01819610595703125, -0.0174713134765625, -0.01674652099609375, -0.016021728515625, -0.01529693603515625, -0.0145721435546875, -0.01384735107421875, -0.01312255859375, -0.01239776611328125, -0.0116729736328125, -0.01094818115234375, -0.010223388671875, -0.00949859619140625, -0.0087738037109375, -0.00804901123046875, -0.00732421875, -0.00659942626953125, -0.0058746337890625, -0.00514984130859375, -0.004425048828125, -0.00370025634765625, -0.0029754638671875, -0.00225067138671875, -0.00152587890625, -0.00080108642578125, -7.62939453125e-05, 0.00064849853515625, 0.001373291015625, 0.00209808349609375, 0.0028228759765625, 0.00354766845703125, 0.0042724609375, 0.00499725341796875, 0.0057220458984375, 0.00644683837890625, 0.007171630859375, 0.00789642333984375, 0.0086212158203125, 0.00934600830078125, 0.01007080078125, 0.01079559326171875, 0.0115203857421875, 0.01224517822265625, 0.012969970703125, 0.01369476318359375, 0.0144195556640625, 0.01514434814453125, 0.015869140625, 0.01659393310546875, 0.0173187255859375, 0.01804351806640625, 0.018768310546875, 0.01949310302734375, 0.0202178955078125, 0.02094268798828125, 0.02166748046875, 0.02239227294921875, 0.0231170654296875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 4.0, 11.0, 12.0, 4.0, 14.0, 10.0, 14.0, 18.0, 20.0, 25.0, 17.0, 26.0, 25.0, 36.0, 30.0, 38.0, 49.0, 37.0, 37.0, 42.0, 1069.0, 57.0, 41.0, 41.0, 35.0, 46.0, 33.0, 34.0, 18.0, 28.0, 24.0, 16.0, 16.0, 14.0, 7.0, 14.0, 12.0, 10.0, 9.0, 9.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-2.34765625, -2.27972412109375, -2.2117919921875, -2.14385986328125, -2.075927734375, -2.00799560546875, -1.9400634765625, -1.87213134765625, -1.80419921875, -1.73626708984375, -1.6683349609375, -1.60040283203125, -1.532470703125, -1.46453857421875, -1.3966064453125, -1.32867431640625, -1.2607421875, -1.19281005859375, -1.1248779296875, -1.05694580078125, -0.989013671875, -0.92108154296875, -0.8531494140625, -0.78521728515625, -0.71728515625, -0.64935302734375, -0.5814208984375, -0.51348876953125, -0.445556640625, -0.37762451171875, -0.3096923828125, -0.24176025390625, -0.173828125, -0.10589599609375, -0.0379638671875, 0.02996826171875, 0.097900390625, 0.16583251953125, 0.2337646484375, 0.30169677734375, 0.36962890625, 0.43756103515625, 0.5054931640625, 0.57342529296875, 0.641357421875, 0.70928955078125, 0.7772216796875, 0.84515380859375, 0.9130859375, 0.98101806640625, 1.0489501953125, 1.11688232421875, 1.184814453125, 1.25274658203125, 1.3206787109375, 1.38861083984375, 1.45654296875, 1.52447509765625, 1.5924072265625, 1.66033935546875, 1.728271484375, 1.79620361328125, 1.8641357421875, 1.93206787109375, 2.0]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 11.0, 6.0, 17.0, 31.0, 40.0, 59.0, 79.0, 137.0, 180.0, 268.0, 387.0, 499.0, 753.0, 1013.0, 1388.0, 1959.0, 2695.0, 3751.0, 5149.0, 7263.0, 10307.0, 14793.0, 22078.0, 33793.0, 54397.0, 93807.0, 203509.0, 1325036.0, 122802.0, 66465.0, 40933.0, 25820.0, 17161.0, 11837.0, 8150.0, 5807.0, 4179.0, 2995.0, 2136.0, 1589.0, 1164.0, 817.0, 555.0, 410.0, 275.0, 195.0, 151.0, 103.0, 62.0, 48.0, 25.0, 25.0, 14.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01605224609375, -0.015537738800048828, -0.015023231506347656, -0.014508724212646484, -0.013994216918945312, -0.01347970962524414, -0.012965202331542969, -0.012450695037841797, -0.011936187744140625, -0.011421680450439453, -0.010907173156738281, -0.01039266586303711, -0.009878158569335938, -0.009363651275634766, -0.008849143981933594, -0.008334636688232422, -0.00782012939453125, -0.007305622100830078, -0.006791114807128906, -0.006276607513427734, -0.0057621002197265625, -0.005247592926025391, -0.004733085632324219, -0.004218578338623047, -0.003704071044921875, -0.003189563751220703, -0.0026750564575195312, -0.0021605491638183594, -0.0016460418701171875, -0.0011315345764160156, -0.0006170272827148438, -0.00010251998901367188, 0.0004119873046875, 0.0009264945983886719, 0.0014410018920898438, 0.0019555091857910156, 0.0024700164794921875, 0.0029845237731933594, 0.0034990310668945312, 0.004013538360595703, 0.004528045654296875, 0.005042552947998047, 0.005557060241699219, 0.006071567535400391, 0.0065860748291015625, 0.007100582122802734, 0.007615089416503906, 0.008129596710205078, 0.00864410400390625, 0.009158611297607422, 0.009673118591308594, 0.010187625885009766, 0.010702133178710938, 0.01121664047241211, 0.011731147766113281, 0.012245655059814453, 0.012760162353515625, 0.013274669647216797, 0.013789176940917969, 0.01430368423461914, 0.014818191528320312, 0.015332698822021484, 0.015847206115722656, 0.016361713409423828, 0.016876220703125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 0.0, 158.0, 0.0, 0.0, 0.0, 0.0, 499.0, 0.0, 0.0, 0.0, 0.0, 168.0, 0.0, 0.0, 0.0, 0.0, 61.0, 0.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4552067518234253e-07, -3.334134817123413e-07, -3.213062882423401e-07, -3.0919909477233887e-07, -2.9709190130233765e-07, -2.849847078323364e-07, -2.728775143623352e-07, -2.60770320892334e-07, -2.4866312742233276e-07, -2.3655593395233154e-07, -2.2444874048233032e-07, -2.123415470123291e-07, -2.0023435354232788e-07, -1.8812716007232666e-07, -1.7601996660232544e-07, -1.6391277313232422e-07, -1.51805579662323e-07, -1.3969838619232178e-07, -1.2759119272232056e-07, -1.1548399925231934e-07, -1.0337680578231812e-07, -9.12696123123169e-08, -7.916241884231567e-08, -6.705522537231445e-08, -5.494803190231323e-08, -4.284083843231201e-08, -3.073364496231079e-08, -1.862645149230957e-08, -6.51925802230835e-09, 5.587935447692871e-09, 1.7695128917694092e-08, 2.9802322387695312e-08, 4.190951585769653e-08, 5.4016709327697754e-08, 6.612390279769897e-08, 7.82310962677002e-08, 9.033828973770142e-08, 1.0244548320770264e-07, 1.1455267667770386e-07, 1.2665987014770508e-07, 1.387670636177063e-07, 1.5087425708770752e-07, 1.6298145055770874e-07, 1.7508864402770996e-07, 1.8719583749771118e-07, 1.993030309677124e-07, 2.1141022443771362e-07, 2.2351741790771484e-07, 2.3562461137771606e-07, 2.477318048477173e-07, 2.598389983177185e-07, 2.7194619178771973e-07, 2.8405338525772095e-07, 2.9616057872772217e-07, 3.082677721977234e-07, 3.203749656677246e-07, 3.3248215913772583e-07, 3.4458935260772705e-07, 3.5669654607772827e-07, 3.688037395477295e-07, 3.809109330177307e-07, 3.9301812648773193e-07, 4.0512531995773315e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 9.0, 12.0, 2.0, 4.0, 3.0, 10.0, 40.0, 20.0, 6.0, 23.0, 45.0, 124.0, 132.0, 132.0, 598.0, 13189.0, 988374.0, 44684.0, 620.0, 130.0, 69.0, 152.0, 46.0, 24.0, 4.0, 14.0, 22.0, 16.0, 5.0, 4.0, 3.0, 12.0, 9.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.404254913330078e-06, -8.153729140758514e-06, -7.90320336818695e-06, -7.652677595615387e-06, -7.402151823043823e-06, -7.1516260504722595e-06, -6.901100277900696e-06, -6.650574505329132e-06, -6.400048732757568e-06, -6.149522960186005e-06, -5.898997187614441e-06, -5.648471415042877e-06, -5.3979456424713135e-06, -5.14741986989975e-06, -4.896894097328186e-06, -4.646368324756622e-06, -4.395842552185059e-06, -4.145316779613495e-06, -3.894791007041931e-06, -3.6442652344703674e-06, -3.3937394618988037e-06, -3.14321368932724e-06, -2.8926879167556763e-06, -2.6421621441841125e-06, -2.391636371612549e-06, -2.141110599040985e-06, -1.8905848264694214e-06, -1.6400590538978577e-06, -1.389533281326294e-06, -1.1390075087547302e-06, -8.884817361831665e-07, -6.379559636116028e-07, -3.8743019104003906e-07, -1.3690441846847534e-07, 1.1362135410308838e-07, 3.641471266746521e-07, 6.146728992462158e-07, 8.651986718177795e-07, 1.1157244443893433e-06, 1.366250216960907e-06, 1.6167759895324707e-06, 1.8673017621040344e-06, 2.117827534675598e-06, 2.368353307247162e-06, 2.6188790798187256e-06, 2.8694048523902893e-06, 3.119930624961853e-06, 3.3704563975334167e-06, 3.6209821701049805e-06, 3.871507942676544e-06, 4.122033715248108e-06, 4.372559487819672e-06, 4.623085260391235e-06, 4.873611032962799e-06, 5.124136805534363e-06, 5.3746625781059265e-06, 5.62518835067749e-06, 5.875714123249054e-06, 6.126239895820618e-06, 6.376765668392181e-06, 6.627291440963745e-06, 6.877817213535309e-06, 7.1283429861068726e-06, 7.378868758678436e-06, 7.62939453125e-06]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 12.0, 42.0, 59.0, 700.0, 82.0, 61.0, 43.0, 12.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.262035766558256e-06, -1.2390503343340242e-06, -1.2160649021097925e-06, -1.1930795835723984e-06, -1.1700941513481666e-06, -1.1471087191239349e-06, -1.124123286899703e-06, -1.1011378546754713e-06, -1.0781525361380773e-06, -1.0551671039138455e-06, -1.0321816716896137e-06, -1.0091963531522197e-06, -9.86210920927988e-07, -9.632254887037561e-07, -9.402400564795244e-07, -9.172546242552926e-07, -8.942691920310608e-07, -8.71283759806829e-07, -8.482983844260161e-07, -8.253129522017844e-07, -8.023275768209714e-07, -7.793421445967397e-07, -7.563567123725079e-07, -7.333712801482761e-07, -7.103859047674632e-07, -6.874004725432314e-07, -6.644150971624185e-07, -6.414296649381868e-07, -6.18444232713955e-07, -5.954588573331421e-07, -5.724734251089103e-07, -5.494880497280974e-07, -5.265026175038656e-07, -5.035171852796338e-07, -4.805318098988209e-07, -4.5754637767458917e-07, -4.345609738720668e-07, -4.115755700695445e-07, -3.885901378453127e-07, -3.6560473404279037e-07, -3.4261933024026803e-07, -3.196339264377457e-07, -2.9664852263522334e-07, -2.7366309041099157e-07, -2.5067768660846923e-07, -2.276922828059469e-07, -2.0470686479256983e-07, -1.8172144677919277e-07, -1.5873602876581572e-07, -1.3575061075243866e-07, -1.1276520694991632e-07, -8.977979604196662e-08, -6.679438513401692e-08, -4.380897422606722e-08, -2.0823563318117522e-08, 2.1618546952595352e-09, 2.5147258497781877e-08, 4.8132669405731576e-08, 7.111808031368128e-08, 9.410349122163097e-08, 1.1708890212958067e-07, 1.4007432014295773e-07, 1.6305972394548007e-07, 1.8604514195885713e-07, 2.0903054576137947e-07]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 156.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 636.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 180.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 10.0, 5.0, 20.0, 17.0, 12.0, 16.0, 27.0, 26.0, 23.0, 30.0, 33.0, 44.0, 43.0, 48.0, 55.0, 43.0, 46.0, 41.0, 49.0, 38.0, 33.0, 28.0, 42.0, 41.0, 23.0, 16.0, 27.0, 22.0, 20.0, 19.0, 16.0, 13.0, 11.0, 11.0, 4.0, 7.0, 8.0, 8.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.453125, -3.34539794921875, -3.2376708984375, -3.12994384765625, -3.022216796875, -2.91448974609375, -2.8067626953125, -2.69903564453125, -2.59130859375, -2.48358154296875, -2.3758544921875, -2.26812744140625, -2.160400390625, -2.05267333984375, -1.9449462890625, -1.83721923828125, -1.7294921875, -1.62176513671875, -1.5140380859375, -1.40631103515625, -1.298583984375, -1.19085693359375, -1.0831298828125, -0.97540283203125, -0.86767578125, -0.75994873046875, -0.6522216796875, -0.54449462890625, -0.436767578125, -0.32904052734375, -0.2213134765625, -0.11358642578125, -0.005859375, 0.10186767578125, 0.2095947265625, 0.31732177734375, 0.425048828125, 0.53277587890625, 0.6405029296875, 0.74822998046875, 0.85595703125, 0.96368408203125, 1.0714111328125, 1.17913818359375, 1.286865234375, 1.39459228515625, 1.5023193359375, 1.61004638671875, 1.7177734375, 1.82550048828125, 1.9332275390625, 2.04095458984375, 2.148681640625, 2.25640869140625, 2.3641357421875, 2.47186279296875, 2.57958984375, 2.68731689453125, 2.7950439453125, 2.90277099609375, 3.010498046875, 3.11822509765625, 3.2259521484375, 3.33367919921875, 3.44140625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 6.0, 15.0, 7.0, 40.0, 85.0, 157.0, 290.0, 484.0, 930.0, 1699.0, 3107.0, 5510.0, 10207.0, 18712.0, 36349.0, 75511.0, 174490.0, 331406.0, 210514.0, 89286.0, 42161.0, 21824.0, 11637.0, 6482.0, 3438.0, 1928.0, 1116.0, 523.0, 291.0, 173.0, 94.0, 46.0, 16.0, 10.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76953125, -3.6539306640625, -3.538330078125, -3.4227294921875, -3.30712890625, -3.1915283203125, -3.075927734375, -2.9603271484375, -2.8447265625, -2.7291259765625, -2.613525390625, -2.4979248046875, -2.38232421875, -2.2667236328125, -2.151123046875, -2.0355224609375, -1.919921875, -1.8043212890625, -1.688720703125, -1.5731201171875, -1.45751953125, -1.3419189453125, -1.226318359375, -1.1107177734375, -0.9951171875, -0.8795166015625, -0.763916015625, -0.6483154296875, -0.53271484375, -0.4171142578125, -0.301513671875, -0.1859130859375, -0.0703125, 0.0452880859375, 0.160888671875, 0.2764892578125, 0.39208984375, 0.5076904296875, 0.623291015625, 0.7388916015625, 0.8544921875, 0.9700927734375, 1.085693359375, 1.2012939453125, 1.31689453125, 1.4324951171875, 1.548095703125, 1.6636962890625, 1.779296875, 1.8948974609375, 2.010498046875, 2.1260986328125, 2.24169921875, 2.3572998046875, 2.472900390625, 2.5885009765625, 2.7041015625, 2.8197021484375, 2.935302734375, 3.0509033203125, 3.16650390625, 3.2821044921875, 3.397705078125, 3.5133056640625, 3.62890625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 7.0, 4.0, 11.0, 16.0, 8.0, 13.0, 18.0, 22.0, 21.0, 27.0, 34.0, 38.0, 28.0, 43.0, 47.0, 60.0, 76.0, 137.0, 333.0, 1420.0, 187.0, 75.0, 62.0, 47.0, 40.0, 21.0, 34.0, 34.0, 28.0, 19.0, 24.0, 12.0, 14.0, 19.0, 7.0, 11.0, 11.0, 6.0, 7.0, 7.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9375, -10.5867919921875, -10.236083984375, -9.8853759765625, -9.53466796875, -9.1839599609375, -8.833251953125, -8.4825439453125, -8.1318359375, -7.7811279296875, -7.430419921875, -7.0797119140625, -6.72900390625, -6.3782958984375, -6.027587890625, -5.6768798828125, -5.326171875, -4.9754638671875, -4.624755859375, -4.2740478515625, -3.92333984375, -3.5726318359375, -3.221923828125, -2.8712158203125, -2.5205078125, -2.1697998046875, -1.819091796875, -1.4683837890625, -1.11767578125, -0.7669677734375, -0.416259765625, -0.0655517578125, 0.28515625, 0.6358642578125, 0.986572265625, 1.3372802734375, 1.68798828125, 2.0386962890625, 2.389404296875, 2.7401123046875, 3.0908203125, 3.4415283203125, 3.792236328125, 4.1429443359375, 4.49365234375, 4.8443603515625, 5.195068359375, 5.5457763671875, 5.896484375, 6.2471923828125, 6.597900390625, 6.9486083984375, 7.29931640625, 7.6500244140625, 8.000732421875, 8.3514404296875, 8.7021484375, 9.0528564453125, 9.403564453125, 9.7542724609375, 10.10498046875, 10.4556884765625, 10.806396484375, 11.1571044921875, 11.5078125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 10.0, 8.0, 7.0, 11.0, 10.0, 14.0, 18.0, 23.0, 25.0, 39.0, 51.0, 63.0, 73.0, 113.0, 134.0, 186.0, 286.0, 612.0, 3040.0, 26866.0, 566796.0, 2459661.0, 78139.0, 7055.0, 1086.0, 397.0, 266.0, 150.0, 134.0, 107.0, 70.0, 55.0, 37.0, 41.0, 23.0, 20.0, 11.0, 16.0, 15.0, 7.0, 5.0, 5.0, 8.0, 6.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.0078125, -14.5418701171875, -14.075927734375, -13.6099853515625, -13.14404296875, -12.6781005859375, -12.212158203125, -11.7462158203125, -11.2802734375, -10.8143310546875, -10.348388671875, -9.8824462890625, -9.41650390625, -8.9505615234375, -8.484619140625, -8.0186767578125, -7.552734375, -7.0867919921875, -6.620849609375, -6.1549072265625, -5.68896484375, -5.2230224609375, -4.757080078125, -4.2911376953125, -3.8251953125, -3.3592529296875, -2.893310546875, -2.4273681640625, -1.96142578125, -1.4954833984375, -1.029541015625, -0.5635986328125, -0.09765625, 0.3682861328125, 0.834228515625, 1.3001708984375, 1.76611328125, 2.2320556640625, 2.697998046875, 3.1639404296875, 3.6298828125, 4.0958251953125, 4.561767578125, 5.0277099609375, 5.49365234375, 5.9595947265625, 6.425537109375, 6.8914794921875, 7.357421875, 7.8233642578125, 8.289306640625, 8.7552490234375, 9.22119140625, 9.6871337890625, 10.153076171875, 10.6190185546875, 11.0849609375, 11.5509033203125, 12.016845703125, 12.4827880859375, 12.94873046875, 13.4146728515625, 13.880615234375, 14.3465576171875, 14.8125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 424.0, 552.0, 33.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.59344482421875, -66.20903778076172, -61.824623107910156, -57.440216064453125, -53.05580520629883, -48.67139434814453, -44.2869873046875, -39.9025764465332, -35.518165588378906, -31.13375473022461, -26.749345779418945, -22.36493682861328, -17.980525970458984, -13.596115112304688, -9.211706161499023, -4.827297210693359, -0.4428863525390625, 3.941523551940918, 8.325933456420898, 12.710343360900879, 17.09475326538086, 21.479164123535156, 25.86357307434082, 30.247982025146484, 34.63239288330078, 39.01680374145508, 43.401214599609375, 47.785621643066406, 52.1700325012207, 56.554443359375, 60.93885040283203, 65.32325744628906, 69.70768737792969, 74.09209442138672, 78.47650909423828, 82.86091613769531, 87.24533081054688, 91.6297378540039, 96.01414489746094, 100.3985595703125, 104.78296661376953, 109.16737365722656, 113.55178833007812, 117.93619537353516, 122.32060241699219, 126.70501708984375, 131.0894317626953, 135.4738311767578, 139.85824584960938, 144.24266052246094, 148.62705993652344, 153.011474609375, 157.39588928222656, 161.78030395507812, 166.16470336914062, 170.5491180419922, 174.93353271484375, 179.3179473876953, 183.7023468017578, 188.08676147460938, 192.47117614746094, 196.8555908203125, 201.239990234375, 205.62440490722656, 210.00880432128906]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 3.0, 7.0, 3.0, 10.0, 10.0, 8.0, 13.0, 14.0, 16.0, 23.0, 27.0, 25.0, 31.0, 35.0, 33.0, 37.0, 51.0, 31.0, 40.0, 47.0, 37.0, 39.0, 43.0, 41.0, 37.0, 46.0, 38.0, 32.0, 39.0, 22.0, 26.0, 22.0, 17.0, 15.0, 9.0, 9.0, 7.0, 11.0, 8.0, 11.0, 4.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-27.474750518798828, -26.582067489624023, -25.68938446044922, -24.796703338623047, -23.904020309448242, -23.011337280273438, -22.118654251098633, -21.225971221923828, -20.333288192749023, -19.44060516357422, -18.547922134399414, -17.65523910522461, -16.762557983398438, -15.869874954223633, -14.977191925048828, -14.084508895874023, -13.191826820373535, -12.29914379119873, -11.406461715698242, -10.513778686523438, -9.621095657348633, -8.728412628173828, -7.83573055267334, -6.943047523498535, -6.050364971160889, -5.157682418823242, -4.2649993896484375, -3.372316837310791, -2.4796340465545654, -1.5869512557983398, -0.6942687034606934, 0.19841432571411133, 1.0910968780517578, 1.9837796688079834, 2.876462459564209, 3.7691450119018555, 4.66182804107666, 5.554510593414307, 6.447193145751953, 7.339876174926758, 8.232559204101562, 9.125242233276367, 10.017924308776855, 10.91060733795166, 11.803290367126465, 12.695972442626953, 13.588655471801758, 14.481338500976562, 15.37402057647705, 16.26670265197754, 17.159385681152344, 18.05206871032715, 18.944751739501953, 19.837434768676758, 20.730117797851562, 21.622798919677734, 22.51548194885254, 23.408164978027344, 24.30084800720215, 25.193531036376953, 26.086212158203125, 26.97889518737793, 27.871578216552734, 28.76426124572754, 29.656944274902344]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 4.0, 8.0, 9.0, 10.0, 13.0, 9.0, 17.0, 20.0, 21.0, 28.0, 31.0, 26.0, 31.0, 35.0, 23.0, 50.0, 46.0, 45.0, 60.0, 46.0, 34.0, 38.0, 40.0, 46.0, 28.0, 39.0, 33.0, 27.0, 21.0, 15.0, 19.0, 24.0, 16.0, 20.0, 12.0, 10.0, 10.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.458984375, -3.34912109375, -3.2392578125, -3.12939453125, -3.01953125, -2.90966796875, -2.7998046875, -2.68994140625, -2.580078125, -2.47021484375, -2.3603515625, -2.25048828125, -2.140625, -2.03076171875, -1.9208984375, -1.81103515625, -1.701171875, -1.59130859375, -1.4814453125, -1.37158203125, -1.26171875, -1.15185546875, -1.0419921875, -0.93212890625, -0.822265625, -0.71240234375, -0.6025390625, -0.49267578125, -0.3828125, -0.27294921875, -0.1630859375, -0.05322265625, 0.056640625, 0.16650390625, 0.2763671875, 0.38623046875, 0.49609375, 0.60595703125, 0.7158203125, 0.82568359375, 0.935546875, 1.04541015625, 1.1552734375, 1.26513671875, 1.375, 1.48486328125, 1.5947265625, 1.70458984375, 1.814453125, 1.92431640625, 2.0341796875, 2.14404296875, 2.25390625, 2.36376953125, 2.4736328125, 2.58349609375, 2.693359375, 2.80322265625, 2.9130859375, 3.02294921875, 3.1328125, 3.24267578125, 3.3525390625, 3.46240234375, 3.572265625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 0.0, 7.0, 6.0, 10.0, 9.0, 25.0, 12.0, 17.0, 16.0, 19.0, 37.0, 43.0, 87.0, 149.0, 395.0, 1105.0, 3654.0, 15209.0, 78214.0, 572869.0, 2711759.0, 696416.0, 90498.0, 17233.0, 4273.0, 1284.0, 442.0, 196.0, 97.0, 40.0, 34.0, 22.0, 21.0, 10.0, 15.0, 18.0, 11.0, 9.0, 7.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.7197265625, -7.439453125, -7.1591796875, -6.87890625, -6.5986328125, -6.318359375, -6.0380859375, -5.7578125, -5.4775390625, -5.197265625, -4.9169921875, -4.63671875, -4.3564453125, -4.076171875, -3.7958984375, -3.515625, -3.2353515625, -2.955078125, -2.6748046875, -2.39453125, -2.1142578125, -1.833984375, -1.5537109375, -1.2734375, -0.9931640625, -0.712890625, -0.4326171875, -0.15234375, 0.1279296875, 0.408203125, 0.6884765625, 0.96875, 1.2490234375, 1.529296875, 1.8095703125, 2.08984375, 2.3701171875, 2.650390625, 2.9306640625, 3.2109375, 3.4912109375, 3.771484375, 4.0517578125, 4.33203125, 4.6123046875, 4.892578125, 5.1728515625, 5.453125, 5.7333984375, 6.013671875, 6.2939453125, 6.57421875, 6.8544921875, 7.134765625, 7.4150390625, 7.6953125, 7.9755859375, 8.255859375, 8.5361328125, 8.81640625, 9.0966796875, 9.376953125, 9.6572265625, 9.9375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 11.0, 9.0, 11.0, 16.0, 16.0, 32.0, 43.0, 46.0, 70.0, 91.0, 106.0, 154.0, 186.0, 232.0, 311.0, 329.0, 444.0, 419.0, 331.0, 252.0, 222.0, 188.0, 136.0, 105.0, 79.0, 60.0, 39.0, 42.0, 28.0, 17.0, 13.0, 8.0, 7.0, 3.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-6.78125, -6.611083984375, -6.44091796875, -6.270751953125, -6.1005859375, -5.930419921875, -5.76025390625, -5.590087890625, -5.419921875, -5.249755859375, -5.07958984375, -4.909423828125, -4.7392578125, -4.569091796875, -4.39892578125, -4.228759765625, -4.05859375, -3.888427734375, -3.71826171875, -3.548095703125, -3.3779296875, -3.207763671875, -3.03759765625, -2.867431640625, -2.697265625, -2.527099609375, -2.35693359375, -2.186767578125, -2.0166015625, -1.846435546875, -1.67626953125, -1.506103515625, -1.3359375, -1.165771484375, -0.99560546875, -0.825439453125, -0.6552734375, -0.485107421875, -0.31494140625, -0.144775390625, 0.025390625, 0.195556640625, 0.36572265625, 0.535888671875, 0.7060546875, 0.876220703125, 1.04638671875, 1.216552734375, 1.38671875, 1.556884765625, 1.72705078125, 1.897216796875, 2.0673828125, 2.237548828125, 2.40771484375, 2.577880859375, 2.748046875, 2.918212890625, 3.08837890625, 3.258544921875, 3.4287109375, 3.598876953125, 3.76904296875, 3.939208984375, 4.109375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 6.0, 20.0, 19.0, 19.0, 38.0, 56.0, 72.0, 96.0, 132.0, 171.0, 299.0, 475.0, 1766.0, 19556.0, 570671.0, 3429389.0, 161775.0, 7482.0, 996.0, 387.0, 244.0, 155.0, 112.0, 106.0, 80.0, 43.0, 31.0, 26.0, 15.0, 11.0, 12.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.11865234375, -15.4560546875, -14.79345703125, -14.130859375, -13.46826171875, -12.8056640625, -12.14306640625, -11.48046875, -10.81787109375, -10.1552734375, -9.49267578125, -8.830078125, -8.16748046875, -7.5048828125, -6.84228515625, -6.1796875, -5.51708984375, -4.8544921875, -4.19189453125, -3.529296875, -2.86669921875, -2.2041015625, -1.54150390625, -0.87890625, -0.21630859375, 0.4462890625, 1.10888671875, 1.771484375, 2.43408203125, 3.0966796875, 3.75927734375, 4.421875, 5.08447265625, 5.7470703125, 6.40966796875, 7.072265625, 7.73486328125, 8.3974609375, 9.06005859375, 9.72265625, 10.38525390625, 11.0478515625, 11.71044921875, 12.373046875, 13.03564453125, 13.6982421875, 14.36083984375, 15.0234375, 15.68603515625, 16.3486328125, 17.01123046875, 17.673828125, 18.33642578125, 18.9990234375, 19.66162109375, 20.32421875, 20.98681640625, 21.6494140625, 22.31201171875, 22.974609375, 23.63720703125, 24.2998046875, 24.96240234375, 25.625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 19.0, 45.0, 122.0, 175.0, 259.0, 175.0, 128.0, 55.0, 17.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.59611129760742, -47.73607635498047, -45.87604522705078, -44.01601028442383, -42.155975341796875, -40.29594039916992, -38.43590545654297, -36.57587432861328, -34.71583938598633, -32.855804443359375, -30.995771408081055, -29.135738372802734, -27.27570343017578, -25.415668487548828, -23.555635452270508, -21.695602416992188, -19.835567474365234, -17.97553253173828, -16.11549949645996, -14.255465507507324, -12.395431518554688, -10.53539752960205, -8.675363540649414, -6.815329551696777, -4.955295562744141, -3.095261573791504, -1.2352275848388672, 0.6248064041137695, 2.4848403930664062, 4.344874382019043, 6.20490837097168, 8.064942359924316, 9.924980163574219, 11.785014152526855, 13.645048141479492, 15.505082130432129, 17.365116119384766, 19.22515106201172, 21.08518409729004, 22.94521713256836, 24.805252075195312, 26.665287017822266, 28.525320053100586, 30.385353088378906, 32.24538803100586, 34.10542297363281, 35.9654541015625, 37.82548904418945, 39.685523986816406, 41.54555892944336, 43.40559387207031, 45.265625, 47.12565994262695, 48.985694885253906, 50.845726013183594, 52.70576095581055, 54.5657958984375, 56.42583084106445, 58.285865783691406, 60.145896911621094, 62.00593185424805, 63.865966796875, 65.72599792480469, 67.5860366821289, 69.4460678100586]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 4.0, 10.0, 10.0, 12.0, 9.0, 11.0, 14.0, 12.0, 18.0, 22.0, 17.0, 29.0, 24.0, 32.0, 32.0, 33.0, 28.0, 47.0, 37.0, 32.0, 47.0, 40.0, 43.0, 39.0, 27.0, 31.0, 25.0, 31.0, 35.0, 23.0, 26.0, 24.0, 26.0, 20.0, 14.0, 26.0, 14.0, 12.0, 10.0, 10.0, 11.0, 6.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-16.023412704467773, -15.483242988586426, -14.943073272705078, -14.40290355682373, -13.862733840942383, -13.322563171386719, -12.782393455505371, -12.242223739624023, -11.702054023742676, -11.161884307861328, -10.62171459197998, -10.081544876098633, -9.541374206542969, -9.001205444335938, -8.461034774780273, -7.920865058898926, -7.380695343017578, -6.8405256271362305, -6.300355911254883, -5.760185718536377, -5.220016002655029, -4.679846286773682, -4.139676094055176, -3.599506378173828, -3.0593366622924805, -2.519166946411133, -1.978996992111206, -1.4388271570205688, -0.8986573219299316, -0.358487606048584, 0.18168234825134277, 0.7218523025512695, 1.2620220184326172, 1.8021918535232544, 2.3423616886138916, 2.8825316429138184, 3.422701358795166, 3.9628710746765137, 4.5030412673950195, 5.043210983276367, 5.583380699157715, 6.1235504150390625, 6.66372013092041, 7.203890323638916, 7.744060039520264, 8.284229278564453, 8.824399948120117, 9.364569664001465, 9.904739379882812, 10.44490909576416, 10.985078811645508, 11.525248527526855, 12.065418243408203, 12.605588912963867, 13.145758628845215, 13.685928344726562, 14.22609806060791, 14.766267776489258, 15.306437492370605, 15.846607208251953, 16.386777877807617, 16.92694664001465, 17.467117309570312, 18.007286071777344, 18.547456741333008]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 10.0, 6.0, 5.0, 11.0, 13.0, 24.0, 14.0, 22.0, 21.0, 31.0, 27.0, 29.0, 28.0, 42.0, 25.0, 49.0, 41.0, 36.0, 40.0, 35.0, 40.0, 54.0, 40.0, 40.0, 31.0, 34.0, 33.0, 35.0, 29.0, 19.0, 14.0, 18.0, 19.0, 12.0, 12.0, 12.0, 14.0, 10.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.3671875, -3.260406494140625, -3.15362548828125, -3.046844482421875, -2.9400634765625, -2.833282470703125, -2.72650146484375, -2.619720458984375, -2.512939453125, -2.406158447265625, -2.29937744140625, -2.192596435546875, -2.0858154296875, -1.979034423828125, -1.87225341796875, -1.765472412109375, -1.65869140625, -1.551910400390625, -1.44512939453125, -1.338348388671875, -1.2315673828125, -1.124786376953125, -1.01800537109375, -0.911224365234375, -0.804443359375, -0.697662353515625, -0.59088134765625, -0.484100341796875, -0.3773193359375, -0.270538330078125, -0.16375732421875, -0.056976318359375, 0.0498046875, 0.156585693359375, 0.26336669921875, 0.370147705078125, 0.4769287109375, 0.583709716796875, 0.69049072265625, 0.797271728515625, 0.904052734375, 1.010833740234375, 1.11761474609375, 1.224395751953125, 1.3311767578125, 1.437957763671875, 1.54473876953125, 1.651519775390625, 1.75830078125, 1.865081787109375, 1.97186279296875, 2.078643798828125, 2.1854248046875, 2.292205810546875, 2.39898681640625, 2.505767822265625, 2.612548828125, 2.719329833984375, 2.82611083984375, 2.932891845703125, 3.0396728515625, 3.146453857421875, 3.25323486328125, 3.360015869140625, 3.466796875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 10.0, 9.0, 9.0, 18.0, 29.0, 36.0, 64.0, 86.0, 139.0, 178.0, 288.0, 390.0, 664.0, 926.0, 1453.0, 2121.0, 3427.0, 5418.0, 8731.0, 13545.0, 21821.0, 37129.0, 65428.0, 133439.0, 357139.0, 194723.0, 84116.0, 46114.0, 26661.0, 16091.0, 10186.0, 6389.0, 4127.0, 2563.0, 1719.0, 1141.0, 765.0, 449.0, 323.0, 211.0, 154.0, 101.0, 80.0, 51.0, 24.0, 19.0, 18.0, 12.0, 6.0, 9.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0306549072265625, -0.02968764305114746, -0.028720378875732422, -0.027753114700317383, -0.026785850524902344, -0.025818586349487305, -0.024851322174072266, -0.023884057998657227, -0.022916793823242188, -0.02194952964782715, -0.02098226547241211, -0.02001500129699707, -0.01904773712158203, -0.018080472946166992, -0.017113208770751953, -0.016145944595336914, -0.015178680419921875, -0.014211416244506836, -0.013244152069091797, -0.012276887893676758, -0.011309623718261719, -0.01034235954284668, -0.00937509536743164, -0.008407831192016602, -0.0074405670166015625, -0.0064733028411865234, -0.005506038665771484, -0.004538774490356445, -0.0035715103149414062, -0.002604246139526367, -0.0016369819641113281, -0.0006697177886962891, 0.00029754638671875, 0.001264810562133789, 0.002232074737548828, 0.003199338912963867, 0.004166603088378906, 0.005133867263793945, 0.006101131439208984, 0.0070683956146240234, 0.008035659790039062, 0.009002923965454102, 0.00997018814086914, 0.01093745231628418, 0.011904716491699219, 0.012871980667114258, 0.013839244842529297, 0.014806509017944336, 0.015773773193359375, 0.016741037368774414, 0.017708301544189453, 0.018675565719604492, 0.01964282989501953, 0.02061009407043457, 0.02157735824584961, 0.02254462242126465, 0.023511886596679688, 0.024479150772094727, 0.025446414947509766, 0.026413679122924805, 0.027380943298339844, 0.028348207473754883, 0.029315471649169922, 0.03028273582458496, 0.03125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 9.0, 5.0, 11.0, 9.0, 29.0, 12.0, 21.0, 15.0, 28.0, 22.0, 33.0, 37.0, 30.0, 25.0, 38.0, 45.0, 43.0, 29.0, 39.0, 1056.0, 29.0, 35.0, 45.0, 40.0, 25.0, 36.0, 32.0, 29.0, 25.0, 23.0, 26.0, 23.0, 18.0, 17.0, 17.0, 10.0, 14.0, 8.0, 6.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-2.162109375, -2.096832275390625, -2.03155517578125, -1.966278076171875, -1.9010009765625, -1.835723876953125, -1.77044677734375, -1.705169677734375, -1.639892578125, -1.574615478515625, -1.50933837890625, -1.444061279296875, -1.3787841796875, -1.313507080078125, -1.24822998046875, -1.182952880859375, -1.11767578125, -1.052398681640625, -0.98712158203125, -0.921844482421875, -0.8565673828125, -0.791290283203125, -0.72601318359375, -0.660736083984375, -0.595458984375, -0.530181884765625, -0.46490478515625, -0.399627685546875, -0.3343505859375, -0.269073486328125, -0.20379638671875, -0.138519287109375, -0.0732421875, -0.007965087890625, 0.05731201171875, 0.122589111328125, 0.1878662109375, 0.253143310546875, 0.31842041015625, 0.383697509765625, 0.448974609375, 0.514251708984375, 0.57952880859375, 0.644805908203125, 0.7100830078125, 0.775360107421875, 0.84063720703125, 0.905914306640625, 0.97119140625, 1.036468505859375, 1.10174560546875, 1.167022705078125, 1.2322998046875, 1.297576904296875, 1.36285400390625, 1.428131103515625, 1.493408203125, 1.558685302734375, 1.62396240234375, 1.689239501953125, 1.7545166015625, 1.819793701171875, 1.88507080078125, 1.950347900390625, 2.015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 7.0, 11.0, 11.0, 25.0, 37.0, 37.0, 68.0, 103.0, 135.0, 221.0, 270.0, 446.0, 604.0, 859.0, 1228.0, 1739.0, 2409.0, 3448.0, 4633.0, 6683.0, 9440.0, 13042.0, 19017.0, 27437.0, 41489.0, 64752.0, 108808.0, 210966.0, 1265305.0, 111865.0, 65896.0, 42198.0, 28084.0, 19362.0, 13453.0, 9410.0, 6776.0, 4830.0, 3516.0, 2532.0, 1834.0, 1181.0, 902.0, 648.0, 430.0, 308.0, 206.0, 164.0, 96.0, 80.0, 47.0, 33.0, 24.0, 18.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0147857666015625, -0.014309167861938477, -0.013832569122314453, -0.01335597038269043, -0.012879371643066406, -0.012402772903442383, -0.01192617416381836, -0.011449575424194336, -0.010972976684570312, -0.010496377944946289, -0.010019779205322266, -0.009543180465698242, -0.009066581726074219, -0.008589982986450195, -0.008113384246826172, -0.0076367855072021484, -0.007160186767578125, -0.0066835880279541016, -0.006206989288330078, -0.005730390548706055, -0.005253791809082031, -0.004777193069458008, -0.004300594329833984, -0.003823995590209961, -0.0033473968505859375, -0.002870798110961914, -0.0023941993713378906, -0.0019176006317138672, -0.0014410018920898438, -0.0009644031524658203, -0.0004878044128417969, -1.1205673217773438e-05, 0.00046539306640625, 0.0009419918060302734, 0.0014185905456542969, 0.0018951892852783203, 0.0023717880249023438, 0.002848386764526367, 0.0033249855041503906, 0.003801584243774414, 0.0042781829833984375, 0.004754781723022461, 0.005231380462646484, 0.005707979202270508, 0.006184577941894531, 0.006661176681518555, 0.007137775421142578, 0.0076143741607666016, 0.008090972900390625, 0.008567571640014648, 0.009044170379638672, 0.009520769119262695, 0.009997367858886719, 0.010473966598510742, 0.010950565338134766, 0.011427164077758789, 0.011903762817382812, 0.012380361557006836, 0.01285696029663086, 0.013333559036254883, 0.013810157775878906, 0.01428675651550293, 0.014763355255126953, 0.015239953994750977, 0.015716552734375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 6.0, 0.0, 9.0, 0.0, 0.0, 18.0, 0.0, 0.0, 28.0, 0.0, 59.0, 0.0, 0.0, 141.0, 0.0, 0.0, 443.0, 0.0, 186.0, 0.0, 0.0, 64.0, 0.0, 0.0, 28.0, 0.0, 15.0, 0.0, 0.0, 9.0, 0.0, 0.0, 8.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07, 7.37607479095459e-07, 7.599592208862305e-07, 7.82310962677002e-07, 8.046627044677734e-07, 8.270144462585449e-07, 8.493661880493164e-07, 8.717179298400879e-07, 8.940696716308594e-07]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 4.0, 3.0, 7.0, 2.0, 9.0, 4.0, 4.0, 22.0, 12.0, 32.0, 58.0, 50.0, 287.0, 360.0, 17668.0, 1028464.0, 1023.0, 300.0, 76.0, 30.0, 60.0, 14.0, 18.0, 14.0, 6.0, 12.0, 6.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0205974578857422e-05, -1.970399171113968e-05, -1.9202008843421936e-05, -1.8700025975704193e-05, -1.819804310798645e-05, -1.7696060240268707e-05, -1.7194077372550964e-05, -1.669209450483322e-05, -1.619011163711548e-05, -1.5688128769397736e-05, -1.5186145901679993e-05, -1.468416303396225e-05, -1.4182180166244507e-05, -1.3680197298526764e-05, -1.3178214430809021e-05, -1.2676231563091278e-05, -1.2174248695373535e-05, -1.1672265827655792e-05, -1.117028295993805e-05, -1.0668300092220306e-05, -1.0166317224502563e-05, -9.66433435678482e-06, -9.162351489067078e-06, -8.660368621349335e-06, -8.158385753631592e-06, -7.656402885913849e-06, -7.154420018196106e-06, -6.652437150478363e-06, -6.15045428276062e-06, -5.648471415042877e-06, -5.146488547325134e-06, -4.644505679607391e-06, -4.1425228118896484e-06, -3.6405399441719055e-06, -3.1385570764541626e-06, -2.6365742087364197e-06, -2.1345913410186768e-06, -1.6326084733009338e-06, -1.130625605583191e-06, -6.28642737865448e-07, -1.2665987014770508e-07, 3.7532299757003784e-07, 8.773058652877808e-07, 1.3792887330055237e-06, 1.8812716007232666e-06, 2.3832544684410095e-06, 2.8852373361587524e-06, 3.3872202038764954e-06, 3.889203071594238e-06, 4.391185939311981e-06, 4.893168807029724e-06, 5.395151674747467e-06, 5.89713454246521e-06, 6.399117410182953e-06, 6.901100277900696e-06, 7.403083145618439e-06, 7.905066013336182e-06, 8.407048881053925e-06, 8.909031748771667e-06, 9.41101461648941e-06, 9.912997484207153e-06, 1.0414980351924896e-05, 1.091696321964264e-05, 1.1418946087360382e-05, 1.1920928955078125e-05]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [6.0, 9.0, 43.0, 135.0, 737.0, 73.0, 14.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8116206490503828e-07, -1.3884476857128902e-07, -9.652747934296713e-08, -5.421019011464523e-08, -1.1892893780895974e-08, 3.042440255285328e-08, 7.274168467574782e-08, 1.1505899522035179e-07, 1.5737627734324633e-07, 1.9969357367699558e-07, 2.420108557998901e-07, 2.843281663444941e-07, 3.2664544846738863e-07, 3.6896273059028317e-07, 4.1128004113488714e-07, 4.535973516794911e-07, 4.959146053806762e-07, 5.382319159252802e-07, 5.805491696264653e-07, 6.228664801710693e-07, 6.651837907156732e-07, 7.075010444168583e-07, 7.498183549614623e-07, 7.921356655060663e-07, 8.344529760506703e-07, 8.767702865952742e-07, 9.190875402964593e-07, 9.614047939976444e-07, 1.0037221045422484e-06, 1.0460394150868524e-06, 1.0883567256314564e-06, 1.1306740361760603e-06, 1.1729913467206643e-06, 1.2153086572652683e-06, 1.2576259678098722e-06, 1.2999432783544762e-06, 1.3422604752122425e-06, 1.3845777857568464e-06, 1.4268950963014504e-06, 1.4692124068460544e-06, 1.5115297173906583e-06, 1.5538470279352623e-06, 1.5961643384798663e-06, 1.6384815353376325e-06, 1.6807988458822365e-06, 1.7231161564268405e-06, 1.7654334669714444e-06, 1.8077507775160484e-06, 1.8500679743738146e-06, 1.8923852849184186e-06, 1.9347025954630226e-06, 1.977019792320789e-06, 2.0193372165522305e-06, 2.0616544134099968e-06, 2.1039718376414385e-06, 2.1462890344992047e-06, 2.1886064587306464e-06, 2.2309236555884127e-06, 2.2732410798198543e-06, 2.3155582766776206e-06, 2.3578757009090623e-06, 2.4001928977668285e-06, 2.4425103219982702e-06, 2.4848275188560365e-06, 2.5271447157138027e-06]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 167.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 599.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 172.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 10.0, 6.0, 5.0, 11.0, 13.0, 24.0, 14.0, 22.0, 21.0, 31.0, 27.0, 29.0, 28.0, 42.0, 25.0, 49.0, 41.0, 36.0, 40.0, 35.0, 40.0, 54.0, 40.0, 40.0, 31.0, 34.0, 33.0, 35.0, 29.0, 19.0, 14.0, 18.0, 19.0, 12.0, 12.0, 12.0, 14.0, 10.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.3671875, -3.260406494140625, -3.15362548828125, -3.046844482421875, -2.9400634765625, -2.833282470703125, -2.72650146484375, -2.619720458984375, -2.512939453125, -2.406158447265625, -2.29937744140625, -2.192596435546875, -2.0858154296875, -1.979034423828125, -1.87225341796875, -1.765472412109375, -1.65869140625, -1.551910400390625, -1.44512939453125, -1.338348388671875, -1.2315673828125, -1.124786376953125, -1.01800537109375, -0.911224365234375, -0.804443359375, -0.697662353515625, -0.59088134765625, -0.484100341796875, -0.3773193359375, -0.270538330078125, -0.16375732421875, -0.056976318359375, 0.0498046875, 0.156585693359375, 0.26336669921875, 0.370147705078125, 0.4769287109375, 0.583709716796875, 0.69049072265625, 0.797271728515625, 0.904052734375, 1.010833740234375, 1.11761474609375, 1.224395751953125, 1.3311767578125, 1.437957763671875, 1.54473876953125, 1.651519775390625, 1.75830078125, 1.865081787109375, 1.97186279296875, 2.078643798828125, 2.1854248046875, 2.292205810546875, 2.39898681640625, 2.505767822265625, 2.612548828125, 2.719329833984375, 2.82611083984375, 2.932891845703125, 3.0396728515625, 3.146453857421875, 3.25323486328125, 3.360015869140625, 3.466796875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 15.0, 8.0, 12.0, 14.0, 25.0, 34.0, 32.0, 58.0, 71.0, 111.0, 192.0, 327.0, 658.0, 1438.0, 3129.0, 7314.0, 17893.0, 48706.0, 161579.0, 533461.0, 185315.0, 54168.0, 19442.0, 7963.0, 3358.0, 1509.0, 721.0, 395.0, 192.0, 119.0, 66.0, 44.0, 40.0, 42.0, 18.0, 15.0, 17.0, 16.0, 12.0, 4.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.71484375, -5.53369140625, -5.3525390625, -5.17138671875, -4.990234375, -4.80908203125, -4.6279296875, -4.44677734375, -4.265625, -4.08447265625, -3.9033203125, -3.72216796875, -3.541015625, -3.35986328125, -3.1787109375, -2.99755859375, -2.81640625, -2.63525390625, -2.4541015625, -2.27294921875, -2.091796875, -1.91064453125, -1.7294921875, -1.54833984375, -1.3671875, -1.18603515625, -1.0048828125, -0.82373046875, -0.642578125, -0.46142578125, -0.2802734375, -0.09912109375, 0.08203125, 0.26318359375, 0.4443359375, 0.62548828125, 0.806640625, 0.98779296875, 1.1689453125, 1.35009765625, 1.53125, 1.71240234375, 1.8935546875, 2.07470703125, 2.255859375, 2.43701171875, 2.6181640625, 2.79931640625, 2.98046875, 3.16162109375, 3.3427734375, 3.52392578125, 3.705078125, 3.88623046875, 4.0673828125, 4.24853515625, 4.4296875, 4.61083984375, 4.7919921875, 4.97314453125, 5.154296875, 5.33544921875, 5.5166015625, 5.69775390625, 5.87890625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 4.0, 9.0, 7.0, 9.0, 16.0, 11.0, 15.0, 15.0, 22.0, 23.0, 16.0, 34.0, 31.0, 36.0, 34.0, 40.0, 57.0, 108.0, 194.0, 1486.0, 282.0, 130.0, 86.0, 61.0, 34.0, 52.0, 35.0, 38.0, 20.0, 24.0, 24.0, 16.0, 14.0, 14.0, 15.0, 3.0, 7.0, 4.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7109375, -10.3504638671875, -9.989990234375, -9.6295166015625, -9.26904296875, -8.9085693359375, -8.548095703125, -8.1876220703125, -7.8271484375, -7.4666748046875, -7.106201171875, -6.7457275390625, -6.38525390625, -6.0247802734375, -5.664306640625, -5.3038330078125, -4.943359375, -4.5828857421875, -4.222412109375, -3.8619384765625, -3.50146484375, -3.1409912109375, -2.780517578125, -2.4200439453125, -2.0595703125, -1.6990966796875, -1.338623046875, -0.9781494140625, -0.61767578125, -0.2572021484375, 0.103271484375, 0.4637451171875, 0.82421875, 1.1846923828125, 1.545166015625, 1.9056396484375, 2.26611328125, 2.6265869140625, 2.987060546875, 3.3475341796875, 3.7080078125, 4.0684814453125, 4.428955078125, 4.7894287109375, 5.14990234375, 5.5103759765625, 5.870849609375, 6.2313232421875, 6.591796875, 6.9522705078125, 7.312744140625, 7.6732177734375, 8.03369140625, 8.3941650390625, 8.754638671875, 9.1151123046875, 9.4755859375, 9.8360595703125, 10.196533203125, 10.5570068359375, 10.91748046875, 11.2779541015625, 11.638427734375, 11.9989013671875, 12.359375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 10.0, 5.0, 5.0, 9.0, 12.0, 15.0, 21.0, 28.0, 35.0, 38.0, 47.0, 61.0, 88.0, 169.0, 222.0, 488.0, 1962.0, 20972.0, 1492117.0, 1604432.0, 21753.0, 1938.0, 518.0, 224.0, 131.0, 92.0, 64.0, 49.0, 37.0, 34.0, 29.0, 16.0, 18.0, 13.0, 13.0, 10.0, 8.0, 6.0, 2.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.0, -21.35302734375, -20.7060546875, -20.05908203125, -19.412109375, -18.76513671875, -18.1181640625, -17.47119140625, -16.82421875, -16.17724609375, -15.5302734375, -14.88330078125, -14.236328125, -13.58935546875, -12.9423828125, -12.29541015625, -11.6484375, -11.00146484375, -10.3544921875, -9.70751953125, -9.060546875, -8.41357421875, -7.7666015625, -7.11962890625, -6.47265625, -5.82568359375, -5.1787109375, -4.53173828125, -3.884765625, -3.23779296875, -2.5908203125, -1.94384765625, -1.296875, -0.64990234375, -0.0029296875, 0.64404296875, 1.291015625, 1.93798828125, 2.5849609375, 3.23193359375, 3.87890625, 4.52587890625, 5.1728515625, 5.81982421875, 6.466796875, 7.11376953125, 7.7607421875, 8.40771484375, 9.0546875, 9.70166015625, 10.3486328125, 10.99560546875, 11.642578125, 12.28955078125, 12.9365234375, 13.58349609375, 14.23046875, 14.87744140625, 15.5244140625, 16.17138671875, 16.818359375, 17.46533203125, 18.1123046875, 18.75927734375, 19.40625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 9.0, 22.0, 61.0, 124.0, 204.0, 212.0, 207.0, 103.0, 45.0, 18.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.988393783569336, -21.915363311767578, -20.84233283996582, -19.769302368164062, -18.696271896362305, -17.623241424560547, -16.550212860107422, -15.477181434631348, -14.40415096282959, -13.331120491027832, -12.258090019226074, -11.185060501098633, -10.112030029296875, -9.038999557495117, -7.965969085693359, -6.892938613891602, -5.819908142089844, -4.746877670288086, -3.6738474369049072, -2.6008172035217285, -1.5277867317199707, -0.4547562599182129, 0.6182737350463867, 1.6913042068481445, 2.7643346786499023, 3.83736515045166, 4.910395622253418, 5.983425617218018, 7.056456089019775, 8.129486083984375, 9.202516555786133, 10.27554702758789, 11.348579406738281, 12.421609878540039, 13.494640350341797, 14.567670822143555, 15.640701293945312, 16.71373176574707, 17.786762237548828, 18.859790802001953, 19.932823181152344, 21.0058536529541, 22.07888412475586, 23.151914596557617, 24.224945068359375, 25.297975540161133, 26.37100601196289, 27.444034576416016, 28.517065048217773, 29.59009552001953, 30.66312599182129, 31.736156463623047, 32.80918502807617, 33.88221740722656, 34.95524597167969, 36.02827835083008, 37.1013069152832, 38.17433547973633, 39.24736785888672, 40.320396423339844, 41.393428802490234, 42.46645736694336, 43.53948974609375, 44.612518310546875, 45.685550689697266]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 8.0, 4.0, 9.0, 5.0, 11.0, 11.0, 5.0, 8.0, 15.0, 19.0, 16.0, 20.0, 26.0, 24.0, 24.0, 29.0, 41.0, 42.0, 34.0, 45.0, 42.0, 33.0, 37.0, 37.0, 56.0, 35.0, 46.0, 37.0, 22.0, 27.0, 40.0, 20.0, 22.0, 26.0, 31.0, 15.0, 18.0, 9.0, 10.0, 9.0, 6.0, 4.0, 5.0, 6.0, 3.0, 6.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-30.072677612304688, -29.169567108154297, -28.26645851135254, -27.36334800720215, -26.460237503051758, -25.55712890625, -24.65401840209961, -23.75090789794922, -22.84779930114746, -21.94468879699707, -21.041580200195312, -20.138469696044922, -19.23535919189453, -18.332250595092773, -17.429140090942383, -16.526031494140625, -15.622920036315918, -14.719810485839844, -13.816699981689453, -12.913590431213379, -12.010480880737305, -11.107370376586914, -10.20426082611084, -9.301151275634766, -8.398040771484375, -7.494930744171143, -6.591821193695068, -5.688711166381836, -4.785601615905762, -3.8824915885925293, -2.979381561279297, -2.0762720108032227, -1.1731624603271484, -0.27005261182785034, 0.6330572366714478, 1.5361671447753906, 2.439276933670044, 3.3423867225646973, 4.24549674987793, 5.148606300354004, 6.051716327667236, 6.954826354980469, 7.857935905456543, 8.761045455932617, 9.664155960083008, 10.567265510559082, 11.470375061035156, 12.373485565185547, 13.276595115661621, 14.179704666137695, 15.082815170288086, 15.98592472076416, 16.889034271240234, 17.792144775390625, 18.695255279541016, 19.598363876342773, 20.501474380493164, 21.404584884643555, 22.307693481445312, 23.210803985595703, 24.113914489746094, 25.01702308654785, 25.920133590698242, 26.8232421875, 27.72635269165039]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 10.0, 7.0, 14.0, 11.0, 15.0, 13.0, 22.0, 20.0, 26.0, 29.0, 30.0, 45.0, 39.0, 41.0, 40.0, 43.0, 38.0, 39.0, 44.0, 39.0, 47.0, 45.0, 41.0, 41.0, 40.0, 32.0, 29.0, 21.0, 17.0, 21.0, 16.0, 16.0, 17.0, 10.0, 9.0, 7.0, 5.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.65625, -3.534912109375, -3.41357421875, -3.292236328125, -3.1708984375, -3.049560546875, -2.92822265625, -2.806884765625, -2.685546875, -2.564208984375, -2.44287109375, -2.321533203125, -2.2001953125, -2.078857421875, -1.95751953125, -1.836181640625, -1.71484375, -1.593505859375, -1.47216796875, -1.350830078125, -1.2294921875, -1.108154296875, -0.98681640625, -0.865478515625, -0.744140625, -0.622802734375, -0.50146484375, -0.380126953125, -0.2587890625, -0.137451171875, -0.01611328125, 0.105224609375, 0.2265625, 0.347900390625, 0.46923828125, 0.590576171875, 0.7119140625, 0.833251953125, 0.95458984375, 1.075927734375, 1.197265625, 1.318603515625, 1.43994140625, 1.561279296875, 1.6826171875, 1.803955078125, 1.92529296875, 2.046630859375, 2.16796875, 2.289306640625, 2.41064453125, 2.531982421875, 2.6533203125, 2.774658203125, 2.89599609375, 3.017333984375, 3.138671875, 3.260009765625, 3.38134765625, 3.502685546875, 3.6240234375, 3.745361328125, 3.86669921875, 3.988037109375, 4.109375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 10.0, 10.0, 9.0, 13.0, 20.0, 24.0, 32.0, 47.0, 68.0, 90.0, 201.0, 390.0, 875.0, 2000.0, 5406.0, 17139.0, 62000.0, 288673.0, 1596144.0, 1790431.0, 332453.0, 69618.0, 18540.0, 5982.0, 2194.0, 879.0, 423.0, 224.0, 115.0, 94.0, 50.0, 31.0, 22.0, 15.0, 17.0, 11.0, 8.0, 4.0, 8.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.296875, -7.06915283203125, -6.8414306640625, -6.61370849609375, -6.385986328125, -6.15826416015625, -5.9305419921875, -5.70281982421875, -5.47509765625, -5.24737548828125, -5.0196533203125, -4.79193115234375, -4.564208984375, -4.33648681640625, -4.1087646484375, -3.88104248046875, -3.6533203125, -3.42559814453125, -3.1978759765625, -2.97015380859375, -2.742431640625, -2.51470947265625, -2.2869873046875, -2.05926513671875, -1.83154296875, -1.60382080078125, -1.3760986328125, -1.14837646484375, -0.920654296875, -0.69293212890625, -0.4652099609375, -0.23748779296875, -0.009765625, 0.21795654296875, 0.4456787109375, 0.67340087890625, 0.901123046875, 1.12884521484375, 1.3565673828125, 1.58428955078125, 1.81201171875, 2.03973388671875, 2.2674560546875, 2.49517822265625, 2.722900390625, 2.95062255859375, 3.1783447265625, 3.40606689453125, 3.6337890625, 3.86151123046875, 4.0892333984375, 4.31695556640625, 4.544677734375, 4.77239990234375, 5.0001220703125, 5.22784423828125, 5.45556640625, 5.68328857421875, 5.9110107421875, 6.13873291015625, 6.366455078125, 6.59417724609375, 6.8218994140625, 7.04962158203125, 7.27734375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 9.0, 5.0, 10.0, 13.0, 14.0, 28.0, 28.0, 48.0, 72.0, 92.0, 113.0, 144.0, 171.0, 251.0, 297.0, 362.0, 462.0, 384.0, 359.0, 265.0, 226.0, 177.0, 133.0, 105.0, 65.0, 54.0, 38.0, 31.0, 33.0, 23.0, 15.0, 16.0, 8.0, 15.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.67578125, -5.49786376953125, -5.3199462890625, -5.14202880859375, -4.964111328125, -4.78619384765625, -4.6082763671875, -4.43035888671875, -4.25244140625, -4.07452392578125, -3.8966064453125, -3.71868896484375, -3.540771484375, -3.36285400390625, -3.1849365234375, -3.00701904296875, -2.8291015625, -2.65118408203125, -2.4732666015625, -2.29534912109375, -2.117431640625, -1.93951416015625, -1.7615966796875, -1.58367919921875, -1.40576171875, -1.22784423828125, -1.0499267578125, -0.87200927734375, -0.694091796875, -0.51617431640625, -0.3382568359375, -0.16033935546875, 0.017578125, 0.19549560546875, 0.3734130859375, 0.55133056640625, 0.729248046875, 0.90716552734375, 1.0850830078125, 1.26300048828125, 1.44091796875, 1.61883544921875, 1.7967529296875, 1.97467041015625, 2.152587890625, 2.33050537109375, 2.5084228515625, 2.68634033203125, 2.8642578125, 3.04217529296875, 3.2200927734375, 3.39801025390625, 3.575927734375, 3.75384521484375, 3.9317626953125, 4.10968017578125, 4.28759765625, 4.46551513671875, 4.6434326171875, 4.82135009765625, 4.999267578125, 5.17718505859375, 5.3551025390625, 5.53302001953125, 5.7109375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 8.0, 21.0, 22.0, 25.0, 46.0, 47.0, 70.0, 94.0, 98.0, 177.0, 274.0, 480.0, 1322.0, 5713.0, 45932.0, 646865.0, 3135797.0, 325107.0, 26186.0, 3746.0, 989.0, 412.0, 241.0, 169.0, 124.0, 90.0, 64.0, 45.0, 24.0, 19.0, 14.0, 17.0, 9.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.984375, -15.5054931640625, -15.026611328125, -14.5477294921875, -14.06884765625, -13.5899658203125, -13.111083984375, -12.6322021484375, -12.1533203125, -11.6744384765625, -11.195556640625, -10.7166748046875, -10.23779296875, -9.7589111328125, -9.280029296875, -8.8011474609375, -8.322265625, -7.8433837890625, -7.364501953125, -6.8856201171875, -6.40673828125, -5.9278564453125, -5.448974609375, -4.9700927734375, -4.4912109375, -4.0123291015625, -3.533447265625, -3.0545654296875, -2.57568359375, -2.0968017578125, -1.617919921875, -1.1390380859375, -0.66015625, -0.1812744140625, 0.297607421875, 0.7764892578125, 1.25537109375, 1.7342529296875, 2.213134765625, 2.6920166015625, 3.1708984375, 3.6497802734375, 4.128662109375, 4.6075439453125, 5.08642578125, 5.5653076171875, 6.044189453125, 6.5230712890625, 7.001953125, 7.4808349609375, 7.959716796875, 8.4385986328125, 8.91748046875, 9.3963623046875, 9.875244140625, 10.3541259765625, 10.8330078125, 11.3118896484375, 11.790771484375, 12.2696533203125, 12.74853515625, 13.2274169921875, 13.706298828125, 14.1851806640625, 14.6640625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 19.0, 109.0, 354.0, 375.0, 140.0, 16.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.09521484375, -74.55223846435547, -71.00926208496094, -67.4662857055664, -63.92331314086914, -60.38033676147461, -56.83736038208008, -53.29438781738281, -49.75141143798828, -46.20843505859375, -42.66545867919922, -39.12248229980469, -35.57950973510742, -32.03653335571289, -28.49355697631836, -24.95058250427246, -21.407604217529297, -17.864627838134766, -14.321653366088867, -10.778676986694336, -7.235701560974121, -3.6927261352539062, -0.149749755859375, 3.3932247161865234, 6.936201095581055, 10.47917652130127, 14.022151947021484, 17.565128326416016, 21.108104705810547, 24.651079177856445, 28.194055557250977, 31.737030029296875, 35.280006408691406, 38.82298278808594, 42.36595916748047, 45.908935546875, 49.451908111572266, 52.9948844909668, 56.53786087036133, 60.080833435058594, 63.623809814453125, 67.16678619384766, 70.70976257324219, 74.25273895263672, 77.79571533203125, 81.33868408203125, 84.88166809082031, 88.42463684082031, 91.96762084960938, 95.5105972290039, 99.05357360839844, 102.59654998779297, 106.1395263671875, 109.6824951171875, 113.22547912597656, 116.76844787597656, 120.3114242553711, 123.85440063476562, 127.39737701416016, 130.9403533935547, 134.4833221435547, 138.02630615234375, 141.56927490234375, 145.1122589111328, 148.6552276611328]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 4.0, 4.0, 4.0, 13.0, 6.0, 8.0, 19.0, 20.0, 19.0, 31.0, 28.0, 32.0, 30.0, 38.0, 29.0, 29.0, 29.0, 44.0, 39.0, 40.0, 51.0, 45.0, 51.0, 33.0, 37.0, 38.0, 37.0, 38.0, 23.0, 22.0, 21.0, 16.0, 19.0, 17.0, 16.0, 7.0, 9.0, 10.0, 7.0, 5.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-20.96167755126953, -20.313222885131836, -19.66476821899414, -19.016315460205078, -18.367860794067383, -17.719406127929688, -17.070953369140625, -16.42249870300293, -15.774044036865234, -15.125589370727539, -14.47713565826416, -13.828681945800781, -13.180227279663086, -12.53177261352539, -11.883318901062012, -11.234865188598633, -10.586410522460938, -9.937955856323242, -9.289502143859863, -8.641048431396484, -7.992593765258789, -7.344139575958252, -6.695685386657715, -6.047231197357178, -5.398777008056641, -4.7503228187561035, -4.101868629455566, -3.4534144401550293, -2.804960250854492, -2.156506061553955, -1.508051872253418, -0.8595976829528809, -0.21114349365234375, 0.43731069564819336, 1.0857648849487305, 1.7342190742492676, 2.3826732635498047, 3.031127452850342, 3.679581642150879, 4.328035831451416, 4.976490020751953, 5.62494421005249, 6.273398399353027, 6.9218525886535645, 7.570306777954102, 8.218761444091797, 8.867215156555176, 9.515668869018555, 10.16412353515625, 10.812578201293945, 11.461031913757324, 12.109485626220703, 12.757940292358398, 13.406394958496094, 14.054848670959473, 14.703302383422852, 15.351757049560547, 16.000211715698242, 16.648666381835938, 17.297119140625, 17.945573806762695, 18.59402847290039, 19.242481231689453, 19.89093589782715, 20.539390563964844]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 9.0, 12.0, 15.0, 14.0, 15.0, 18.0, 20.0, 21.0, 33.0, 26.0, 36.0, 35.0, 33.0, 39.0, 47.0, 51.0, 32.0, 47.0, 59.0, 44.0, 41.0, 35.0, 37.0, 50.0, 30.0, 24.0, 30.0, 10.0, 21.0, 24.0, 18.0, 12.0, 12.0, 11.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.760528564453125, -3.63629150390625, -3.512054443359375, -3.3878173828125, -3.263580322265625, -3.13934326171875, -3.015106201171875, -2.890869140625, -2.766632080078125, -2.64239501953125, -2.518157958984375, -2.3939208984375, -2.269683837890625, -2.14544677734375, -2.021209716796875, -1.89697265625, -1.772735595703125, -1.64849853515625, -1.524261474609375, -1.4000244140625, -1.275787353515625, -1.15155029296875, -1.027313232421875, -0.903076171875, -0.778839111328125, -0.65460205078125, -0.530364990234375, -0.4061279296875, -0.281890869140625, -0.15765380859375, -0.033416748046875, 0.0908203125, 0.215057373046875, 0.33929443359375, 0.463531494140625, 0.5877685546875, 0.712005615234375, 0.83624267578125, 0.960479736328125, 1.084716796875, 1.208953857421875, 1.33319091796875, 1.457427978515625, 1.5816650390625, 1.705902099609375, 1.83013916015625, 1.954376220703125, 2.07861328125, 2.202850341796875, 2.32708740234375, 2.451324462890625, 2.5755615234375, 2.699798583984375, 2.82403564453125, 2.948272705078125, 3.072509765625, 3.196746826171875, 3.32098388671875, 3.445220947265625, 3.5694580078125, 3.693695068359375, 3.81793212890625, 3.942169189453125, 4.06640625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 2.0, 7.0, 6.0, 15.0, 18.0, 25.0, 40.0, 49.0, 68.0, 105.0, 130.0, 209.0, 335.0, 429.0, 649.0, 937.0, 1399.0, 2084.0, 3146.0, 4646.0, 6986.0, 10613.0, 16418.0, 25446.0, 42049.0, 72452.0, 146106.0, 338673.0, 169650.0, 80359.0, 45735.0, 27822.0, 17469.0, 11479.0, 7681.0, 5023.0, 3344.0, 2209.0, 1519.0, 970.0, 732.0, 465.0, 334.0, 216.0, 157.0, 116.0, 73.0, 44.0, 43.0, 22.0, 19.0, 12.0, 14.0, 5.0, 2.0, 4.0, 5.0, 0.0, 2.0, 1.0], "bins": [-0.031402587890625, -0.030408382415771484, -0.02941417694091797, -0.028419971466064453, -0.027425765991210938, -0.026431560516357422, -0.025437355041503906, -0.02444314956665039, -0.023448944091796875, -0.02245473861694336, -0.021460533142089844, -0.020466327667236328, -0.019472122192382812, -0.018477916717529297, -0.01748371124267578, -0.016489505767822266, -0.01549530029296875, -0.014501094818115234, -0.013506889343261719, -0.012512683868408203, -0.011518478393554688, -0.010524272918701172, -0.009530067443847656, -0.00853586196899414, -0.007541656494140625, -0.006547451019287109, -0.005553245544433594, -0.004559040069580078, -0.0035648345947265625, -0.002570629119873047, -0.0015764236450195312, -0.0005822181701660156, 0.0004119873046875, 0.0014061927795410156, 0.0024003982543945312, 0.003394603729248047, 0.0043888092041015625, 0.005383014678955078, 0.006377220153808594, 0.007371425628662109, 0.008365631103515625, 0.00935983657836914, 0.010354042053222656, 0.011348247528076172, 0.012342453002929688, 0.013336658477783203, 0.014330863952636719, 0.015325069427490234, 0.01631927490234375, 0.017313480377197266, 0.01830768585205078, 0.019301891326904297, 0.020296096801757812, 0.021290302276611328, 0.022284507751464844, 0.02327871322631836, 0.024272918701171875, 0.02526712417602539, 0.026261329650878906, 0.027255535125732422, 0.028249740600585938, 0.029243946075439453, 0.03023815155029297, 0.031232357025146484, 0.0322265625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 4.0, 4.0, 4.0, 12.0, 16.0, 18.0, 8.0, 22.0, 26.0, 30.0, 28.0, 26.0, 24.0, 34.0, 46.0, 25.0, 37.0, 32.0, 50.0, 1069.0, 43.0, 38.0, 37.0, 40.0, 39.0, 38.0, 28.0, 33.0, 28.0, 30.0, 20.0, 24.0, 15.0, 21.0, 11.0, 9.0, 12.0, 7.0, 2.0, 5.0, 9.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.392578125, -2.316986083984375, -2.24139404296875, -2.165802001953125, -2.0902099609375, -2.014617919921875, -1.93902587890625, -1.863433837890625, -1.787841796875, -1.712249755859375, -1.63665771484375, -1.561065673828125, -1.4854736328125, -1.409881591796875, -1.33428955078125, -1.258697509765625, -1.18310546875, -1.107513427734375, -1.03192138671875, -0.956329345703125, -0.8807373046875, -0.805145263671875, -0.72955322265625, -0.653961181640625, -0.578369140625, -0.502777099609375, -0.42718505859375, -0.351593017578125, -0.2760009765625, -0.200408935546875, -0.12481689453125, -0.049224853515625, 0.0263671875, 0.101959228515625, 0.17755126953125, 0.253143310546875, 0.3287353515625, 0.404327392578125, 0.47991943359375, 0.555511474609375, 0.631103515625, 0.706695556640625, 0.78228759765625, 0.857879638671875, 0.9334716796875, 1.009063720703125, 1.08465576171875, 1.160247802734375, 1.23583984375, 1.311431884765625, 1.38702392578125, 1.462615966796875, 1.5382080078125, 1.613800048828125, 1.68939208984375, 1.764984130859375, 1.840576171875, 1.916168212890625, 1.99176025390625, 2.067352294921875, 2.1429443359375, 2.218536376953125, 2.29412841796875, 2.369720458984375, 2.4453125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 9.0, 13.0, 22.0, 28.0, 39.0, 60.0, 89.0, 123.0, 165.0, 233.0, 352.0, 484.0, 679.0, 940.0, 1347.0, 1794.0, 2577.0, 3663.0, 5183.0, 7543.0, 10751.0, 15424.0, 22532.0, 34071.0, 52842.0, 87632.0, 170310.0, 1322532.0, 135871.0, 75396.0, 46879.0, 30308.0, 20279.0, 13869.0, 9714.0, 6876.0, 4683.0, 3404.0, 2385.0, 1738.0, 1190.0, 838.0, 677.0, 479.0, 331.0, 237.0, 197.0, 103.0, 81.0, 58.0, 40.0, 21.0, 15.0, 12.0, 10.0, 6.0, 3.0, 2.0, 1.0], "bins": [-0.0179595947265625, -0.017404556274414062, -0.016849517822265625, -0.016294479370117188, -0.01573944091796875, -0.015184402465820312, -0.014629364013671875, -0.014074325561523438, -0.013519287109375, -0.012964248657226562, -0.012409210205078125, -0.011854171752929688, -0.01129913330078125, -0.010744094848632812, -0.010189056396484375, -0.009634017944335938, -0.0090789794921875, -0.008523941040039062, -0.007968902587890625, -0.0074138641357421875, -0.00685882568359375, -0.0063037872314453125, -0.005748748779296875, -0.0051937103271484375, -0.004638671875, -0.0040836334228515625, -0.003528594970703125, -0.0029735565185546875, -0.00241851806640625, -0.0018634796142578125, -0.001308441162109375, -0.0007534027099609375, -0.0001983642578125, 0.0003566741943359375, 0.000911712646484375, 0.0014667510986328125, 0.00202178955078125, 0.0025768280029296875, 0.003131866455078125, 0.0036869049072265625, 0.004241943359375, 0.0047969818115234375, 0.005352020263671875, 0.0059070587158203125, 0.00646209716796875, 0.0070171356201171875, 0.007572174072265625, 0.008127212524414062, 0.0086822509765625, 0.009237289428710938, 0.009792327880859375, 0.010347366333007812, 0.01090240478515625, 0.011457443237304688, 0.012012481689453125, 0.012567520141601562, 0.01312255859375, 0.013677597045898438, 0.014232635498046875, 0.014787673950195312, 0.01534271240234375, 0.015897750854492188, 0.016452789306640625, 0.017007827758789062, 0.0175628662109375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 89.0, 0.0, 0.0, 185.0, 0.0, 0.0, 0.0, 371.0, 0.0, 0.0, 0.0, 194.0, 0.0, 0.0, 58.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.600733518600464e-07, -4.4330954551696777e-07, -4.2654573917388916e-07, -4.0978193283081055e-07, -3.9301812648773193e-07, -3.762543201446533e-07, -3.594905138015747e-07, -3.427267074584961e-07, -3.259629011154175e-07, -3.0919909477233887e-07, -2.9243528842926025e-07, -2.7567148208618164e-07, -2.5890767574310303e-07, -2.421438694000244e-07, -2.253800630569458e-07, -2.086162567138672e-07, -1.9185245037078857e-07, -1.7508864402770996e-07, -1.5832483768463135e-07, -1.4156103134155273e-07, -1.2479722499847412e-07, -1.0803341865539551e-07, -9.12696123123169e-08, -7.450580596923828e-08, -5.774199962615967e-08, -4.0978193283081055e-08, -2.421438694000244e-08, -7.450580596923828e-09, 9.313225746154785e-09, 2.60770320892334e-08, 4.284083843231201e-08, 5.960464477539063e-08, 7.636845111846924e-08, 9.313225746154785e-08, 1.0989606380462646e-07, 1.2665987014770508e-07, 1.434236764907837e-07, 1.601874828338623e-07, 1.7695128917694092e-07, 1.9371509552001953e-07, 2.1047890186309814e-07, 2.2724270820617676e-07, 2.4400651454925537e-07, 2.60770320892334e-07, 2.775341272354126e-07, 2.942979335784912e-07, 3.110617399215698e-07, 3.2782554626464844e-07, 3.4458935260772705e-07, 3.6135315895080566e-07, 3.781169652938843e-07, 3.948807716369629e-07, 4.116445779800415e-07, 4.284083843231201e-07, 4.4517219066619873e-07, 4.6193599700927734e-07, 4.78699803352356e-07, 4.954636096954346e-07, 5.122274160385132e-07, 5.289912223815918e-07, 5.457550287246704e-07, 5.62518835067749e-07, 5.792826414108276e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 3.0, 4.0, 23.0, 8.0, 10.0, 25.0, 45.0, 47.0, 34.0, 287.0, 259.0, 2665.0, 989884.0, 54002.0, 577.0, 238.0, 194.0, 43.0, 35.0, 69.0, 13.0, 9.0, 23.0, 7.0, 2.0, 10.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4007091522216797e-05, -1.361500471830368e-05, -1.3222917914390564e-05, -1.2830831110477448e-05, -1.2438744306564331e-05, -1.2046657502651215e-05, -1.1654570698738098e-05, -1.1262483894824982e-05, -1.0870397090911865e-05, -1.0478310286998749e-05, -1.0086223483085632e-05, -9.694136679172516e-06, -9.3020498752594e-06, -8.909963071346283e-06, -8.517876267433167e-06, -8.12578946352005e-06, -7.733702659606934e-06, -7.341615855693817e-06, -6.949529051780701e-06, -6.557442247867584e-06, -6.165355443954468e-06, -5.773268640041351e-06, -5.381181836128235e-06, -4.989095032215118e-06, -4.597008228302002e-06, -4.2049214243888855e-06, -3.812834620475769e-06, -3.4207478165626526e-06, -3.028661012649536e-06, -2.6365742087364197e-06, -2.2444874048233032e-06, -1.8524006009101868e-06, -1.4603137969970703e-06, -1.0682269930839539e-06, -6.761401891708374e-07, -2.8405338525772095e-07, 1.0803341865539551e-07, 5.00120222568512e-07, 8.922070264816284e-07, 1.2842938303947449e-06, 1.6763806343078613e-06, 2.0684674382209778e-06, 2.4605542421340942e-06, 2.8526410460472107e-06, 3.244727849960327e-06, 3.6368146538734436e-06, 4.02890145778656e-06, 4.4209882616996765e-06, 4.813075065612793e-06, 5.2051618695259094e-06, 5.597248673439026e-06, 5.989335477352142e-06, 6.381422281265259e-06, 6.773509085178375e-06, 7.165595889091492e-06, 7.557682693004608e-06, 7.949769496917725e-06, 8.341856300830841e-06, 8.733943104743958e-06, 9.126029908657074e-06, 9.51811671257019e-06, 9.910203516483307e-06, 1.0302290320396423e-05, 1.069437712430954e-05, 1.1086463928222656e-05]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 21.0, 21.0, 33.0, 50.0, 68.0, 594.0, 70.0, 60.0, 41.0, 22.0, 12.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.893276918162883e-07, -6.754470973646676e-07, -6.615665597564657e-07, -6.47685965304845e-07, -6.338053708532243e-07, -6.199248332450225e-07, -6.060442387934017e-07, -5.921637011851999e-07, -5.782831067335792e-07, -5.644025122819585e-07, -5.505219746737566e-07, -5.366413802221359e-07, -5.227608426139341e-07, -5.088802481623134e-07, -4.949996537106927e-07, -4.811191161024908e-07, -4.672385216508701e-07, -4.533579556209588e-07, -4.3947738959104754e-07, -4.2559679513942683e-07, -4.1171622910951555e-07, -3.978356630796043e-07, -3.8395506862798356e-07, -3.700745025980723e-07, -3.56193936568161e-07, -3.4231337053824973e-07, -3.2843280450833845e-07, -3.1455221005671774e-07, -3.0067164402680646e-07, -2.867910779968952e-07, -2.729104835452745e-07, -2.590299175153632e-07, -2.451493514854519e-07, -2.3126878545554064e-07, -2.1738820521477464e-07, -2.0350762497400865e-07, -1.8962705894409737e-07, -1.757464929141861e-07, -1.618659126734201e-07, -1.479853324326541e-07, -1.3410478061359754e-07, -1.2022420037283155e-07, -1.0634363434292027e-07, -9.246306120758163e-08, -7.8582488072243e-08, -6.470191493690436e-08, -5.082134180156572e-08, -3.6940768666227086e-08, -2.306019553088845e-08, -9.179622395549814e-09, 4.700950739788823e-09, 1.858152387512746e-08, 3.2462097010466096e-08, 4.634267014580473e-08, 6.022324328114337e-08, 7.4103816416482e-08, 8.798438955182064e-08, 1.0186496268715928e-07, 1.1574553582249791e-07, 1.296261018524092e-07, 1.4350668209317519e-07, 1.5738726233394118e-07, 1.7126782836385246e-07, 1.8514839439376374e-07, 1.9902897463452973e-07]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 186.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 572.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 190.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 9.0, 12.0, 15.0, 14.0, 15.0, 18.0, 20.0, 21.0, 33.0, 26.0, 36.0, 35.0, 33.0, 39.0, 47.0, 51.0, 32.0, 47.0, 59.0, 44.0, 41.0, 35.0, 37.0, 50.0, 30.0, 24.0, 30.0, 10.0, 21.0, 24.0, 18.0, 12.0, 12.0, 11.0, 7.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.884765625, -3.760528564453125, -3.63629150390625, -3.512054443359375, -3.3878173828125, -3.263580322265625, -3.13934326171875, -3.015106201171875, -2.890869140625, -2.766632080078125, -2.64239501953125, -2.518157958984375, -2.3939208984375, -2.269683837890625, -2.14544677734375, -2.021209716796875, -1.89697265625, -1.772735595703125, -1.64849853515625, -1.524261474609375, -1.4000244140625, -1.275787353515625, -1.15155029296875, -1.027313232421875, -0.903076171875, -0.778839111328125, -0.65460205078125, -0.530364990234375, -0.4061279296875, -0.281890869140625, -0.15765380859375, -0.033416748046875, 0.0908203125, 0.215057373046875, 0.33929443359375, 0.463531494140625, 0.5877685546875, 0.712005615234375, 0.83624267578125, 0.960479736328125, 1.084716796875, 1.208953857421875, 1.33319091796875, 1.457427978515625, 1.5816650390625, 1.705902099609375, 1.83013916015625, 1.954376220703125, 2.07861328125, 2.202850341796875, 2.32708740234375, 2.451324462890625, 2.5755615234375, 2.699798583984375, 2.82403564453125, 2.948272705078125, 3.072509765625, 3.196746826171875, 3.32098388671875, 3.445220947265625, 3.5694580078125, 3.693695068359375, 3.81793212890625, 3.942169189453125, 4.06640625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 11.0, 10.0, 16.0, 19.0, 27.0, 41.0, 38.0, 54.0, 74.0, 105.0, 123.0, 226.0, 350.0, 683.0, 1487.0, 3238.0, 7883.0, 18599.0, 46185.0, 161873.0, 638676.0, 106292.0, 36010.0, 14859.0, 6214.0, 2710.0, 1198.0, 566.0, 307.0, 177.0, 98.0, 82.0, 88.0, 65.0, 37.0, 32.0, 23.0, 19.0, 14.0, 4.0, 7.0, 3.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.390625, -7.155029296875, -6.91943359375, -6.683837890625, -6.4482421875, -6.212646484375, -5.97705078125, -5.741455078125, -5.505859375, -5.270263671875, -5.03466796875, -4.799072265625, -4.5634765625, -4.327880859375, -4.09228515625, -3.856689453125, -3.62109375, -3.385498046875, -3.14990234375, -2.914306640625, -2.6787109375, -2.443115234375, -2.20751953125, -1.971923828125, -1.736328125, -1.500732421875, -1.26513671875, -1.029541015625, -0.7939453125, -0.558349609375, -0.32275390625, -0.087158203125, 0.1484375, 0.384033203125, 0.61962890625, 0.855224609375, 1.0908203125, 1.326416015625, 1.56201171875, 1.797607421875, 2.033203125, 2.268798828125, 2.50439453125, 2.739990234375, 2.9755859375, 3.211181640625, 3.44677734375, 3.682373046875, 3.91796875, 4.153564453125, 4.38916015625, 4.624755859375, 4.8603515625, 5.095947265625, 5.33154296875, 5.567138671875, 5.802734375, 6.038330078125, 6.27392578125, 6.509521484375, 6.7451171875, 6.980712890625, 7.21630859375, 7.451904296875, 7.6875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 4.0, 5.0, 3.0, 6.0, 6.0, 4.0, 12.0, 14.0, 28.0, 20.0, 21.0, 31.0, 20.0, 38.0, 30.0, 38.0, 36.0, 40.0, 49.0, 74.0, 129.0, 1516.0, 359.0, 111.0, 73.0, 52.0, 46.0, 38.0, 33.0, 29.0, 41.0, 17.0, 33.0, 14.0, 18.0, 13.0, 10.0, 9.0, 5.0, 7.0, 8.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.9609375, -10.606201171875, -10.25146484375, -9.896728515625, -9.5419921875, -9.187255859375, -8.83251953125, -8.477783203125, -8.123046875, -7.768310546875, -7.41357421875, -7.058837890625, -6.7041015625, -6.349365234375, -5.99462890625, -5.639892578125, -5.28515625, -4.930419921875, -4.57568359375, -4.220947265625, -3.8662109375, -3.511474609375, -3.15673828125, -2.802001953125, -2.447265625, -2.092529296875, -1.73779296875, -1.383056640625, -1.0283203125, -0.673583984375, -0.31884765625, 0.035888671875, 0.390625, 0.745361328125, 1.10009765625, 1.454833984375, 1.8095703125, 2.164306640625, 2.51904296875, 2.873779296875, 3.228515625, 3.583251953125, 3.93798828125, 4.292724609375, 4.6474609375, 5.002197265625, 5.35693359375, 5.711669921875, 6.06640625, 6.421142578125, 6.77587890625, 7.130615234375, 7.4853515625, 7.840087890625, 8.19482421875, 8.549560546875, 8.904296875, 9.259033203125, 9.61376953125, 9.968505859375, 10.3232421875, 10.677978515625, 11.03271484375, 11.387451171875, 11.7421875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 6.0, 7.0, 9.0, 15.0, 8.0, 12.0, 16.0, 16.0, 36.0, 32.0, 52.0, 77.0, 74.0, 108.0, 202.0, 400.0, 1324.0, 9886.0, 195569.0, 2872961.0, 58765.0, 4405.0, 807.0, 291.0, 157.0, 104.0, 80.0, 65.0, 25.0, 39.0, 37.0, 25.0, 28.0, 14.0, 9.0, 7.0, 8.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.171875, -22.4765625, -21.78125, -21.0859375, -20.390625, -19.6953125, -19.0, -18.3046875, -17.609375, -16.9140625, -16.21875, -15.5234375, -14.828125, -14.1328125, -13.4375, -12.7421875, -12.046875, -11.3515625, -10.65625, -9.9609375, -9.265625, -8.5703125, -7.875, -7.1796875, -6.484375, -5.7890625, -5.09375, -4.3984375, -3.703125, -3.0078125, -2.3125, -1.6171875, -0.921875, -0.2265625, 0.46875, 1.1640625, 1.859375, 2.5546875, 3.25, 3.9453125, 4.640625, 5.3359375, 6.03125, 6.7265625, 7.421875, 8.1171875, 8.8125, 9.5078125, 10.203125, 10.8984375, 11.59375, 12.2890625, 12.984375, 13.6796875, 14.375, 15.0703125, 15.765625, 16.4609375, 17.15625, 17.8515625, 18.546875, 19.2421875, 19.9375, 20.6328125, 21.328125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 11.0, 292.0, 671.0, 43.0], "bins": [-247.36798095703125, -243.39218139648438, -239.4163818359375, -235.44058227539062, -231.46478271484375, -227.48898315429688, -223.51316833496094, -219.53736877441406, -215.5615692138672, -211.5857696533203, -207.60997009277344, -203.63417053222656, -199.6583709716797, -195.68255615234375, -191.70675659179688, -187.73095703125, -183.75515747070312, -179.77935791015625, -175.80355834960938, -171.8277587890625, -167.85195922851562, -163.87615966796875, -159.9003448486328, -155.92454528808594, -151.94874572753906, -147.9729461669922, -143.9971466064453, -140.02134704589844, -136.04554748535156, -132.06973266601562, -128.09393310546875, -124.11813354492188, -120.142333984375, -116.16653442382812, -112.19073486328125, -108.21492767333984, -104.23912811279297, -100.2633285522461, -96.28752899169922, -92.31172180175781, -88.33592987060547, -84.3601303100586, -80.38433074951172, -76.40852355957031, -72.43272399902344, -68.45692443847656, -64.48112487792969, -60.50532150268555, -56.529518127441406, -52.55371856689453, -48.57791519165039, -44.602115631103516, -40.626312255859375, -36.6505126953125, -32.674713134765625, -28.698909759521484, -24.723108291625977, -20.74730682373047, -16.77150535583496, -12.79570484161377, -8.819903373718262, -4.84410285949707, -0.8683013916015625, 3.1075000762939453, 7.083301544189453]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 2.0, 9.0, 8.0, 13.0, 16.0, 17.0, 15.0, 21.0, 25.0, 26.0, 38.0, 28.0, 31.0, 42.0, 38.0, 30.0, 46.0, 43.0, 41.0, 45.0, 32.0, 27.0, 43.0, 34.0, 46.0, 36.0, 31.0, 23.0, 23.0, 28.0, 23.0, 19.0, 8.0, 19.0, 13.0, 10.0, 11.0, 6.0, 4.0, 2.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-29.287628173828125, -28.375293731689453, -27.46295928955078, -26.55062484741211, -25.638290405273438, -24.725955963134766, -23.813623428344727, -22.901288986206055, -21.988954544067383, -21.07662010192871, -20.16428565979004, -19.251951217651367, -18.339618682861328, -17.427284240722656, -16.514949798583984, -15.602615356445312, -14.69028091430664, -13.777946472167969, -12.865612030029297, -11.953278541564941, -11.04094409942627, -10.128609657287598, -9.216276168823242, -8.30394172668457, -7.391607284545898, -6.479272842407227, -5.566938877105713, -4.654604911804199, -3.7422704696655273, -2.8299360275268555, -1.9176020622253418, -1.0052680969238281, -0.09293365478515625, 0.8194005489349365, 1.7317347526550293, 2.644068956375122, 3.556403160095215, 4.468737602233887, 5.3810715675354, 6.293405532836914, 7.205739974975586, 8.118074417114258, 9.03040885925293, 9.942742347717285, 10.855076789855957, 11.767411231994629, 12.679744720458984, 13.592079162597656, 14.504413604736328, 15.416748046875, 16.329082489013672, 17.241416931152344, 18.153751373291016, 19.066085815429688, 19.978418350219727, 20.8907527923584, 21.80308723449707, 22.715421676635742, 23.627756118774414, 24.540090560913086, 25.452423095703125, 26.364757537841797, 27.27709197998047, 28.18942642211914, 29.101760864257812]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 9.0, 8.0, 11.0, 13.0, 11.0, 15.0, 15.0, 28.0, 23.0, 30.0, 40.0, 21.0, 36.0, 51.0, 51.0, 33.0, 45.0, 39.0, 55.0, 51.0, 58.0, 43.0, 23.0, 28.0, 32.0, 41.0, 26.0, 20.0, 26.0, 18.0, 19.0, 18.0, 14.0, 14.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.98040771484375, -3.8475341796875, -3.71466064453125, -3.581787109375, -3.44891357421875, -3.3160400390625, -3.18316650390625, -3.05029296875, -2.91741943359375, -2.7845458984375, -2.65167236328125, -2.518798828125, -2.38592529296875, -2.2530517578125, -2.12017822265625, -1.9873046875, -1.85443115234375, -1.7215576171875, -1.58868408203125, -1.455810546875, -1.32293701171875, -1.1900634765625, -1.05718994140625, -0.92431640625, -0.79144287109375, -0.6585693359375, -0.52569580078125, -0.392822265625, -0.25994873046875, -0.1270751953125, 0.00579833984375, 0.138671875, 0.27154541015625, 0.4044189453125, 0.53729248046875, 0.670166015625, 0.80303955078125, 0.9359130859375, 1.06878662109375, 1.20166015625, 1.33453369140625, 1.4674072265625, 1.60028076171875, 1.733154296875, 1.86602783203125, 1.9989013671875, 2.13177490234375, 2.2646484375, 2.39752197265625, 2.5303955078125, 2.66326904296875, 2.796142578125, 2.92901611328125, 3.0618896484375, 3.19476318359375, 3.32763671875, 3.46051025390625, 3.5933837890625, 3.72625732421875, 3.859130859375, 3.99200439453125, 4.1248779296875, 4.25775146484375, 4.390625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 6.0, 3.0, 7.0, 4.0, 17.0, 19.0, 18.0, 19.0, 45.0, 53.0, 84.0, 143.0, 221.0, 361.0, 691.0, 1328.0, 2741.0, 6602.0, 16890.0, 51770.0, 195512.0, 959185.0, 2113509.0, 645828.0, 137692.0, 38403.0, 13134.0, 5037.0, 2282.0, 1147.0, 579.0, 357.0, 200.0, 135.0, 68.0, 52.0, 50.0, 27.0, 23.0, 17.0, 8.0, 3.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.2935791015625, -6.079345703125, -5.8651123046875, -5.65087890625, -5.4366455078125, -5.222412109375, -5.0081787109375, -4.7939453125, -4.5797119140625, -4.365478515625, -4.1512451171875, -3.93701171875, -3.7227783203125, -3.508544921875, -3.2943115234375, -3.080078125, -2.8658447265625, -2.651611328125, -2.4373779296875, -2.22314453125, -2.0089111328125, -1.794677734375, -1.5804443359375, -1.3662109375, -1.1519775390625, -0.937744140625, -0.7235107421875, -0.50927734375, -0.2950439453125, -0.080810546875, 0.1334228515625, 0.34765625, 0.5618896484375, 0.776123046875, 0.9903564453125, 1.20458984375, 1.4188232421875, 1.633056640625, 1.8472900390625, 2.0615234375, 2.2757568359375, 2.489990234375, 2.7042236328125, 2.91845703125, 3.1326904296875, 3.346923828125, 3.5611572265625, 3.775390625, 3.9896240234375, 4.203857421875, 4.4180908203125, 4.63232421875, 4.8465576171875, 5.060791015625, 5.2750244140625, 5.4892578125, 5.7034912109375, 5.917724609375, 6.1319580078125, 6.34619140625, 6.5604248046875, 6.774658203125, 6.9888916015625, 7.203125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 6.0, 3.0, 5.0, 12.0, 10.0, 23.0, 22.0, 25.0, 29.0, 31.0, 55.0, 74.0, 87.0, 117.0, 142.0, 195.0, 253.0, 314.0, 411.0, 384.0, 398.0, 333.0, 259.0, 199.0, 151.0, 117.0, 103.0, 79.0, 54.0, 40.0, 32.0, 23.0, 17.0, 13.0, 8.0, 15.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.75390625, -4.5823974609375, -4.410888671875, -4.2393798828125, -4.06787109375, -3.8963623046875, -3.724853515625, -3.5533447265625, -3.3818359375, -3.2103271484375, -3.038818359375, -2.8673095703125, -2.69580078125, -2.5242919921875, -2.352783203125, -2.1812744140625, -2.009765625, -1.8382568359375, -1.666748046875, -1.4952392578125, -1.32373046875, -1.1522216796875, -0.980712890625, -0.8092041015625, -0.6376953125, -0.4661865234375, -0.294677734375, -0.1231689453125, 0.04833984375, 0.2198486328125, 0.391357421875, 0.5628662109375, 0.734375, 0.9058837890625, 1.077392578125, 1.2489013671875, 1.42041015625, 1.5919189453125, 1.763427734375, 1.9349365234375, 2.1064453125, 2.2779541015625, 2.449462890625, 2.6209716796875, 2.79248046875, 2.9639892578125, 3.135498046875, 3.3070068359375, 3.478515625, 3.6500244140625, 3.821533203125, 3.9930419921875, 4.16455078125, 4.3360595703125, 4.507568359375, 4.6790771484375, 4.8505859375, 5.0220947265625, 5.193603515625, 5.3651123046875, 5.53662109375, 5.7081298828125, 5.879638671875, 6.0511474609375, 6.22265625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 4.0, 4.0, 6.0, 9.0, 13.0, 18.0, 15.0, 13.0, 41.0, 28.0, 37.0, 80.0, 97.0, 157.0, 224.0, 390.0, 879.0, 2634.0, 12964.0, 94741.0, 1213580.0, 2631079.0, 206428.0, 23730.0, 4402.0, 1259.0, 513.0, 311.0, 184.0, 122.0, 82.0, 44.0, 40.0, 38.0, 34.0, 23.0, 21.0, 9.0, 10.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-17.25, -16.785888671875, -16.32177734375, -15.857666015625, -15.3935546875, -14.929443359375, -14.46533203125, -14.001220703125, -13.537109375, -13.072998046875, -12.60888671875, -12.144775390625, -11.6806640625, -11.216552734375, -10.75244140625, -10.288330078125, -9.82421875, -9.360107421875, -8.89599609375, -8.431884765625, -7.9677734375, -7.503662109375, -7.03955078125, -6.575439453125, -6.111328125, -5.647216796875, -5.18310546875, -4.718994140625, -4.2548828125, -3.790771484375, -3.32666015625, -2.862548828125, -2.3984375, -1.934326171875, -1.47021484375, -1.006103515625, -0.5419921875, -0.077880859375, 0.38623046875, 0.850341796875, 1.314453125, 1.778564453125, 2.24267578125, 2.706787109375, 3.1708984375, 3.635009765625, 4.09912109375, 4.563232421875, 5.02734375, 5.491455078125, 5.95556640625, 6.419677734375, 6.8837890625, 7.347900390625, 7.81201171875, 8.276123046875, 8.740234375, 9.204345703125, 9.66845703125, 10.132568359375, 10.5966796875, 11.060791015625, 11.52490234375, 11.989013671875, 12.453125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 14.0, 34.0, 59.0, 104.0, 186.0, 192.0, 182.0, 106.0, 75.0, 29.0, 16.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.16059494018555, -33.52985382080078, -31.89911460876465, -30.268373489379883, -28.63763427734375, -27.006893157958984, -25.37615203857422, -23.745410919189453, -22.11467170715332, -20.483930587768555, -18.853191375732422, -17.222450256347656, -15.591710090637207, -13.960969924926758, -12.330228805541992, -10.699488639831543, -9.068748474121094, -7.4380083084106445, -5.807267665863037, -4.17652702331543, -2.5457868576049805, -0.9150466918945312, 0.7156944274902344, 2.3464345932006836, 3.977174758911133, 5.607914924621582, 7.2386555671691895, 8.869396209716797, 10.500136375427246, 12.130876541137695, 13.761617660522461, 15.39235782623291, 17.023094177246094, 18.65383529663086, 20.284574508666992, 21.915315628051758, 23.54605484008789, 25.176795959472656, 26.807537078857422, 28.438278198242188, 30.06901741027832, 31.699758529663086, 33.33049774169922, 34.961238861083984, 36.59197998046875, 38.22271728515625, 39.85346221923828, 41.48419952392578, 43.11494064331055, 44.74568176269531, 46.37642288208008, 48.007164001464844, 49.637901306152344, 51.26864242553711, 52.899383544921875, 54.53012466430664, 56.160865783691406, 57.79160690307617, 59.42234802246094, 61.05308532714844, 62.6838264465332, 64.31456756591797, 65.9453125, 67.5760498046875, 69.206787109375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 8.0, 16.0, 14.0, 13.0, 20.0, 17.0, 22.0, 28.0, 25.0, 34.0, 20.0, 30.0, 28.0, 39.0, 33.0, 56.0, 43.0, 50.0, 38.0, 54.0, 34.0, 26.0, 49.0, 35.0, 33.0, 32.0, 36.0, 28.0, 23.0, 26.0, 12.0, 7.0, 12.0, 10.0, 8.0, 11.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.984542846679688, -22.278053283691406, -21.571561813354492, -20.86507225036621, -20.158580780029297, -19.452091217041016, -18.745601654052734, -18.039112091064453, -17.33262062072754, -16.626131057739258, -15.919639587402344, -15.213150024414062, -14.506659507751465, -13.800168991088867, -13.093679428100586, -12.387188911437988, -11.68069839477539, -10.974207878112793, -10.267717361450195, -9.561227798461914, -8.854737281799316, -8.148246765136719, -7.441756725311279, -6.73526668548584, -6.028776168823242, -5.3222856521606445, -4.615795612335205, -3.9093053340911865, -3.202815055847168, -2.4963247776031494, -1.7898344993591309, -1.0833444595336914, -0.37685585021972656, 0.329634428024292, 1.0361247062683105, 1.742614984512329, 2.4491052627563477, 3.155595541000366, 3.8620858192443848, 4.568575859069824, 5.275066375732422, 5.9815568923950195, 6.688046932220459, 7.394536972045898, 8.101027488708496, 8.807518005371094, 9.514007568359375, 10.220498085021973, 10.92698860168457, 11.633479118347168, 12.339969635009766, 13.046459197998047, 13.752949714660645, 14.459440231323242, 15.165929794311523, 15.872420310974121, 16.57891082763672, 17.285400390625, 17.991891860961914, 18.698381423950195, 19.40487289428711, 20.11136245727539, 20.817852020263672, 21.524341583251953, 22.230833053588867]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 2.0, 8.0, 4.0, 7.0, 6.0, 19.0, 11.0, 14.0, 17.0, 24.0, 18.0, 22.0, 33.0, 44.0, 31.0, 41.0, 31.0, 36.0, 34.0, 39.0, 44.0, 49.0, 42.0, 36.0, 45.0, 39.0, 38.0, 34.0, 37.0, 29.0, 24.0, 23.0, 11.0, 29.0, 18.0, 14.0, 11.0, 10.0, 5.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.45703125, -4.32989501953125, -4.2027587890625, -4.07562255859375, -3.948486328125, -3.82135009765625, -3.6942138671875, -3.56707763671875, -3.43994140625, -3.31280517578125, -3.1856689453125, -3.05853271484375, -2.931396484375, -2.80426025390625, -2.6771240234375, -2.54998779296875, -2.4228515625, -2.29571533203125, -2.1685791015625, -2.04144287109375, -1.914306640625, -1.78717041015625, -1.6600341796875, -1.53289794921875, -1.40576171875, -1.27862548828125, -1.1514892578125, -1.02435302734375, -0.897216796875, -0.77008056640625, -0.6429443359375, -0.51580810546875, -0.388671875, -0.26153564453125, -0.1343994140625, -0.00726318359375, 0.119873046875, 0.24700927734375, 0.3741455078125, 0.50128173828125, 0.62841796875, 0.75555419921875, 0.8826904296875, 1.00982666015625, 1.136962890625, 1.26409912109375, 1.3912353515625, 1.51837158203125, 1.6455078125, 1.77264404296875, 1.8997802734375, 2.02691650390625, 2.154052734375, 2.28118896484375, 2.4083251953125, 2.53546142578125, 2.66259765625, 2.78973388671875, 2.9168701171875, 3.04400634765625, 3.171142578125, 3.29827880859375, 3.4254150390625, 3.55255126953125, 3.6796875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 9.0, 20.0, 41.0, 58.0, 69.0, 119.0, 160.0, 276.0, 379.0, 611.0, 909.0, 1355.0, 2263.0, 3472.0, 5315.0, 8487.0, 13430.0, 21937.0, 36388.0, 62426.0, 116584.0, 300968.0, 234440.0, 99084.0, 54607.0, 32418.0, 19560.0, 12033.0, 7553.0, 4752.0, 3137.0, 1931.0, 1287.0, 844.0, 526.0, 362.0, 241.0, 162.0, 120.0, 66.0, 48.0, 30.0, 22.0, 20.0, 15.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0306854248046875, -0.02965855598449707, -0.02863168716430664, -0.02760481834411621, -0.02657794952392578, -0.02555108070373535, -0.024524211883544922, -0.023497343063354492, -0.022470474243164062, -0.021443605422973633, -0.020416736602783203, -0.019389867782592773, -0.018362998962402344, -0.017336130142211914, -0.016309261322021484, -0.015282392501831055, -0.014255523681640625, -0.013228654861450195, -0.012201786041259766, -0.011174917221069336, -0.010148048400878906, -0.009121179580688477, -0.008094310760498047, -0.007067441940307617, -0.0060405731201171875, -0.005013704299926758, -0.003986835479736328, -0.0029599666595458984, -0.0019330978393554688, -0.0009062290191650391, 0.00012063980102539062, 0.0011475086212158203, 0.00217437744140625, 0.0032012462615966797, 0.004228115081787109, 0.005254983901977539, 0.006281852722167969, 0.0073087215423583984, 0.008335590362548828, 0.009362459182739258, 0.010389328002929688, 0.011416196823120117, 0.012443065643310547, 0.013469934463500977, 0.014496803283691406, 0.015523672103881836, 0.016550540924072266, 0.017577409744262695, 0.018604278564453125, 0.019631147384643555, 0.020658016204833984, 0.021684885025024414, 0.022711753845214844, 0.023738622665405273, 0.024765491485595703, 0.025792360305786133, 0.026819229125976562, 0.027846097946166992, 0.028872966766357422, 0.02989983558654785, 0.03092670440673828, 0.03195357322692871, 0.03298044204711914, 0.03400731086730957, 0.0350341796875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 7.0, 0.0, 4.0, 3.0, 9.0, 5.0, 9.0, 6.0, 16.0, 11.0, 14.0, 17.0, 17.0, 19.0, 29.0, 27.0, 27.0, 26.0, 43.0, 39.0, 21.0, 29.0, 44.0, 49.0, 1057.0, 44.0, 32.0, 44.0, 37.0, 45.0, 37.0, 30.0, 27.0, 32.0, 25.0, 16.0, 29.0, 15.0, 14.0, 13.0, 12.0, 12.0, 11.0, 8.0, 4.0, 3.0, 4.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.108367919921875, -2.03118896484375, -1.954010009765625, -1.8768310546875, -1.799652099609375, -1.72247314453125, -1.645294189453125, -1.568115234375, -1.490936279296875, -1.41375732421875, -1.336578369140625, -1.2593994140625, -1.182220458984375, -1.10504150390625, -1.027862548828125, -0.95068359375, -0.873504638671875, -0.79632568359375, -0.719146728515625, -0.6419677734375, -0.564788818359375, -0.48760986328125, -0.410430908203125, -0.333251953125, -0.256072998046875, -0.17889404296875, -0.101715087890625, -0.0245361328125, 0.052642822265625, 0.12982177734375, 0.207000732421875, 0.2841796875, 0.361358642578125, 0.43853759765625, 0.515716552734375, 0.5928955078125, 0.670074462890625, 0.74725341796875, 0.824432373046875, 0.901611328125, 0.978790283203125, 1.05596923828125, 1.133148193359375, 1.2103271484375, 1.287506103515625, 1.36468505859375, 1.441864013671875, 1.51904296875, 1.596221923828125, 1.67340087890625, 1.750579833984375, 1.8277587890625, 1.904937744140625, 1.98211669921875, 2.059295654296875, 2.136474609375, 2.213653564453125, 2.29083251953125, 2.368011474609375, 2.4451904296875, 2.522369384765625, 2.59954833984375, 2.676727294921875, 2.75390625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 21.0, 17.0, 45.0, 60.0, 85.0, 147.0, 194.0, 296.0, 424.0, 589.0, 898.0, 1217.0, 1732.0, 2387.0, 3419.0, 4681.0, 6831.0, 9736.0, 14229.0, 20977.0, 32485.0, 51195.0, 85447.0, 168180.0, 1329394.0, 143936.0, 77236.0, 47174.0, 29835.0, 19655.0, 13288.0, 9297.0, 6366.0, 4508.0, 3287.0, 2290.0, 1612.0, 1214.0, 818.0, 609.0, 420.0, 278.0, 210.0, 135.0, 97.0, 59.0, 37.0, 31.0, 15.0, 15.0, 9.0, 5.0, 3.0, 1.0, 3.0], "bins": [-0.0203399658203125, -0.01973104476928711, -0.01912212371826172, -0.018513202667236328, -0.017904281616210938, -0.017295360565185547, -0.016686439514160156, -0.016077518463134766, -0.015468597412109375, -0.014859676361083984, -0.014250755310058594, -0.013641834259033203, -0.013032913208007812, -0.012423992156982422, -0.011815071105957031, -0.01120615005493164, -0.01059722900390625, -0.00998830795288086, -0.009379386901855469, -0.008770465850830078, -0.008161544799804688, -0.007552623748779297, -0.006943702697753906, -0.006334781646728516, -0.005725860595703125, -0.005116939544677734, -0.004508018493652344, -0.003899097442626953, -0.0032901763916015625, -0.002681255340576172, -0.0020723342895507812, -0.0014634132385253906, -0.0008544921875, -0.0002455711364746094, 0.00036334991455078125, 0.0009722709655761719, 0.0015811920166015625, 0.002190113067626953, 0.0027990341186523438, 0.0034079551696777344, 0.004016876220703125, 0.004625797271728516, 0.005234718322753906, 0.005843639373779297, 0.0064525604248046875, 0.007061481475830078, 0.007670402526855469, 0.00827932357788086, 0.00888824462890625, 0.00949716567993164, 0.010106086730957031, 0.010715007781982422, 0.011323928833007812, 0.011932849884033203, 0.012541770935058594, 0.013150691986083984, 0.013759613037109375, 0.014368534088134766, 0.014977455139160156, 0.015586376190185547, 0.016195297241210938, 0.016804218292236328, 0.01741313934326172, 0.01802206039428711, 0.0186309814453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 83.0, 0.0, 0.0, 0.0, 189.0, 0.0, 0.0, 0.0, 404.0, 0.0, 0.0, 183.0, 0.0, 0.0, 0.0, 78.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-07, -5.19677996635437e-07, -5.029141902923584e-07, -4.861503839492798e-07, -4.6938657760620117e-07, -4.5262277126312256e-07, -4.3585896492004395e-07, -4.1909515857696533e-07, -4.023313522338867e-07, -3.855675458908081e-07, -3.688037395477295e-07, -3.520399332046509e-07, -3.3527612686157227e-07, -3.1851232051849365e-07, -3.0174851417541504e-07, -2.849847078323364e-07, -2.682209014892578e-07, -2.514570951461792e-07, -2.3469328880310059e-07, -2.1792948246002197e-07, -2.0116567611694336e-07, -1.8440186977386475e-07, -1.6763806343078613e-07, -1.5087425708770752e-07, -1.341104507446289e-07, -1.1734664440155029e-07, -1.0058283805847168e-07, -8.381903171539307e-08, -6.705522537231445e-08, -5.029141902923584e-08, -3.3527612686157227e-08, -1.6763806343078613e-08, 0.0, 1.6763806343078613e-08, 3.3527612686157227e-08, 5.029141902923584e-08, 6.705522537231445e-08, 8.381903171539307e-08, 1.0058283805847168e-07, 1.1734664440155029e-07, 1.341104507446289e-07, 1.5087425708770752e-07, 1.6763806343078613e-07, 1.8440186977386475e-07, 2.0116567611694336e-07, 2.1792948246002197e-07, 2.3469328880310059e-07, 2.514570951461792e-07, 2.682209014892578e-07, 2.849847078323364e-07, 3.0174851417541504e-07, 3.1851232051849365e-07, 3.3527612686157227e-07, 3.520399332046509e-07, 3.688037395477295e-07, 3.855675458908081e-07, 4.023313522338867e-07, 4.1909515857696533e-07, 4.3585896492004395e-07, 4.5262277126312256e-07, 4.6938657760620117e-07, 4.861503839492798e-07, 5.029141902923584e-07, 5.19677996635437e-07, 5.364418029785156e-07]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 16.0, 15.0, 6.0, 15.0, 52.0, 54.0, 29.0, 176.0, 131.0, 462.0, 5122.0, 1036174.0, 5329.0, 456.0, 144.0, 185.0, 24.0, 38.0, 64.0, 12.0, 4.0, 16.0, 9.0, 0.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1682510375976562e-05, -1.1323019862174988e-05, -1.0963529348373413e-05, -1.0604038834571838e-05, -1.0244548320770264e-05, -9.885057806968689e-06, -9.525567293167114e-06, -9.16607677936554e-06, -8.806586265563965e-06, -8.44709575176239e-06, -8.087605237960815e-06, -7.72811472415924e-06, -7.368624210357666e-06, -7.009133696556091e-06, -6.649643182754517e-06, -6.290152668952942e-06, -5.930662155151367e-06, -5.5711716413497925e-06, -5.211681127548218e-06, -4.852190613746643e-06, -4.492700099945068e-06, -4.133209586143494e-06, -3.773719072341919e-06, -3.4142285585403442e-06, -3.0547380447387695e-06, -2.695247530937195e-06, -2.33575701713562e-06, -1.9762665033340454e-06, -1.6167759895324707e-06, -1.257285475730896e-06, -8.977949619293213e-07, -5.383044481277466e-07, -1.7881393432617188e-07, 1.8067657947540283e-07, 5.401670932769775e-07, 8.996576070785522e-07, 1.259148120880127e-06, 1.6186386346817017e-06, 1.9781291484832764e-06, 2.337619662284851e-06, 2.6971101760864258e-06, 3.0566006898880005e-06, 3.416091203689575e-06, 3.77558171749115e-06, 4.135072231292725e-06, 4.494562745094299e-06, 4.854053258895874e-06, 5.213543772697449e-06, 5.5730342864990234e-06, 5.932524800300598e-06, 6.292015314102173e-06, 6.6515058279037476e-06, 7.010996341705322e-06, 7.370486855506897e-06, 7.729977369308472e-06, 8.089467883110046e-06, 8.448958396911621e-06, 8.808448910713196e-06, 9.16793942451477e-06, 9.527429938316345e-06, 9.88692045211792e-06, 1.0246410965919495e-05, 1.060590147972107e-05, 1.0965391993522644e-05, 1.1324882507324219e-05]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 16.0, 25.0, 50.0, 45.0, 92.0, 546.0, 88.0, 59.0, 39.0, 20.0, 14.0, 12.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701017564926588e-07, -1.22701564464478e-07, -1.083929390688354e-07, -9.408432788404753e-08, -7.977570959383229e-08, -6.546709130361705e-08, -5.1158480118829175e-08, -3.684986182861394e-08, -2.2541243538398703e-08, -8.232627024540307e-09, 6.07598948931809e-09, 2.0384604226819647e-08, 3.469322251703488e-08, 4.900184080725012e-08, 6.3310451992038e-08, 7.761907028225323e-08, 9.192768857246847e-08, 1.062363068626837e-07, 1.2054492515289894e-07, 1.3485353633768682e-07, 1.491621617333294e-07, 1.634707729181173e-07, 1.7777938410290517e-07, 1.9208800949854776e-07, 2.0639662068333564e-07, 2.2070523186812352e-07, 2.350138572637661e-07, 2.493224542376993e-07, 2.6363107963334187e-07, 2.7793970502898446e-07, 2.9224833042462706e-07, 3.065569273985602e-07, 3.2086558121591224e-07, 3.3517420661155484e-07, 3.49482803585488e-07, 3.637914289811306e-07, 3.781000543767732e-07, 3.9240865135070635e-07, 4.0671727674634894e-07, 4.2102590214199154e-07, 4.3533452753763413e-07, 4.496431529332767e-07, 4.639517499072099e-07, 4.782604037245619e-07, 4.925689722767856e-07, 5.068775976724282e-07, 5.211862230680708e-07, 5.354948484637134e-07, 5.498034170159372e-07, 5.641120424115798e-07, 5.784206678072223e-07, 5.927292932028649e-07, 6.070378617550887e-07, 6.213464871507313e-07, 6.356551125463739e-07, 6.499637379420165e-07, 6.64272363337659e-07, 6.785809887333016e-07, 6.928896141289442e-07, 7.07198182681168e-07, 7.215068080768106e-07, 7.358154334724532e-07, 7.501240588680957e-07, 7.644326842637383e-07, 7.787413096593809e-07]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 210.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 513.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 206.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 2.0, 8.0, 4.0, 7.0, 6.0, 19.0, 11.0, 14.0, 17.0, 24.0, 18.0, 22.0, 33.0, 44.0, 31.0, 41.0, 31.0, 36.0, 34.0, 39.0, 44.0, 49.0, 42.0, 36.0, 45.0, 39.0, 38.0, 34.0, 37.0, 29.0, 24.0, 23.0, 11.0, 29.0, 18.0, 14.0, 11.0, 10.0, 5.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.45703125, -4.32989501953125, -4.2027587890625, -4.07562255859375, -3.948486328125, -3.82135009765625, -3.6942138671875, -3.56707763671875, -3.43994140625, -3.31280517578125, -3.1856689453125, -3.05853271484375, -2.931396484375, -2.80426025390625, -2.6771240234375, -2.54998779296875, -2.4228515625, -2.29571533203125, -2.1685791015625, -2.04144287109375, -1.914306640625, -1.78717041015625, -1.6600341796875, -1.53289794921875, -1.40576171875, -1.27862548828125, -1.1514892578125, -1.02435302734375, -0.897216796875, -0.77008056640625, -0.6429443359375, -0.51580810546875, -0.388671875, -0.26153564453125, -0.1343994140625, -0.00726318359375, 0.119873046875, 0.24700927734375, 0.3741455078125, 0.50128173828125, 0.62841796875, 0.75555419921875, 0.8826904296875, 1.00982666015625, 1.136962890625, 1.26409912109375, 1.3912353515625, 1.51837158203125, 1.6455078125, 1.77264404296875, 1.8997802734375, 2.02691650390625, 2.154052734375, 2.28118896484375, 2.4083251953125, 2.53546142578125, 2.66259765625, 2.78973388671875, 2.9168701171875, 3.04400634765625, 3.171142578125, 3.29827880859375, 3.4254150390625, 3.55255126953125, 3.6796875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 12.0, 9.0, 24.0, 21.0, 30.0, 58.0, 49.0, 97.0, 173.0, 234.0, 413.0, 663.0, 1087.0, 1747.0, 3041.0, 5320.0, 9579.0, 17566.0, 32201.0, 61096.0, 127786.0, 293483.0, 261810.0, 111587.0, 55197.0, 28676.0, 15848.0, 8784.0, 4943.0, 2744.0, 1554.0, 1026.0, 610.0, 380.0, 228.0, 172.0, 97.0, 62.0, 48.0, 33.0, 20.0, 13.0, 13.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0, 5.0], "bins": [-5.05859375, -4.917755126953125, -4.77691650390625, -4.636077880859375, -4.4952392578125, -4.354400634765625, -4.21356201171875, -4.072723388671875, -3.931884765625, -3.791046142578125, -3.65020751953125, -3.509368896484375, -3.3685302734375, -3.227691650390625, -3.08685302734375, -2.946014404296875, -2.80517578125, -2.664337158203125, -2.52349853515625, -2.382659912109375, -2.2418212890625, -2.100982666015625, -1.96014404296875, -1.819305419921875, -1.678466796875, -1.537628173828125, -1.39678955078125, -1.255950927734375, -1.1151123046875, -0.974273681640625, -0.83343505859375, -0.692596435546875, -0.5517578125, -0.410919189453125, -0.27008056640625, -0.129241943359375, 0.0115966796875, 0.152435302734375, 0.29327392578125, 0.434112548828125, 0.574951171875, 0.715789794921875, 0.85662841796875, 0.997467041015625, 1.1383056640625, 1.279144287109375, 1.41998291015625, 1.560821533203125, 1.70166015625, 1.842498779296875, 1.98333740234375, 2.124176025390625, 2.2650146484375, 2.405853271484375, 2.54669189453125, 2.687530517578125, 2.828369140625, 2.969207763671875, 3.11004638671875, 3.250885009765625, 3.3917236328125, 3.532562255859375, 3.67340087890625, 3.814239501953125, 3.955078125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 11.0, 13.0, 19.0, 17.0, 19.0, 20.0, 13.0, 21.0, 23.0, 34.0, 32.0, 21.0, 53.0, 32.0, 48.0, 72.0, 111.0, 168.0, 1364.0, 281.0, 140.0, 83.0, 67.0, 45.0, 28.0, 28.0, 40.0, 28.0, 24.0, 27.0, 24.0, 23.0, 11.0, 16.0, 7.0, 14.0, 7.0, 4.0, 4.0, 8.0, 5.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-9.953125, -9.6397705078125, -9.326416015625, -9.0130615234375, -8.69970703125, -8.3863525390625, -8.072998046875, -7.7596435546875, -7.4462890625, -7.1329345703125, -6.819580078125, -6.5062255859375, -6.19287109375, -5.8795166015625, -5.566162109375, -5.2528076171875, -4.939453125, -4.6260986328125, -4.312744140625, -3.9993896484375, -3.68603515625, -3.3726806640625, -3.059326171875, -2.7459716796875, -2.4326171875, -2.1192626953125, -1.805908203125, -1.4925537109375, -1.17919921875, -0.8658447265625, -0.552490234375, -0.2391357421875, 0.07421875, 0.3875732421875, 0.700927734375, 1.0142822265625, 1.32763671875, 1.6409912109375, 1.954345703125, 2.2677001953125, 2.5810546875, 2.8944091796875, 3.207763671875, 3.5211181640625, 3.83447265625, 4.1478271484375, 4.461181640625, 4.7745361328125, 5.087890625, 5.4012451171875, 5.714599609375, 6.0279541015625, 6.34130859375, 6.6546630859375, 6.968017578125, 7.2813720703125, 7.5947265625, 7.9080810546875, 8.221435546875, 8.5347900390625, 8.84814453125, 9.1614990234375, 9.474853515625, 9.7882080078125, 10.1015625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 4.0, 8.0, 7.0, 6.0, 9.0, 9.0, 16.0, 26.0, 52.0, 74.0, 79.0, 136.0, 283.0, 650.0, 1900.0, 8966.0, 74472.0, 2212358.0, 797381.0, 40934.0, 5732.0, 1429.0, 516.0, 263.0, 137.0, 84.0, 56.0, 28.0, 33.0, 14.0, 16.0, 10.0, 6.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.671875, -17.13427734375, -16.5966796875, -16.05908203125, -15.521484375, -14.98388671875, -14.4462890625, -13.90869140625, -13.37109375, -12.83349609375, -12.2958984375, -11.75830078125, -11.220703125, -10.68310546875, -10.1455078125, -9.60791015625, -9.0703125, -8.53271484375, -7.9951171875, -7.45751953125, -6.919921875, -6.38232421875, -5.8447265625, -5.30712890625, -4.76953125, -4.23193359375, -3.6943359375, -3.15673828125, -2.619140625, -2.08154296875, -1.5439453125, -1.00634765625, -0.46875, 0.06884765625, 0.6064453125, 1.14404296875, 1.681640625, 2.21923828125, 2.7568359375, 3.29443359375, 3.83203125, 4.36962890625, 4.9072265625, 5.44482421875, 5.982421875, 6.52001953125, 7.0576171875, 7.59521484375, 8.1328125, 8.67041015625, 9.2080078125, 9.74560546875, 10.283203125, 10.82080078125, 11.3583984375, 11.89599609375, 12.43359375, 12.97119140625, 13.5087890625, 14.04638671875, 14.583984375, 15.12158203125, 15.6591796875, 16.19677734375, 16.734375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 372.0, 631.0, 12.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-313.49932861328125, -306.0535888671875, -298.60784912109375, -291.1621398925781, -283.7164001464844, -276.2706604003906, -268.8249206542969, -261.37921142578125, -253.9334716796875, -246.48773193359375, -239.04200744628906, -231.5962677001953, -224.15054321289062, -216.70480346679688, -209.25906372070312, -201.81333923339844, -194.3675994873047, -186.92185974121094, -179.47613525390625, -172.0303955078125, -164.5846710205078, -157.13893127441406, -149.69320678710938, -142.24746704101562, -134.80172729492188, -127.35599517822266, -119.91026306152344, -112.46452331542969, -105.018798828125, -97.57305908203125, -90.12732696533203, -82.68159484863281, -75.23588562011719, -67.79015350341797, -60.34442138671875, -52.898685455322266, -45.45295333862305, -38.00722122192383, -30.561485290527344, -23.115753173828125, -15.670021057128906, -8.224287986755371, -0.7785549163818359, 6.667179107666016, 14.112911224365234, 21.558643341064453, 29.004379272460938, 36.450111389160156, 43.895843505859375, 51.341575622558594, 58.78730773925781, 66.23304748535156, 73.67877197265625, 81.12451171875, 88.57024383544922, 96.01597595214844, 103.46170806884766, 110.90744018554688, 118.3531723022461, 125.79890441894531, 133.24464416503906, 140.69036865234375, 148.1361083984375, 155.58184814453125, 163.02757263183594]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 7.0, 5.0, 6.0, 4.0, 4.0, 9.0, 13.0, 7.0, 23.0, 18.0, 19.0, 27.0, 16.0, 24.0, 22.0, 29.0, 38.0, 27.0, 17.0, 38.0, 32.0, 36.0, 35.0, 42.0, 32.0, 40.0, 49.0, 35.0, 36.0, 40.0, 30.0, 26.0, 27.0, 18.0, 21.0, 24.0, 15.0, 25.0, 8.0, 15.0, 8.0, 11.0, 7.0, 8.0, 8.0, 5.0, 5.0, 1.0, 8.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-25.123313903808594, -24.28046417236328, -23.43761444091797, -22.594764709472656, -21.751914978027344, -20.90906524658203, -20.06621742248535, -19.22336769104004, -18.380517959594727, -17.537668228149414, -16.6948184967041, -15.851969718933105, -15.009119987487793, -14.16627025604248, -13.323421478271484, -12.480571746826172, -11.63772201538086, -10.794872283935547, -9.952022552490234, -9.109173774719238, -8.266324043273926, -7.423474311828613, -6.580625057220459, -5.737775802612305, -4.894926071166992, -4.05207633972168, -3.2092270851135254, -2.366377592086792, -1.5235280990600586, -0.6806783676147461, 0.1621708869934082, 1.0050201416015625, 1.8478717803955078, 2.690721273422241, 3.5335707664489746, 4.376420021057129, 5.219269752502441, 6.062119483947754, 6.904968738555908, 7.7478179931640625, 8.590667724609375, 9.433517456054688, 10.2763671875, 11.119215965270996, 11.962065696716309, 12.804915428161621, 13.647764205932617, 14.49061393737793, 15.333463668823242, 16.176313400268555, 17.019163131713867, 17.86201286315918, 18.70486068725586, 19.547710418701172, 20.390560150146484, 21.233409881591797, 22.07625961303711, 22.919109344482422, 23.761959075927734, 24.604808807373047, 25.44765853881836, 26.290508270263672, 27.13335609436035, 27.976205825805664, 28.819055557250977]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 2.0, 5.0, 12.0, 4.0, 11.0, 15.0, 8.0, 22.0, 35.0, 23.0, 30.0, 41.0, 37.0, 32.0, 42.0, 39.0, 38.0, 51.0, 37.0, 44.0, 50.0, 50.0, 42.0, 41.0, 40.0, 39.0, 28.0, 41.0, 24.0, 27.0, 15.0, 15.0, 17.0, 4.0, 7.0, 5.0, 7.0, 3.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.359375, -4.21771240234375, -4.0760498046875, -3.93438720703125, -3.792724609375, -3.65106201171875, -3.5093994140625, -3.36773681640625, -3.22607421875, -3.08441162109375, -2.9427490234375, -2.80108642578125, -2.659423828125, -2.51776123046875, -2.3760986328125, -2.23443603515625, -2.0927734375, -1.95111083984375, -1.8094482421875, -1.66778564453125, -1.526123046875, -1.38446044921875, -1.2427978515625, -1.10113525390625, -0.95947265625, -0.81781005859375, -0.6761474609375, -0.53448486328125, -0.392822265625, -0.25115966796875, -0.1094970703125, 0.03216552734375, 0.173828125, 0.31549072265625, 0.4571533203125, 0.59881591796875, 0.740478515625, 0.88214111328125, 1.0238037109375, 1.16546630859375, 1.30712890625, 1.44879150390625, 1.5904541015625, 1.73211669921875, 1.873779296875, 2.01544189453125, 2.1571044921875, 2.29876708984375, 2.4404296875, 2.58209228515625, 2.7237548828125, 2.86541748046875, 3.007080078125, 3.14874267578125, 3.2904052734375, 3.43206787109375, 3.57373046875, 3.71539306640625, 3.8570556640625, 3.99871826171875, 4.140380859375, 4.28204345703125, 4.4237060546875, 4.56536865234375, 4.70703125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 15.0, 8.0, 18.0, 16.0, 25.0, 33.0, 41.0, 77.0, 117.0, 208.0, 355.0, 826.0, 1753.0, 3763.0, 9224.0, 25273.0, 81691.0, 351133.0, 1683012.0, 1591082.0, 328251.0, 77283.0, 24034.0, 8979.0, 3735.0, 1592.0, 776.0, 386.0, 186.0, 107.0, 82.0, 50.0, 42.0, 25.0, 20.0, 15.0, 10.0, 7.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-7.8203125, -7.60882568359375, -7.3973388671875, -7.18585205078125, -6.974365234375, -6.76287841796875, -6.5513916015625, -6.33990478515625, -6.12841796875, -5.91693115234375, -5.7054443359375, -5.49395751953125, -5.282470703125, -5.07098388671875, -4.8594970703125, -4.64801025390625, -4.4365234375, -4.22503662109375, -4.0135498046875, -3.80206298828125, -3.590576171875, -3.37908935546875, -3.1676025390625, -2.95611572265625, -2.74462890625, -2.53314208984375, -2.3216552734375, -2.11016845703125, -1.898681640625, -1.68719482421875, -1.4757080078125, -1.26422119140625, -1.052734375, -0.84124755859375, -0.6297607421875, -0.41827392578125, -0.206787109375, 0.00469970703125, 0.2161865234375, 0.42767333984375, 0.63916015625, 0.85064697265625, 1.0621337890625, 1.27362060546875, 1.485107421875, 1.69659423828125, 1.9080810546875, 2.11956787109375, 2.3310546875, 2.54254150390625, 2.7540283203125, 2.96551513671875, 3.177001953125, 3.38848876953125, 3.5999755859375, 3.81146240234375, 4.02294921875, 4.23443603515625, 4.4459228515625, 4.65740966796875, 4.868896484375, 5.08038330078125, 5.2918701171875, 5.50335693359375, 5.71484375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 7.0, 4.0, 10.0, 6.0, 9.0, 13.0, 25.0, 32.0, 30.0, 47.0, 53.0, 94.0, 105.0, 144.0, 198.0, 253.0, 349.0, 402.0, 460.0, 456.0, 336.0, 230.0, 222.0, 142.0, 118.0, 68.0, 83.0, 32.0, 34.0, 34.0, 14.0, 22.0, 7.0, 13.0, 7.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.9140625, -6.73529052734375, -6.5565185546875, -6.37774658203125, -6.198974609375, -6.02020263671875, -5.8414306640625, -5.66265869140625, -5.48388671875, -5.30511474609375, -5.1263427734375, -4.94757080078125, -4.768798828125, -4.59002685546875, -4.4112548828125, -4.23248291015625, -4.0537109375, -3.87493896484375, -3.6961669921875, -3.51739501953125, -3.338623046875, -3.15985107421875, -2.9810791015625, -2.80230712890625, -2.62353515625, -2.44476318359375, -2.2659912109375, -2.08721923828125, -1.908447265625, -1.72967529296875, -1.5509033203125, -1.37213134765625, -1.193359375, -1.01458740234375, -0.8358154296875, -0.65704345703125, -0.478271484375, -0.29949951171875, -0.1207275390625, 0.05804443359375, 0.23681640625, 0.41558837890625, 0.5943603515625, 0.77313232421875, 0.951904296875, 1.13067626953125, 1.3094482421875, 1.48822021484375, 1.6669921875, 1.84576416015625, 2.0245361328125, 2.20330810546875, 2.382080078125, 2.56085205078125, 2.7396240234375, 2.91839599609375, 3.09716796875, 3.27593994140625, 3.4547119140625, 3.63348388671875, 3.812255859375, 3.99102783203125, 4.1697998046875, 4.34857177734375, 4.52734375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 13.0, 11.0, 31.0, 39.0, 54.0, 78.0, 118.0, 207.0, 417.0, 932.0, 2482.0, 7798.0, 29577.0, 133964.0, 819511.0, 2597459.0, 484084.0, 88327.0, 20217.0, 5494.0, 1874.0, 738.0, 330.0, 172.0, 120.0, 80.0, 36.0, 36.0, 22.0, 13.0, 21.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.53955078125, -8.2275390625, -7.91552734375, -7.603515625, -7.29150390625, -6.9794921875, -6.66748046875, -6.35546875, -6.04345703125, -5.7314453125, -5.41943359375, -5.107421875, -4.79541015625, -4.4833984375, -4.17138671875, -3.859375, -3.54736328125, -3.2353515625, -2.92333984375, -2.611328125, -2.29931640625, -1.9873046875, -1.67529296875, -1.36328125, -1.05126953125, -0.7392578125, -0.42724609375, -0.115234375, 0.19677734375, 0.5087890625, 0.82080078125, 1.1328125, 1.44482421875, 1.7568359375, 2.06884765625, 2.380859375, 2.69287109375, 3.0048828125, 3.31689453125, 3.62890625, 3.94091796875, 4.2529296875, 4.56494140625, 4.876953125, 5.18896484375, 5.5009765625, 5.81298828125, 6.125, 6.43701171875, 6.7490234375, 7.06103515625, 7.373046875, 7.68505859375, 7.9970703125, 8.30908203125, 8.62109375, 8.93310546875, 9.2451171875, 9.55712890625, 9.869140625, 10.18115234375, 10.4931640625, 10.80517578125, 11.1171875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 9.0, 39.0, 140.0, 268.0, 300.0, 180.0, 61.0, 18.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.183257102966309, -12.715012550354004, -10.246768951416016, -7.778524398803711, -5.310279846191406, -2.8420352935791016, -0.3737916946411133, 2.0944528579711914, 4.562697410583496, 7.030941963195801, 9.499185562133789, 11.967430114746094, 14.435674667358398, 16.903919219970703, 19.372161865234375, 21.840408325195312, 24.308650970458984, 26.77689552307129, 29.245140075683594, 31.713382720947266, 34.1816291809082, 36.649871826171875, 39.11811828613281, 41.586360931396484, 44.05460739135742, 46.522850036621094, 48.99109649658203, 51.4593391418457, 53.92758560180664, 56.39582824707031, 58.86407470703125, 61.33231735229492, 63.800559997558594, 66.26880645751953, 68.73704528808594, 71.20529174804688, 73.67353820800781, 76.14178466796875, 78.61002349853516, 81.0782699584961, 83.54651641845703, 86.01476287841797, 88.48300170898438, 90.95124816894531, 93.41949462890625, 95.88774108886719, 98.3559799194336, 100.82422637939453, 103.29246520996094, 105.76071166992188, 108.22895050048828, 110.69719696044922, 113.16544342041016, 115.6336898803711, 118.1019287109375, 120.57017517089844, 123.03842163085938, 125.50666809082031, 127.97490692138672, 130.4431610107422, 132.91139221191406, 135.379638671875, 137.84788513183594, 140.31613159179688, 142.7843780517578]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 3.0, 13.0, 10.0, 9.0, 8.0, 15.0, 11.0, 18.0, 20.0, 21.0, 27.0, 31.0, 39.0, 37.0, 28.0, 38.0, 46.0, 36.0, 35.0, 37.0, 38.0, 47.0, 36.0, 46.0, 30.0, 39.0, 35.0, 37.0, 36.0, 24.0, 22.0, 26.0, 17.0, 13.0, 15.0, 15.0, 8.0, 9.0, 6.0, 9.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-22.587005615234375, -21.898597717285156, -21.210189819335938, -20.521780014038086, -19.833372116088867, -19.14496421813965, -18.456554412841797, -17.768146514892578, -17.07973861694336, -16.39133071899414, -15.702921867370605, -15.01451301574707, -14.326105117797852, -13.637697219848633, -12.949288368225098, -12.260879516601562, -11.572471618652344, -10.884063720703125, -10.19565486907959, -9.507246017456055, -8.818838119506836, -8.130430221557617, -7.442021369934082, -6.753612995147705, -6.065204620361328, -5.376796245574951, -4.688387870788574, -3.9999794960021973, -3.3115711212158203, -2.6231627464294434, -1.9347543716430664, -1.2463459968566895, -0.5579376220703125, 0.13047075271606445, 0.8188791275024414, 1.5072875022888184, 2.1956958770751953, 2.8841042518615723, 3.572512626647949, 4.260921001434326, 4.949329376220703, 5.63773775100708, 6.326146125793457, 7.014554500579834, 7.702962875366211, 8.39137077331543, 9.079779624938965, 9.7681884765625, 10.456596374511719, 11.145004272460938, 11.833413124084473, 12.521821975708008, 13.210229873657227, 13.898637771606445, 14.58704662322998, 15.275455474853516, 15.963863372802734, 16.652271270751953, 17.340679168701172, 18.029088973999023, 18.717496871948242, 19.40590476989746, 20.094314575195312, 20.78272247314453, 21.47113037109375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 11.0, 10.0, 10.0, 10.0, 17.0, 11.0, 17.0, 20.0, 20.0, 35.0, 25.0, 32.0, 28.0, 43.0, 40.0, 47.0, 35.0, 38.0, 29.0, 48.0, 43.0, 34.0, 30.0, 43.0, 43.0, 30.0, 23.0, 33.0, 25.0, 26.0, 17.0, 17.0, 20.0, 17.0, 14.0, 11.0, 10.0, 3.0, 10.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.1796875, -4.053131103515625, -3.92657470703125, -3.800018310546875, -3.6734619140625, -3.546905517578125, -3.42034912109375, -3.293792724609375, -3.167236328125, -3.040679931640625, -2.91412353515625, -2.787567138671875, -2.6610107421875, -2.534454345703125, -2.40789794921875, -2.281341552734375, -2.15478515625, -2.028228759765625, -1.90167236328125, -1.775115966796875, -1.6485595703125, -1.522003173828125, -1.39544677734375, -1.268890380859375, -1.142333984375, -1.015777587890625, -0.88922119140625, -0.762664794921875, -0.6361083984375, -0.509552001953125, -0.38299560546875, -0.256439208984375, -0.1298828125, -0.003326416015625, 0.12322998046875, 0.249786376953125, 0.3763427734375, 0.502899169921875, 0.62945556640625, 0.756011962890625, 0.882568359375, 1.009124755859375, 1.13568115234375, 1.262237548828125, 1.3887939453125, 1.515350341796875, 1.64190673828125, 1.768463134765625, 1.89501953125, 2.021575927734375, 2.14813232421875, 2.274688720703125, 2.4012451171875, 2.527801513671875, 2.65435791015625, 2.780914306640625, 2.907470703125, 3.034027099609375, 3.16058349609375, 3.287139892578125, 3.4136962890625, 3.540252685546875, 3.66680908203125, 3.793365478515625, 3.919921875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 6.0, 13.0, 16.0, 26.0, 38.0, 60.0, 87.0, 125.0, 146.0, 248.0, 377.0, 491.0, 705.0, 967.0, 1375.0, 2073.0, 2790.0, 4038.0, 5676.0, 8261.0, 11843.0, 17278.0, 25465.0, 39294.0, 63338.0, 108492.0, 242773.0, 228988.0, 104197.0, 61344.0, 38121.0, 24658.0, 16814.0, 11521.0, 8012.0, 5657.0, 3923.0, 2772.0, 1927.0, 1403.0, 962.0, 691.0, 444.0, 331.0, 228.0, 180.0, 127.0, 81.0, 53.0, 36.0, 32.0, 26.0, 11.0, 13.0, 4.0, 5.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.028778076171875, -0.02784872055053711, -0.02691936492919922, -0.025990009307861328, -0.025060653686523438, -0.024131298065185547, -0.023201942443847656, -0.022272586822509766, -0.021343231201171875, -0.020413875579833984, -0.019484519958496094, -0.018555164337158203, -0.017625808715820312, -0.016696453094482422, -0.01576709747314453, -0.01483774185180664, -0.01390838623046875, -0.01297903060913086, -0.012049674987792969, -0.011120319366455078, -0.010190963745117188, -0.009261608123779297, -0.008332252502441406, -0.007402896881103516, -0.006473541259765625, -0.005544185638427734, -0.004614830017089844, -0.003685474395751953, -0.0027561187744140625, -0.0018267631530761719, -0.0008974075317382812, 3.1948089599609375e-05, 0.0009613037109375, 0.0018906593322753906, 0.0028200149536132812, 0.003749370574951172, 0.0046787261962890625, 0.005608081817626953, 0.006537437438964844, 0.007466793060302734, 0.008396148681640625, 0.009325504302978516, 0.010254859924316406, 0.011184215545654297, 0.012113571166992188, 0.013042926788330078, 0.013972282409667969, 0.01490163803100586, 0.01583099365234375, 0.01676034927368164, 0.01768970489501953, 0.018619060516357422, 0.019548416137695312, 0.020477771759033203, 0.021407127380371094, 0.022336483001708984, 0.023265838623046875, 0.024195194244384766, 0.025124549865722656, 0.026053905487060547, 0.026983261108398438, 0.027912616729736328, 0.02884197235107422, 0.02977132797241211, 0.03070068359375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 10.0, 4.0, 12.0, 9.0, 8.0, 8.0, 19.0, 22.0, 20.0, 23.0, 20.0, 21.0, 24.0, 26.0, 36.0, 42.0, 33.0, 35.0, 39.0, 31.0, 1070.0, 37.0, 35.0, 40.0, 41.0, 35.0, 42.0, 32.0, 31.0, 27.0, 25.0, 29.0, 17.0, 26.0, 9.0, 18.0, 14.0, 13.0, 9.0, 6.0, 10.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.37890625, -2.3016357421875, -2.224365234375, -2.1470947265625, -2.06982421875, -1.9925537109375, -1.915283203125, -1.8380126953125, -1.7607421875, -1.6834716796875, -1.606201171875, -1.5289306640625, -1.45166015625, -1.3743896484375, -1.297119140625, -1.2198486328125, -1.142578125, -1.0653076171875, -0.988037109375, -0.9107666015625, -0.83349609375, -0.7562255859375, -0.678955078125, -0.6016845703125, -0.5244140625, -0.4471435546875, -0.369873046875, -0.2926025390625, -0.21533203125, -0.1380615234375, -0.060791015625, 0.0164794921875, 0.09375, 0.1710205078125, 0.248291015625, 0.3255615234375, 0.40283203125, 0.4801025390625, 0.557373046875, 0.6346435546875, 0.7119140625, 0.7891845703125, 0.866455078125, 0.9437255859375, 1.02099609375, 1.0982666015625, 1.175537109375, 1.2528076171875, 1.330078125, 1.4073486328125, 1.484619140625, 1.5618896484375, 1.63916015625, 1.7164306640625, 1.793701171875, 1.8709716796875, 1.9482421875, 2.0255126953125, 2.102783203125, 2.1800537109375, 2.25732421875, 2.3345947265625, 2.411865234375, 2.4891357421875, 2.56640625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 6.0, 6.0, 7.0, 9.0, 28.0, 26.0, 43.0, 52.0, 95.0, 112.0, 179.0, 258.0, 339.0, 467.0, 740.0, 1046.0, 1386.0, 1929.0, 2709.0, 3727.0, 5126.0, 7288.0, 9998.0, 14120.0, 20488.0, 30583.0, 46520.0, 74535.0, 132154.0, 1299114.0, 177698.0, 92493.0, 55990.0, 36219.0, 24275.0, 16649.0, 11326.0, 8372.0, 5985.0, 4235.0, 3088.0, 2232.0, 1602.0, 1152.0, 831.0, 604.0, 396.0, 292.0, 186.0, 132.0, 102.0, 57.0, 46.0, 34.0, 24.0, 16.0, 8.0, 9.0, 2.0, 3.0, 3.0], "bins": [-0.0184478759765625, -0.017883777618408203, -0.017319679260253906, -0.01675558090209961, -0.016191482543945312, -0.015627384185791016, -0.015063285827636719, -0.014499187469482422, -0.013935089111328125, -0.013370990753173828, -0.012806892395019531, -0.012242794036865234, -0.011678695678710938, -0.01111459732055664, -0.010550498962402344, -0.009986400604248047, -0.00942230224609375, -0.008858203887939453, -0.008294105529785156, -0.007730007171630859, -0.0071659088134765625, -0.006601810455322266, -0.006037712097167969, -0.005473613739013672, -0.004909515380859375, -0.004345417022705078, -0.0037813186645507812, -0.0032172203063964844, -0.0026531219482421875, -0.0020890235900878906, -0.0015249252319335938, -0.0009608268737792969, -0.000396728515625, 0.00016736984252929688, 0.0007314682006835938, 0.0012955665588378906, 0.0018596649169921875, 0.0024237632751464844, 0.0029878616333007812, 0.003551959991455078, 0.004116058349609375, 0.004680156707763672, 0.005244255065917969, 0.005808353424072266, 0.0063724517822265625, 0.006936550140380859, 0.007500648498535156, 0.008064746856689453, 0.00862884521484375, 0.009192943572998047, 0.009757041931152344, 0.01032114028930664, 0.010885238647460938, 0.011449337005615234, 0.012013435363769531, 0.012577533721923828, 0.013141632080078125, 0.013705730438232422, 0.014269828796386719, 0.014833927154541016, 0.015398025512695312, 0.01596212387084961, 0.016526222229003906, 0.017090320587158203, 0.0176544189453125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 0.0, 70.0, 0.0, 0.0, 0.0, 188.0, 0.0, 0.0, 0.0, 0.0, 353.0, 0.0, 0.0, 0.0, 0.0, 185.0, 0.0, 0.0, 0.0, 103.0, 0.0, 0.0, 0.0, 0.0, 37.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4458935260772705e-07, -3.3155083656311035e-07, -3.1851232051849365e-07, -3.0547380447387695e-07, -2.9243528842926025e-07, -2.7939677238464355e-07, -2.6635825634002686e-07, -2.5331974029541016e-07, -2.4028122425079346e-07, -2.2724270820617676e-07, -2.1420419216156006e-07, -2.0116567611694336e-07, -1.8812716007232666e-07, -1.7508864402770996e-07, -1.6205012798309326e-07, -1.4901161193847656e-07, -1.3597309589385986e-07, -1.2293457984924316e-07, -1.0989606380462646e-07, -9.685754776000977e-08, -8.381903171539307e-08, -7.078051567077637e-08, -5.774199962615967e-08, -4.470348358154297e-08, -3.166496753692627e-08, -1.862645149230957e-08, -5.587935447692871e-09, 7.450580596923828e-09, 2.0489096641540527e-08, 3.3527612686157227e-08, 4.6566128730773926e-08, 5.960464477539063e-08, 7.264316082000732e-08, 8.568167686462402e-08, 9.872019290924072e-08, 1.1175870895385742e-07, 1.2479722499847412e-07, 1.3783574104309082e-07, 1.5087425708770752e-07, 1.6391277313232422e-07, 1.7695128917694092e-07, 1.8998980522155762e-07, 2.0302832126617432e-07, 2.1606683731079102e-07, 2.2910535335540771e-07, 2.421438694000244e-07, 2.551823854446411e-07, 2.682209014892578e-07, 2.812594175338745e-07, 2.942979335784912e-07, 3.073364496231079e-07, 3.203749656677246e-07, 3.334134817123413e-07, 3.46451997756958e-07, 3.594905138015747e-07, 3.725290298461914e-07, 3.855675458908081e-07, 3.986060619354248e-07, 4.116445779800415e-07, 4.246830940246582e-07, 4.377216100692749e-07, 4.507601261138916e-07, 4.637986421585083e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 4.0, 4.0, 3.0, 12.0, 22.0, 8.0, 12.0, 14.0, 57.0, 52.0, 36.0, 51.0, 91.0, 201.0, 169.0, 460.0, 2119.0, 216756.0, 825135.0, 2222.0, 360.0, 260.0, 192.0, 82.0, 32.0, 20.0, 37.0, 41.0, 13.0, 13.0, 8.0, 19.0, 9.0, 4.0, 3.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.715557098388672e-06, -9.43802297115326e-06, -9.160488843917847e-06, -8.882954716682434e-06, -8.605420589447021e-06, -8.327886462211609e-06, -8.050352334976196e-06, -7.772818207740784e-06, -7.495284080505371e-06, -7.2177499532699585e-06, -6.940215826034546e-06, -6.662681698799133e-06, -6.385147571563721e-06, -6.107613444328308e-06, -5.8300793170928955e-06, -5.552545189857483e-06, -5.27501106262207e-06, -4.997476935386658e-06, -4.719942808151245e-06, -4.4424086809158325e-06, -4.16487455368042e-06, -3.887340426445007e-06, -3.6098062992095947e-06, -3.332272171974182e-06, -3.0547380447387695e-06, -2.777203917503357e-06, -2.4996697902679443e-06, -2.2221356630325317e-06, -1.944601535797119e-06, -1.6670674085617065e-06, -1.389533281326294e-06, -1.1119991540908813e-06, -8.344650268554688e-07, -5.569308996200562e-07, -2.7939677238464355e-07, -1.862645149230957e-09, 2.7567148208618164e-07, 5.532056093215942e-07, 8.307397365570068e-07, 1.1082738637924194e-06, 1.385807991027832e-06, 1.6633421182632446e-06, 1.9408762454986572e-06, 2.21841037273407e-06, 2.4959444999694824e-06, 2.773478627204895e-06, 3.0510127544403076e-06, 3.3285468816757202e-06, 3.606081008911133e-06, 3.883615136146545e-06, 4.161149263381958e-06, 4.438683390617371e-06, 4.716217517852783e-06, 4.993751645088196e-06, 5.271285772323608e-06, 5.548819899559021e-06, 5.826354026794434e-06, 6.103888154029846e-06, 6.381422281265259e-06, 6.658956408500671e-06, 6.936490535736084e-06, 7.214024662971497e-06, 7.491558790206909e-06, 7.769092917442322e-06, 8.046627044677734e-06]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 24.0, 83.0, 156.0, 620.0, 86.0, 25.0, 11.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2872408206021646e-06, -1.2604533594640088e-06, -1.233665898325853e-06, -1.2068784371876973e-06, -1.1800909760495415e-06, -1.1533035149113857e-06, -1.12651605377323e-06, -1.0997287063219119e-06, -1.0729412451837561e-06, -1.0461537840456003e-06, -1.0193663229074446e-06, -9.925788617692888e-07, -9.65791400631133e-07, -9.390039963363961e-07, -9.122165351982403e-07, -8.854290740600845e-07, -8.586415560785099e-07, -8.318540949403541e-07, -8.050666338021983e-07, -7.782791726640426e-07, -7.514917683693056e-07, -7.247043072311499e-07, -6.979168460929941e-07, -6.711293849548383e-07, -6.443419806601014e-07, -6.175545195219456e-07, -5.907670583837898e-07, -5.639795972456341e-07, -5.371921929508972e-07, -5.104047318127414e-07, -4.836172706745856e-07, -4.568298095364298e-07, -4.3004234839827404e-07, -4.0325488726011827e-07, -3.764674545436719e-07, -3.4967999340551614e-07, -3.2289253226736037e-07, -2.96105099550914e-07, -2.6931763841275824e-07, -2.4253017727460247e-07, -2.157427303473014e-07, -1.8895528342000034e-07, -1.6216782228184456e-07, -1.353803753545435e-07, -1.0859292132181508e-07, -8.180546728908666e-08, -5.50180203617856e-08, -2.8230559223629825e-08, -1.4431122963287635e-09, 2.5344339960042817e-08, 5.2131792216414397e-08, 7.891924269642914e-08, 1.0570669672915756e-07, 1.3249415076188598e-07, 1.5928159768918704e-07, 1.8606905882734281e-07, 2.1285650575464388e-07, 2.3964395268194494e-07, 2.664314138201007e-07, 2.932188749582565e-07, 3.2000630767470284e-07, 3.467937688128586e-07, 3.7358120152930496e-07, 4.0036866266746074e-07, 4.271561238056165e-07]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 202.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 530.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 220.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 11.0, 10.0, 10.0, 10.0, 17.0, 11.0, 17.0, 20.0, 20.0, 35.0, 25.0, 32.0, 28.0, 43.0, 40.0, 47.0, 35.0, 38.0, 29.0, 48.0, 43.0, 34.0, 30.0, 43.0, 43.0, 30.0, 23.0, 33.0, 25.0, 26.0, 17.0, 17.0, 20.0, 17.0, 14.0, 11.0, 10.0, 3.0, 10.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.1796875, -4.053131103515625, -3.92657470703125, -3.800018310546875, -3.6734619140625, -3.546905517578125, -3.42034912109375, -3.293792724609375, -3.167236328125, -3.040679931640625, -2.91412353515625, -2.787567138671875, -2.6610107421875, -2.534454345703125, -2.40789794921875, -2.281341552734375, -2.15478515625, -2.028228759765625, -1.90167236328125, -1.775115966796875, -1.6485595703125, -1.522003173828125, -1.39544677734375, -1.268890380859375, -1.142333984375, -1.015777587890625, -0.88922119140625, -0.762664794921875, -0.6361083984375, -0.509552001953125, -0.38299560546875, -0.256439208984375, -0.1298828125, -0.003326416015625, 0.12322998046875, 0.249786376953125, 0.3763427734375, 0.502899169921875, 0.62945556640625, 0.756011962890625, 0.882568359375, 1.009124755859375, 1.13568115234375, 1.262237548828125, 1.3887939453125, 1.515350341796875, 1.64190673828125, 1.768463134765625, 1.89501953125, 2.021575927734375, 2.14813232421875, 2.274688720703125, 2.4012451171875, 2.527801513671875, 2.65435791015625, 2.780914306640625, 2.907470703125, 3.034027099609375, 3.16058349609375, 3.287139892578125, 3.4136962890625, 3.540252685546875, 3.66680908203125, 3.793365478515625, 3.919921875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 7.0, 12.0, 25.0, 34.0, 45.0, 60.0, 71.0, 135.0, 185.0, 337.0, 551.0, 902.0, 1626.0, 2686.0, 4888.0, 8688.0, 14945.0, 26603.0, 47953.0, 90558.0, 200414.0, 318255.0, 159319.0, 76087.0, 40768.0, 22919.0, 12959.0, 7334.0, 4254.0, 2426.0, 1364.0, 772.0, 485.0, 306.0, 182.0, 118.0, 70.0, 50.0, 33.0, 16.0, 21.0, 19.0, 16.0, 16.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0], "bins": [-5.1484375, -4.9893798828125, -4.830322265625, -4.6712646484375, -4.51220703125, -4.3531494140625, -4.194091796875, -4.0350341796875, -3.8759765625, -3.7169189453125, -3.557861328125, -3.3988037109375, -3.23974609375, -3.0806884765625, -2.921630859375, -2.7625732421875, -2.603515625, -2.4444580078125, -2.285400390625, -2.1263427734375, -1.96728515625, -1.8082275390625, -1.649169921875, -1.4901123046875, -1.3310546875, -1.1719970703125, -1.012939453125, -0.8538818359375, -0.69482421875, -0.5357666015625, -0.376708984375, -0.2176513671875, -0.05859375, 0.1004638671875, 0.259521484375, 0.4185791015625, 0.57763671875, 0.7366943359375, 0.895751953125, 1.0548095703125, 1.2138671875, 1.3729248046875, 1.531982421875, 1.6910400390625, 1.85009765625, 2.0091552734375, 2.168212890625, 2.3272705078125, 2.486328125, 2.6453857421875, 2.804443359375, 2.9635009765625, 3.12255859375, 3.2816162109375, 3.440673828125, 3.5997314453125, 3.7587890625, 3.9178466796875, 4.076904296875, 4.2359619140625, 4.39501953125, 4.5540771484375, 4.713134765625, 4.8721923828125, 5.03125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 4.0, 1.0, 12.0, 9.0, 7.0, 8.0, 24.0, 21.0, 27.0, 35.0, 47.0, 46.0, 41.0, 71.0, 70.0, 85.0, 196.0, 1401.0, 328.0, 150.0, 90.0, 70.0, 56.0, 51.0, 40.0, 33.0, 23.0, 20.0, 20.0, 24.0, 8.0, 13.0, 12.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-15.7421875, -15.3270263671875, -14.911865234375, -14.4967041015625, -14.08154296875, -13.6663818359375, -13.251220703125, -12.8360595703125, -12.4208984375, -12.0057373046875, -11.590576171875, -11.1754150390625, -10.76025390625, -10.3450927734375, -9.929931640625, -9.5147705078125, -9.099609375, -8.6844482421875, -8.269287109375, -7.8541259765625, -7.43896484375, -7.0238037109375, -6.608642578125, -6.1934814453125, -5.7783203125, -5.3631591796875, -4.947998046875, -4.5328369140625, -4.11767578125, -3.7025146484375, -3.287353515625, -2.8721923828125, -2.45703125, -2.0418701171875, -1.626708984375, -1.2115478515625, -0.79638671875, -0.3812255859375, 0.033935546875, 0.4490966796875, 0.8642578125, 1.2794189453125, 1.694580078125, 2.1097412109375, 2.52490234375, 2.9400634765625, 3.355224609375, 3.7703857421875, 4.185546875, 4.6007080078125, 5.015869140625, 5.4310302734375, 5.84619140625, 6.2613525390625, 6.676513671875, 7.0916748046875, 7.5068359375, 7.9219970703125, 8.337158203125, 8.7523193359375, 9.16748046875, 9.5826416015625, 9.997802734375, 10.4129638671875, 10.828125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 3.0, 4.0, 7.0, 10.0, 13.0, 13.0, 14.0, 28.0, 38.0, 31.0, 68.0, 84.0, 118.0, 171.0, 329.0, 841.0, 3531.0, 23201.0, 231027.0, 2651640.0, 208032.0, 21431.0, 3271.0, 774.0, 336.0, 197.0, 131.0, 73.0, 62.0, 55.0, 44.0, 21.0, 26.0, 13.0, 16.0, 13.0, 4.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-17.390625, -16.855224609375, -16.31982421875, -15.784423828125, -15.2490234375, -14.713623046875, -14.17822265625, -13.642822265625, -13.107421875, -12.572021484375, -12.03662109375, -11.501220703125, -10.9658203125, -10.430419921875, -9.89501953125, -9.359619140625, -8.82421875, -8.288818359375, -7.75341796875, -7.218017578125, -6.6826171875, -6.147216796875, -5.61181640625, -5.076416015625, -4.541015625, -4.005615234375, -3.47021484375, -2.934814453125, -2.3994140625, -1.864013671875, -1.32861328125, -0.793212890625, -0.2578125, 0.277587890625, 0.81298828125, 1.348388671875, 1.8837890625, 2.419189453125, 2.95458984375, 3.489990234375, 4.025390625, 4.560791015625, 5.09619140625, 5.631591796875, 6.1669921875, 6.702392578125, 7.23779296875, 7.773193359375, 8.30859375, 8.843994140625, 9.37939453125, 9.914794921875, 10.4501953125, 10.985595703125, 11.52099609375, 12.056396484375, 12.591796875, 13.127197265625, 13.66259765625, 14.197998046875, 14.7333984375, 15.268798828125, 15.80419921875, 16.339599609375, 16.875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 23.0, 90.0, 230.0, 372.0, 198.0, 83.0, 15.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.21612548828125, -117.83573913574219, -115.45536041259766, -113.0749740600586, -110.69458770751953, -108.314208984375, -105.93382263183594, -103.55343627929688, -101.17305755615234, -98.79267120361328, -96.41229248046875, -94.03190612792969, -91.65151977539062, -89.2711410522461, -86.89075469970703, -84.5103759765625, -82.12998962402344, -79.74960327148438, -77.36922454833984, -74.98883819580078, -72.60845184326172, -70.22807312011719, -67.84768676757812, -65.46730041503906, -63.0869140625, -60.7065315246582, -58.32614517211914, -55.945762634277344, -53.56538009643555, -51.18499755859375, -48.80461120605469, -46.42422866821289, -44.04384994506836, -41.66346740722656, -39.2830810546875, -36.9026985168457, -34.522315979003906, -32.141929626464844, -29.761547088623047, -27.38116455078125, -25.00078010559082, -22.62039566040039, -20.240013122558594, -17.859628677368164, -15.47924518585205, -13.098861694335938, -10.718477249145508, -8.338094711303711, -5.957710266113281, -3.577326536178589, -1.1969428062438965, 1.183441162109375, 3.5638246536254883, 5.944208145141602, 8.324592590332031, 10.704975128173828, 13.085359573364258, 15.465743064880371, 17.846126556396484, 20.226511001586914, 22.606895446777344, 24.98727798461914, 27.36766242980957, 29.748044967651367, 32.1284294128418]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 9.0, 8.0, 13.0, 19.0, 15.0, 21.0, 21.0, 19.0, 33.0, 30.0, 40.0, 38.0, 34.0, 46.0, 40.0, 42.0, 50.0, 47.0, 39.0, 59.0, 36.0, 40.0, 51.0, 35.0, 30.0, 36.0, 30.0, 22.0, 25.0, 15.0, 13.0, 12.0, 10.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.5267333984375, -35.580589294433594, -34.63444519042969, -33.68830108642578, -32.742156982421875, -31.79601287841797, -30.849868774414062, -29.903724670410156, -28.95758056640625, -28.011436462402344, -27.065292358398438, -26.11914825439453, -25.173004150390625, -24.22686004638672, -23.280715942382812, -22.334571838378906, -21.388427734375, -20.442283630371094, -19.496139526367188, -18.54999542236328, -17.603851318359375, -16.65770721435547, -15.711563110351562, -14.765419006347656, -13.81927490234375, -12.873130798339844, -11.926986694335938, -10.980842590332031, -10.034698486328125, -9.088554382324219, -8.142410278320312, -7.196266174316406, -6.2501220703125, -5.303977966308594, -4.3578338623046875, -3.4116897583007812, -2.465545654296875, -1.5194015502929688, -0.5732574462890625, 0.37288665771484375, 1.31903076171875, 2.2651748657226562, 3.2113189697265625, 4.157463073730469, 5.103607177734375, 6.049751281738281, 6.9958953857421875, 7.942039489746094, 8.88818359375, 9.834327697753906, 10.780471801757812, 11.726615905761719, 12.672760009765625, 13.618904113769531, 14.565048217773438, 15.511192321777344, 16.45733642578125, 17.403480529785156, 18.349624633789062, 19.29576873779297, 20.241912841796875, 21.18805694580078, 22.134201049804688, 23.080345153808594, 24.0264892578125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 3.0, 16.0, 11.0, 7.0, 19.0, 15.0, 17.0, 20.0, 24.0, 37.0, 30.0, 31.0, 40.0, 45.0, 32.0, 33.0, 43.0, 47.0, 39.0, 40.0, 49.0, 42.0, 43.0, 46.0, 33.0, 33.0, 26.0, 19.0, 29.0, 21.0, 18.0, 14.0, 17.0, 8.0, 13.0, 11.0, 6.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.59375, -4.45587158203125, -4.3179931640625, -4.18011474609375, -4.042236328125, -3.90435791015625, -3.7664794921875, -3.62860107421875, -3.49072265625, -3.35284423828125, -3.2149658203125, -3.07708740234375, -2.939208984375, -2.80133056640625, -2.6634521484375, -2.52557373046875, -2.3876953125, -2.24981689453125, -2.1119384765625, -1.97406005859375, -1.836181640625, -1.69830322265625, -1.5604248046875, -1.42254638671875, -1.28466796875, -1.14678955078125, -1.0089111328125, -0.87103271484375, -0.733154296875, -0.59527587890625, -0.4573974609375, -0.31951904296875, -0.181640625, -0.04376220703125, 0.0941162109375, 0.23199462890625, 0.369873046875, 0.50775146484375, 0.6456298828125, 0.78350830078125, 0.92138671875, 1.05926513671875, 1.1971435546875, 1.33502197265625, 1.472900390625, 1.61077880859375, 1.7486572265625, 1.88653564453125, 2.0244140625, 2.16229248046875, 2.3001708984375, 2.43804931640625, 2.575927734375, 2.71380615234375, 2.8516845703125, 2.98956298828125, 3.12744140625, 3.26531982421875, 3.4031982421875, 3.54107666015625, 3.678955078125, 3.81683349609375, 3.9547119140625, 4.09259033203125, 4.23046875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 9.0, 17.0, 26.0, 17.0, 23.0, 31.0, 38.0, 59.0, 69.0, 94.0, 150.0, 210.0, 316.0, 458.0, 2540.0, 4015533.0, 172382.0, 918.0, 405.0, 296.0, 170.0, 128.0, 88.0, 60.0, 47.0, 41.0, 36.0, 28.0, 18.0, 15.0, 11.0, 7.0, 8.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-68.25, -66.44482421875, -64.6396484375, -62.83447265625, -61.029296875, -59.22412109375, -57.4189453125, -55.61376953125, -53.80859375, -52.00341796875, -50.1982421875, -48.39306640625, -46.587890625, -44.78271484375, -42.9775390625, -41.17236328125, -39.3671875, -37.56201171875, -35.7568359375, -33.95166015625, -32.146484375, -30.34130859375, -28.5361328125, -26.73095703125, -24.92578125, -23.12060546875, -21.3154296875, -19.51025390625, -17.705078125, -15.89990234375, -14.0947265625, -12.28955078125, -10.484375, -8.67919921875, -6.8740234375, -5.06884765625, -3.263671875, -1.45849609375, 0.3466796875, 2.15185546875, 3.95703125, 5.76220703125, 7.5673828125, 9.37255859375, 11.177734375, 12.98291015625, 14.7880859375, 16.59326171875, 18.3984375, 20.20361328125, 22.0087890625, 23.81396484375, 25.619140625, 27.42431640625, 29.2294921875, 31.03466796875, 32.83984375, 34.64501953125, 36.4501953125, 38.25537109375, 40.060546875, 41.86572265625, 43.6708984375, 45.47607421875, 47.28125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 11.0, 9.0, 17.0, 16.0, 26.0, 38.0, 41.0, 67.0, 87.0, 128.0, 212.0, 259.0, 418.0, 571.0, 574.0, 482.0, 334.0, 224.0, 153.0, 114.0, 82.0, 58.0, 40.0, 23.0, 22.0, 20.0, 14.0, 9.0, 5.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.0859375, -6.87933349609375, -6.6727294921875, -6.46612548828125, -6.259521484375, -6.05291748046875, -5.8463134765625, -5.63970947265625, -5.43310546875, -5.22650146484375, -5.0198974609375, -4.81329345703125, -4.606689453125, -4.40008544921875, -4.1934814453125, -3.98687744140625, -3.7802734375, -3.57366943359375, -3.3670654296875, -3.16046142578125, -2.953857421875, -2.74725341796875, -2.5406494140625, -2.33404541015625, -2.12744140625, -1.92083740234375, -1.7142333984375, -1.50762939453125, -1.301025390625, -1.09442138671875, -0.8878173828125, -0.68121337890625, -0.474609375, -0.26800537109375, -0.0614013671875, 0.14520263671875, 0.351806640625, 0.55841064453125, 0.7650146484375, 0.97161865234375, 1.17822265625, 1.38482666015625, 1.5914306640625, 1.79803466796875, 2.004638671875, 2.21124267578125, 2.4178466796875, 2.62445068359375, 2.8310546875, 3.03765869140625, 3.2442626953125, 3.45086669921875, 3.657470703125, 3.86407470703125, 4.0706787109375, 4.27728271484375, 4.48388671875, 4.69049072265625, 4.8970947265625, 5.10369873046875, 5.310302734375, 5.51690673828125, 5.7235107421875, 5.93011474609375, 6.13671875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 8.0, 6.0, 16.0, 6.0, 20.0, 27.0, 29.0, 25.0, 61.0, 59.0, 85.0, 156.0, 354.0, 1727.0, 20529.0, 523786.0, 3521184.0, 117907.0, 6744.0, 828.0, 271.0, 110.0, 86.0, 50.0, 34.0, 34.0, 25.0, 20.0, 16.0, 14.0, 8.0, 10.0, 4.0, 13.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -15.982666015625, -15.32470703125, -14.666748046875, -14.0087890625, -13.350830078125, -12.69287109375, -12.034912109375, -11.376953125, -10.718994140625, -10.06103515625, -9.403076171875, -8.7451171875, -8.087158203125, -7.42919921875, -6.771240234375, -6.11328125, -5.455322265625, -4.79736328125, -4.139404296875, -3.4814453125, -2.823486328125, -2.16552734375, -1.507568359375, -0.849609375, -0.191650390625, 0.46630859375, 1.124267578125, 1.7822265625, 2.440185546875, 3.09814453125, 3.756103515625, 4.4140625, 5.072021484375, 5.72998046875, 6.387939453125, 7.0458984375, 7.703857421875, 8.36181640625, 9.019775390625, 9.677734375, 10.335693359375, 10.99365234375, 11.651611328125, 12.3095703125, 12.967529296875, 13.62548828125, 14.283447265625, 14.94140625, 15.599365234375, 16.25732421875, 16.915283203125, 17.5732421875, 18.231201171875, 18.88916015625, 19.547119140625, 20.205078125, 20.863037109375, 21.52099609375, 22.178955078125, 22.8369140625, 23.494873046875, 24.15283203125, 24.810791015625, 25.46875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 10.0, 16.0, 31.0, 36.0, 52.0, 102.0, 124.0, 134.0, 150.0, 132.0, 80.0, 63.0, 36.0, 14.0, 16.0, 6.0, 10.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.466529846191406, -35.505558013916016, -34.54458999633789, -33.5836181640625, -32.622650146484375, -31.661678314208984, -30.700706481933594, -29.739736557006836, -28.778766632080078, -27.81779670715332, -26.856826782226562, -25.895854949951172, -24.934885025024414, -23.973915100097656, -23.012943267822266, -22.051973342895508, -21.09100341796875, -20.130033493041992, -19.169063568115234, -18.208091735839844, -17.247121810913086, -16.286151885986328, -15.325181007385254, -14.36421012878418, -13.403240203857422, -12.442270278930664, -11.48129940032959, -10.520328521728516, -9.559358596801758, -8.598388671875, -7.637417793273926, -6.67644739151001, -5.715475082397461, -4.754504680633545, -3.793534278869629, -2.832563877105713, -1.8715934753417969, -0.9106230735778809, 0.050347328186035156, 1.0113177299499512, 1.9722881317138672, 2.933258533477783, 3.894228935241699, 4.855199337005615, 5.816169738769531, 6.777140140533447, 7.738110542297363, 8.699081420898438, 9.660051345825195, 10.621021270751953, 11.581992149353027, 12.542963027954102, 13.50393295288086, 14.464902877807617, 15.425873756408691, 16.386844635009766, 17.347814559936523, 18.30878448486328, 19.269756317138672, 20.23072624206543, 21.191696166992188, 22.152666091918945, 23.113636016845703, 24.074607849121094, 25.03557777404785]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 8.0, 9.0, 12.0, 13.0, 16.0, 11.0, 23.0, 27.0, 25.0, 23.0, 25.0, 40.0, 40.0, 37.0, 42.0, 38.0, 45.0, 50.0, 46.0, 41.0, 36.0, 40.0, 44.0, 37.0, 24.0, 25.0, 31.0, 19.0, 16.0, 22.0, 26.0, 12.0, 15.0, 13.0, 16.0, 6.0, 7.0, 7.0, 4.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-20.051612854003906, -19.437625885009766, -18.823638916015625, -18.209651947021484, -17.595666885375977, -16.981679916381836, -16.367692947387695, -15.753705978393555, -15.139719009399414, -14.525732040405273, -13.91174602508545, -13.297759056091309, -12.683772087097168, -12.069786071777344, -11.455799102783203, -10.841812133789062, -10.227826118469238, -9.613839149475098, -8.999853134155273, -8.385866165161133, -7.771879196166992, -7.15789270401001, -6.543906211853027, -5.929919242858887, -5.315932750701904, -4.701946258544922, -4.087959289550781, -3.473972797393799, -2.8599860668182373, -2.245999336242676, -1.6320128440856934, -1.0180258750915527, -0.4040393829345703, 0.20994728803634644, 0.8239339590072632, 1.4379205703735352, 2.0519073009490967, 2.665894031524658, 3.2798805236816406, 3.8938674926757812, 4.507853984832764, 5.121840476989746, 5.735827445983887, 6.349813938140869, 6.963800430297852, 7.577787399291992, 8.191774368286133, 8.805761337280273, 9.419747352600098, 10.033734321594238, 10.647720336914062, 11.261707305908203, 11.875694274902344, 12.489681243896484, 13.103667259216309, 13.71765422821045, 14.331640243530273, 14.945627212524414, 15.559613227844238, 16.173599243164062, 16.787586212158203, 17.401573181152344, 18.015560150146484, 18.629547119140625, 19.243534088134766]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 13.0, 9.0, 12.0, 16.0, 13.0, 14.0, 22.0, 26.0, 39.0, 36.0, 36.0, 37.0, 42.0, 52.0, 49.0, 52.0, 36.0, 48.0, 36.0, 49.0, 30.0, 42.0, 39.0, 32.0, 24.0, 28.0, 19.0, 28.0, 20.0, 20.0, 11.0, 17.0, 9.0, 9.0, 12.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.23016357421875, -4.0931396484375, -3.95611572265625, -3.819091796875, -3.68206787109375, -3.5450439453125, -3.40802001953125, -3.27099609375, -3.13397216796875, -2.9969482421875, -2.85992431640625, -2.722900390625, -2.58587646484375, -2.4488525390625, -2.31182861328125, -2.1748046875, -2.03778076171875, -1.9007568359375, -1.76373291015625, -1.626708984375, -1.48968505859375, -1.3526611328125, -1.21563720703125, -1.07861328125, -0.94158935546875, -0.8045654296875, -0.66754150390625, -0.530517578125, -0.39349365234375, -0.2564697265625, -0.11944580078125, 0.017578125, 0.15460205078125, 0.2916259765625, 0.42864990234375, 0.565673828125, 0.70269775390625, 0.8397216796875, 0.97674560546875, 1.11376953125, 1.25079345703125, 1.3878173828125, 1.52484130859375, 1.661865234375, 1.79888916015625, 1.9359130859375, 2.07293701171875, 2.2099609375, 2.34698486328125, 2.4840087890625, 2.62103271484375, 2.758056640625, 2.89508056640625, 3.0321044921875, 3.16912841796875, 3.30615234375, 3.44317626953125, 3.5802001953125, 3.71722412109375, 3.854248046875, 3.99127197265625, 4.1282958984375, 4.26531982421875, 4.40234375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 11.0, 17.0, 24.0, 31.0, 51.0, 78.0, 107.0, 142.0, 195.0, 308.0, 468.0, 710.0, 1141.0, 1752.0, 2680.0, 4200.0, 6410.0, 10080.0, 16154.0, 26423.0, 46099.0, 85426.0, 192067.0, 340511.0, 143473.0, 69797.0, 38500.0, 23222.0, 14001.0, 8810.0, 5464.0, 3495.0, 2334.0, 1466.0, 953.0, 608.0, 424.0, 278.0, 187.0, 132.0, 109.0, 66.0, 47.0, 30.0, 19.0, 15.0, 15.0, 3.0, 3.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0], "bins": [-0.040130615234375, -0.03888988494873047, -0.03764915466308594, -0.036408424377441406, -0.035167694091796875, -0.033926963806152344, -0.03268623352050781, -0.03144550323486328, -0.03020477294921875, -0.02896404266357422, -0.027723312377929688, -0.026482582092285156, -0.025241851806640625, -0.024001121520996094, -0.022760391235351562, -0.02151966094970703, -0.0202789306640625, -0.01903820037841797, -0.017797470092773438, -0.016556739807128906, -0.015316009521484375, -0.014075279235839844, -0.012834548950195312, -0.011593818664550781, -0.01035308837890625, -0.009112358093261719, -0.007871627807617188, -0.006630897521972656, -0.005390167236328125, -0.004149436950683594, -0.0029087066650390625, -0.0016679763793945312, -0.00042724609375, 0.0008134841918945312, 0.0020542144775390625, 0.0032949447631835938, 0.004535675048828125, 0.005776405334472656, 0.0070171356201171875, 0.008257865905761719, 0.00949859619140625, 0.010739326477050781, 0.011980056762695312, 0.013220787048339844, 0.014461517333984375, 0.015702247619628906, 0.016942977905273438, 0.01818370819091797, 0.0194244384765625, 0.02066516876220703, 0.021905899047851562, 0.023146629333496094, 0.024387359619140625, 0.025628089904785156, 0.026868820190429688, 0.02810955047607422, 0.02935028076171875, 0.03059101104736328, 0.03183174133300781, 0.033072471618652344, 0.034313201904296875, 0.035553932189941406, 0.03679466247558594, 0.03803539276123047, 0.039276123046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 4.0, 14.0, 8.0, 12.0, 13.0, 19.0, 19.0, 20.0, 23.0, 25.0, 36.0, 35.0, 27.0, 26.0, 35.0, 38.0, 34.0, 44.0, 1069.0, 35.0, 52.0, 47.0, 38.0, 49.0, 39.0, 28.0, 30.0, 36.0, 32.0, 17.0, 11.0, 19.0, 11.0, 15.0, 7.0, 16.0, 5.0, 4.0, 6.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.6171875, -2.5367431640625, -2.456298828125, -2.3758544921875, -2.29541015625, -2.2149658203125, -2.134521484375, -2.0540771484375, -1.9736328125, -1.8931884765625, -1.812744140625, -1.7322998046875, -1.65185546875, -1.5714111328125, -1.490966796875, -1.4105224609375, -1.330078125, -1.2496337890625, -1.169189453125, -1.0887451171875, -1.00830078125, -0.9278564453125, -0.847412109375, -0.7669677734375, -0.6865234375, -0.6060791015625, -0.525634765625, -0.4451904296875, -0.36474609375, -0.2843017578125, -0.203857421875, -0.1234130859375, -0.04296875, 0.0374755859375, 0.117919921875, 0.1983642578125, 0.27880859375, 0.3592529296875, 0.439697265625, 0.5201416015625, 0.6005859375, 0.6810302734375, 0.761474609375, 0.8419189453125, 0.92236328125, 1.0028076171875, 1.083251953125, 1.1636962890625, 1.244140625, 1.3245849609375, 1.405029296875, 1.4854736328125, 1.56591796875, 1.6463623046875, 1.726806640625, 1.8072509765625, 1.8876953125, 1.9681396484375, 2.048583984375, 2.1290283203125, 2.20947265625, 2.2899169921875, 2.370361328125, 2.4508056640625, 2.53125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 6.0, 8.0, 5.0, 17.0, 26.0, 26.0, 50.0, 67.0, 109.0, 165.0, 255.0, 354.0, 522.0, 764.0, 1011.0, 1431.0, 2012.0, 2819.0, 3915.0, 5399.0, 7694.0, 11306.0, 16184.0, 24184.0, 36631.0, 57649.0, 99260.0, 207892.0, 1301118.0, 119986.0, 66708.0, 42221.0, 27071.0, 18267.0, 12468.0, 8621.0, 6019.0, 4213.0, 3088.0, 2182.0, 1612.0, 1136.0, 820.0, 584.0, 395.0, 293.0, 195.0, 110.0, 106.0, 58.0, 41.0, 29.0, 15.0, 8.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0182647705078125, -0.017678260803222656, -0.017091751098632812, -0.01650524139404297, -0.015918731689453125, -0.015332221984863281, -0.014745712280273438, -0.014159202575683594, -0.01357269287109375, -0.012986183166503906, -0.012399673461914062, -0.011813163757324219, -0.011226654052734375, -0.010640144348144531, -0.010053634643554688, -0.009467124938964844, -0.008880615234375, -0.008294105529785156, -0.0077075958251953125, -0.007121086120605469, -0.006534576416015625, -0.005948066711425781, -0.0053615570068359375, -0.004775047302246094, -0.00418853759765625, -0.0036020278930664062, -0.0030155181884765625, -0.0024290084838867188, -0.001842498779296875, -0.0012559890747070312, -0.0006694793701171875, -8.296966552734375e-05, 0.0005035400390625, 0.0010900497436523438, 0.0016765594482421875, 0.0022630691528320312, 0.002849578857421875, 0.0034360885620117188, 0.0040225982666015625, 0.004609107971191406, 0.00519561767578125, 0.005782127380371094, 0.0063686370849609375, 0.006955146789550781, 0.007541656494140625, 0.008128166198730469, 0.008714675903320312, 0.009301185607910156, 0.0098876953125, 0.010474205017089844, 0.011060714721679688, 0.011647224426269531, 0.012233734130859375, 0.012820243835449219, 0.013406753540039062, 0.013993263244628906, 0.01457977294921875, 0.015166282653808594, 0.015752792358398438, 0.01633930206298828, 0.016925811767578125, 0.01751232147216797, 0.018098831176757812, 0.018685340881347656, 0.0192718505859375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 96.0, 0.0, 0.0, 195.0, 0.0, 0.0, 0.0, 317.0, 0.0, 0.0, 0.0, 193.0, 0.0, 0.0, 91.0, 0.0, 0.0, 0.0, 44.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.600733518600464e-07, -4.4330954551696777e-07, -4.2654573917388916e-07, -4.0978193283081055e-07, -3.9301812648773193e-07, -3.762543201446533e-07, -3.594905138015747e-07, -3.427267074584961e-07, -3.259629011154175e-07, -3.0919909477233887e-07, -2.9243528842926025e-07, -2.7567148208618164e-07, -2.5890767574310303e-07, -2.421438694000244e-07, -2.253800630569458e-07, -2.086162567138672e-07, -1.9185245037078857e-07, -1.7508864402770996e-07, -1.5832483768463135e-07, -1.4156103134155273e-07, -1.2479722499847412e-07, -1.0803341865539551e-07, -9.12696123123169e-08, -7.450580596923828e-08, -5.774199962615967e-08, -4.0978193283081055e-08, -2.421438694000244e-08, -7.450580596923828e-09, 9.313225746154785e-09, 2.60770320892334e-08, 4.284083843231201e-08, 5.960464477539063e-08, 7.636845111846924e-08, 9.313225746154785e-08, 1.0989606380462646e-07, 1.2665987014770508e-07, 1.434236764907837e-07, 1.601874828338623e-07, 1.7695128917694092e-07, 1.9371509552001953e-07, 2.1047890186309814e-07, 2.2724270820617676e-07, 2.4400651454925537e-07, 2.60770320892334e-07, 2.775341272354126e-07, 2.942979335784912e-07, 3.110617399215698e-07, 3.2782554626464844e-07, 3.4458935260772705e-07, 3.6135315895080566e-07, 3.781169652938843e-07, 3.948807716369629e-07, 4.116445779800415e-07, 4.284083843231201e-07, 4.4517219066619873e-07, 4.6193599700927734e-07, 4.78699803352356e-07, 4.954636096954346e-07, 5.122274160385132e-07, 5.289912223815918e-07, 5.457550287246704e-07, 5.62518835067749e-07, 5.792826414108276e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 3.0, 10.0, 23.0, 21.0, 12.0, 26.0, 83.0, 43.0, 76.0, 185.0, 353.0, 644.0, 56333.0, 987140.0, 2437.0, 510.0, 220.0, 150.0, 50.0, 51.0, 71.0, 14.0, 20.0, 17.0, 11.0, 7.0, 13.0, 7.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.2755393981933594e-05, -1.2394040822982788e-05, -1.2032687664031982e-05, -1.1671334505081177e-05, -1.1309981346130371e-05, -1.0948628187179565e-05, -1.058727502822876e-05, -1.0225921869277954e-05, -9.864568710327148e-06, -9.503215551376343e-06, -9.141862392425537e-06, -8.780509233474731e-06, -8.419156074523926e-06, -8.05780291557312e-06, -7.696449756622314e-06, -7.335096597671509e-06, -6.973743438720703e-06, -6.6123902797698975e-06, -6.251037120819092e-06, -5.889683961868286e-06, -5.5283308029174805e-06, -5.166977643966675e-06, -4.805624485015869e-06, -4.4442713260650635e-06, -4.082918167114258e-06, -3.721565008163452e-06, -3.3602118492126465e-06, -2.998858690261841e-06, -2.637505531311035e-06, -2.2761523723602295e-06, -1.914799213409424e-06, -1.5534460544586182e-06, -1.1920928955078125e-06, -8.307397365570068e-07, -4.6938657760620117e-07, -1.0803341865539551e-07, 2.5331974029541016e-07, 6.146728992462158e-07, 9.760260581970215e-07, 1.3373792171478271e-06, 1.6987323760986328e-06, 2.0600855350494385e-06, 2.421438694000244e-06, 2.78279185295105e-06, 3.1441450119018555e-06, 3.505498170852661e-06, 3.866851329803467e-06, 4.2282044887542725e-06, 4.589557647705078e-06, 4.950910806655884e-06, 5.3122639656066895e-06, 5.673617124557495e-06, 6.034970283508301e-06, 6.3963234424591064e-06, 6.757676601409912e-06, 7.119029760360718e-06, 7.4803829193115234e-06, 7.841736078262329e-06, 8.203089237213135e-06, 8.56444239616394e-06, 8.925795555114746e-06, 9.287148714065552e-06, 9.648501873016357e-06, 1.0009855031967163e-05, 1.0371208190917969e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 13.0, 33.0, 70.0, 131.0, 513.0, 110.0, 69.0, 42.0, 12.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.924813871795777e-07, -7.729202593509399e-07, -7.533591883657209e-07, -7.337980605370831e-07, -7.142369895518641e-07, -6.946758617232263e-07, -6.751147907380073e-07, -6.555536629093695e-07, -6.359925919241505e-07, -6.164314640955126e-07, -5.968703931102937e-07, -5.773092652816558e-07, -5.577481942964368e-07, -5.38187066467799e-07, -5.1862599548258e-07, -4.990648676539422e-07, -4.795037398253044e-07, -4.5994264041837596e-07, -4.4038154101144755e-07, -4.2082044160451915e-07, -4.0125934219759074e-07, -3.816982143689529e-07, -3.621371149620245e-07, -3.425760155550961e-07, -3.230149161481677e-07, -3.034538167412393e-07, -2.8389271733431087e-07, -2.6433161792738247e-07, -2.4477049009874463e-07, -2.2520940490267094e-07, -2.0564829128488782e-07, -1.860871918779594e-07, -1.6652614931444987e-07, -1.4696504990752146e-07, -1.2740395050059306e-07, -1.0784283688280993e-07, -8.828173747588153e-08, -6.872063806895312e-08, -4.915953155659736e-08, -2.9598425044241594e-08, -1.0037325637313188e-08, 9.523777322328897e-09, 2.9084880281970982e-08, 4.8645983241613067e-08, 6.820708620125515e-08, 8.776818560818356e-08, 1.0732929212053932e-07, 1.2689039863289509e-07, 1.464514980398235e-07, 1.660125974467519e-07, 1.855736968536803e-07, 2.0513481047146342e-07, 2.2469590987839183e-07, 2.4425702349617495e-07, 2.6381812290310336e-07, 2.8337922231003176e-07, 3.0294032171696017e-07, 3.225014211238886e-07, 3.42062520530817e-07, 3.616236199377454e-07, 3.811847477663832e-07, 4.007458187516022e-07, 4.2030694658024004e-07, 4.3986804598716844e-07, 4.5942914539409685e-07]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 209.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 474.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 221.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 13.0, 9.0, 12.0, 16.0, 13.0, 14.0, 22.0, 26.0, 39.0, 36.0, 36.0, 37.0, 42.0, 52.0, 49.0, 52.0, 36.0, 48.0, 36.0, 49.0, 30.0, 42.0, 39.0, 32.0, 24.0, 28.0, 19.0, 28.0, 20.0, 20.0, 11.0, 17.0, 9.0, 9.0, 12.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.23016357421875, -4.0931396484375, -3.95611572265625, -3.819091796875, -3.68206787109375, -3.5450439453125, -3.40802001953125, -3.27099609375, -3.13397216796875, -2.9969482421875, -2.85992431640625, -2.722900390625, -2.58587646484375, -2.4488525390625, -2.31182861328125, -2.1748046875, -2.03778076171875, -1.9007568359375, -1.76373291015625, -1.626708984375, -1.48968505859375, -1.3526611328125, -1.21563720703125, -1.07861328125, -0.94158935546875, -0.8045654296875, -0.66754150390625, -0.530517578125, -0.39349365234375, -0.2564697265625, -0.11944580078125, 0.017578125, 0.15460205078125, 0.2916259765625, 0.42864990234375, 0.565673828125, 0.70269775390625, 0.8397216796875, 0.97674560546875, 1.11376953125, 1.25079345703125, 1.3878173828125, 1.52484130859375, 1.661865234375, 1.79888916015625, 1.9359130859375, 2.07293701171875, 2.2099609375, 2.34698486328125, 2.4840087890625, 2.62103271484375, 2.758056640625, 2.89508056640625, 3.0321044921875, 3.16912841796875, 3.30615234375, 3.44317626953125, 3.5802001953125, 3.71722412109375, 3.854248046875, 3.99127197265625, 4.1282958984375, 4.26531982421875, 4.40234375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 9.0, 12.0, 14.0, 23.0, 40.0, 62.0, 58.0, 97.0, 127.0, 190.0, 255.0, 397.0, 558.0, 862.0, 1285.0, 2188.0, 3837.0, 6871.0, 13214.0, 25638.0, 52307.0, 115167.0, 265342.0, 298567.0, 136533.0, 61237.0, 29489.0, 15169.0, 7842.0, 4418.0, 2408.0, 1468.0, 903.0, 575.0, 370.0, 271.0, 189.0, 163.0, 118.0, 74.0, 63.0, 34.0, 32.0, 22.0, 14.0, 6.0, 10.0, 2.0, 0.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0], "bins": [-4.9375, -4.78369140625, -4.6298828125, -4.47607421875, -4.322265625, -4.16845703125, -4.0146484375, -3.86083984375, -3.70703125, -3.55322265625, -3.3994140625, -3.24560546875, -3.091796875, -2.93798828125, -2.7841796875, -2.63037109375, -2.4765625, -2.32275390625, -2.1689453125, -2.01513671875, -1.861328125, -1.70751953125, -1.5537109375, -1.39990234375, -1.24609375, -1.09228515625, -0.9384765625, -0.78466796875, -0.630859375, -0.47705078125, -0.3232421875, -0.16943359375, -0.015625, 0.13818359375, 0.2919921875, 0.44580078125, 0.599609375, 0.75341796875, 0.9072265625, 1.06103515625, 1.21484375, 1.36865234375, 1.5224609375, 1.67626953125, 1.830078125, 1.98388671875, 2.1376953125, 2.29150390625, 2.4453125, 2.59912109375, 2.7529296875, 2.90673828125, 3.060546875, 3.21435546875, 3.3681640625, 3.52197265625, 3.67578125, 3.82958984375, 3.9833984375, 4.13720703125, 4.291015625, 4.44482421875, 4.5986328125, 4.75244140625, 4.90625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 12.0, 11.0, 13.0, 20.0, 19.0, 24.0, 30.0, 30.0, 48.0, 39.0, 61.0, 89.0, 129.0, 203.0, 1515.0, 266.0, 127.0, 87.0, 61.0, 51.0, 42.0, 33.0, 29.0, 29.0, 12.0, 17.0, 18.0, 11.0, 5.0, 3.0, 3.0, 4.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8046875, -12.4229736328125, -12.041259765625, -11.6595458984375, -11.27783203125, -10.8961181640625, -10.514404296875, -10.1326904296875, -9.7509765625, -9.3692626953125, -8.987548828125, -8.6058349609375, -8.22412109375, -7.8424072265625, -7.460693359375, -7.0789794921875, -6.697265625, -6.3155517578125, -5.933837890625, -5.5521240234375, -5.17041015625, -4.7886962890625, -4.406982421875, -4.0252685546875, -3.6435546875, -3.2618408203125, -2.880126953125, -2.4984130859375, -2.11669921875, -1.7349853515625, -1.353271484375, -0.9715576171875, -0.58984375, -0.2081298828125, 0.173583984375, 0.5552978515625, 0.93701171875, 1.3187255859375, 1.700439453125, 2.0821533203125, 2.4638671875, 2.8455810546875, 3.227294921875, 3.6090087890625, 3.99072265625, 4.3724365234375, 4.754150390625, 5.1358642578125, 5.517578125, 5.8992919921875, 6.281005859375, 6.6627197265625, 7.04443359375, 7.4261474609375, 7.807861328125, 8.1895751953125, 8.5712890625, 8.9530029296875, 9.334716796875, 9.7164306640625, 10.09814453125, 10.4798583984375, 10.861572265625, 11.2432861328125, 11.625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 9.0, 12.0, 18.0, 17.0, 23.0, 41.0, 53.0, 96.0, 162.0, 278.0, 566.0, 1486.0, 55374.0, 3071892.0, 13446.0, 1090.0, 461.0, 241.0, 144.0, 72.0, 46.0, 37.0, 27.0, 25.0, 21.0, 7.0, 7.0, 2.0, 6.0, 6.0, 2.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.1875, -37.10791015625, -36.0283203125, -34.94873046875, -33.869140625, -32.78955078125, -31.7099609375, -30.63037109375, -29.55078125, -28.47119140625, -27.3916015625, -26.31201171875, -25.232421875, -24.15283203125, -23.0732421875, -21.99365234375, -20.9140625, -19.83447265625, -18.7548828125, -17.67529296875, -16.595703125, -15.51611328125, -14.4365234375, -13.35693359375, -12.27734375, -11.19775390625, -10.1181640625, -9.03857421875, -7.958984375, -6.87939453125, -5.7998046875, -4.72021484375, -3.640625, -2.56103515625, -1.4814453125, -0.40185546875, 0.677734375, 1.75732421875, 2.8369140625, 3.91650390625, 4.99609375, 6.07568359375, 7.1552734375, 8.23486328125, 9.314453125, 10.39404296875, 11.4736328125, 12.55322265625, 13.6328125, 14.71240234375, 15.7919921875, 16.87158203125, 17.951171875, 19.03076171875, 20.1103515625, 21.18994140625, 22.26953125, 23.34912109375, 24.4287109375, 25.50830078125, 26.587890625, 27.66748046875, 28.7470703125, 29.82666015625, 30.90625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 34.0, 487.0, 480.0, 14.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.8851318359375, -138.35284423828125, -132.820556640625, -127.28828430175781, -121.75599670410156, -116.22370910644531, -110.6914291381836, -105.15914916992188, -99.62686157226562, -94.09457397460938, -88.56229400634766, -83.03001403808594, -77.49772644042969, -71.96543884277344, -66.43315887451172, -60.900875091552734, -55.36859130859375, -49.836307525634766, -44.30402374267578, -38.7717399597168, -33.23945617675781, -27.707172393798828, -22.174888610839844, -16.64260482788086, -11.110321044921875, -5.578037261962891, -0.04575347900390625, 5.486530303955078, 11.018814086914062, 16.551097869873047, 22.08338165283203, 27.615665435791016, 33.14796447753906, 38.68024826049805, 44.21253204345703, 49.744815826416016, 55.277099609375, 60.809383392333984, 66.34166717529297, 71.87394714355469, 77.40623474121094, 82.93852233886719, 88.4708023071289, 94.00308227539062, 99.53536987304688, 105.06765747070312, 110.59993743896484, 116.13221740722656, 121.66450500488281, 127.19679260253906, 132.72906494140625, 138.2613525390625, 143.79364013671875, 149.325927734375, 154.85821533203125, 160.39048767089844, 165.9227752685547, 171.45506286621094, 176.98733520507812, 182.51962280273438, 188.05191040039062, 193.58419799804688, 199.11648559570312, 204.6487579345703, 210.18104553222656]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 5.0, 3.0, 7.0, 12.0, 10.0, 15.0, 20.0, 24.0, 24.0, 16.0, 20.0, 25.0, 26.0, 21.0, 37.0, 27.0, 43.0, 40.0, 42.0, 39.0, 34.0, 44.0, 42.0, 62.0, 39.0, 41.0, 35.0, 25.0, 27.0, 27.0, 13.0, 23.0, 13.0, 24.0, 12.0, 16.0, 11.0, 10.0, 7.0, 8.0, 4.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-32.734901428222656, -31.840923309326172, -30.946943283081055, -30.05296516418457, -29.158985137939453, -28.26500701904297, -27.371028900146484, -26.47705078125, -25.583070755004883, -24.6890926361084, -23.79511260986328, -22.901134490966797, -22.007156372070312, -21.113176345825195, -20.21919822692871, -19.325218200683594, -18.43124008178711, -17.537261962890625, -16.643281936645508, -15.749303817749023, -14.855324745178223, -13.961345672607422, -13.067367553710938, -12.173388481140137, -11.279409408569336, -10.385430335998535, -9.491451263427734, -8.59747314453125, -7.703494071960449, -6.809514999389648, -5.915536403656006, -5.021557807922363, -4.1275787353515625, -3.233599901199341, -2.339621067047119, -1.4456422328948975, -0.5516633987426758, 0.342315673828125, 1.2362942695617676, 2.13027286529541, 3.024251937866211, 3.9182307720184326, 4.812209606170654, 5.706188201904297, 6.600167274475098, 7.494146347045898, 8.388124465942383, 9.282103538513184, 10.176082611083984, 11.070061683654785, 11.964040756225586, 12.85801887512207, 13.751997947692871, 14.645977020263672, 15.539955139160156, 16.43393325805664, 17.327913284301758, 18.221891403198242, 19.11587142944336, 20.009849548339844, 20.903827667236328, 21.797807693481445, 22.69178581237793, 23.585765838623047, 24.47974395751953]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 10.0, 13.0, 9.0, 10.0, 16.0, 15.0, 15.0, 28.0, 26.0, 29.0, 44.0, 34.0, 38.0, 31.0, 53.0, 40.0, 44.0, 36.0, 42.0, 45.0, 60.0, 41.0, 49.0, 37.0, 30.0, 28.0, 23.0, 21.0, 25.0, 16.0, 19.0, 13.0, 14.0, 10.0, 11.0, 12.0, 7.0, 5.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.383056640625, -4.24267578125, -4.102294921875, -3.9619140625, -3.821533203125, -3.68115234375, -3.540771484375, -3.400390625, -3.260009765625, -3.11962890625, -2.979248046875, -2.8388671875, -2.698486328125, -2.55810546875, -2.417724609375, -2.27734375, -2.136962890625, -1.99658203125, -1.856201171875, -1.7158203125, -1.575439453125, -1.43505859375, -1.294677734375, -1.154296875, -1.013916015625, -0.87353515625, -0.733154296875, -0.5927734375, -0.452392578125, -0.31201171875, -0.171630859375, -0.03125, 0.109130859375, 0.24951171875, 0.389892578125, 0.5302734375, 0.670654296875, 0.81103515625, 0.951416015625, 1.091796875, 1.232177734375, 1.37255859375, 1.512939453125, 1.6533203125, 1.793701171875, 1.93408203125, 2.074462890625, 2.21484375, 2.355224609375, 2.49560546875, 2.635986328125, 2.7763671875, 2.916748046875, 3.05712890625, 3.197509765625, 3.337890625, 3.478271484375, 3.61865234375, 3.759033203125, 3.8994140625, 4.039794921875, 4.18017578125, 4.320556640625, 4.4609375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 8.0, 17.0, 21.0, 40.0, 57.0, 81.0, 106.0, 181.0, 282.0, 441.0, 675.0, 1155.0, 1955.0, 3714.0, 7610.0, 18244.0, 59337.0, 284439.0, 1295845.0, 1885282.0, 492292.0, 95436.0, 25825.0, 10113.0, 4803.0, 2507.0, 1407.0, 852.0, 509.0, 368.0, 205.0, 140.0, 115.0, 61.0, 51.0, 41.0, 17.0, 12.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0], "bins": [-7.76953125, -7.56597900390625, -7.3624267578125, -7.15887451171875, -6.955322265625, -6.75177001953125, -6.5482177734375, -6.34466552734375, -6.14111328125, -5.93756103515625, -5.7340087890625, -5.53045654296875, -5.326904296875, -5.12335205078125, -4.9197998046875, -4.71624755859375, -4.5126953125, -4.30914306640625, -4.1055908203125, -3.90203857421875, -3.698486328125, -3.49493408203125, -3.2913818359375, -3.08782958984375, -2.88427734375, -2.68072509765625, -2.4771728515625, -2.27362060546875, -2.070068359375, -1.86651611328125, -1.6629638671875, -1.45941162109375, -1.255859375, -1.05230712890625, -0.8487548828125, -0.64520263671875, -0.441650390625, -0.23809814453125, -0.0345458984375, 0.16900634765625, 0.37255859375, 0.57611083984375, 0.7796630859375, 0.98321533203125, 1.186767578125, 1.39031982421875, 1.5938720703125, 1.79742431640625, 2.0009765625, 2.20452880859375, 2.4080810546875, 2.61163330078125, 2.815185546875, 3.01873779296875, 3.2222900390625, 3.42584228515625, 3.62939453125, 3.83294677734375, 4.0364990234375, 4.24005126953125, 4.443603515625, 4.64715576171875, 4.8507080078125, 5.05426025390625, 5.2578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 8.0, 15.0, 26.0, 37.0, 40.0, 58.0, 50.0, 66.0, 115.0, 156.0, 211.0, 281.0, 358.0, 465.0, 537.0, 410.0, 306.0, 210.0, 169.0, 121.0, 99.0, 89.0, 68.0, 44.0, 35.0, 25.0, 14.0, 14.0, 12.0, 5.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8515625, -6.6383056640625, -6.425048828125, -6.2117919921875, -5.99853515625, -5.7852783203125, -5.572021484375, -5.3587646484375, -5.1455078125, -4.9322509765625, -4.718994140625, -4.5057373046875, -4.29248046875, -4.0792236328125, -3.865966796875, -3.6527099609375, -3.439453125, -3.2261962890625, -3.012939453125, -2.7996826171875, -2.58642578125, -2.3731689453125, -2.159912109375, -1.9466552734375, -1.7333984375, -1.5201416015625, -1.306884765625, -1.0936279296875, -0.88037109375, -0.6671142578125, -0.453857421875, -0.2406005859375, -0.02734375, 0.1859130859375, 0.399169921875, 0.6124267578125, 0.82568359375, 1.0389404296875, 1.252197265625, 1.4654541015625, 1.6787109375, 1.8919677734375, 2.105224609375, 2.3184814453125, 2.53173828125, 2.7449951171875, 2.958251953125, 3.1715087890625, 3.384765625, 3.5980224609375, 3.811279296875, 4.0245361328125, 4.23779296875, 4.4510498046875, 4.664306640625, 4.8775634765625, 5.0908203125, 5.3040771484375, 5.517333984375, 5.7305908203125, 5.94384765625, 6.1571044921875, 6.370361328125, 6.5836181640625, 6.796875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 13.0, 8.0, 12.0, 22.0, 42.0, 67.0, 113.0, 215.0, 332.0, 611.0, 1126.0, 2640.0, 8409.0, 42362.0, 324340.0, 2749485.0, 934757.0, 105379.0, 16719.0, 4214.0, 1592.0, 790.0, 413.0, 232.0, 139.0, 88.0, 65.0, 35.0, 20.0, 9.0, 8.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4921875, -11.1514892578125, -10.810791015625, -10.4700927734375, -10.12939453125, -9.7886962890625, -9.447998046875, -9.1072998046875, -8.7666015625, -8.4259033203125, -8.085205078125, -7.7445068359375, -7.40380859375, -7.0631103515625, -6.722412109375, -6.3817138671875, -6.041015625, -5.7003173828125, -5.359619140625, -5.0189208984375, -4.67822265625, -4.3375244140625, -3.996826171875, -3.6561279296875, -3.3154296875, -2.9747314453125, -2.634033203125, -2.2933349609375, -1.95263671875, -1.6119384765625, -1.271240234375, -0.9305419921875, -0.58984375, -0.2491455078125, 0.091552734375, 0.4322509765625, 0.77294921875, 1.1136474609375, 1.454345703125, 1.7950439453125, 2.1357421875, 2.4764404296875, 2.817138671875, 3.1578369140625, 3.49853515625, 3.8392333984375, 4.179931640625, 4.5206298828125, 4.861328125, 5.2020263671875, 5.542724609375, 5.8834228515625, 6.22412109375, 6.5648193359375, 6.905517578125, 7.2462158203125, 7.5869140625, 7.9276123046875, 8.268310546875, 8.6090087890625, 8.94970703125, 9.2904052734375, 9.631103515625, 9.9718017578125, 10.3125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 414.0, 591.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-351.9768981933594, -340.64019775390625, -329.3034973144531, -317.966796875, -306.6300964355469, -295.29339599609375, -283.9566955566406, -272.6199951171875, -261.2832946777344, -249.94659423828125, -238.60989379882812, -227.273193359375, -215.93649291992188, -204.59979248046875, -193.26309204101562, -181.9263916015625, -170.58969116210938, -159.25299072265625, -147.91629028320312, -136.57958984375, -125.24288940429688, -113.90618896484375, -102.56948852539062, -91.2327880859375, -79.89608764648438, -68.55938720703125, -57.222686767578125, -45.885986328125, -34.549285888671875, -23.21258544921875, -11.875885009765625, -0.5391845703125, 10.79754638671875, 22.134246826171875, 33.470947265625, 44.807647705078125, 56.14434814453125, 67.48104858398438, 78.8177490234375, 90.15444946289062, 101.49114990234375, 112.82785034179688, 124.16455078125, 135.50125122070312, 146.83795166015625, 158.17465209960938, 169.5113525390625, 180.84805297851562, 192.18475341796875, 203.52145385742188, 214.858154296875, 226.19485473632812, 237.53155517578125, 248.86825561523438, 260.2049560546875, 271.5416564941406, 282.87835693359375, 294.2150573730469, 305.5517578125, 316.8884582519531, 328.22515869140625, 339.5618591308594, 350.8985595703125, 362.2352600097656, 373.57196044921875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 8.0, 10.0, 12.0, 15.0, 13.0, 8.0, 16.0, 20.0, 28.0, 27.0, 38.0, 34.0, 36.0, 38.0, 38.0, 38.0, 45.0, 42.0, 53.0, 38.0, 49.0, 40.0, 34.0, 34.0, 49.0, 31.0, 23.0, 36.0, 15.0, 20.0, 14.0, 12.0, 11.0, 15.0, 9.0, 10.0, 8.0, 5.0, 4.0, 8.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0], "bins": [-29.10305404663086, -28.261837005615234, -27.420618057250977, -26.57940101623535, -25.738183975219727, -24.89696502685547, -24.055747985839844, -23.21453094482422, -22.373313903808594, -21.53209686279297, -20.69087791442871, -19.849660873413086, -19.00844383239746, -18.167224884033203, -17.326007843017578, -16.484790802001953, -15.643572807312012, -14.80235481262207, -13.961137771606445, -13.119919776916504, -12.278702735900879, -11.437484741210938, -10.596267700195312, -9.755049705505371, -8.91383171081543, -8.072613716125488, -7.231396675109863, -6.390178680419922, -5.548961639404297, -4.7077436447143555, -3.8665261268615723, -3.025308609008789, -2.184091567993164, -1.3428740501403809, -0.5016564130783081, 0.33956122398376465, 1.1807787418365479, 2.02199649810791, 2.8632140159606934, 3.7044315338134766, 4.54564905166626, 5.386866569519043, 6.228084087371826, 7.069301605224609, 7.910519599914551, 8.751737594604492, 9.592954635620117, 10.434171676635742, 11.275389671325684, 12.116607666015625, 12.95782470703125, 13.799042701721191, 14.640259742736816, 15.481477737426758, 16.322694778442383, 17.16391372680664, 18.005130767822266, 18.84634780883789, 19.68756675720215, 20.528783798217773, 21.3700008392334, 22.211219787597656, 23.05243682861328, 23.893653869628906, 24.73487091064453]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 6.0, 5.0, 1.0, 8.0, 12.0, 14.0, 20.0, 16.0, 19.0, 33.0, 23.0, 19.0, 30.0, 37.0, 35.0, 48.0, 48.0, 46.0, 48.0, 36.0, 51.0, 36.0, 48.0, 36.0, 37.0, 36.0, 31.0, 31.0, 23.0, 23.0, 25.0, 13.0, 12.0, 24.0, 16.0, 7.0, 10.0, 13.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.32421875, -3.20916748046875, -3.0941162109375, -2.97906494140625, -2.864013671875, -2.74896240234375, -2.6339111328125, -2.51885986328125, -2.40380859375, -2.28875732421875, -2.1737060546875, -2.05865478515625, -1.943603515625, -1.82855224609375, -1.7135009765625, -1.59844970703125, -1.4833984375, -1.36834716796875, -1.2532958984375, -1.13824462890625, -1.023193359375, -0.90814208984375, -0.7930908203125, -0.67803955078125, -0.56298828125, -0.44793701171875, -0.3328857421875, -0.21783447265625, -0.102783203125, 0.01226806640625, 0.1273193359375, 0.24237060546875, 0.357421875, 0.47247314453125, 0.5875244140625, 0.70257568359375, 0.817626953125, 0.93267822265625, 1.0477294921875, 1.16278076171875, 1.27783203125, 1.39288330078125, 1.5079345703125, 1.62298583984375, 1.738037109375, 1.85308837890625, 1.9681396484375, 2.08319091796875, 2.1982421875, 2.31329345703125, 2.4283447265625, 2.54339599609375, 2.658447265625, 2.77349853515625, 2.8885498046875, 3.00360107421875, 3.11865234375, 3.23370361328125, 3.3487548828125, 3.46380615234375, 3.578857421875, 3.69390869140625, 3.8089599609375, 3.92401123046875, 4.0390625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 11.0, 10.0, 18.0, 34.0, 39.0, 73.0, 105.0, 125.0, 220.0, 334.0, 481.0, 754.0, 1142.0, 1723.0, 2795.0, 4327.0, 6881.0, 11192.0, 18016.0, 30833.0, 53462.0, 100998.0, 247624.0, 303517.0, 116597.0, 59837.0, 34309.0, 20116.0, 12253.0, 7431.0, 4764.0, 2975.0, 1909.0, 1222.0, 840.0, 531.0, 357.0, 228.0, 169.0, 93.0, 70.0, 45.0, 33.0, 23.0, 11.0, 6.0, 12.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.035186767578125, -0.034090518951416016, -0.03299427032470703, -0.03189802169799805, -0.030801773071289062, -0.029705524444580078, -0.028609275817871094, -0.02751302719116211, -0.026416778564453125, -0.02532052993774414, -0.024224281311035156, -0.023128032684326172, -0.022031784057617188, -0.020935535430908203, -0.01983928680419922, -0.018743038177490234, -0.01764678955078125, -0.016550540924072266, -0.015454292297363281, -0.014358043670654297, -0.013261795043945312, -0.012165546417236328, -0.011069297790527344, -0.00997304916381836, -0.008876800537109375, -0.007780551910400391, -0.006684303283691406, -0.005588054656982422, -0.0044918060302734375, -0.003395557403564453, -0.0022993087768554688, -0.0012030601501464844, -0.0001068115234375, 0.0009894371032714844, 0.0020856857299804688, 0.003181934356689453, 0.0042781829833984375, 0.005374431610107422, 0.006470680236816406, 0.007566928863525391, 0.008663177490234375, 0.00975942611694336, 0.010855674743652344, 0.011951923370361328, 0.013048171997070312, 0.014144420623779297, 0.015240669250488281, 0.016336917877197266, 0.01743316650390625, 0.018529415130615234, 0.01962566375732422, 0.020721912384033203, 0.021818161010742188, 0.022914409637451172, 0.024010658264160156, 0.02510690689086914, 0.026203155517578125, 0.02729940414428711, 0.028395652770996094, 0.029491901397705078, 0.030588150024414062, 0.03168439865112305, 0.03278064727783203, 0.033876895904541016, 0.03497314453125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 12.0, 7.0, 12.0, 22.0, 14.0, 14.0, 17.0, 23.0, 28.0, 24.0, 31.0, 34.0, 30.0, 28.0, 28.0, 33.0, 34.0, 30.0, 1075.0, 40.0, 32.0, 41.0, 31.0, 29.0, 34.0, 27.0, 39.0, 33.0, 20.0, 29.0, 16.0, 26.0, 19.0, 10.0, 11.0, 12.0, 16.0, 7.0, 10.0, 5.0, 4.0, 7.0, 1.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.193359375, -2.124267578125, -2.05517578125, -1.986083984375, -1.9169921875, -1.847900390625, -1.77880859375, -1.709716796875, -1.640625, -1.571533203125, -1.50244140625, -1.433349609375, -1.3642578125, -1.295166015625, -1.22607421875, -1.156982421875, -1.087890625, -1.018798828125, -0.94970703125, -0.880615234375, -0.8115234375, -0.742431640625, -0.67333984375, -0.604248046875, -0.53515625, -0.466064453125, -0.39697265625, -0.327880859375, -0.2587890625, -0.189697265625, -0.12060546875, -0.051513671875, 0.017578125, 0.086669921875, 0.15576171875, 0.224853515625, 0.2939453125, 0.363037109375, 0.43212890625, 0.501220703125, 0.5703125, 0.639404296875, 0.70849609375, 0.777587890625, 0.8466796875, 0.915771484375, 0.98486328125, 1.053955078125, 1.123046875, 1.192138671875, 1.26123046875, 1.330322265625, 1.3994140625, 1.468505859375, 1.53759765625, 1.606689453125, 1.67578125, 1.744873046875, 1.81396484375, 1.883056640625, 1.9521484375, 2.021240234375, 2.09033203125, 2.159423828125, 2.228515625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 3.0, 16.0, 27.0, 39.0, 50.0, 70.0, 117.0, 158.0, 243.0, 281.0, 378.0, 520.0, 675.0, 922.0, 1211.0, 1623.0, 2232.0, 3002.0, 4072.0, 5503.0, 7434.0, 10302.0, 14585.0, 20499.0, 29210.0, 43093.0, 65108.0, 107638.0, 1265666.0, 205241.0, 102166.0, 62509.0, 41325.0, 28537.0, 20102.0, 14065.0, 10171.0, 7288.0, 5414.0, 4113.0, 2916.0, 2225.0, 1606.0, 1252.0, 906.0, 702.0, 544.0, 392.0, 289.0, 216.0, 163.0, 109.0, 86.0, 59.0, 20.0, 22.0, 12.0, 8.0, 4.0, 1.0, 2.0], "bins": [-0.0159149169921875, -0.015416860580444336, -0.014918804168701172, -0.014420747756958008, -0.013922691345214844, -0.01342463493347168, -0.012926578521728516, -0.012428522109985352, -0.011930465698242188, -0.011432409286499023, -0.01093435287475586, -0.010436296463012695, -0.009938240051269531, -0.009440183639526367, -0.008942127227783203, -0.008444070816040039, -0.007946014404296875, -0.007447957992553711, -0.006949901580810547, -0.006451845169067383, -0.005953788757324219, -0.005455732345581055, -0.004957675933837891, -0.0044596195220947266, -0.0039615631103515625, -0.0034635066986083984, -0.0029654502868652344, -0.0024673938751220703, -0.0019693374633789062, -0.0014712810516357422, -0.0009732246398925781, -0.00047516822814941406, 2.288818359375e-05, 0.0005209445953369141, 0.0010190010070800781, 0.0015170574188232422, 0.0020151138305664062, 0.0025131702423095703, 0.0030112266540527344, 0.0035092830657958984, 0.0040073394775390625, 0.0045053958892822266, 0.005003452301025391, 0.005501508712768555, 0.005999565124511719, 0.006497621536254883, 0.006995677947998047, 0.007493734359741211, 0.007991790771484375, 0.008489847183227539, 0.008987903594970703, 0.009485960006713867, 0.009984016418457031, 0.010482072830200195, 0.01098012924194336, 0.011478185653686523, 0.011976242065429688, 0.012474298477172852, 0.012972354888916016, 0.01347041130065918, 0.013968467712402344, 0.014466524124145508, 0.014964580535888672, 0.015462636947631836, 0.015960693359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 86.0, 0.0, 0.0, 0.0, 223.0, 0.0, 0.0, 0.0, 333.0, 0.0, 0.0, 187.0, 0.0, 0.0, 0.0, 78.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.6100467443466187e-07, -4.4517219066619873e-07, -4.293397068977356e-07, -4.1350722312927246e-07, -3.976747393608093e-07, -3.818422555923462e-07, -3.6600977182388306e-07, -3.501772880554199e-07, -3.343448042869568e-07, -3.1851232051849365e-07, -3.026798367500305e-07, -2.868473529815674e-07, -2.7101486921310425e-07, -2.551823854446411e-07, -2.39349901676178e-07, -2.2351741790771484e-07, -2.076849341392517e-07, -1.9185245037078857e-07, -1.7601996660232544e-07, -1.601874828338623e-07, -1.4435499906539917e-07, -1.2852251529693604e-07, -1.126900315284729e-07, -9.685754776000977e-08, -8.102506399154663e-08, -6.51925802230835e-08, -4.936009645462036e-08, -3.3527612686157227e-08, -1.7695128917694092e-08, -1.862645149230957e-09, 1.3969838619232178e-08, 2.9802322387695312e-08, 4.563480615615845e-08, 6.146728992462158e-08, 7.729977369308472e-08, 9.313225746154785e-08, 1.0896474123001099e-07, 1.2479722499847412e-07, 1.4062970876693726e-07, 1.564621925354004e-07, 1.7229467630386353e-07, 1.8812716007232666e-07, 2.039596438407898e-07, 2.1979212760925293e-07, 2.3562461137771606e-07, 2.514570951461792e-07, 2.6728957891464233e-07, 2.8312206268310547e-07, 2.989545464515686e-07, 3.1478703022003174e-07, 3.3061951398849487e-07, 3.46451997756958e-07, 3.6228448152542114e-07, 3.781169652938843e-07, 3.939494490623474e-07, 4.0978193283081055e-07, 4.256144165992737e-07, 4.414469003677368e-07, 4.5727938413619995e-07, 4.731118679046631e-07, 4.889443516731262e-07, 5.047768354415894e-07, 5.206093192100525e-07, 5.364418029785156e-07]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 5.0, 6.0, 4.0, 0.0, 10.0, 27.0, 4.0, 25.0, 67.0, 41.0, 65.0, 92.0, 232.0, 342.0, 1138.0, 830968.0, 213870.0, 584.0, 426.0, 269.0, 97.0, 62.0, 52.0, 64.0, 18.0, 4.0, 25.0, 16.0, 3.0, 7.0, 9.0, 3.0, 2.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-1.2278556823730469e-05, -1.1936761438846588e-05, -1.1594966053962708e-05, -1.1253170669078827e-05, -1.0911375284194946e-05, -1.0569579899311066e-05, -1.0227784514427185e-05, -9.885989129543304e-06, -9.544193744659424e-06, -9.202398359775543e-06, -8.860602974891663e-06, -8.518807590007782e-06, -8.177012205123901e-06, -7.83521682024002e-06, -7.49342143535614e-06, -7.1516260504722595e-06, -6.809830665588379e-06, -6.468035280704498e-06, -6.126239895820618e-06, -5.784444510936737e-06, -5.4426491260528564e-06, -5.100853741168976e-06, -4.759058356285095e-06, -4.417262971401215e-06, -4.075467586517334e-06, -3.7336722016334534e-06, -3.3918768167495728e-06, -3.050081431865692e-06, -2.7082860469818115e-06, -2.366490662097931e-06, -2.0246952772140503e-06, -1.6828998923301697e-06, -1.341104507446289e-06, -9.993091225624084e-07, -6.575137376785278e-07, -3.157183527946472e-07, 2.60770320892334e-08, 3.67872416973114e-07, 7.096678018569946e-07, 1.0514631867408752e-06, 1.3932585716247559e-06, 1.7350539565086365e-06, 2.076849341392517e-06, 2.4186447262763977e-06, 2.7604401111602783e-06, 3.102235496044159e-06, 3.4440308809280396e-06, 3.78582626581192e-06, 4.127621650695801e-06, 4.469417035579681e-06, 4.811212420463562e-06, 5.153007805347443e-06, 5.494803190231323e-06, 5.836598575115204e-06, 6.1783939599990845e-06, 6.520189344882965e-06, 6.861984729766846e-06, 7.203780114650726e-06, 7.545575499534607e-06, 7.887370884418488e-06, 8.229166269302368e-06, 8.570961654186249e-06, 8.91275703907013e-06, 9.25455242395401e-06, 9.59634780883789e-06]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 13.0, 10.0, 20.0, 23.0, 32.0, 39.0, 38.0, 49.0, 483.0, 58.0, 56.0, 46.0, 44.0, 25.0, 26.0, 15.0, 10.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.488965774067765e-07, -3.403834227810876e-07, -3.3187026815539866e-07, -3.233570851080003e-07, -3.148439304823114e-07, -3.063307758566225e-07, -2.978176212309336e-07, -2.8930446660524467e-07, -2.8079131197955576e-07, -2.7227815735386685e-07, -2.6376500272817793e-07, -2.552518196807796e-07, -2.467386650550907e-07, -2.3822551042940177e-07, -2.2971235580371285e-07, -2.2119920117802394e-07, -2.126860181306256e-07, -2.0417286350493669e-07, -1.9565969466839306e-07, -1.8714654004270415e-07, -1.7863337120616052e-07, -1.701202165804716e-07, -1.616070619547827e-07, -1.5309390732909378e-07, -1.4458073849255015e-07, -1.3606758386686124e-07, -1.2755441503031761e-07, -1.190412604046287e-07, -1.1052809867351243e-07, -1.0201493694239616e-07, -9.350178231670725e-08, -8.498862058559098e-08, -7.647543043276528e-08, -6.796226870164901e-08, -5.944911052324642e-08, -5.093595234484383e-08, -4.242279061372756e-08, -3.390962888261129e-08, -2.5396470704208696e-08, -1.6883312525806105e-08, -8.370150794689835e-09, 1.4300916006959596e-10, 8.656169114829027e-09, 1.7169329069588457e-08, 2.5682489024347888e-08, 3.419565075546416e-08, 4.270880893386675e-08, 5.122196711226934e-08, 5.973512884338561e-08, 6.824829057450188e-08, 7.676145230561815e-08, 8.527460693130706e-08, 9.378776866242333e-08, 1.023009303935396e-07, 1.1081408501922851e-07, 1.1932723964491743e-07, 1.2784040848146105e-07, 1.3635356310714997e-07, 1.448667319436936e-07, 1.533798865693825e-07, 1.6189304119507142e-07, 1.7040621003161505e-07, 1.7891936465730396e-07, 1.8743253349384759e-07, 1.959456881195365e-07]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 191.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 533.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 203.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.7229467630386353e-07, -1.6577541828155518e-07, -1.5925616025924683e-07, -1.5273690223693848e-07, -1.4621764421463013e-07, -1.3969838619232178e-07, -1.3317912817001343e-07, -1.2665987014770508e-07, -1.2014061212539673e-07, -1.1362135410308838e-07, -1.0710209608078003e-07, -1.0058283805847168e-07, -9.406358003616333e-08, -8.754432201385498e-08, -8.102506399154663e-08, -7.450580596923828e-08, -6.798654794692993e-08, -6.146728992462158e-08, -5.494803190231323e-08, -4.842877388000488e-08, -4.190951585769653e-08, -3.5390257835388184e-08, -2.8870999813079834e-08, -2.2351741790771484e-08, -1.5832483768463135e-08, -9.313225746154785e-09, -2.7939677238464355e-09, 3.725290298461914e-09, 1.0244548320770264e-08, 1.6763806343078613e-08, 2.3283064365386963e-08, 2.9802322387695312e-08, 3.632158041000366e-08, 4.284083843231201e-08, 4.936009645462036e-08, 5.587935447692871e-08, 6.239861249923706e-08, 6.891787052154541e-08, 7.543712854385376e-08, 8.195638656616211e-08, 8.847564458847046e-08, 9.499490261077881e-08, 1.0151416063308716e-07, 1.0803341865539551e-07, 1.1455267667770386e-07, 1.210719347000122e-07, 1.2759119272232056e-07, 1.341104507446289e-07, 1.4062970876693726e-07, 1.471489667892456e-07, 1.5366822481155396e-07, 1.601874828338623e-07, 1.6670674085617065e-07, 1.73225998878479e-07, 1.7974525690078735e-07, 1.862645149230957e-07, 1.9278377294540405e-07, 1.993030309677124e-07, 2.0582228899002075e-07, 2.123415470123291e-07, 2.1886080503463745e-07, 2.253800630569458e-07, 2.3189932107925415e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 6.0, 5.0, 1.0, 8.0, 12.0, 14.0, 20.0, 16.0, 19.0, 33.0, 23.0, 19.0, 30.0, 37.0, 35.0, 48.0, 48.0, 46.0, 48.0, 36.0, 51.0, 36.0, 48.0, 36.0, 37.0, 36.0, 31.0, 31.0, 23.0, 23.0, 25.0, 13.0, 12.0, 24.0, 16.0, 7.0, 10.0, 13.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.32421875, -3.20916748046875, -3.0941162109375, -2.97906494140625, -2.864013671875, -2.74896240234375, -2.6339111328125, -2.51885986328125, -2.40380859375, -2.28875732421875, -2.1737060546875, -2.05865478515625, -1.943603515625, -1.82855224609375, -1.7135009765625, -1.59844970703125, -1.4833984375, -1.36834716796875, -1.2532958984375, -1.13824462890625, -1.023193359375, -0.90814208984375, -0.7930908203125, -0.67803955078125, -0.56298828125, -0.44793701171875, -0.3328857421875, -0.21783447265625, -0.102783203125, 0.01226806640625, 0.1273193359375, 0.24237060546875, 0.357421875, 0.47247314453125, 0.5875244140625, 0.70257568359375, 0.817626953125, 0.93267822265625, 1.0477294921875, 1.16278076171875, 1.27783203125, 1.39288330078125, 1.5079345703125, 1.62298583984375, 1.738037109375, 1.85308837890625, 1.9681396484375, 2.08319091796875, 2.1982421875, 2.31329345703125, 2.4283447265625, 2.54339599609375, 2.658447265625, 2.77349853515625, 2.8885498046875, 3.00360107421875, 3.11865234375, 3.23370361328125, 3.3487548828125, 3.46380615234375, 3.578857421875, 3.69390869140625, 3.8089599609375, 3.92401123046875, 4.0390625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 6.0, 7.0, 3.0, 7.0, 9.0, 16.0, 9.0, 25.0, 40.0, 39.0, 44.0, 94.0, 108.0, 155.0, 269.0, 372.0, 590.0, 915.0, 1585.0, 3280.0, 8553.0, 29166.0, 141133.0, 606590.0, 198429.0, 38004.0, 10577.0, 3771.0, 1853.0, 1038.0, 604.0, 399.0, 262.0, 191.0, 125.0, 77.0, 68.0, 38.0, 32.0, 23.0, 18.0, 13.0, 4.0, 7.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-8.8046875, -8.55731201171875, -8.3099365234375, -8.06256103515625, -7.815185546875, -7.56781005859375, -7.3204345703125, -7.07305908203125, -6.82568359375, -6.57830810546875, -6.3309326171875, -6.08355712890625, -5.836181640625, -5.58880615234375, -5.3414306640625, -5.09405517578125, -4.8466796875, -4.59930419921875, -4.3519287109375, -4.10455322265625, -3.857177734375, -3.60980224609375, -3.3624267578125, -3.11505126953125, -2.86767578125, -2.62030029296875, -2.3729248046875, -2.12554931640625, -1.878173828125, -1.63079833984375, -1.3834228515625, -1.13604736328125, -0.888671875, -0.64129638671875, -0.3939208984375, -0.14654541015625, 0.100830078125, 0.34820556640625, 0.5955810546875, 0.84295654296875, 1.09033203125, 1.33770751953125, 1.5850830078125, 1.83245849609375, 2.079833984375, 2.32720947265625, 2.5745849609375, 2.82196044921875, 3.0693359375, 3.31671142578125, 3.5640869140625, 3.81146240234375, 4.058837890625, 4.30621337890625, 4.5535888671875, 4.80096435546875, 5.04833984375, 5.29571533203125, 5.5430908203125, 5.79046630859375, 6.037841796875, 6.28521728515625, 6.5325927734375, 6.77996826171875, 7.02734375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 5.0, 5.0, 7.0, 10.0, 9.0, 13.0, 11.0, 17.0, 30.0, 20.0, 35.0, 29.0, 38.0, 43.0, 49.0, 82.0, 138.0, 273.0, 1522.0, 227.0, 104.0, 59.0, 55.0, 44.0, 31.0, 24.0, 36.0, 23.0, 17.0, 18.0, 14.0, 7.0, 13.0, 9.0, 7.0, 11.0, 4.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.765625, -10.4696044921875, -10.173583984375, -9.8775634765625, -9.58154296875, -9.2855224609375, -8.989501953125, -8.6934814453125, -8.3974609375, -8.1014404296875, -7.805419921875, -7.5093994140625, -7.21337890625, -6.9173583984375, -6.621337890625, -6.3253173828125, -6.029296875, -5.7332763671875, -5.437255859375, -5.1412353515625, -4.84521484375, -4.5491943359375, -4.253173828125, -3.9571533203125, -3.6611328125, -3.3651123046875, -3.069091796875, -2.7730712890625, -2.47705078125, -2.1810302734375, -1.885009765625, -1.5889892578125, -1.29296875, -0.9969482421875, -0.700927734375, -0.4049072265625, -0.10888671875, 0.1871337890625, 0.483154296875, 0.7791748046875, 1.0751953125, 1.3712158203125, 1.667236328125, 1.9632568359375, 2.25927734375, 2.5552978515625, 2.851318359375, 3.1473388671875, 3.443359375, 3.7393798828125, 4.035400390625, 4.3314208984375, 4.62744140625, 4.9234619140625, 5.219482421875, 5.5155029296875, 5.8115234375, 6.1075439453125, 6.403564453125, 6.6995849609375, 6.99560546875, 7.2916259765625, 7.587646484375, 7.8836669921875, 8.1796875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 17.0, 17.0, 19.0, 21.0, 26.0, 32.0, 50.0, 78.0, 137.0, 198.0, 305.0, 667.0, 2184.0, 203671.0, 2931162.0, 5094.0, 893.0, 391.0, 258.0, 129.0, 94.0, 71.0, 46.0, 32.0, 24.0, 12.0, 13.0, 12.0, 8.0, 14.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.046875, -26.255126953125, -25.46337890625, -24.671630859375, -23.8798828125, -23.088134765625, -22.29638671875, -21.504638671875, -20.712890625, -19.921142578125, -19.12939453125, -18.337646484375, -17.5458984375, -16.754150390625, -15.96240234375, -15.170654296875, -14.37890625, -13.587158203125, -12.79541015625, -12.003662109375, -11.2119140625, -10.420166015625, -9.62841796875, -8.836669921875, -8.044921875, -7.253173828125, -6.46142578125, -5.669677734375, -4.8779296875, -4.086181640625, -3.29443359375, -2.502685546875, -1.7109375, -0.919189453125, -0.12744140625, 0.664306640625, 1.4560546875, 2.247802734375, 3.03955078125, 3.831298828125, 4.623046875, 5.414794921875, 6.20654296875, 6.998291015625, 7.7900390625, 8.581787109375, 9.37353515625, 10.165283203125, 10.95703125, 11.748779296875, 12.54052734375, 13.332275390625, 14.1240234375, 14.915771484375, 15.70751953125, 16.499267578125, 17.291015625, 18.082763671875, 18.87451171875, 19.666259765625, 20.4580078125, 21.249755859375, 22.04150390625, 22.833251953125, 23.625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 15.0, 34.0, 58.0, 123.0, 150.0, 179.0, 151.0, 131.0, 93.0, 36.0, 22.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.391426086425781, -13.234977722167969, -12.078530311584473, -10.92208194732666, -9.765634536743164, -8.609186172485352, -7.452737808227539, -6.296290397644043, -5.1398420333862305, -3.983394145965576, -2.8269460201263428, -1.6704978942871094, -0.5140500068664551, 0.6423978805541992, 1.7988462448120117, 2.955293655395508, 4.11174201965332, 5.268189907073975, 6.424637794494629, 7.581086158752441, 8.737533569335938, 9.89398193359375, 11.050430297851562, 12.206877708435059, 13.363326072692871, 14.519774436950684, 15.67622184753418, 16.832670211791992, 17.989118576049805, 19.145565032958984, 20.302013397216797, 21.45846176147461, 22.614910125732422, 23.771358489990234, 24.927806854248047, 26.08425521850586, 27.24070167541504, 28.39715003967285, 29.553598403930664, 30.710044860839844, 31.866493225097656, 33.02294158935547, 34.17938995361328, 35.335838317871094, 36.492286682128906, 37.64873504638672, 38.80518341064453, 39.96162796020508, 41.118080139160156, 42.27452850341797, 43.43097686767578, 44.587425231933594, 45.743873596191406, 46.90032196044922, 48.05677032470703, 49.21321487426758, 50.36966323852539, 51.5261116027832, 52.682559967041016, 53.83900833129883, 54.99545669555664, 56.15190124511719, 57.308349609375, 58.46479797363281, 59.621246337890625]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 13.0, 4.0, 14.0, 12.0, 16.0, 28.0, 19.0, 15.0, 20.0, 23.0, 17.0, 35.0, 25.0, 42.0, 37.0, 41.0, 39.0, 38.0, 51.0, 45.0, 38.0, 36.0, 34.0, 40.0, 38.0, 38.0, 31.0, 32.0, 31.0, 22.0, 16.0, 22.0, 16.0, 12.0, 5.0, 8.0, 10.0, 10.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-26.74481201171875, -25.981050491333008, -25.217288970947266, -24.453527450561523, -23.68976593017578, -22.926002502441406, -22.162240982055664, -21.398479461669922, -20.63471794128418, -19.870956420898438, -19.107194900512695, -18.343433380126953, -17.579669952392578, -16.815908432006836, -16.052146911621094, -15.288385391235352, -14.52462387084961, -13.760862350463867, -12.997100830078125, -12.233338356018066, -11.469576835632324, -10.705815315246582, -9.942052841186523, -9.178291320800781, -8.414529800415039, -7.650768280029297, -6.8870062828063965, -6.123244285583496, -5.359482765197754, -4.595721244812012, -3.8319592475891113, -3.068197250366211, -2.3044357299804688, -1.5406739711761475, -0.7769122123718262, -0.013150453567504883, 0.7506113052368164, 1.5143730640411377, 2.278134822845459, 3.0418968200683594, 3.8056583404541016, 4.569419860839844, 5.333181858062744, 6.0969438552856445, 6.860705375671387, 7.624466896057129, 8.388229370117188, 9.15199089050293, 9.915752410888672, 10.679513931274414, 11.443275451660156, 12.207037925720215, 12.970799446105957, 13.7345609664917, 14.498323440551758, 15.2620849609375, 16.025846481323242, 16.789608001708984, 17.553369522094727, 18.31713104248047, 19.080894470214844, 19.844655990600586, 20.608417510986328, 21.37217903137207, 22.135940551757812]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 9.0, 9.0, 7.0, 13.0, 8.0, 20.0, 22.0, 23.0, 29.0, 32.0, 24.0, 26.0, 32.0, 47.0, 38.0, 40.0, 41.0, 52.0, 52.0, 42.0, 39.0, 40.0, 39.0, 32.0, 36.0, 27.0, 29.0, 35.0, 21.0, 14.0, 15.0, 15.0, 18.0, 12.0, 11.0, 10.0, 7.0, 10.0, 7.0, 2.0, 7.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.427734375, -3.312347412109375, -3.19696044921875, -3.081573486328125, -2.9661865234375, -2.850799560546875, -2.73541259765625, -2.620025634765625, -2.504638671875, -2.389251708984375, -2.27386474609375, -2.158477783203125, -2.0430908203125, -1.927703857421875, -1.81231689453125, -1.696929931640625, -1.58154296875, -1.466156005859375, -1.35076904296875, -1.235382080078125, -1.1199951171875, -1.004608154296875, -0.88922119140625, -0.773834228515625, -0.658447265625, -0.543060302734375, -0.42767333984375, -0.312286376953125, -0.1968994140625, -0.081512451171875, 0.03387451171875, 0.149261474609375, 0.2646484375, 0.380035400390625, 0.49542236328125, 0.610809326171875, 0.7261962890625, 0.841583251953125, 0.95697021484375, 1.072357177734375, 1.187744140625, 1.303131103515625, 1.41851806640625, 1.533905029296875, 1.6492919921875, 1.764678955078125, 1.88006591796875, 1.995452880859375, 2.11083984375, 2.226226806640625, 2.34161376953125, 2.457000732421875, 2.5723876953125, 2.687774658203125, 2.80316162109375, 2.918548583984375, 3.033935546875, 3.149322509765625, 3.26470947265625, 3.380096435546875, 3.4954833984375, 3.610870361328125, 3.72625732421875, 3.841644287109375, 3.95703125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 7.0, 12.0, 11.0, 18.0, 21.0, 31.0, 41.0, 54.0, 91.0, 109.0, 165.0, 199.0, 312.0, 436.0, 646.0, 921.0, 1478.0, 2165.0, 3380.0, 5317.0, 9354.0, 16677.0, 40087.0, 158097.0, 753864.0, 1972492.0, 935928.0, 199684.0, 47059.0, 18821.0, 9961.0, 5863.0, 3687.0, 2362.0, 1466.0, 1004.0, 735.0, 511.0, 368.0, 234.0, 164.0, 123.0, 99.0, 56.0, 47.0, 29.0, 30.0, 19.0, 12.0, 11.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.40234375, -5.23126220703125, -5.0601806640625, -4.88909912109375, -4.718017578125, -4.54693603515625, -4.3758544921875, -4.20477294921875, -4.03369140625, -3.86260986328125, -3.6915283203125, -3.52044677734375, -3.349365234375, -3.17828369140625, -3.0072021484375, -2.83612060546875, -2.6650390625, -2.49395751953125, -2.3228759765625, -2.15179443359375, -1.980712890625, -1.80963134765625, -1.6385498046875, -1.46746826171875, -1.29638671875, -1.12530517578125, -0.9542236328125, -0.78314208984375, -0.612060546875, -0.44097900390625, -0.2698974609375, -0.09881591796875, 0.072265625, 0.24334716796875, 0.4144287109375, 0.58551025390625, 0.756591796875, 0.92767333984375, 1.0987548828125, 1.26983642578125, 1.44091796875, 1.61199951171875, 1.7830810546875, 1.95416259765625, 2.125244140625, 2.29632568359375, 2.4674072265625, 2.63848876953125, 2.8095703125, 2.98065185546875, 3.1517333984375, 3.32281494140625, 3.493896484375, 3.66497802734375, 3.8360595703125, 4.00714111328125, 4.17822265625, 4.34930419921875, 4.5203857421875, 4.69146728515625, 4.862548828125, 5.03363037109375, 5.2047119140625, 5.37579345703125, 5.546875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 2.0, 7.0, 14.0, 27.0, 36.0, 62.0, 91.0, 119.0, 176.0, 216.0, 317.0, 477.0, 580.0, 570.0, 405.0, 303.0, 207.0, 159.0, 112.0, 74.0, 39.0, 21.0, 16.0, 23.0, 9.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6328125, -8.4107666015625, -8.188720703125, -7.9666748046875, -7.74462890625, -7.5225830078125, -7.300537109375, -7.0784912109375, -6.8564453125, -6.6343994140625, -6.412353515625, -6.1903076171875, -5.96826171875, -5.7462158203125, -5.524169921875, -5.3021240234375, -5.080078125, -4.8580322265625, -4.635986328125, -4.4139404296875, -4.19189453125, -3.9698486328125, -3.747802734375, -3.5257568359375, -3.3037109375, -3.0816650390625, -2.859619140625, -2.6375732421875, -2.41552734375, -2.1934814453125, -1.971435546875, -1.7493896484375, -1.52734375, -1.3052978515625, -1.083251953125, -0.8612060546875, -0.63916015625, -0.4171142578125, -0.195068359375, 0.0269775390625, 0.2490234375, 0.4710693359375, 0.693115234375, 0.9151611328125, 1.13720703125, 1.3592529296875, 1.581298828125, 1.8033447265625, 2.025390625, 2.2474365234375, 2.469482421875, 2.6915283203125, 2.91357421875, 3.1356201171875, 3.357666015625, 3.5797119140625, 3.8017578125, 4.0238037109375, 4.245849609375, 4.4678955078125, 4.68994140625, 4.9119873046875, 5.134033203125, 5.3560791015625, 5.578125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 16.0, 10.0, 27.0, 32.0, 49.0, 85.0, 115.0, 213.0, 350.0, 608.0, 1266.0, 3352.0, 16112.0, 251130.0, 3408350.0, 480449.0, 24567.0, 4286.0, 1479.0, 730.0, 383.0, 249.0, 163.0, 83.0, 47.0, 44.0, 24.0, 16.0, 11.0, 7.0, 6.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6328125, -9.2564697265625, -8.880126953125, -8.5037841796875, -8.12744140625, -7.7510986328125, -7.374755859375, -6.9984130859375, -6.6220703125, -6.2457275390625, -5.869384765625, -5.4930419921875, -5.11669921875, -4.7403564453125, -4.364013671875, -3.9876708984375, -3.611328125, -3.2349853515625, -2.858642578125, -2.4822998046875, -2.10595703125, -1.7296142578125, -1.353271484375, -0.9769287109375, -0.6005859375, -0.2242431640625, 0.152099609375, 0.5284423828125, 0.90478515625, 1.2811279296875, 1.657470703125, 2.0338134765625, 2.41015625, 2.7864990234375, 3.162841796875, 3.5391845703125, 3.91552734375, 4.2918701171875, 4.668212890625, 5.0445556640625, 5.4208984375, 5.7972412109375, 6.173583984375, 6.5499267578125, 6.92626953125, 7.3026123046875, 7.678955078125, 8.0552978515625, 8.431640625, 8.8079833984375, 9.184326171875, 9.5606689453125, 9.93701171875, 10.3133544921875, 10.689697265625, 11.0660400390625, 11.4423828125, 11.8187255859375, 12.195068359375, 12.5714111328125, 12.94775390625, 13.3240966796875, 13.700439453125, 14.0767822265625, 14.453125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 11.0, 33.0, 287.0, 478.0, 176.0, 27.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.482261657714844, -39.63793182373047, -35.793601989746094, -31.949270248413086, -28.10494041442871, -24.260610580444336, -20.416278839111328, -16.571949005126953, -12.727619171142578, -8.883289337158203, -5.038958549499512, -1.1946277618408203, 2.6497020721435547, 6.49403190612793, 10.338363647460938, 14.182693481445312, 18.027023315429688, 21.871353149414062, 25.715682983398438, 29.560014724731445, 33.40434265136719, 37.24867248535156, 41.0930061340332, 44.93733596801758, 48.78166580200195, 52.62599563598633, 56.4703254699707, 60.314659118652344, 64.15898895263672, 68.0033187866211, 71.84764862060547, 75.69197845458984, 79.53630065917969, 83.38063049316406, 87.22496032714844, 91.06929016113281, 94.91361999511719, 98.75794982910156, 102.60227966308594, 106.44660949707031, 110.29093933105469, 114.13526916503906, 117.97959899902344, 121.82392883300781, 125.66825866699219, 129.51258850097656, 133.35691833496094, 137.2012481689453, 141.04559326171875, 144.88992309570312, 148.7342529296875, 152.57858276367188, 156.42291259765625, 160.26724243164062, 164.111572265625, 167.95590209960938, 171.80023193359375, 175.64456176757812, 179.4888916015625, 183.33322143554688, 187.17755126953125, 191.02188110351562, 194.8662109375, 198.71054077148438, 202.55487060546875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 8.0, 2.0, 8.0, 7.0, 11.0, 10.0, 15.0, 14.0, 20.0, 16.0, 15.0, 31.0, 20.0, 33.0, 29.0, 43.0, 36.0, 26.0, 34.0, 49.0, 52.0, 51.0, 36.0, 37.0, 31.0, 34.0, 40.0, 42.0, 34.0, 29.0, 19.0, 33.0, 25.0, 20.0, 17.0, 18.0, 13.0, 13.0, 10.0, 3.0, 3.0, 1.0, 6.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.77295684814453, -17.137928009033203, -16.502899169921875, -15.86786937713623, -15.232839584350586, -14.597810745239258, -13.96278190612793, -13.327753067016602, -12.692723274230957, -12.057694435119629, -11.422664642333984, -10.787635803222656, -10.152606964111328, -9.517577171325684, -8.882548332214355, -8.247518539428711, -7.612489700317383, -6.9774603843688965, -6.34243106842041, -5.707402229309082, -5.072372913360596, -4.437343597412109, -3.802314519882202, -3.167285442352295, -2.5322561264038086, -1.8972269296646118, -1.262197732925415, -0.6271685361862183, 0.007860660552978516, 0.6428899765014648, 1.277919054031372, 1.9129481315612793, 2.5479774475097656, 3.183006763458252, 3.818035840988159, 4.453064918518066, 5.088094234466553, 5.723123550415039, 6.358152389526367, 6.9931817054748535, 7.62821102142334, 8.263239860534668, 8.898269653320312, 9.53329849243164, 10.168327331542969, 10.803357124328613, 11.438385963439941, 12.073415756225586, 12.708444595336914, 13.343473434448242, 13.978503227233887, 14.613532066345215, 15.24856185913086, 15.883590698242188, 16.518619537353516, 17.153648376464844, 17.788677215576172, 18.4237060546875, 19.058734893798828, 19.69376564025879, 20.328794479370117, 20.963823318481445, 21.598852157592773, 22.2338809967041, 22.868911743164062]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 4.0, 5.0, 4.0, 7.0, 10.0, 11.0, 8.0, 16.0, 25.0, 20.0, 31.0, 28.0, 24.0, 17.0, 28.0, 34.0, 44.0, 41.0, 46.0, 36.0, 29.0, 33.0, 44.0, 40.0, 38.0, 42.0, 36.0, 31.0, 38.0, 34.0, 21.0, 21.0, 18.0, 18.0, 11.0, 21.0, 16.0, 13.0, 5.0, 8.0, 15.0, 3.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.796875, -2.70208740234375, -2.6072998046875, -2.51251220703125, -2.417724609375, -2.32293701171875, -2.2281494140625, -2.13336181640625, -2.03857421875, -1.94378662109375, -1.8489990234375, -1.75421142578125, -1.659423828125, -1.56463623046875, -1.4698486328125, -1.37506103515625, -1.2802734375, -1.18548583984375, -1.0906982421875, -0.99591064453125, -0.901123046875, -0.80633544921875, -0.7115478515625, -0.61676025390625, -0.52197265625, -0.42718505859375, -0.3323974609375, -0.23760986328125, -0.142822265625, -0.04803466796875, 0.0467529296875, 0.14154052734375, 0.236328125, 0.33111572265625, 0.4259033203125, 0.52069091796875, 0.615478515625, 0.71026611328125, 0.8050537109375, 0.89984130859375, 0.99462890625, 1.08941650390625, 1.1842041015625, 1.27899169921875, 1.373779296875, 1.46856689453125, 1.5633544921875, 1.65814208984375, 1.7529296875, 1.84771728515625, 1.9425048828125, 2.03729248046875, 2.132080078125, 2.22686767578125, 2.3216552734375, 2.41644287109375, 2.51123046875, 2.60601806640625, 2.7008056640625, 2.79559326171875, 2.890380859375, 2.98516845703125, 3.0799560546875, 3.17474365234375, 3.26953125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 8.0, 14.0, 19.0, 59.0, 46.0, 73.0, 115.0, 170.0, 217.0, 332.0, 515.0, 668.0, 870.0, 1221.0, 1765.0, 2385.0, 3530.0, 5096.0, 7189.0, 10164.0, 15018.0, 22548.0, 34477.0, 55089.0, 96704.0, 212761.0, 274636.0, 118017.0, 64856.0, 39402.0, 25183.0, 16911.0, 11705.0, 7990.0, 5427.0, 3858.0, 2760.0, 1937.0, 1462.0, 975.0, 696.0, 507.0, 347.0, 278.0, 173.0, 131.0, 75.0, 63.0, 38.0, 32.0, 24.0, 9.0, 5.0, 3.0, 2.0, 4.0], "bins": [-0.0242462158203125, -0.023536205291748047, -0.022826194763183594, -0.02211618423461914, -0.021406173706054688, -0.020696163177490234, -0.01998615264892578, -0.019276142120361328, -0.018566131591796875, -0.017856121063232422, -0.01714611053466797, -0.016436100006103516, -0.015726089477539062, -0.01501607894897461, -0.014306068420410156, -0.013596057891845703, -0.01288604736328125, -0.012176036834716797, -0.011466026306152344, -0.01075601577758789, -0.010046005249023438, -0.009335994720458984, -0.008625984191894531, -0.007915973663330078, -0.007205963134765625, -0.006495952606201172, -0.005785942077636719, -0.005075931549072266, -0.0043659210205078125, -0.0036559104919433594, -0.0029458999633789062, -0.002235889434814453, -0.00152587890625, -0.0008158683776855469, -0.00010585784912109375, 0.0006041526794433594, 0.0013141632080078125, 0.0020241737365722656, 0.0027341842651367188, 0.003444194793701172, 0.004154205322265625, 0.004864215850830078, 0.005574226379394531, 0.006284236907958984, 0.0069942474365234375, 0.007704257965087891, 0.008414268493652344, 0.009124279022216797, 0.00983428955078125, 0.010544300079345703, 0.011254310607910156, 0.01196432113647461, 0.012674331665039062, 0.013384342193603516, 0.014094352722167969, 0.014804363250732422, 0.015514373779296875, 0.016224384307861328, 0.01693439483642578, 0.017644405364990234, 0.018354415893554688, 0.01906442642211914, 0.019774436950683594, 0.020484447479248047, 0.0211944580078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 4.0, 9.0, 6.0, 4.0, 9.0, 7.0, 12.0, 14.0, 28.0, 35.0, 24.0, 27.0, 26.0, 29.0, 47.0, 33.0, 42.0, 58.0, 44.0, 1067.0, 46.0, 41.0, 45.0, 41.0, 49.0, 27.0, 34.0, 22.0, 34.0, 26.0, 17.0, 26.0, 16.0, 16.0, 8.0, 11.0, 8.0, 9.0, 6.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.23150634765625, -2.1544189453125, -2.07733154296875, -2.000244140625, -1.92315673828125, -1.8460693359375, -1.76898193359375, -1.69189453125, -1.61480712890625, -1.5377197265625, -1.46063232421875, -1.383544921875, -1.30645751953125, -1.2293701171875, -1.15228271484375, -1.0751953125, -0.99810791015625, -0.9210205078125, -0.84393310546875, -0.766845703125, -0.68975830078125, -0.6126708984375, -0.53558349609375, -0.45849609375, -0.38140869140625, -0.3043212890625, -0.22723388671875, -0.150146484375, -0.07305908203125, 0.0040283203125, 0.08111572265625, 0.158203125, 0.23529052734375, 0.3123779296875, 0.38946533203125, 0.466552734375, 0.54364013671875, 0.6207275390625, 0.69781494140625, 0.77490234375, 0.85198974609375, 0.9290771484375, 1.00616455078125, 1.083251953125, 1.16033935546875, 1.2374267578125, 1.31451416015625, 1.3916015625, 1.46868896484375, 1.5457763671875, 1.62286376953125, 1.699951171875, 1.77703857421875, 1.8541259765625, 1.93121337890625, 2.00830078125, 2.08538818359375, 2.1624755859375, 2.23956298828125, 2.316650390625, 2.39373779296875, 2.4708251953125, 2.54791259765625, 2.625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 11.0, 19.0, 24.0, 39.0, 75.0, 93.0, 140.0, 213.0, 313.0, 472.0, 629.0, 909.0, 1240.0, 1735.0, 2497.0, 3596.0, 5338.0, 7755.0, 11439.0, 16779.0, 25717.0, 40598.0, 67664.0, 126228.0, 1334940.0, 201794.0, 94192.0, 53140.0, 32976.0, 21175.0, 14095.0, 9733.0, 6604.0, 4491.0, 3103.0, 2151.0, 1537.0, 1113.0, 783.0, 584.0, 371.0, 292.0, 166.0, 133.0, 78.0, 50.0, 41.0, 16.0, 16.0, 13.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0], "bins": [-0.0189056396484375, -0.01832890510559082, -0.01775217056274414, -0.01717543601989746, -0.01659870147705078, -0.0160219669342041, -0.015445232391357422, -0.014868497848510742, -0.014291763305664062, -0.013715028762817383, -0.013138294219970703, -0.012561559677124023, -0.011984825134277344, -0.011408090591430664, -0.010831356048583984, -0.010254621505737305, -0.009677886962890625, -0.009101152420043945, -0.008524417877197266, -0.007947683334350586, -0.007370948791503906, -0.0067942142486572266, -0.006217479705810547, -0.005640745162963867, -0.0050640106201171875, -0.004487276077270508, -0.003910541534423828, -0.0033338069915771484, -0.0027570724487304688, -0.002180337905883789, -0.0016036033630371094, -0.0010268688201904297, -0.00045013427734375, 0.0001266002655029297, 0.0007033348083496094, 0.001280069351196289, 0.0018568038940429688, 0.0024335384368896484, 0.003010272979736328, 0.003587007522583008, 0.0041637420654296875, 0.004740476608276367, 0.005317211151123047, 0.0058939456939697266, 0.006470680236816406, 0.007047414779663086, 0.007624149322509766, 0.008200883865356445, 0.008777618408203125, 0.009354352951049805, 0.009931087493896484, 0.010507822036743164, 0.011084556579589844, 0.011661291122436523, 0.012238025665283203, 0.012814760208129883, 0.013391494750976562, 0.013968229293823242, 0.014544963836669922, 0.015121698379516602, 0.01569843292236328, 0.01627516746520996, 0.01685190200805664, 0.01742863655090332, 0.01800537109375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 11.0, 0.0, 0.0, 29.0, 0.0, 0.0, 80.0, 0.0, 0.0, 197.0, 0.0, 0.0, 402.0, 0.0, 0.0, 174.0, 0.0, 0.0, 82.0, 0.0, 0.0, 22.0, 0.0, 0.0, 12.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.764886736869812e-07, -5.569308996200562e-07, -5.373731255531311e-07, -5.178153514862061e-07, -4.98257577419281e-07, -4.78699803352356e-07, -4.591420292854309e-07, -4.3958425521850586e-07, -4.200264811515808e-07, -4.0046870708465576e-07, -3.809109330177307e-07, -3.6135315895080566e-07, -3.417953848838806e-07, -3.2223761081695557e-07, -3.026798367500305e-07, -2.8312206268310547e-07, -2.635642886161804e-07, -2.4400651454925537e-07, -2.2444874048233032e-07, -2.0489096641540527e-07, -1.8533319234848022e-07, -1.6577541828155518e-07, -1.4621764421463013e-07, -1.2665987014770508e-07, -1.0710209608078003e-07, -8.754432201385498e-08, -6.798654794692993e-08, -4.842877388000488e-08, -2.8870999813079834e-08, -9.313225746154785e-09, 1.0244548320770264e-08, 2.9802322387695312e-08, 4.936009645462036e-08, 6.891787052154541e-08, 8.847564458847046e-08, 1.0803341865539551e-07, 1.2759119272232056e-07, 1.471489667892456e-07, 1.6670674085617065e-07, 1.862645149230957e-07, 2.0582228899002075e-07, 2.253800630569458e-07, 2.4493783712387085e-07, 2.644956111907959e-07, 2.8405338525772095e-07, 3.03611159324646e-07, 3.2316893339157104e-07, 3.427267074584961e-07, 3.6228448152542114e-07, 3.818422555923462e-07, 4.0140002965927124e-07, 4.209578037261963e-07, 4.4051557779312134e-07, 4.600733518600464e-07, 4.796311259269714e-07, 4.991888999938965e-07, 5.187466740608215e-07, 5.383044481277466e-07, 5.578622221946716e-07, 5.774199962615967e-07, 5.969777703285217e-07, 6.165355443954468e-07, 6.360933184623718e-07, 6.556510925292969e-07]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 8.0, 8.0, 10.0, 26.0, 18.0, 30.0, 79.0, 91.0, 99.0, 390.0, 369.0, 11644.0, 1031092.0, 3622.0, 375.0, 337.0, 66.0, 91.0, 85.0, 25.0, 26.0, 21.0, 14.0, 4.0, 9.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2278556823730469e-05, -1.1910684406757355e-05, -1.154281198978424e-05, -1.1174939572811127e-05, -1.0807067155838013e-05, -1.0439194738864899e-05, -1.0071322321891785e-05, -9.70344990491867e-06, -9.335577487945557e-06, -8.967705070972443e-06, -8.599832653999329e-06, -8.231960237026215e-06, -7.8640878200531e-06, -7.4962154030799866e-06, -7.1283429861068726e-06, -6.7604705691337585e-06, -6.3925981521606445e-06, -6.0247257351875305e-06, -5.6568533182144165e-06, -5.2889809012413025e-06, -4.9211084842681885e-06, -4.5532360672950745e-06, -4.1853636503219604e-06, -3.8174912333488464e-06, -3.4496188163757324e-06, -3.0817463994026184e-06, -2.7138739824295044e-06, -2.3460015654563904e-06, -1.9781291484832764e-06, -1.6102567315101624e-06, -1.2423843145370483e-06, -8.745118975639343e-07, -5.066394805908203e-07, -1.387670636177063e-07, 2.2910535335540771e-07, 5.969777703285217e-07, 9.648501873016357e-07, 1.3327226042747498e-06, 1.7005950212478638e-06, 2.0684674382209778e-06, 2.436339855194092e-06, 2.804212272167206e-06, 3.17208468914032e-06, 3.539957106113434e-06, 3.907829523086548e-06, 4.275701940059662e-06, 4.643574357032776e-06, 5.01144677400589e-06, 5.379319190979004e-06, 5.747191607952118e-06, 6.115064024925232e-06, 6.482936441898346e-06, 6.85080885887146e-06, 7.218681275844574e-06, 7.586553692817688e-06, 7.954426109790802e-06, 8.322298526763916e-06, 8.69017094373703e-06, 9.058043360710144e-06, 9.425915777683258e-06, 9.793788194656372e-06, 1.0161660611629486e-05, 1.05295330286026e-05, 1.0897405445575714e-05, 1.1265277862548828e-05]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 17.0, 27.0, 68.0, 94.0, 527.0, 115.0, 79.0, 52.0, 25.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.867767746778554e-07, -8.681673762112041e-07, -8.495580345879716e-07, -8.309486361213203e-07, -8.123392944980878e-07, -7.937298960314365e-07, -7.75120554408204e-07, -7.565111559415527e-07, -7.379018143183202e-07, -7.192924158516689e-07, -7.006830742284365e-07, -6.820736757617851e-07, -6.634643341385527e-07, -6.448549356719013e-07, -6.262455940486689e-07, -6.076361955820175e-07, -5.890268539587851e-07, -5.704174554921337e-07, -5.518081138689013e-07, -5.331987154022499e-07, -5.145893737790175e-07, -4.959799753123662e-07, -4.773706336891337e-07, -4.5876123522248236e-07, -4.4015183675583103e-07, -4.2154246671088913e-07, -4.0293309666594723e-07, -3.8432372662100533e-07, -3.6571435657606344e-07, -3.4710498653112154e-07, -3.2849561648617964e-07, -3.098862180195283e-07, -2.9127687639629585e-07, -2.7266750635135395e-07, -2.5405813630641205e-07, -2.3544876626147015e-07, -2.1683939621652826e-07, -1.9823002617158636e-07, -1.7962064191578975e-07, -1.6101127187084785e-07, -1.4240190182590595e-07, -1.2379253178096405e-07, -1.0518316173602216e-07, -8.65737845856529e-08, -6.7964414540711e-08, -4.935504449576911e-08, -3.074566734539985e-08, -1.2136297300457954e-08, 6.473072744483943e-09, 2.508244456578268e-08, 4.369181638708142e-08, 6.230118998473699e-08, 8.091056002967889e-08, 9.951993007462079e-08, 1.1812930722499004e-07, 1.3673867726993194e-07, 1.5534804731487384e-07, 1.7395741735981574e-07, 1.9256678740475763e-07, 2.1117617166055425e-07, 2.2978554170549614e-07, 2.4839491175043804e-07, 2.6700428179537994e-07, 2.8561365184032184e-07, 3.0422302188526373e-07]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 226.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 511.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 199.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.7229467630386353e-07, -1.6577541828155518e-07, -1.5925616025924683e-07, -1.5273690223693848e-07, -1.4621764421463013e-07, -1.3969838619232178e-07, -1.3317912817001343e-07, -1.2665987014770508e-07, -1.2014061212539673e-07, -1.1362135410308838e-07, -1.0710209608078003e-07, -1.0058283805847168e-07, -9.406358003616333e-08, -8.754432201385498e-08, -8.102506399154663e-08, -7.450580596923828e-08, -6.798654794692993e-08, -6.146728992462158e-08, -5.494803190231323e-08, -4.842877388000488e-08, -4.190951585769653e-08, -3.5390257835388184e-08, -2.8870999813079834e-08, -2.2351741790771484e-08, -1.5832483768463135e-08, -9.313225746154785e-09, -2.7939677238464355e-09, 3.725290298461914e-09, 1.0244548320770264e-08, 1.6763806343078613e-08, 2.3283064365386963e-08, 2.9802322387695312e-08, 3.632158041000366e-08, 4.284083843231201e-08, 4.936009645462036e-08, 5.587935447692871e-08, 6.239861249923706e-08, 6.891787052154541e-08, 7.543712854385376e-08, 8.195638656616211e-08, 8.847564458847046e-08, 9.499490261077881e-08, 1.0151416063308716e-07, 1.0803341865539551e-07, 1.1455267667770386e-07, 1.210719347000122e-07, 1.2759119272232056e-07, 1.341104507446289e-07, 1.4062970876693726e-07, 1.471489667892456e-07, 1.5366822481155396e-07, 1.601874828338623e-07, 1.6670674085617065e-07, 1.73225998878479e-07, 1.7974525690078735e-07, 1.862645149230957e-07, 1.9278377294540405e-07, 1.993030309677124e-07, 2.0582228899002075e-07, 2.123415470123291e-07, 2.1886080503463745e-07, 2.253800630569458e-07, 2.3189932107925415e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 4.0, 5.0, 4.0, 7.0, 10.0, 11.0, 8.0, 16.0, 25.0, 20.0, 31.0, 28.0, 24.0, 17.0, 28.0, 34.0, 44.0, 41.0, 46.0, 36.0, 29.0, 33.0, 44.0, 40.0, 38.0, 42.0, 36.0, 31.0, 38.0, 34.0, 21.0, 21.0, 18.0, 18.0, 11.0, 21.0, 16.0, 13.0, 5.0, 8.0, 15.0, 3.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.796875, -2.70208740234375, -2.6072998046875, -2.51251220703125, -2.417724609375, -2.32293701171875, -2.2281494140625, -2.13336181640625, -2.03857421875, -1.94378662109375, -1.8489990234375, -1.75421142578125, -1.659423828125, -1.56463623046875, -1.4698486328125, -1.37506103515625, -1.2802734375, -1.18548583984375, -1.0906982421875, -0.99591064453125, -0.901123046875, -0.80633544921875, -0.7115478515625, -0.61676025390625, -0.52197265625, -0.42718505859375, -0.3323974609375, -0.23760986328125, -0.142822265625, -0.04803466796875, 0.0467529296875, 0.14154052734375, 0.236328125, 0.33111572265625, 0.4259033203125, 0.52069091796875, 0.615478515625, 0.71026611328125, 0.8050537109375, 0.89984130859375, 0.99462890625, 1.08941650390625, 1.1842041015625, 1.27899169921875, 1.373779296875, 1.46856689453125, 1.5633544921875, 1.65814208984375, 1.7529296875, 1.84771728515625, 1.9425048828125, 2.03729248046875, 2.132080078125, 2.22686767578125, 2.3216552734375, 2.41644287109375, 2.51123046875, 2.60601806640625, 2.7008056640625, 2.79559326171875, 2.890380859375, 2.98516845703125, 3.0799560546875, 3.17474365234375, 3.26953125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 9.0, 9.0, 6.0, 9.0, 9.0, 22.0, 30.0, 26.0, 38.0, 54.0, 57.0, 86.0, 127.0, 223.0, 332.0, 637.0, 1226.0, 2699.0, 8084.0, 31060.0, 160777.0, 566520.0, 219684.0, 40227.0, 10112.0, 3326.0, 1359.0, 690.0, 373.0, 241.0, 129.0, 81.0, 68.0, 47.0, 28.0, 33.0, 29.0, 20.0, 17.0, 18.0, 8.0, 9.0, 8.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.55523681640625, -4.3839111328125, -4.21258544921875, -4.041259765625, -3.86993408203125, -3.6986083984375, -3.52728271484375, -3.35595703125, -3.18463134765625, -3.0133056640625, -2.84197998046875, -2.670654296875, -2.49932861328125, -2.3280029296875, -2.15667724609375, -1.9853515625, -1.81402587890625, -1.6427001953125, -1.47137451171875, -1.300048828125, -1.12872314453125, -0.9573974609375, -0.78607177734375, -0.61474609375, -0.44342041015625, -0.2720947265625, -0.10076904296875, 0.070556640625, 0.24188232421875, 0.4132080078125, 0.58453369140625, 0.755859375, 0.92718505859375, 1.0985107421875, 1.26983642578125, 1.441162109375, 1.61248779296875, 1.7838134765625, 1.95513916015625, 2.12646484375, 2.29779052734375, 2.4691162109375, 2.64044189453125, 2.811767578125, 2.98309326171875, 3.1544189453125, 3.32574462890625, 3.4970703125, 3.66839599609375, 3.8397216796875, 4.01104736328125, 4.182373046875, 4.35369873046875, 4.5250244140625, 4.69635009765625, 4.86767578125, 5.03900146484375, 5.2103271484375, 5.38165283203125, 5.552978515625, 5.72430419921875, 5.8956298828125, 6.06695556640625, 6.23828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 10.0, 13.0, 11.0, 19.0, 16.0, 21.0, 41.0, 43.0, 37.0, 44.0, 53.0, 67.0, 90.0, 183.0, 1446.0, 343.0, 155.0, 79.0, 48.0, 54.0, 48.0, 42.0, 32.0, 23.0, 21.0, 14.0, 24.0, 13.0, 8.0, 10.0, 6.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.74609375, -7.47784423828125, -7.2095947265625, -6.94134521484375, -6.673095703125, -6.40484619140625, -6.1365966796875, -5.86834716796875, -5.60009765625, -5.33184814453125, -5.0635986328125, -4.79534912109375, -4.527099609375, -4.25885009765625, -3.9906005859375, -3.72235107421875, -3.4541015625, -3.18585205078125, -2.9176025390625, -2.64935302734375, -2.381103515625, -2.11285400390625, -1.8446044921875, -1.57635498046875, -1.30810546875, -1.03985595703125, -0.7716064453125, -0.50335693359375, -0.235107421875, 0.03314208984375, 0.3013916015625, 0.56964111328125, 0.837890625, 1.10614013671875, 1.3743896484375, 1.64263916015625, 1.910888671875, 2.17913818359375, 2.4473876953125, 2.71563720703125, 2.98388671875, 3.25213623046875, 3.5203857421875, 3.78863525390625, 4.056884765625, 4.32513427734375, 4.5933837890625, 4.86163330078125, 5.1298828125, 5.39813232421875, 5.6663818359375, 5.93463134765625, 6.202880859375, 6.47113037109375, 6.7393798828125, 7.00762939453125, 7.27587890625, 7.54412841796875, 7.8123779296875, 8.08062744140625, 8.348876953125, 8.61712646484375, 8.8853759765625, 9.15362548828125, 9.421875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 4.0, 6.0, 4.0, 10.0, 8.0, 9.0, 11.0, 18.0, 20.0, 47.0, 39.0, 67.0, 83.0, 173.0, 289.0, 511.0, 1446.0, 63090.0, 3070156.0, 7732.0, 900.0, 428.0, 215.0, 126.0, 91.0, 58.0, 46.0, 23.0, 25.0, 17.0, 15.0, 8.0, 9.0, 9.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-23.46875, -22.822265625, -22.17578125, -21.529296875, -20.8828125, -20.236328125, -19.58984375, -18.943359375, -18.296875, -17.650390625, -17.00390625, -16.357421875, -15.7109375, -15.064453125, -14.41796875, -13.771484375, -13.125, -12.478515625, -11.83203125, -11.185546875, -10.5390625, -9.892578125, -9.24609375, -8.599609375, -7.953125, -7.306640625, -6.66015625, -6.013671875, -5.3671875, -4.720703125, -4.07421875, -3.427734375, -2.78125, -2.134765625, -1.48828125, -0.841796875, -0.1953125, 0.451171875, 1.09765625, 1.744140625, 2.390625, 3.037109375, 3.68359375, 4.330078125, 4.9765625, 5.623046875, 6.26953125, 6.916015625, 7.5625, 8.208984375, 8.85546875, 9.501953125, 10.1484375, 10.794921875, 11.44140625, 12.087890625, 12.734375, 13.380859375, 14.02734375, 14.673828125, 15.3203125, 15.966796875, 16.61328125, 17.259765625, 17.90625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 54.0, 891.0, 68.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.42054748535156, -71.49449920654297, -66.56844329833984, -61.64239501953125, -56.71634292602539, -51.79029083251953, -46.86424255371094, -41.93819046020508, -37.01213836669922, -32.08608627319336, -27.160036087036133, -22.233985900878906, -17.307933807373047, -12.381881713867188, -7.455831527709961, -2.5297813415527344, 2.396270751953125, 7.322321891784668, 12.248373031616211, 17.174423217773438, 22.100475311279297, 27.026527404785156, 31.952577590942383, 36.87862777709961, 41.80467987060547, 46.73073196411133, 51.65678405761719, 56.58283233642578, 61.50888442993164, 66.4349365234375, 71.3609848022461, 76.28703308105469, 81.21308898925781, 86.1391372680664, 91.06519317626953, 95.99124145507812, 100.91729736328125, 105.84334564208984, 110.76939392089844, 115.69544982910156, 120.62149810791016, 125.54754638671875, 130.47360229492188, 135.399658203125, 140.32569885253906, 145.2517547607422, 150.1778106689453, 155.10385131835938, 160.0299072265625, 164.95596313476562, 169.8820037841797, 174.8080596923828, 179.73411560058594, 184.66015625, 189.58621215820312, 194.51226806640625, 199.43832397460938, 204.3643798828125, 209.29042053222656, 214.2164764404297, 219.1425323486328, 224.06857299804688, 228.99462890625, 233.92068481445312, 238.8467254638672]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 6.0, 3.0, 5.0, 7.0, 13.0, 12.0, 18.0, 17.0, 21.0, 15.0, 25.0, 28.0, 29.0, 17.0, 33.0, 40.0, 26.0, 56.0, 51.0, 40.0, 36.0, 54.0, 38.0, 32.0, 45.0, 47.0, 37.0, 29.0, 31.0, 27.0, 24.0, 17.0, 15.0, 25.0, 9.0, 10.0, 17.0, 13.0, 4.0, 12.0, 6.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.779748916625977, -15.178143501281738, -14.5765380859375, -13.974933624267578, -13.37332820892334, -12.771722793579102, -12.17011833190918, -11.568512916564941, -10.966907501220703, -10.365302085876465, -9.763696670532227, -9.162092208862305, -8.560486793518066, -7.958881378173828, -7.357276439666748, -6.755671501159668, -6.15406608581543, -5.552460670471191, -4.950855731964111, -4.349250793457031, -3.747645378112793, -3.146040201187134, -2.5444350242614746, -1.9428300857543945, -1.3412246704101562, -0.7396194934844971, -0.1380143165588379, 0.4635908603668213, 1.0651960372924805, 1.6668012142181396, 2.268406391143799, 2.870011329650879, 3.4716148376464844, 4.073220252990723, 4.674825191497803, 5.276430130004883, 5.878035545349121, 6.479640960693359, 7.0812458992004395, 7.6828508377075195, 8.284456253051758, 8.886061668395996, 9.487667083740234, 10.089271545410156, 10.690876960754395, 11.292482376098633, 11.894086837768555, 12.495692253112793, 13.097297668457031, 13.69890308380127, 14.300508499145508, 14.90211296081543, 15.503718376159668, 16.105323791503906, 16.706928253173828, 17.30853271484375, 17.910139083862305, 18.511743545532227, 19.11334991455078, 19.714954376220703, 20.316558837890625, 20.91816520690918, 21.5197696685791, 22.121376037597656, 22.722980499267578]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 5.0, 9.0, 12.0, 11.0, 10.0, 13.0, 17.0, 21.0, 29.0, 24.0, 31.0, 26.0, 33.0, 36.0, 43.0, 40.0, 48.0, 42.0, 33.0, 37.0, 51.0, 38.0, 49.0, 33.0, 44.0, 34.0, 18.0, 24.0, 28.0, 26.0, 22.0, 24.0, 20.0, 6.0, 13.0, 6.0, 7.0, 6.0, 9.0, 6.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01953125, -2.908447265625, -2.79736328125, -2.686279296875, -2.5751953125, -2.464111328125, -2.35302734375, -2.241943359375, -2.130859375, -2.019775390625, -1.90869140625, -1.797607421875, -1.6865234375, -1.575439453125, -1.46435546875, -1.353271484375, -1.2421875, -1.131103515625, -1.02001953125, -0.908935546875, -0.7978515625, -0.686767578125, -0.57568359375, -0.464599609375, -0.353515625, -0.242431640625, -0.13134765625, -0.020263671875, 0.0908203125, 0.201904296875, 0.31298828125, 0.424072265625, 0.53515625, 0.646240234375, 0.75732421875, 0.868408203125, 0.9794921875, 1.090576171875, 1.20166015625, 1.312744140625, 1.423828125, 1.534912109375, 1.64599609375, 1.757080078125, 1.8681640625, 1.979248046875, 2.09033203125, 2.201416015625, 2.3125, 2.423583984375, 2.53466796875, 2.645751953125, 2.7568359375, 2.867919921875, 2.97900390625, 3.090087890625, 3.201171875, 3.312255859375, 3.42333984375, 3.534423828125, 3.6455078125, 3.756591796875, 3.86767578125, 3.978759765625, 4.08984375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 9.0, 14.0, 20.0, 19.0, 29.0, 41.0, 44.0, 67.0, 84.0, 118.0, 127.0, 153.0, 260.0, 338.0, 489.0, 717.0, 1223.0, 2951.0, 12837.0, 118828.0, 2296306.0, 1662550.0, 81184.0, 9888.0, 2454.0, 1076.0, 671.0, 443.0, 323.0, 229.0, 192.0, 145.0, 98.0, 83.0, 61.0, 46.0, 40.0, 30.0, 19.0, 16.0, 20.0, 8.0, 11.0, 3.0, 2.0, 5.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6328125, -15.1104736328125, -14.588134765625, -14.0657958984375, -13.54345703125, -13.0211181640625, -12.498779296875, -11.9764404296875, -11.4541015625, -10.9317626953125, -10.409423828125, -9.8870849609375, -9.36474609375, -8.8424072265625, -8.320068359375, -7.7977294921875, -7.275390625, -6.7530517578125, -6.230712890625, -5.7083740234375, -5.18603515625, -4.6636962890625, -4.141357421875, -3.6190185546875, -3.0966796875, -2.5743408203125, -2.052001953125, -1.5296630859375, -1.00732421875, -0.4849853515625, 0.037353515625, 0.5596923828125, 1.08203125, 1.6043701171875, 2.126708984375, 2.6490478515625, 3.17138671875, 3.6937255859375, 4.216064453125, 4.7384033203125, 5.2607421875, 5.7830810546875, 6.305419921875, 6.8277587890625, 7.35009765625, 7.8724365234375, 8.394775390625, 8.9171142578125, 9.439453125, 9.9617919921875, 10.484130859375, 11.0064697265625, 11.52880859375, 12.0511474609375, 12.573486328125, 13.0958251953125, 13.6181640625, 14.1405029296875, 14.662841796875, 15.1851806640625, 15.70751953125, 16.2298583984375, 16.752197265625, 17.2745361328125, 17.796875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 10.0, 9.0, 19.0, 28.0, 27.0, 41.0, 59.0, 84.0, 105.0, 155.0, 224.0, 285.0, 368.0, 452.0, 501.0, 432.0, 345.0, 250.0, 194.0, 148.0, 102.0, 56.0, 60.0, 37.0, 26.0, 13.0, 13.0, 8.0, 14.0, 2.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.625, -8.38079833984375, -8.1365966796875, -7.89239501953125, -7.648193359375, -7.40399169921875, -7.1597900390625, -6.91558837890625, -6.67138671875, -6.42718505859375, -6.1829833984375, -5.93878173828125, -5.694580078125, -5.45037841796875, -5.2061767578125, -4.96197509765625, -4.7177734375, -4.47357177734375, -4.2293701171875, -3.98516845703125, -3.740966796875, -3.49676513671875, -3.2525634765625, -3.00836181640625, -2.76416015625, -2.51995849609375, -2.2757568359375, -2.03155517578125, -1.787353515625, -1.54315185546875, -1.2989501953125, -1.05474853515625, -0.810546875, -0.56634521484375, -0.3221435546875, -0.07794189453125, 0.166259765625, 0.41046142578125, 0.6546630859375, 0.89886474609375, 1.14306640625, 1.38726806640625, 1.6314697265625, 1.87567138671875, 2.119873046875, 2.36407470703125, 2.6082763671875, 2.85247802734375, 3.0966796875, 3.34088134765625, 3.5850830078125, 3.82928466796875, 4.073486328125, 4.31768798828125, 4.5618896484375, 4.80609130859375, 5.05029296875, 5.29449462890625, 5.5386962890625, 5.78289794921875, 6.027099609375, 6.27130126953125, 6.5155029296875, 6.75970458984375, 7.00390625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 4.0, 5.0, 15.0, 24.0, 26.0, 57.0, 73.0, 131.0, 322.0, 626.0, 1523.0, 4287.0, 14616.0, 66739.0, 382275.0, 2105575.0, 1347150.0, 215871.0, 40053.0, 9653.0, 3037.0, 1132.0, 513.0, 257.0, 121.0, 65.0, 33.0, 30.0, 20.0, 7.0, 5.0, 9.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.0625, -6.808837890625, -6.55517578125, -6.301513671875, -6.0478515625, -5.794189453125, -5.54052734375, -5.286865234375, -5.033203125, -4.779541015625, -4.52587890625, -4.272216796875, -4.0185546875, -3.764892578125, -3.51123046875, -3.257568359375, -3.00390625, -2.750244140625, -2.49658203125, -2.242919921875, -1.9892578125, -1.735595703125, -1.48193359375, -1.228271484375, -0.974609375, -0.720947265625, -0.46728515625, -0.213623046875, 0.0400390625, 0.293701171875, 0.54736328125, 0.801025390625, 1.0546875, 1.308349609375, 1.56201171875, 1.815673828125, 2.0693359375, 2.322998046875, 2.57666015625, 2.830322265625, 3.083984375, 3.337646484375, 3.59130859375, 3.844970703125, 4.0986328125, 4.352294921875, 4.60595703125, 4.859619140625, 5.11328125, 5.366943359375, 5.62060546875, 5.874267578125, 6.1279296875, 6.381591796875, 6.63525390625, 6.888916015625, 7.142578125, 7.396240234375, 7.64990234375, 7.903564453125, 8.1572265625, 8.410888671875, 8.66455078125, 8.918212890625, 9.171875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 10.0, 15.0, 23.0, 12.0, 34.0, 28.0, 39.0, 54.0, 45.0, 52.0, 61.0, 88.0, 79.0, 81.0, 81.0, 57.0, 49.0, 53.0, 32.0, 25.0, 20.0, 15.0, 14.0, 5.0, 4.0, 7.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.447107315063477, -24.990333557128906, -23.533557891845703, -22.076784133911133, -20.620010375976562, -19.163236618041992, -17.706462860107422, -16.24968719482422, -14.792913436889648, -13.336139678955078, -11.879364967346191, -10.422590255737305, -8.965816497802734, -7.509042263031006, -6.052268028259277, -4.595493316650391, -3.1387195587158203, -1.6819453239440918, -0.22517108917236328, 1.2316031455993652, 2.6883773803710938, 4.145151615142822, 5.601925849914551, 7.0587005615234375, 8.515474319458008, 9.972248077392578, 11.429022789001465, 12.885797500610352, 14.342571258544922, 15.799345016479492, 17.256118774414062, 18.712894439697266, 20.16967010498047, 21.62644386291504, 23.08321762084961, 24.539993286132812, 25.996767044067383, 27.453540802001953, 28.910316467285156, 30.367090225219727, 31.823863983154297, 33.2806396484375, 34.73741149902344, 36.19418716430664, 37.650962829589844, 39.10773468017578, 40.564510345458984, 42.02128601074219, 43.478057861328125, 44.93483352661133, 46.391605377197266, 47.84838104248047, 49.305152893066406, 50.76192855834961, 52.21870422363281, 53.67547607421875, 55.13225173950195, 56.589027404785156, 58.045799255371094, 59.5025749206543, 60.9593505859375, 62.41612243652344, 63.87289810180664, 65.32967376708984, 66.78644561767578]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 1.0, 4.0, 3.0, 7.0, 8.0, 3.0, 6.0, 14.0, 7.0, 14.0, 18.0, 10.0, 15.0, 21.0, 24.0, 21.0, 25.0, 32.0, 23.0, 35.0, 27.0, 35.0, 31.0, 30.0, 30.0, 32.0, 39.0, 41.0, 34.0, 28.0, 41.0, 34.0, 34.0, 18.0, 39.0, 31.0, 19.0, 15.0, 29.0, 23.0, 21.0, 17.0, 9.0, 12.0, 11.0, 7.0, 4.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.17131805419922, -23.375730514526367, -22.580142974853516, -21.784555435180664, -20.988967895507812, -20.19338035583496, -19.39779281616211, -18.602203369140625, -17.806617736816406, -17.011030197143555, -16.215442657470703, -15.419855117797852, -14.624267578125, -13.828680038452148, -13.03309154510498, -12.237504005432129, -11.441915512084961, -10.64632797241211, -9.850740432739258, -9.055152893066406, -8.259565353393555, -7.463977336883545, -6.668389320373535, -5.872801780700684, -5.077214241027832, -4.2816267013549805, -3.48603892326355, -2.690451145172119, -1.8948636054992676, -1.099276065826416, -0.30368804931640625, 0.4918994903564453, 1.2874889373779297, 2.0830764770507812, 2.878664255142212, 3.6742520332336426, 4.469839572906494, 5.265427112579346, 6.0610151290893555, 6.856602668762207, 7.652190208435059, 8.44777774810791, 9.243365287780762, 10.03895378112793, 10.834541320800781, 11.630128860473633, 12.425716400146484, 13.221303939819336, 14.016891479492188, 14.812479019165039, 15.60806655883789, 16.403654098510742, 17.199241638183594, 17.994829177856445, 18.790416717529297, 19.58600616455078, 20.381591796875, 21.17717933654785, 21.972766876220703, 22.768354415893555, 23.563941955566406, 24.359529495239258, 25.15511703491211, 25.950706481933594, 26.746294021606445]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 5.0, 1.0, 4.0, 6.0, 7.0, 13.0, 11.0, 16.0, 9.0, 21.0, 26.0, 21.0, 24.0, 20.0, 30.0, 34.0, 27.0, 41.0, 44.0, 39.0, 35.0, 34.0, 45.0, 44.0, 40.0, 46.0, 30.0, 34.0, 24.0, 24.0, 36.0, 34.0, 29.0, 24.0, 19.0, 17.0, 19.0, 11.0, 11.0, 10.0, 6.0, 8.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.90625, -51.224609375, -49.54296875, -47.861328125, -46.1796875, -44.498046875, -42.81640625, -41.134765625, -39.453125, -37.771484375, -36.08984375, -34.408203125, -32.7265625, -31.044921875, -29.36328125, -27.681640625, -26.0, -24.318359375, -22.63671875, -20.955078125, -19.2734375, -17.591796875, -15.91015625, -14.228515625, -12.546875, -10.865234375, -9.18359375, -7.501953125, -5.8203125, -4.138671875, -2.45703125, -0.775390625, 0.90625, 2.587890625, 4.26953125, 5.951171875, 7.6328125, 9.314453125, 10.99609375, 12.677734375, 14.359375, 16.041015625, 17.72265625, 19.404296875, 21.0859375, 22.767578125, 24.44921875, 26.130859375, 27.8125, 29.494140625, 31.17578125, 32.857421875, 34.5390625, 36.220703125, 37.90234375, 39.583984375, 41.265625, 42.947265625, 44.62890625, 46.310546875, 47.9921875, 49.673828125, 51.35546875, 53.037109375, 54.71875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 7.0, 7.0, 8.0, 12.0, 24.0, 50.0, 87.0, 121.0, 167.0, 294.0, 413.0, 638.0, 1044.0, 1545.0, 2278.0, 3567.0, 5310.0, 8099.0, 12586.0, 19291.0, 30505.0, 48636.0, 83710.0, 167648.0, 328298.0, 139496.0, 72888.0, 43664.0, 27578.0, 17715.0, 11495.0, 7378.0, 4782.0, 3263.0, 2006.0, 1370.0, 927.0, 580.0, 383.0, 253.0, 141.0, 113.0, 72.0, 46.0, 22.0, 13.0, 10.0, 9.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59326171875, -0.5749435424804688, -0.5566253662109375, -0.5383071899414062, -0.519989013671875, -0.5016708374023438, -0.4833526611328125, -0.46503448486328125, -0.44671630859375, -0.42839813232421875, -0.4100799560546875, -0.39176177978515625, -0.373443603515625, -0.35512542724609375, -0.3368072509765625, -0.31848907470703125, -0.3001708984375, -0.28185272216796875, -0.2635345458984375, -0.24521636962890625, -0.226898193359375, -0.20858001708984375, -0.1902618408203125, -0.17194366455078125, -0.15362548828125, -0.13530731201171875, -0.1169891357421875, -0.09867095947265625, -0.080352783203125, -0.06203460693359375, -0.0437164306640625, -0.02539825439453125, -0.007080078125, 0.01123809814453125, 0.0295562744140625, 0.04787445068359375, 0.066192626953125, 0.08451080322265625, 0.1028289794921875, 0.12114715576171875, 0.13946533203125, 0.15778350830078125, 0.1761016845703125, 0.19441986083984375, 0.212738037109375, 0.23105621337890625, 0.2493743896484375, 0.26769256591796875, 0.2860107421875, 0.30432891845703125, 0.3226470947265625, 0.34096527099609375, 0.359283447265625, 0.37760162353515625, 0.3959197998046875, 0.41423797607421875, 0.43255615234375, 0.45087432861328125, 0.4691925048828125, 0.48751068115234375, 0.505828857421875, 0.5241470336914062, 0.5424652099609375, 0.5607833862304688, 0.5791015625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 5.0, 6.0, 8.0, 10.0, 10.0, 18.0, 23.0, 14.0, 32.0, 26.0, 33.0, 21.0, 27.0, 41.0, 30.0, 31.0, 35.0, 42.0, 37.0, 34.0, 1057.0, 33.0, 47.0, 40.0, 44.0, 32.0, 36.0, 35.0, 30.0, 33.0, 19.0, 16.0, 23.0, 20.0, 14.0, 9.0, 12.0, 5.0, 12.0, 9.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.25, -41.0576171875, -39.865234375, -38.6728515625, -37.48046875, -36.2880859375, -35.095703125, -33.9033203125, -32.7109375, -31.5185546875, -30.326171875, -29.1337890625, -27.94140625, -26.7490234375, -25.556640625, -24.3642578125, -23.171875, -21.9794921875, -20.787109375, -19.5947265625, -18.40234375, -17.2099609375, -16.017578125, -14.8251953125, -13.6328125, -12.4404296875, -11.248046875, -10.0556640625, -8.86328125, -7.6708984375, -6.478515625, -5.2861328125, -4.09375, -2.9013671875, -1.708984375, -0.5166015625, 0.67578125, 1.8681640625, 3.060546875, 4.2529296875, 5.4453125, 6.6376953125, 7.830078125, 9.0224609375, 10.21484375, 11.4072265625, 12.599609375, 13.7919921875, 14.984375, 16.1767578125, 17.369140625, 18.5615234375, 19.75390625, 20.9462890625, 22.138671875, 23.3310546875, 24.5234375, 25.7158203125, 26.908203125, 28.1005859375, 29.29296875, 30.4853515625, 31.677734375, 32.8701171875, 34.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 6.0, 15.0, 26.0, 29.0, 45.0, 64.0, 97.0, 167.0, 251.0, 364.0, 554.0, 815.0, 1192.0, 1697.0, 2471.0, 3563.0, 5261.0, 7694.0, 11178.0, 16283.0, 24684.0, 37716.0, 60179.0, 103386.0, 214492.0, 1296672.0, 118180.0, 67044.0, 41431.0, 26785.0, 17457.0, 11820.0, 8112.0, 5520.0, 3800.0, 2558.0, 1770.0, 1262.0, 825.0, 590.0, 390.0, 232.0, 162.0, 99.0, 56.0, 41.0, 30.0, 20.0, 14.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29150390625, -0.2821311950683594, -0.27275848388671875, -0.2633857727050781, -0.2540130615234375, -0.24464035034179688, -0.23526763916015625, -0.22589492797851562, -0.216522216796875, -0.20714950561523438, -0.19777679443359375, -0.18840408325195312, -0.1790313720703125, -0.16965866088867188, -0.16028594970703125, -0.15091323852539062, -0.14154052734375, -0.13216781616210938, -0.12279510498046875, -0.11342239379882812, -0.1040496826171875, -0.09467697143554688, -0.08530426025390625, -0.07593154907226562, -0.066558837890625, -0.057186126708984375, -0.04781341552734375, -0.038440704345703125, -0.0290679931640625, -0.019695281982421875, -0.01032257080078125, -0.000949859619140625, 0.0084228515625, 0.017795562744140625, 0.02716827392578125, 0.036540985107421875, 0.0459136962890625, 0.055286407470703125, 0.06465911865234375, 0.07403182983398438, 0.083404541015625, 0.09277725219726562, 0.10214996337890625, 0.11152267456054688, 0.1208953857421875, 0.13026809692382812, 0.13964080810546875, 0.14901351928710938, 0.15838623046875, 0.16775894165039062, 0.17713165283203125, 0.18650436401367188, 0.1958770751953125, 0.20524978637695312, 0.21462249755859375, 0.22399520874023438, 0.233367919921875, 0.24274063110351562, 0.25211334228515625, 0.2614860534667969, 0.2708587646484375, 0.2802314758300781, 0.28960418701171875, 0.2989768981933594, 0.308349609375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 9.0, 6.0, 13.0, 12.0, 18.0, 9.0, 20.0, 15.0, 22.0, 21.0, 39.0, 35.0, 35.0, 42.0, 50.0, 42.0, 48.0, 38.0, 56.0, 72.0, 46.0, 53.0, 41.0, 33.0, 30.0, 39.0, 17.0, 31.0, 11.0, 30.0, 13.0, 14.0, 7.0, 12.0, 5.0, 7.0, 2.0, 2.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.496906280517578e-06, -6.2873587012290955e-06, -6.077811121940613e-06, -5.86826354265213e-06, -5.6587159633636475e-06, -5.449168384075165e-06, -5.239620804786682e-06, -5.0300732254981995e-06, -4.820525646209717e-06, -4.610978066921234e-06, -4.4014304876327515e-06, -4.191882908344269e-06, -3.982335329055786e-06, -3.7727877497673035e-06, -3.563240170478821e-06, -3.353692591190338e-06, -3.1441450119018555e-06, -2.934597432613373e-06, -2.72504985332489e-06, -2.5155022740364075e-06, -2.305954694747925e-06, -2.096407115459442e-06, -1.8868595361709595e-06, -1.6773119568824768e-06, -1.4677643775939941e-06, -1.2582167983055115e-06, -1.0486692190170288e-06, -8.391216397285461e-07, -6.295740604400635e-07, -4.200264811515808e-07, -2.1047890186309814e-07, -9.313225746154785e-10, 2.086162567138672e-07, 4.1816383600234985e-07, 6.277114152908325e-07, 8.372589945793152e-07, 1.0468065738677979e-06, 1.2563541531562805e-06, 1.4659017324447632e-06, 1.6754493117332458e-06, 1.8849968910217285e-06, 2.094544470310211e-06, 2.304092049598694e-06, 2.5136396288871765e-06, 2.723187208175659e-06, 2.932734787464142e-06, 3.1422823667526245e-06, 3.351829946041107e-06, 3.56137752532959e-06, 3.7709251046180725e-06, 3.980472683906555e-06, 4.190020263195038e-06, 4.3995678424835205e-06, 4.609115421772003e-06, 4.818663001060486e-06, 5.0282105803489685e-06, 5.237758159637451e-06, 5.447305738925934e-06, 5.6568533182144165e-06, 5.866400897502899e-06, 6.075948476791382e-06, 6.2854960560798645e-06, 6.495043635368347e-06, 6.70459121465683e-06, 6.9141387939453125e-06]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 14.0, 15.0, 18.0, 39.0, 47.0, 74.0, 83.0, 165.0, 267.0, 357.0, 584.0, 915.0, 1558.0, 2887.0, 5612.0, 10983.0, 26459.0, 57241.0, 130559.0, 242017.0, 266356.0, 164480.0, 74909.0, 32354.0, 15320.0, 6813.0, 3486.0, 1977.0, 1100.0, 643.0, 433.0, 246.0, 196.0, 97.0, 77.0, 55.0, 34.0, 18.0, 18.0, 16.0, 8.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7060508728027344e-05, -2.609938383102417e-05, -2.5138258934020996e-05, -2.4177134037017822e-05, -2.321600914001465e-05, -2.2254884243011475e-05, -2.12937593460083e-05, -2.0332634449005127e-05, -1.9371509552001953e-05, -1.841038465499878e-05, -1.7449259757995605e-05, -1.648813486099243e-05, -1.5527009963989258e-05, -1.4565885066986084e-05, -1.360476016998291e-05, -1.2643635272979736e-05, -1.1682510375976562e-05, -1.0721385478973389e-05, -9.760260581970215e-06, -8.799135684967041e-06, -7.838010787963867e-06, -6.876885890960693e-06, -5.9157609939575195e-06, -4.954636096954346e-06, -3.993511199951172e-06, -3.032386302947998e-06, -2.0712614059448242e-06, -1.1101365089416504e-06, -1.4901161193847656e-07, 8.121132850646973e-07, 1.773238182067871e-06, 2.734363079071045e-06, 3.6954879760742188e-06, 4.656612873077393e-06, 5.617737770080566e-06, 6.57886266708374e-06, 7.539987564086914e-06, 8.501112461090088e-06, 9.462237358093262e-06, 1.0423362255096436e-05, 1.138448715209961e-05, 1.2345612049102783e-05, 1.3306736946105957e-05, 1.4267861843109131e-05, 1.5228986740112305e-05, 1.619011163711548e-05, 1.7151236534118652e-05, 1.8112361431121826e-05, 1.9073486328125e-05, 2.0034611225128174e-05, 2.0995736122131348e-05, 2.195686101913452e-05, 2.2917985916137695e-05, 2.387911081314087e-05, 2.4840235710144043e-05, 2.5801360607147217e-05, 2.676248550415039e-05, 2.7723610401153564e-05, 2.8684735298156738e-05, 2.9645860195159912e-05, 3.0606985092163086e-05, 3.156810998916626e-05, 3.2529234886169434e-05, 3.349035978317261e-05, 3.445148468017578e-05]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 10.0, 17.0, 20.0, 25.0, 38.0, 50.0, 62.0, 59.0, 83.0, 93.0, 88.0, 69.0, 58.0, 65.0, 59.0, 57.0, 37.0, 33.0, 18.0, 13.0, 14.0, 5.0, 7.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.063694622251205e-06, -7.842925697332248e-06, -7.62215631766594e-06, -7.401387392746983e-06, -7.180618467828026e-06, -6.959849088161718e-06, -6.739080163242761e-06, -6.518311238323804e-06, -6.297542313404847e-06, -6.07677338848589e-06, -5.856004008819582e-06, -5.635235083900625e-06, -5.414466158981668e-06, -5.19369677931536e-06, -4.972927854396403e-06, -4.752158929477446e-06, -4.531390004558489e-06, -4.310621079639532e-06, -4.089851699973224e-06, -3.869082775054267e-06, -3.6483138501353096e-06, -3.427544697842677e-06, -3.2067755455500446e-06, -2.9860066206310876e-06, -2.7652372409647796e-06, -2.544468088672147e-06, -2.32369916375319e-06, -2.1029300114605576e-06, -1.8821610865416005e-06, -1.661391934248968e-06, -1.4406228956431733e-06, -1.2198538570373785e-06, -9.990849321184214e-07, -7.783158935126266e-07, -5.575468549068319e-07, -3.3677775945761823e-07, -1.1600872085182345e-07, 1.0476037459739018e-07, 3.2552941320318496e-07, 5.462984518089797e-07, 7.670674904147745e-07, 9.878365290205693e-07, 1.208605567626364e-06, 1.4293746062321588e-06, 1.6501437585247913e-06, 1.8709127971305861e-06, 2.091681835736381e-06, 2.312450760655338e-06, 2.5332199129479704e-06, 2.753989065240603e-06, 2.97475799015956e-06, 3.1955271424521925e-06, 3.4162960673711495e-06, 3.637065219663782e-06, 3.857834144582739e-06, 4.078603524249047e-06, 4.299372449168004e-06, 4.520141374086961e-06, 4.740910753753269e-06, 4.961679678672226e-06, 5.182448603591183e-06, 5.403217983257491e-06, 5.623986908176448e-06, 5.844755833095405e-06, 6.065524758014362e-06]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 8.0, 7.0, 6.0, 12.0, 8.0, 8.0, 15.0, 22.0, 27.0, 17.0, 27.0, 31.0, 22.0, 15.0, 38.0, 33.0, 42.0, 39.0, 42.0, 30.0, 40.0, 22.0, 53.0, 50.0, 47.0, 33.0, 28.0, 47.0, 12.0, 16.0, 20.0, 28.0, 28.0, 31.0, 15.0, 10.0, 17.0, 4.0, 18.0, 7.0, 4.0, 12.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.516674041748047e-06, -3.4049153327941895e-06, -3.293156623840332e-06, -3.1813979148864746e-06, -3.069639205932617e-06, -2.9578804969787598e-06, -2.8461217880249023e-06, -2.734363079071045e-06, -2.6226043701171875e-06, -2.51084566116333e-06, -2.3990869522094727e-06, -2.2873282432556152e-06, -2.175569534301758e-06, -2.0638108253479004e-06, -1.952052116394043e-06, -1.8402934074401855e-06, -1.7285346984863281e-06, -1.6167759895324707e-06, -1.5050172805786133e-06, -1.3932585716247559e-06, -1.2814998626708984e-06, -1.169741153717041e-06, -1.0579824447631836e-06, -9.462237358093262e-07, -8.344650268554688e-07, -7.227063179016113e-07, -6.109476089477539e-07, -4.991888999938965e-07, -3.8743019104003906e-07, -2.7567148208618164e-07, -1.6391277313232422e-07, -5.21540641784668e-08, 5.960464477539063e-08, 1.7136335372924805e-07, 2.8312206268310547e-07, 3.948807716369629e-07, 5.066394805908203e-07, 6.183981895446777e-07, 7.301568984985352e-07, 8.419156074523926e-07, 9.5367431640625e-07, 1.0654330253601074e-06, 1.1771917343139648e-06, 1.2889504432678223e-06, 1.4007091522216797e-06, 1.5124678611755371e-06, 1.6242265701293945e-06, 1.735985279083252e-06, 1.8477439880371094e-06, 1.959502696990967e-06, 2.0712614059448242e-06, 2.1830201148986816e-06, 2.294778823852539e-06, 2.4065375328063965e-06, 2.518296241760254e-06, 2.6300549507141113e-06, 2.7418136596679688e-06, 2.853572368621826e-06, 2.9653310775756836e-06, 3.077089786529541e-06, 3.1888484954833984e-06, 3.300607204437256e-06, 3.4123659133911133e-06, 3.5241246223449707e-06, 3.635883331298828e-06]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 5.0, 1.0, 4.0, 6.0, 7.0, 13.0, 11.0, 16.0, 9.0, 21.0, 26.0, 21.0, 24.0, 20.0, 30.0, 34.0, 27.0, 41.0, 44.0, 39.0, 35.0, 34.0, 45.0, 44.0, 40.0, 46.0, 30.0, 34.0, 24.0, 24.0, 36.0, 34.0, 29.0, 24.0, 19.0, 17.0, 19.0, 11.0, 11.0, 10.0, 6.0, 8.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.90625, -51.224609375, -49.54296875, -47.861328125, -46.1796875, -44.498046875, -42.81640625, -41.134765625, -39.453125, -37.771484375, -36.08984375, -34.408203125, -32.7265625, -31.044921875, -29.36328125, -27.681640625, -26.0, -24.318359375, -22.63671875, -20.955078125, -19.2734375, -17.591796875, -15.91015625, -14.228515625, -12.546875, -10.865234375, -9.18359375, -7.501953125, -5.8203125, -4.138671875, -2.45703125, -0.775390625, 0.90625, 2.587890625, 4.26953125, 5.951171875, 7.6328125, 9.314453125, 10.99609375, 12.677734375, 14.359375, 16.041015625, 17.72265625, 19.404296875, 21.0859375, 22.767578125, 24.44921875, 26.130859375, 27.8125, 29.494140625, 31.17578125, 32.857421875, 34.5390625, 36.220703125, 37.90234375, 39.583984375, 41.265625, 42.947265625, 44.62890625, 46.310546875, 47.9921875, 49.673828125, 51.35546875, 53.037109375, 54.71875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 9.0, 6.0, 5.0, 7.0, 9.0, 16.0, 15.0, 18.0, 29.0, 35.0, 53.0, 63.0, 68.0, 100.0, 153.0, 240.0, 384.0, 822.0, 1809.0, 5863.0, 21949.0, 90920.0, 312146.0, 408016.0, 153457.0, 37603.0, 9498.0, 2707.0, 1118.0, 523.0, 261.0, 177.0, 97.0, 93.0, 69.0, 47.0, 46.0, 34.0, 30.0, 12.0, 12.0, 12.0, 12.0, 5.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.159423828125, -7.88916015625, -7.618896484375, -7.3486328125, -7.078369140625, -6.80810546875, -6.537841796875, -6.267578125, -5.997314453125, -5.72705078125, -5.456787109375, -5.1865234375, -4.916259765625, -4.64599609375, -4.375732421875, -4.10546875, -3.835205078125, -3.56494140625, -3.294677734375, -3.0244140625, -2.754150390625, -2.48388671875, -2.213623046875, -1.943359375, -1.673095703125, -1.40283203125, -1.132568359375, -0.8623046875, -0.592041015625, -0.32177734375, -0.051513671875, 0.21875, 0.489013671875, 0.75927734375, 1.029541015625, 1.2998046875, 1.570068359375, 1.84033203125, 2.110595703125, 2.380859375, 2.651123046875, 2.92138671875, 3.191650390625, 3.4619140625, 3.732177734375, 4.00244140625, 4.272705078125, 4.54296875, 4.813232421875, 5.08349609375, 5.353759765625, 5.6240234375, 5.894287109375, 6.16455078125, 6.434814453125, 6.705078125, 6.975341796875, 7.24560546875, 7.515869140625, 7.7861328125, 8.056396484375, 8.32666015625, 8.596923828125, 8.8671875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 11.0, 14.0, 5.0, 15.0, 20.0, 32.0, 38.0, 46.0, 37.0, 52.0, 68.0, 66.0, 68.0, 2113.0, 72.0, 65.0, 51.0, 63.0, 44.0, 37.0, 23.0, 29.0, 25.0, 12.0, 10.0, 6.0, 3.0, 3.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.5625, -106.9296875, -103.296875, -99.6640625, -96.03125, -92.3984375, -88.765625, -85.1328125, -81.5, -77.8671875, -74.234375, -70.6015625, -66.96875, -63.3359375, -59.703125, -56.0703125, -52.4375, -48.8046875, -45.171875, -41.5390625, -37.90625, -34.2734375, -30.640625, -27.0078125, -23.375, -19.7421875, -16.109375, -12.4765625, -8.84375, -5.2109375, -1.578125, 2.0546875, 5.6875, 9.3203125, 12.953125, 16.5859375, 20.21875, 23.8515625, 27.484375, 31.1171875, 34.75, 38.3828125, 42.015625, 45.6484375, 49.28125, 52.9140625, 56.546875, 60.1796875, 63.8125, 67.4453125, 71.078125, 74.7109375, 78.34375, 81.9765625, 85.609375, 89.2421875, 92.875, 96.5078125, 100.140625, 103.7734375, 107.40625, 111.0390625, 114.671875, 118.3046875, 121.9375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 12.0, 8.0, 22.0, 27.0, 30.0, 46.0, 49.0, 95.0, 138.0, 208.0, 330.0, 568.0, 1295.0, 4400.0, 47585.0, 2831129.0, 243544.0, 11987.0, 2179.0, 816.0, 430.0, 255.0, 178.0, 94.0, 74.0, 70.0, 36.0, 32.0, 25.0, 10.0, 10.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.40625, -15.854736328125, -15.30322265625, -14.751708984375, -14.2001953125, -13.648681640625, -13.09716796875, -12.545654296875, -11.994140625, -11.442626953125, -10.89111328125, -10.339599609375, -9.7880859375, -9.236572265625, -8.68505859375, -8.133544921875, -7.58203125, -7.030517578125, -6.47900390625, -5.927490234375, -5.3759765625, -4.824462890625, -4.27294921875, -3.721435546875, -3.169921875, -2.618408203125, -2.06689453125, -1.515380859375, -0.9638671875, -0.412353515625, 0.13916015625, 0.690673828125, 1.2421875, 1.793701171875, 2.34521484375, 2.896728515625, 3.4482421875, 3.999755859375, 4.55126953125, 5.102783203125, 5.654296875, 6.205810546875, 6.75732421875, 7.308837890625, 7.8603515625, 8.411865234375, 8.96337890625, 9.514892578125, 10.06640625, 10.617919921875, 11.16943359375, 11.720947265625, 12.2724609375, 12.823974609375, 13.37548828125, 13.927001953125, 14.478515625, 15.030029296875, 15.58154296875, 16.133056640625, 16.6845703125, 17.236083984375, 17.78759765625, 18.339111328125, 18.890625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 8.0, 5.0, 11.0, 19.0, 19.0, 54.0, 70.0, 106.0, 124.0, 144.0, 109.0, 97.0, 85.0, 42.0, 25.0, 25.0, 18.0, 5.0, 7.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.08516693115234, -114.35338592529297, -110.6216049194336, -106.88983154296875, -103.15805053710938, -99.42626953125, -95.69448852539062, -91.96270751953125, -88.23092651367188, -84.4991455078125, -80.76736450195312, -77.03558349609375, -73.3038101196289, -69.57202911376953, -65.84024810791016, -62.10846710205078, -58.37669372558594, -54.64491271972656, -50.91313552856445, -47.18135452270508, -43.44957733154297, -39.717796325683594, -35.98601531982422, -32.254234313964844, -28.522457122802734, -24.790678024291992, -21.05889892578125, -17.327117919921875, -13.595338821411133, -9.86355972290039, -6.131778717041016, -2.3999996185302734, 1.3317794799804688, 5.063559055328369, 8.79533863067627, 12.527118682861328, 16.25889778137207, 19.990676879882812, 23.722457885742188, 27.45423698425293, 31.186016082763672, 34.91779708862305, 38.649574279785156, 42.38135528564453, 46.113136291503906, 49.844913482666016, 53.57669448852539, 57.3084716796875, 61.040252685546875, 64.77203369140625, 68.50381469726562, 72.235595703125, 75.96736907958984, 79.69915008544922, 83.4309310913086, 87.16271209716797, 90.89448547363281, 94.62626647949219, 98.35804748535156, 102.08982849121094, 105.82160186767578, 109.55338287353516, 113.28516387939453, 117.0169448852539, 120.74872589111328]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 2.0, 3.0, 6.0, 6.0, 8.0, 10.0, 11.0, 11.0, 19.0, 9.0, 17.0, 22.0, 25.0, 19.0, 35.0, 29.0, 32.0, 42.0, 35.0, 38.0, 49.0, 45.0, 36.0, 41.0, 43.0, 39.0, 38.0, 36.0, 26.0, 34.0, 28.0, 30.0, 21.0, 19.0, 15.0, 22.0, 14.0, 14.0, 11.0, 6.0, 12.0, 7.0, 9.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-105.35623168945312, -101.88427734375, -98.4123306274414, -94.94037628173828, -91.46842956542969, -87.99647521972656, -84.52452850341797, -81.05257415771484, -77.58062744140625, -74.10867309570312, -70.63672637939453, -67.1647720336914, -63.69282531738281, -60.22087097167969, -56.748924255371094, -53.27696990966797, -49.80501937866211, -46.33306884765625, -42.86111831665039, -39.38916778564453, -35.91721725463867, -32.44526672363281, -28.97331428527832, -25.50136375427246, -22.0294132232666, -18.557462692260742, -15.085512161254883, -11.613560676574707, -8.141610145568848, -4.669658660888672, -1.1977081298828125, 2.274242401123047, 5.746192932128906, 9.218143463134766, 12.690093994140625, 16.162044525146484, 19.633995056152344, 23.105947494506836, 26.577898025512695, 30.049848556518555, 33.52179718017578, 36.99374771118164, 40.4656982421875, 43.93764877319336, 47.40959930419922, 50.881553649902344, 54.35350036621094, 57.82545471191406, 61.29740524291992, 64.76935577392578, 68.2413101196289, 71.7132568359375, 75.18521118164062, 78.65715789794922, 82.12911224365234, 85.60105895996094, 89.07301330566406, 92.54496765136719, 96.01691436767578, 99.4888687133789, 102.9608154296875, 106.43276977539062, 109.90471649169922, 113.37667083740234, 116.84861755371094]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 11.0, 16.0, 20.0, 22.0, 21.0, 36.0, 37.0, 54.0, 72.0, 69.0, 108.0, 158.0, 168.0, 232.0, 275.0, 290.0, 427.0, 514.0, 610.0, 722.0, 1178.0, 1039573.0, 789.0, 597.0, 512.0, 414.0, 306.0, 259.0, 231.0, 160.0, 134.0, 118.0, 75.0, 83.0, 64.0, 61.0, 30.0, 26.0, 25.0, 12.0, 6.0, 11.0, 8.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.267873764038086, -30.29191017150879, -29.31594467163086, -28.339981079101562, -27.364017486572266, -26.38805389404297, -25.412090301513672, -24.436124801635742, -23.460161209106445, -22.48419761657715, -21.50823211669922, -20.532268524169922, -19.556304931640625, -18.580341339111328, -17.60437774658203, -16.6284122467041, -15.652448654174805, -14.676485061645508, -13.700520515441895, -12.724555969238281, -11.748592376708984, -10.772628784179688, -9.796664237976074, -8.820699691772461, -7.844736099243164, -6.868772029876709, -5.892807960510254, -4.916843891143799, -3.9408798217773438, -2.9649157524108887, -1.9889516830444336, -1.0129876136779785, -0.03702354431152344, 0.9389405250549316, 1.9149045944213867, 2.890868663787842, 3.866832733154297, 4.842796802520752, 5.818760871887207, 6.794724941253662, 7.770689010620117, 8.746652603149414, 9.722617149353027, 10.69858169555664, 11.674545288085938, 12.650508880615234, 13.626473426818848, 14.602437973022461, 15.578401565551758, 16.554365158081055, 17.530330657958984, 18.50629425048828, 19.482257843017578, 20.458221435546875, 21.434185028076172, 22.4101505279541, 23.3861141204834, 24.362077713012695, 25.338043212890625, 26.314006805419922, 27.28997039794922, 28.265933990478516, 29.241897583007812, 30.217863082885742, 31.19382667541504]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 4.0, 9.0, 5.0, 12.0, 24.0, 46.0, 58.0, 149.0, 7815.0, 51454584.0, 286.0, 43.0, 22.0, 21.0, 27.0, 14.0, 6.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1564.4718017578125, -1514.3001708984375, -1464.128662109375, -1413.95703125, -1363.7855224609375, -1313.6138916015625, -1263.4423828125, -1213.270751953125, -1163.09912109375, -1112.927490234375, -1062.7559814453125, -1012.5843505859375, -962.412841796875, -912.2412109375, -862.0696411132812, -811.8980712890625, -761.7265625, -711.5549926757812, -661.3834228515625, -611.2117919921875, -561.040283203125, -510.8686828613281, -460.69708251953125, -410.5255126953125, -360.35394287109375, -310.182373046875, -260.01080322265625, -209.83920288085938, -159.66763305664062, -109.49606323242188, -59.324462890625, -9.15289306640625, 41.0186767578125, 91.19025421142578, 141.36183166503906, 191.53341674804688, 241.70498657226562, 291.8765563964844, 342.04815673828125, 392.2197265625, 442.39129638671875, 492.5628662109375, 542.7344360351562, 592.906005859375, 643.07763671875, 693.2491455078125, 743.4207763671875, 793.5923461914062, 843.763916015625, 893.9354858398438, 944.1070556640625, 994.2786865234375, 1044.4501953125, 1094.621826171875, 1144.79345703125, 1194.9649658203125, 1245.136474609375, 1295.30810546875, 1345.4796142578125, 1395.6512451171875, 1445.82275390625, 1495.994384765625, 1546.166015625, 1596.3375244140625, 1646.5091552734375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [4.0, 3.0, 10.0, 20.0, 33.0, 68.0, 92.0, 142.0, 213.0, 241.0, 347.0, 528.0, 690.0, 912.0, 1269.0, 1878.0, 2666.0, 3686.0, 5203.0, 7160.0, 10027.0, 14067.0, 19960.0, 28022.0, 39929.0, 57893.0, 83852.0, 125163.0, 188280.0, 309452.0, 625274.0, 3809746.0, 331782.0, 198973.0, 130506.0, 89335.0, 61382.0, 42315.0, 29376.0, 20441.0, 14358.0, 10090.0, 7275.0, 5354.0, 3747.0, 2729.0, 1945.0, 1361.0, 1029.0, 792.0, 497.0, 404.0, 307.0, 209.0, 141.0, 103.0, 73.0, 49.0, 26.0, 12.0, 7.0, 4.0, 2.0, 2.0], "bins": [-0.125244140625, -0.12121200561523438, -0.11717987060546875, -0.11314773559570312, -0.1091156005859375, -0.10508346557617188, -0.10105133056640625, -0.09701919555664062, -0.092987060546875, -0.08895492553710938, -0.08492279052734375, -0.08089065551757812, -0.0768585205078125, -0.07282638549804688, -0.06879425048828125, -0.06476211547851562, -0.06072998046875, -0.056697845458984375, -0.05266571044921875, -0.048633575439453125, -0.0446014404296875, -0.040569305419921875, -0.03653717041015625, -0.032505035400390625, -0.028472900390625, -0.024440765380859375, -0.02040863037109375, -0.016376495361328125, -0.0123443603515625, -0.008312225341796875, -0.00428009033203125, -0.000247955322265625, 0.0037841796875, 0.007816314697265625, 0.01184844970703125, 0.015880584716796875, 0.0199127197265625, 0.023944854736328125, 0.02797698974609375, 0.032009124755859375, 0.036041259765625, 0.040073394775390625, 0.04410552978515625, 0.048137664794921875, 0.0521697998046875, 0.056201934814453125, 0.06023406982421875, 0.06426620483398438, 0.06829833984375, 0.07233047485351562, 0.07636260986328125, 0.08039474487304688, 0.0844268798828125, 0.08845901489257812, 0.09249114990234375, 0.09652328491210938, 0.100555419921875, 0.10458755493164062, 0.10861968994140625, 0.11265182495117188, 0.1166839599609375, 0.12071609497070312, 0.12474822998046875, 0.12878036499023438, 0.1328125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 10.0, 10.0, 20.0, 14.0, 15.0, 25.0, 25.0, 31.0, 34.0, 26.0, 30.0, 35.0, 24.0, 29.0, 32.0, 28.0, 40.0, 1071.0, 38.0, 41.0, 39.0, 42.0, 38.0, 38.0, 36.0, 26.0, 32.0, 28.0, 22.0, 16.0, 11.0, 14.0, 15.0, 7.0, 12.0, 9.0, 6.0, 8.0, 4.0, 7.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-15.25, -14.7684326171875, -14.286865234375, -13.8052978515625, -13.32373046875, -12.8421630859375, -12.360595703125, -11.8790283203125, -11.3974609375, -10.9158935546875, -10.434326171875, -9.9527587890625, -9.47119140625, -8.9896240234375, -8.508056640625, -8.0264892578125, -7.544921875, -7.0633544921875, -6.581787109375, -6.1002197265625, -5.61865234375, -5.1370849609375, -4.655517578125, -4.1739501953125, -3.6923828125, -3.2108154296875, -2.729248046875, -2.2476806640625, -1.76611328125, -1.2845458984375, -0.802978515625, -0.3214111328125, 0.16015625, 0.6417236328125, 1.123291015625, 1.6048583984375, 2.08642578125, 2.5679931640625, 3.049560546875, 3.5311279296875, 4.0126953125, 4.4942626953125, 4.975830078125, 5.4573974609375, 5.93896484375, 6.4205322265625, 6.902099609375, 7.3836669921875, 7.865234375, 8.3468017578125, 8.828369140625, 9.3099365234375, 9.79150390625, 10.2730712890625, 10.754638671875, 11.2362060546875, 11.7177734375, 12.1993408203125, 12.680908203125, 13.1624755859375, 13.64404296875, 14.1256103515625, 14.607177734375, 15.0887451171875, 15.5703125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 1.0, 4.0, 1.0, 5.0, 14.0, 19.0, 28.0, 23.0, 39.0, 49.0, 62.0, 107.0, 174.0, 292.0, 409.0, 642.0, 932.0, 1523.0, 2427.0, 4122.0, 6288.0, 10257.0, 16683.0, 27674.0, 45562.0, 77337.0, 132803.0, 241392.0, 500195.0, 4044664.0, 560217.0, 263235.0, 144212.0, 83933.0, 48733.0, 29394.0, 18386.0, 11279.0, 6865.0, 4338.0, 2551.0, 1635.0, 995.0, 639.0, 449.0, 280.0, 199.0, 114.0, 68.0, 48.0, 39.0, 28.0, 27.0, 19.0, 10.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1212158203125, -0.11725044250488281, -0.11328506469726562, -0.10931968688964844, -0.10535430908203125, -0.10138893127441406, -0.09742355346679688, -0.09345817565917969, -0.0894927978515625, -0.08552742004394531, -0.08156204223632812, -0.07759666442871094, -0.07363128662109375, -0.06966590881347656, -0.06570053100585938, -0.06173515319824219, -0.057769775390625, -0.05380439758300781, -0.049839019775390625, -0.04587364196777344, -0.04190826416015625, -0.03794288635253906, -0.033977508544921875, -0.030012130737304688, -0.0260467529296875, -0.022081375122070312, -0.018115997314453125, -0.014150619506835938, -0.01018524169921875, -0.0062198638916015625, -0.002254486083984375, 0.0017108917236328125, 0.00567626953125, 0.009641647338867188, 0.013607025146484375, 0.017572402954101562, 0.02153778076171875, 0.025503158569335938, 0.029468536376953125, 0.03343391418457031, 0.0373992919921875, 0.04136466979980469, 0.045330047607421875, 0.04929542541503906, 0.05326080322265625, 0.05722618103027344, 0.061191558837890625, 0.06515693664550781, 0.069122314453125, 0.07308769226074219, 0.07705307006835938, 0.08101844787597656, 0.08498382568359375, 0.08894920349121094, 0.09291458129882812, 0.09687995910644531, 0.1008453369140625, 0.10481071472167969, 0.10877609252929688, 0.11274147033691406, 0.11670684814453125, 0.12067222595214844, 0.12463760375976562, 0.1286029815673828, 0.132568359375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 7.0, 8.0, 15.0, 10.0, 13.0, 19.0, 18.0, 25.0, 27.0, 15.0, 34.0, 36.0, 27.0, 35.0, 40.0, 46.0, 36.0, 41.0, 1064.0, 43.0, 31.0, 37.0, 41.0, 34.0, 36.0, 33.0, 29.0, 38.0, 31.0, 21.0, 27.0, 14.0, 9.0, 15.0, 9.0, 13.0, 14.0, 7.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.875, -12.457763671875, -12.04052734375, -11.623291015625, -11.2060546875, -10.788818359375, -10.37158203125, -9.954345703125, -9.537109375, -9.119873046875, -8.70263671875, -8.285400390625, -7.8681640625, -7.450927734375, -7.03369140625, -6.616455078125, -6.19921875, -5.781982421875, -5.36474609375, -4.947509765625, -4.5302734375, -4.113037109375, -3.69580078125, -3.278564453125, -2.861328125, -2.444091796875, -2.02685546875, -1.609619140625, -1.1923828125, -0.775146484375, -0.35791015625, 0.059326171875, 0.4765625, 0.893798828125, 1.31103515625, 1.728271484375, 2.1455078125, 2.562744140625, 2.97998046875, 3.397216796875, 3.814453125, 4.231689453125, 4.64892578125, 5.066162109375, 5.4833984375, 5.900634765625, 6.31787109375, 6.735107421875, 7.15234375, 7.569580078125, 7.98681640625, 8.404052734375, 8.8212890625, 9.238525390625, 9.65576171875, 10.072998046875, 10.490234375, 10.907470703125, 11.32470703125, 11.741943359375, 12.1591796875, 12.576416015625, 12.99365234375, 13.410888671875, 13.828125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 6.0, 11.0, 19.0, 14.0, 19.0, 14.0, 29.0, 45.0, 63.0, 68.0, 84.0, 90.0, 134.0, 192.0, 289.0, 362.0, 689.0, 1489.0, 3934.0, 11960.0, 50091.0, 5974630.0, 204342.0, 28877.0, 8220.0, 2884.0, 1110.0, 594.0, 326.0, 204.0, 172.0, 116.0, 74.0, 57.0, 53.0, 54.0, 32.0, 26.0, 11.0, 14.0, 12.0, 5.0, 9.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.7216796875, -0.6966400146484375, -0.671600341796875, -0.6465606689453125, -0.62152099609375, -0.5964813232421875, -0.571441650390625, -0.5464019775390625, -0.5213623046875, -0.4963226318359375, -0.471282958984375, -0.4462432861328125, -0.42120361328125, -0.3961639404296875, -0.371124267578125, -0.3460845947265625, -0.321044921875, -0.2960052490234375, -0.270965576171875, -0.2459259033203125, -0.22088623046875, -0.1958465576171875, -0.170806884765625, -0.1457672119140625, -0.1207275390625, -0.0956878662109375, -0.070648193359375, -0.0456085205078125, -0.02056884765625, 0.0044708251953125, 0.029510498046875, 0.0545501708984375, 0.07958984375, 0.1046295166015625, 0.129669189453125, 0.1547088623046875, 0.17974853515625, 0.2047882080078125, 0.229827880859375, 0.2548675537109375, 0.2799072265625, 0.3049468994140625, 0.329986572265625, 0.3550262451171875, 0.38006591796875, 0.4051055908203125, 0.430145263671875, 0.4551849365234375, 0.480224609375, 0.5052642822265625, 0.530303955078125, 0.5553436279296875, 0.58038330078125, 0.6054229736328125, 0.630462646484375, 0.6555023193359375, 0.6805419921875, 0.7055816650390625, 0.730621337890625, 0.7556610107421875, 0.78070068359375, 0.8057403564453125, 0.830780029296875, 0.8558197021484375, 0.880859375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 4.0, 5.0, 5.0, 8.0, 13.0, 13.0, 17.0, 20.0, 14.0, 25.0, 36.0, 37.0, 35.0, 38.0, 47.0, 45.0, 34.0, 47.0, 1073.0, 67.0, 51.0, 48.0, 42.0, 49.0, 45.0, 35.0, 26.0, 30.0, 26.0, 18.0, 11.0, 13.0, 13.0, 10.0, 10.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -11.992431640625, -11.56298828125, -11.133544921875, -10.7041015625, -10.274658203125, -9.84521484375, -9.415771484375, -8.986328125, -8.556884765625, -8.12744140625, -7.697998046875, -7.2685546875, -6.839111328125, -6.40966796875, -5.980224609375, -5.55078125, -5.121337890625, -4.69189453125, -4.262451171875, -3.8330078125, -3.403564453125, -2.97412109375, -2.544677734375, -2.115234375, -1.685791015625, -1.25634765625, -0.826904296875, -0.3974609375, 0.031982421875, 0.46142578125, 0.890869140625, 1.3203125, 1.749755859375, 2.17919921875, 2.608642578125, 3.0380859375, 3.467529296875, 3.89697265625, 4.326416015625, 4.755859375, 5.185302734375, 5.61474609375, 6.044189453125, 6.4736328125, 6.903076171875, 7.33251953125, 7.761962890625, 8.19140625, 8.620849609375, 9.05029296875, 9.479736328125, 9.9091796875, 10.338623046875, 10.76806640625, 11.197509765625, 11.626953125, 12.056396484375, 12.48583984375, 12.915283203125, 13.3447265625, 13.774169921875, 14.20361328125, 14.633056640625, 15.0625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 16.0, 964.0, 33.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.80882263183594, -76.42049407958984, -73.03216552734375, -69.64382934570312, -66.25550079345703, -62.86717224121094, -59.478843688964844, -56.09051513671875, -52.702186584472656, -49.31385803222656, -45.9255256652832, -42.53719711303711, -39.148868560791016, -35.760536193847656, -32.37220764160156, -28.98387908935547, -25.59554672241211, -22.207216262817383, -18.81888771057129, -15.430557250976562, -12.042227745056152, -8.653898239135742, -5.265567779541016, -1.8772392272949219, 1.5110912322998047, 4.899420738220215, 8.287750244140625, 11.676080703735352, 15.064410209655762, 18.452739715576172, 21.8410701751709, 25.229398727416992, 28.61772918701172, 32.00605773925781, 35.39439010620117, 38.782718658447266, 42.17104721069336, 45.55937957763672, 48.94770812988281, 52.336036682128906, 55.724365234375, 59.112693786621094, 62.50102615356445, 65.88935852050781, 69.2776870727539, 72.666015625, 76.0543441772461, 79.44267272949219, 82.83100891113281, 86.2193374633789, 89.607666015625, 92.99600219726562, 96.38433074951172, 99.77265930175781, 103.1609878540039, 106.54931640625, 109.9376449584961, 113.32597351074219, 116.71430206298828, 120.10263061523438, 123.490966796875, 126.8792953491211, 130.2676239013672, 133.65594482421875, 137.04428100585938]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 3.0, 6.0, 3.0, 8.0, 17.0, 15.0, 15.0, 20.0, 15.0, 22.0, 19.0, 25.0, 24.0, 30.0, 29.0, 32.0, 36.0, 47.0, 38.0, 44.0, 33.0, 30.0, 39.0, 37.0, 38.0, 32.0, 30.0, 38.0, 26.0, 36.0, 31.0, 37.0, 22.0, 15.0, 14.0, 17.0, 16.0, 9.0, 13.0, 6.0, 9.0, 7.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.41275978088379, -24.678314208984375, -23.94386863708496, -23.209423065185547, -22.4749755859375, -21.740530014038086, -21.006084442138672, -20.271638870239258, -19.537193298339844, -18.80274772644043, -18.068302154541016, -17.3338565826416, -16.599411010742188, -15.864964485168457, -15.130517959594727, -14.396072387695312, -13.661626815795898, -12.927181243896484, -12.19273567199707, -11.45828914642334, -10.723843574523926, -9.989398002624512, -9.254951477050781, -8.520505905151367, -7.786060333251953, -7.051614761352539, -6.317168712615967, -5.5827226638793945, -4.8482770919799805, -4.113831520080566, -3.379385471343994, -2.644939422607422, -1.9104957580566406, -1.1760499477386475, -0.4416041374206543, 0.29284167289733887, 1.027287483215332, 1.7617332935333252, 2.4961791038513184, 3.2306251525878906, 3.9650707244873047, 4.699516296386719, 5.433962345123291, 6.168408393859863, 6.902853965759277, 7.637299537658691, 8.371746063232422, 9.106191635131836, 9.84063720703125, 10.575082778930664, 11.309528350830078, 12.043974876403809, 12.778420448303223, 13.512866020202637, 14.247312545776367, 14.981758117675781, 15.716203689575195, 16.45064926147461, 17.185094833374023, 17.919540405273438, 18.653987884521484, 19.3884334564209, 20.122879028320312, 20.857324600219727, 21.59177017211914]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 8.0, 5.0, 7.0, 13.0, 14.0, 19.0, 21.0, 43.0, 42.0, 51.0, 103.0, 94.0, 147.0, 201.0, 285.0, 463.0, 810.0, 1728.0, 6969.0, 187180.0, 3980253.0, 11540.0, 2294.0, 719.0, 407.0, 259.0, 202.0, 105.0, 91.0, 44.0, 33.0, 42.0, 22.0, 14.0, 14.0, 13.0, 2.0, 3.0, 2.0, 2.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.058135986328125, -0.05606412887573242, -0.053992271423339844, -0.051920413970947266, -0.04984855651855469, -0.04777669906616211, -0.04570484161376953, -0.04363298416137695, -0.041561126708984375, -0.0394892692565918, -0.03741741180419922, -0.03534555435180664, -0.03327369689941406, -0.031201839447021484, -0.029129981994628906, -0.027058124542236328, -0.02498626708984375, -0.022914409637451172, -0.020842552185058594, -0.018770694732666016, -0.016698837280273438, -0.01462697982788086, -0.012555122375488281, -0.010483264923095703, -0.008411407470703125, -0.006339550018310547, -0.004267692565917969, -0.0021958351135253906, -0.0001239776611328125, 0.0019478797912597656, 0.004019737243652344, 0.006091594696044922, 0.0081634521484375, 0.010235309600830078, 0.012307167053222656, 0.014379024505615234, 0.016450881958007812, 0.01852273941040039, 0.02059459686279297, 0.022666454315185547, 0.024738311767578125, 0.026810169219970703, 0.02888202667236328, 0.03095388412475586, 0.03302574157714844, 0.035097599029541016, 0.037169456481933594, 0.03924131393432617, 0.04131317138671875, 0.04338502883911133, 0.045456886291503906, 0.047528743743896484, 0.04960060119628906, 0.05167245864868164, 0.05374431610107422, 0.0558161735534668, 0.057888031005859375, 0.05995988845825195, 0.06203174591064453, 0.06410360336303711, 0.06617546081542969, 0.06824731826782227, 0.07031917572021484, 0.07239103317260742, 0.074462890625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 4.0, 5.0, 9.0, 5.0, 8.0, 15.0, 19.0, 23.0, 21.0, 778.0, 21.0, 18.0, 12.0, 12.0, 7.0, 6.0, 8.0, 6.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0299072265625, -0.02884531021118164, -0.02778339385986328, -0.026721477508544922, -0.025659561157226562, -0.024597644805908203, -0.023535728454589844, -0.022473812103271484, -0.021411895751953125, -0.020349979400634766, -0.019288063049316406, -0.018226146697998047, -0.017164230346679688, -0.016102313995361328, -0.015040397644042969, -0.01397848129272461, -0.01291656494140625, -0.01185464859008789, -0.010792732238769531, -0.009730815887451172, -0.008668899536132812, -0.007606983184814453, -0.006545066833496094, -0.005483150482177734, -0.004421234130859375, -0.0033593177795410156, -0.0022974014282226562, -0.0012354850769042969, -0.0001735687255859375, 0.0008883476257324219, 0.0019502639770507812, 0.0030121803283691406, 0.0040740966796875, 0.005136013031005859, 0.006197929382324219, 0.007259845733642578, 0.008321762084960938, 0.009383678436279297, 0.010445594787597656, 0.011507511138916016, 0.012569427490234375, 0.013631343841552734, 0.014693260192871094, 0.015755176544189453, 0.016817092895507812, 0.017879009246826172, 0.01894092559814453, 0.02000284194946289, 0.02106475830078125, 0.02212667465209961, 0.02318859100341797, 0.024250507354736328, 0.025312423706054688, 0.026374340057373047, 0.027436256408691406, 0.028498172760009766, 0.029560089111328125, 0.030622005462646484, 0.031683921813964844, 0.0327458381652832, 0.03380775451660156, 0.03486967086791992, 0.03593158721923828, 0.03699350357055664, 0.038055419921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 10.0, 22.0, 30.0, 47.0, 76.0, 198.0, 703.0, 3926.0, 4107751.0, 78162.0, 2659.0, 383.0, 125.0, 49.0, 33.0, 19.0, 17.0, 12.0, 6.0, 7.0, 4.0, 4.0, 0.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.182373046875, -0.17647171020507812, -0.17057037353515625, -0.16466903686523438, -0.1587677001953125, -0.15286636352539062, -0.14696502685546875, -0.14106369018554688, -0.135162353515625, -0.12926101684570312, -0.12335968017578125, -0.11745834350585938, -0.1115570068359375, -0.10565567016601562, -0.09975433349609375, -0.09385299682617188, -0.08795166015625, -0.08205032348632812, -0.07614898681640625, -0.07024765014648438, -0.0643463134765625, -0.058444976806640625, -0.05254364013671875, -0.046642303466796875, -0.040740966796875, -0.034839630126953125, -0.02893829345703125, -0.023036956787109375, -0.0171356201171875, -0.011234283447265625, -0.00533294677734375, 0.000568389892578125, 0.0064697265625, 0.012371063232421875, 0.01827239990234375, 0.024173736572265625, 0.0300750732421875, 0.035976409912109375, 0.04187774658203125, 0.047779083251953125, 0.053680419921875, 0.059581756591796875, 0.06548309326171875, 0.07138442993164062, 0.0772857666015625, 0.08318710327148438, 0.08908843994140625, 0.09498977661132812, 0.10089111328125, 0.10679244995117188, 0.11269378662109375, 0.11859512329101562, 0.1244964599609375, 0.13039779663085938, 0.13629913330078125, 0.14220046997070312, 0.148101806640625, 0.15400314331054688, 0.15990447998046875, 0.16580581665039062, 0.1717071533203125, 0.17760848999023438, 0.18350982666015625, 0.18941116333007812, 0.1953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 5.0, 3.0, 10.0, 7.0, 6.0, 14.0, 26.0, 179.0, 1540.0, 2046.0, 145.0, 26.0, 6.0, 7.0, 12.0, 5.0, 7.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0694580078125, -0.0675816535949707, -0.0657052993774414, -0.06382894515991211, -0.06195259094238281, -0.060076236724853516, -0.05819988250732422, -0.05632352828979492, -0.054447174072265625, -0.05257081985473633, -0.05069446563720703, -0.048818111419677734, -0.04694175720214844, -0.04506540298461914, -0.043189048767089844, -0.04131269454956055, -0.03943634033203125, -0.03755998611450195, -0.035683631896972656, -0.03380727767944336, -0.03193092346191406, -0.030054569244384766, -0.02817821502685547, -0.026301860809326172, -0.024425506591796875, -0.022549152374267578, -0.02067279815673828, -0.018796443939208984, -0.016920089721679688, -0.01504373550415039, -0.013167381286621094, -0.011291027069091797, -0.0094146728515625, -0.007538318634033203, -0.005661964416503906, -0.0037856101989746094, -0.0019092559814453125, -3.2901763916015625e-05, 0.0018434524536132812, 0.003719806671142578, 0.005596160888671875, 0.007472515106201172, 0.009348869323730469, 0.011225223541259766, 0.013101577758789062, 0.01497793197631836, 0.016854286193847656, 0.018730640411376953, 0.02060699462890625, 0.022483348846435547, 0.024359703063964844, 0.02623605728149414, 0.028112411499023438, 0.029988765716552734, 0.03186511993408203, 0.03374147415161133, 0.035617828369140625, 0.03749418258666992, 0.03937053680419922, 0.041246891021728516, 0.04312324523925781, 0.04499959945678711, 0.046875953674316406, 0.0487523078918457, 0.050628662109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 971.0, 45.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3632950186729431, -0.3417055606842041, -0.3201160728931427, -0.2985265851020813, -0.2769371271133423, -0.25534766912460327, -0.23375818133354187, -0.21216870844364166, -0.19057923555374146, -0.16898976266384125, -0.14740028977394104, -0.12581081688404083, -0.10422134399414062, -0.08263187110424042, -0.06104239821434021, -0.03945292532444, -0.017863452434539795, 0.0037260204553604126, 0.02531549334526062, 0.04690496623516083, 0.06849443912506104, 0.09008391201496124, 0.11167338490486145, 0.13326285779476166, 0.15485233068466187, 0.17644180357456207, 0.19803127646446228, 0.2196207493543625, 0.2412102222442627, 0.2627996802330017, 0.2843891680240631, 0.3059786558151245, 0.3275681734085083, 0.3491576313972473, 0.3707471191883087, 0.3923366069793701, 0.41392606496810913, 0.43551552295684814, 0.45710501074790955, 0.47869449853897095, 0.50028395652771, 0.521873414516449, 0.543462872505188, 0.5650523900985718, 0.5866418480873108, 0.6082313060760498, 0.6298208236694336, 0.6514102816581726, 0.6729997396469116, 0.6945891976356506, 0.7161786556243896, 0.7377681732177734, 0.7593576312065125, 0.7809470891952515, 0.8025366067886353, 0.8241260647773743, 0.8457155227661133, 0.8673049807548523, 0.8888944387435913, 0.9104839563369751, 0.9320734143257141, 0.9536628723144531, 0.9752523899078369, 0.9968418478965759, 1.018431305885315]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 9.0, 7.0, 10.0, 16.0, 17.0, 21.0, 50.0, 48.0, 74.0, 93.0, 107.0, 105.0, 106.0, 89.0, 77.0, 35.0, 39.0, 22.0, 18.0, 9.0, 7.0, 14.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.21257835626602173, -0.2066056877374649, -0.20063303411006927, -0.19466036558151245, -0.18868769705295563, -0.1827150285243988, -0.17674237489700317, -0.17076970636844635, -0.16479703783988953, -0.1588243693113327, -0.15285171568393707, -0.14687904715538025, -0.14090637862682343, -0.1349337100982666, -0.12896105647087097, -0.12298838794231415, -0.11701573431491852, -0.11104307323694229, -0.10507040470838547, -0.09909774363040924, -0.09312507510185242, -0.08715241402387619, -0.08117975294589996, -0.07520708441734314, -0.06923442333936691, -0.06326176226139069, -0.05728909373283386, -0.051316432654857635, -0.04534376785159111, -0.039371103048324585, -0.03339844197034836, -0.027425777167081833, -0.021453112363815308, -0.015480448491871357, -0.009507784619927406, -0.0035351216793060303, 0.002437543123960495, 0.00841020792722702, 0.014382869005203247, 0.020355533808469772, 0.026328198611736298, 0.03230086341500282, 0.03827352821826935, 0.044246189296245575, 0.0502188540995121, 0.056191518902778625, 0.06216417998075485, 0.06813684105873108, 0.0741095095872879, 0.08008217066526413, 0.08605483919382095, 0.09202750027179718, 0.098000168800354, 0.10397282987833023, 0.10994549095630646, 0.11591815948486328, 0.12189082056283951, 0.12786348164081573, 0.13383615016937256, 0.1398088037967682, 0.145781472325325, 0.15175414085388184, 0.15772679448127747, 0.1636994630098343, 0.1696721315383911]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 4.0, 13.0, 15.0, 30.0, 34.0, 38.0, 71.0, 94.0, 121.0, 184.0, 238.0, 397.0, 641.0, 1074.0, 1665.0, 3017.0, 5457.0, 11324.0, 31011.0, 915595.0, 47132.0, 14660.0, 6602.0, 3718.0, 2026.0, 1209.0, 760.0, 501.0, 279.0, 211.0, 134.0, 83.0, 58.0, 47.0, 25.0, 25.0, 15.0, 16.0, 6.0, 6.0, 9.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0340576171875, -0.03286886215209961, -0.03168010711669922, -0.030491352081298828, -0.029302597045898438, -0.028113842010498047, -0.026925086975097656, -0.025736331939697266, -0.024547576904296875, -0.023358821868896484, -0.022170066833496094, -0.020981311798095703, -0.019792556762695312, -0.018603801727294922, -0.01741504669189453, -0.01622629165649414, -0.01503753662109375, -0.01384878158569336, -0.012660026550292969, -0.011471271514892578, -0.010282516479492188, -0.009093761444091797, -0.007905006408691406, -0.006716251373291016, -0.005527496337890625, -0.004338741302490234, -0.0031499862670898438, -0.001961231231689453, -0.0007724761962890625, 0.0004162788391113281, 0.0016050338745117188, 0.0027937889099121094, 0.0039825439453125, 0.005171298980712891, 0.006360054016113281, 0.007548809051513672, 0.008737564086914062, 0.009926319122314453, 0.011115074157714844, 0.012303829193115234, 0.013492584228515625, 0.014681339263916016, 0.015870094299316406, 0.017058849334716797, 0.018247604370117188, 0.019436359405517578, 0.02062511444091797, 0.02181386947631836, 0.02300262451171875, 0.02419137954711914, 0.02538013458251953, 0.026568889617919922, 0.027757644653320312, 0.028946399688720703, 0.030135154724121094, 0.031323909759521484, 0.032512664794921875, 0.033701419830322266, 0.034890174865722656, 0.03607892990112305, 0.03726768493652344, 0.03845643997192383, 0.03964519500732422, 0.04083395004272461, 0.042022705078125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 7.0, 4.0, 8.0, 5.0, 16.0, 17.0, 21.0, 21.0, 766.0, 33.0, 19.0, 18.0, 10.0, 7.0, 6.0, 7.0, 8.0, 5.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029632568359375, -0.028595447540283203, -0.027558326721191406, -0.02652120590209961, -0.025484085083007812, -0.024446964263916016, -0.02340984344482422, -0.022372722625732422, -0.021335601806640625, -0.020298480987548828, -0.01926136016845703, -0.018224239349365234, -0.017187118530273438, -0.01614999771118164, -0.015112876892089844, -0.014075756072998047, -0.01303863525390625, -0.012001514434814453, -0.010964393615722656, -0.00992727279663086, -0.008890151977539062, -0.007853031158447266, -0.006815910339355469, -0.005778789520263672, -0.004741668701171875, -0.003704547882080078, -0.0026674270629882812, -0.0016303062438964844, -0.0005931854248046875, 0.0004439353942871094, 0.0014810562133789062, 0.002518177032470703, 0.0035552978515625, 0.004592418670654297, 0.005629539489746094, 0.006666660308837891, 0.0077037811279296875, 0.008740901947021484, 0.009778022766113281, 0.010815143585205078, 0.011852264404296875, 0.012889385223388672, 0.013926506042480469, 0.014963626861572266, 0.016000747680664062, 0.01703786849975586, 0.018074989318847656, 0.019112110137939453, 0.02014923095703125, 0.021186351776123047, 0.022223472595214844, 0.02326059341430664, 0.024297714233398438, 0.025334835052490234, 0.02637195587158203, 0.027409076690673828, 0.028446197509765625, 0.029483318328857422, 0.03052043914794922, 0.031557559967041016, 0.03259468078613281, 0.03363180160522461, 0.034668922424316406, 0.0357060432434082, 0.0367431640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 3.0, 8.0, 7.0, 4.0, 11.0, 21.0, 18.0, 19.0, 27.0, 28.0, 29.0, 59.0, 56.0, 61.0, 97.0, 124.0, 181.0, 365.0, 793.0, 2618.0, 19865.0, 752093.0, 256893.0, 11589.0, 1930.0, 591.0, 293.0, 167.0, 111.0, 105.0, 67.0, 59.0, 44.0, 53.0, 32.0, 17.0, 22.0, 15.0, 15.0, 16.0, 3.0, 7.0, 8.0, 8.0, 3.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09930419921875, -0.09628486633300781, -0.09326553344726562, -0.09024620056152344, -0.08722686767578125, -0.08420753479003906, -0.08118820190429688, -0.07816886901855469, -0.0751495361328125, -0.07213020324707031, -0.06911087036132812, -0.06609153747558594, -0.06307220458984375, -0.06005287170410156, -0.057033538818359375, -0.05401420593261719, -0.050994873046875, -0.04797554016113281, -0.044956207275390625, -0.04193687438964844, -0.03891754150390625, -0.03589820861816406, -0.032878875732421875, -0.029859542846679688, -0.0268402099609375, -0.023820877075195312, -0.020801544189453125, -0.017782211303710938, -0.01476287841796875, -0.011743545532226562, -0.008724212646484375, -0.0057048797607421875, -0.002685546875, 0.0003337860107421875, 0.003353118896484375, 0.0063724517822265625, 0.00939178466796875, 0.012411117553710938, 0.015430450439453125, 0.018449783325195312, 0.0214691162109375, 0.024488449096679688, 0.027507781982421875, 0.030527114868164062, 0.03354644775390625, 0.03656578063964844, 0.039585113525390625, 0.04260444641113281, 0.045623779296875, 0.04864311218261719, 0.051662445068359375, 0.05468177795410156, 0.05770111083984375, 0.06072044372558594, 0.06373977661132812, 0.06675910949707031, 0.0697784423828125, 0.07279777526855469, 0.07581710815429688, 0.07883644104003906, 0.08185577392578125, 0.08487510681152344, 0.08789443969726562, 0.09091377258300781, 0.09393310546875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 3.0, 8.0, 7.0, 3.0, 11.0, 18.0, 17.0, 11.0, 19.0, 10.0, 19.0, 27.0, 17.0, 28.0, 26.0, 25.0, 36.0, 39.0, 33.0, 34.0, 38.0, 45.0, 38.0, 51.0, 30.0, 28.0, 40.0, 41.0, 29.0, 41.0, 31.0, 14.0, 27.0, 32.0, 18.0, 11.0, 12.0, 12.0, 12.0, 15.0, 2.0, 6.0, 8.0, 8.0, 3.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.090576171875, -0.08782196044921875, -0.0850677490234375, -0.08231353759765625, -0.079559326171875, -0.07680511474609375, -0.0740509033203125, -0.07129669189453125, -0.06854248046875, -0.06578826904296875, -0.0630340576171875, -0.06027984619140625, -0.057525634765625, -0.05477142333984375, -0.0520172119140625, -0.04926300048828125, -0.0465087890625, -0.04375457763671875, -0.0410003662109375, -0.03824615478515625, -0.035491943359375, -0.03273773193359375, -0.0299835205078125, -0.02722930908203125, -0.02447509765625, -0.02172088623046875, -0.0189666748046875, -0.01621246337890625, -0.013458251953125, -0.01070404052734375, -0.0079498291015625, -0.00519561767578125, -0.00244140625, 0.00031280517578125, 0.0030670166015625, 0.00582122802734375, 0.008575439453125, 0.01132965087890625, 0.0140838623046875, 0.01683807373046875, 0.01959228515625, 0.02234649658203125, 0.0251007080078125, 0.02785491943359375, 0.030609130859375, 0.03336334228515625, 0.0361175537109375, 0.03887176513671875, 0.0416259765625, 0.04438018798828125, 0.0471343994140625, 0.04988861083984375, 0.052642822265625, 0.05539703369140625, 0.0581512451171875, 0.06090545654296875, 0.06365966796875, 0.06641387939453125, 0.0691680908203125, 0.07192230224609375, 0.074676513671875, 0.07743072509765625, 0.0801849365234375, 0.08293914794921875, 0.085693359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 9.0, 12.0, 21.0, 23.0, 42.0, 67.0, 110.0, 250.0, 598.0, 1780.0, 8229.0, 146175.0, 869942.0, 16962.0, 2821.0, 806.0, 327.0, 155.0, 69.0, 49.0, 27.0, 17.0, 14.0, 10.0, 9.0, 10.0, 2.0, 4.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.976987838745117e-05, -4.822295159101486e-05, -4.667602479457855e-05, -4.512909799814224e-05, -4.358217120170593e-05, -4.203524440526962e-05, -4.048831760883331e-05, -3.8941390812397e-05, -3.739446401596069e-05, -3.5847537219524384e-05, -3.4300610423088074e-05, -3.2753683626651764e-05, -3.1206756830215454e-05, -2.9659830033779144e-05, -2.8112903237342834e-05, -2.6565976440906525e-05, -2.5019049644470215e-05, -2.3472122848033905e-05, -2.1925196051597595e-05, -2.0378269255161285e-05, -1.8831342458724976e-05, -1.7284415662288666e-05, -1.5737488865852356e-05, -1.4190562069416046e-05, -1.2643635272979736e-05, -1.1096708476543427e-05, -9.549781680107117e-06, -8.002854883670807e-06, -6.455928087234497e-06, -4.909001290798187e-06, -3.3620744943618774e-06, -1.8151476979255676e-06, -2.682209014892578e-07, 1.278705894947052e-06, 2.825632691383362e-06, 4.372559487819672e-06, 5.9194862842559814e-06, 7.466413080692291e-06, 9.013339877128601e-06, 1.0560266673564911e-05, 1.210719347000122e-05, 1.365412026643753e-05, 1.520104706287384e-05, 1.674797385931015e-05, 1.829490065574646e-05, 1.984182745218277e-05, 2.138875424861908e-05, 2.293568104505539e-05, 2.44826078414917e-05, 2.602953463792801e-05, 2.757646143436432e-05, 2.912338823080063e-05, 3.067031502723694e-05, 3.221724182367325e-05, 3.376416862010956e-05, 3.531109541654587e-05, 3.685802221298218e-05, 3.840494900941849e-05, 3.99518758058548e-05, 4.149880260229111e-05, 4.304572939872742e-05, 4.459265619516373e-05, 4.613958299160004e-05, 4.7686509788036346e-05, 4.9233436584472656e-05]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 10.0, 14.0, 21.0, 20.0, 17.0, 23.0, 30.0, 37.0, 39.0, 46.0, 80.0, 60.0, 63.0, 58.0, 58.0, 67.0, 47.0, 35.0, 51.0, 40.0, 31.0, 17.0, 26.0, 30.0, 16.0, 6.0, 10.0, 4.0, 9.0, 2.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.516674041748047e-06, -3.3928081393241882e-06, -3.2689422369003296e-06, -3.145076334476471e-06, -3.0212104320526123e-06, -2.8973445296287537e-06, -2.773478627204895e-06, -2.6496127247810364e-06, -2.5257468223571777e-06, -2.401880919933319e-06, -2.2780150175094604e-06, -2.154149115085602e-06, -2.030283212661743e-06, -1.9064173102378845e-06, -1.7825514078140259e-06, -1.6586855053901672e-06, -1.5348196029663086e-06, -1.41095370054245e-06, -1.2870877981185913e-06, -1.1632218956947327e-06, -1.039355993270874e-06, -9.154900908470154e-07, -7.916241884231567e-07, -6.677582859992981e-07, -5.438923835754395e-07, -4.200264811515808e-07, -2.9616057872772217e-07, -1.7229467630386353e-07, -4.842877388000488e-08, 7.543712854385376e-08, 1.993030309677124e-07, 3.2316893339157104e-07, 4.470348358154297e-07, 5.709007382392883e-07, 6.94766640663147e-07, 8.186325430870056e-07, 9.424984455108643e-07, 1.066364347934723e-06, 1.1902302503585815e-06, 1.3140961527824402e-06, 1.4379620552062988e-06, 1.5618279576301575e-06, 1.6856938600540161e-06, 1.8095597624778748e-06, 1.9334256649017334e-06, 2.057291567325592e-06, 2.1811574697494507e-06, 2.3050233721733093e-06, 2.428889274597168e-06, 2.5527551770210266e-06, 2.6766210794448853e-06, 2.800486981868744e-06, 2.9243528842926025e-06, 3.048218786716461e-06, 3.17208468914032e-06, 3.2959505915641785e-06, 3.419816493988037e-06, 3.5436823964118958e-06, 3.6675482988357544e-06, 3.791414201259613e-06, 3.915280103683472e-06, 4.03914600610733e-06, 4.163011908531189e-06, 4.286877810955048e-06, 4.410743713378906e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 10.0, 14.0, 21.0, 26.0, 33.0, 48.0, 53.0, 83.0, 111.0, 172.0, 381.0, 1008.0, 7469.0, 674984.0, 356281.0, 6082.0, 903.0, 322.0, 150.0, 118.0, 66.0, 57.0, 29.0, 26.0, 18.0, 19.0, 14.0, 9.0, 13.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.491474151611328e-05, -2.3875385522842407e-05, -2.2836029529571533e-05, -2.179667353630066e-05, -2.0757317543029785e-05, -1.971796154975891e-05, -1.8678605556488037e-05, -1.7639249563217163e-05, -1.659989356994629e-05, -1.5560537576675415e-05, -1.4521181583404541e-05, -1.3481825590133667e-05, -1.2442469596862793e-05, -1.1403113603591919e-05, -1.0363757610321045e-05, -9.324401617050171e-06, -8.285045623779297e-06, -7.245689630508423e-06, -6.206333637237549e-06, -5.166977643966675e-06, -4.127621650695801e-06, -3.0882656574249268e-06, -2.0489096641540527e-06, -1.0095536708831787e-06, 2.9802322387695312e-08, 1.0691583156585693e-06, 2.1085143089294434e-06, 3.1478703022003174e-06, 4.187226295471191e-06, 5.2265822887420654e-06, 6.2659382820129395e-06, 7.3052942752838135e-06, 8.344650268554688e-06, 9.384006261825562e-06, 1.0423362255096436e-05, 1.146271824836731e-05, 1.2502074241638184e-05, 1.3541430234909058e-05, 1.4580786228179932e-05, 1.5620142221450806e-05, 1.665949821472168e-05, 1.7698854207992554e-05, 1.8738210201263428e-05, 1.9777566194534302e-05, 2.0816922187805176e-05, 2.185627818107605e-05, 2.2895634174346924e-05, 2.3934990167617798e-05, 2.4974346160888672e-05, 2.6013702154159546e-05, 2.705305814743042e-05, 2.8092414140701294e-05, 2.9131770133972168e-05, 3.0171126127243042e-05, 3.1210482120513916e-05, 3.224983811378479e-05, 3.3289194107055664e-05, 3.432855010032654e-05, 3.536790609359741e-05, 3.6407262086868286e-05, 3.744661808013916e-05, 3.8485974073410034e-05, 3.952533006668091e-05, 4.056468605995178e-05, 4.1604042053222656e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 7.0, 11.0, 16.0, 16.0, 20.0, 22.0, 19.0, 35.0, 37.0, 39.0, 49.0, 60.0, 64.0, 84.0, 68.0, 72.0, 74.0, 52.0, 40.0, 31.0, 35.0, 28.0, 18.0, 16.0, 10.0, 17.0, 12.0, 9.0, 11.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2709369659423828e-05, -2.176128327846527e-05, -2.0813196897506714e-05, -1.9865110516548157e-05, -1.89170241355896e-05, -1.7968937754631042e-05, -1.7020851373672485e-05, -1.6072764992713928e-05, -1.5124678611755371e-05, -1.4176592230796814e-05, -1.3228505849838257e-05, -1.22804194688797e-05, -1.1332333087921143e-05, -1.0384246706962585e-05, -9.436160326004028e-06, -8.488073945045471e-06, -7.539987564086914e-06, -6.591901183128357e-06, -5.6438148021698e-06, -4.695728421211243e-06, -3.7476420402526855e-06, -2.7995556592941284e-06, -1.8514692783355713e-06, -9.033828973770142e-07, 4.470348358154297e-08, 9.927898645401e-07, 1.9408762454986572e-06, 2.8889626264572144e-06, 3.8370490074157715e-06, 4.785135388374329e-06, 5.733221769332886e-06, 6.681308150291443e-06, 7.62939453125e-06, 8.577480912208557e-06, 9.525567293167114e-06, 1.0473653674125671e-05, 1.1421740055084229e-05, 1.2369826436042786e-05, 1.3317912817001343e-05, 1.42659991979599e-05, 1.5214085578918457e-05, 1.6162171959877014e-05, 1.711025834083557e-05, 1.805834472179413e-05, 1.9006431102752686e-05, 1.9954517483711243e-05, 2.09026038646698e-05, 2.1850690245628357e-05, 2.2798776626586914e-05, 2.374686300754547e-05, 2.469494938850403e-05, 2.5643035769462585e-05, 2.6591122150421143e-05, 2.75392085313797e-05, 2.8487294912338257e-05, 2.9435381293296814e-05, 3.038346767425537e-05, 3.133155405521393e-05, 3.2279640436172485e-05, 3.322772681713104e-05, 3.41758131980896e-05, 3.512389957904816e-05, 3.6071985960006714e-05, 3.702007234096527e-05, 3.796815872192383e-05]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 18.0, 857.0, 128.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.635565757751465, -3.5704493522644043, -3.5053329467773438, -3.440216541290283, -3.3751001358032227, -3.309983968734741, -3.2448675632476807, -3.17975115776062, -3.1146347522735596, -3.049518346786499, -2.9844019412994385, -2.919285535812378, -2.8541693687438965, -2.789052963256836, -2.7239365577697754, -2.658820152282715, -2.5937037467956543, -2.5285873413085938, -2.463470935821533, -2.3983545303344727, -2.333238124847412, -2.2681219577789307, -2.20300555229187, -2.1378891468048096, -2.072772741317749, -2.0076563358306885, -1.942539930343628, -1.877423644065857, -1.8123072385787964, -1.7471908330917358, -1.6820745468139648, -1.6169581413269043, -1.5518417358398438, -1.4867253303527832, -1.4216089248657227, -1.3564926385879517, -1.2913762331008911, -1.2262598276138306, -1.1611435413360596, -1.096027135848999, -1.0309107303619385, -0.9657943248748779, -0.9006779789924622, -0.8355616331100464, -0.7704452276229858, -0.7053288221359253, -0.6402124762535095, -0.5750961303710938, -0.509979784488678, -0.4448634088039398, -0.37974703311920166, -0.3146306574344635, -0.24951428174972534, -0.18439790606498718, -0.11928153038024902, -0.054165154695510864, 0.010951220989227295, 0.07606759667396545, 0.1411839723587036, 0.20630034804344177, 0.27141672372817993, 0.3365330994129181, 0.40164947509765625, 0.4667658507823944, 0.5318822264671326]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 10.0, 13.0, 20.0, 35.0, 65.0, 123.0, 167.0, 192.0, 134.0, 84.0, 44.0, 27.0, 10.0, 8.0, 7.0, 9.0, 7.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.210785388946533, -2.137617588043213, -2.0644497871398926, -1.9912818670272827, -1.9181140661239624, -1.844946265220642, -1.7717783451080322, -1.698610544204712, -1.6254427433013916, -1.5522749423980713, -1.479107141494751, -1.4059392213821411, -1.3327714204788208, -1.2596036195755005, -1.1864356994628906, -1.1132678985595703, -1.04010009765625, -0.9669322967529297, -0.8937644362449646, -0.8205965757369995, -0.7474287748336792, -0.6742609739303589, -0.6010931134223938, -0.5279252529144287, -0.4547574520111084, -0.3815896213054657, -0.308421790599823, -0.2352539598941803, -0.1620861291885376, -0.0889182984828949, -0.015750467777252197, 0.05741739273071289, 0.1305854320526123, 0.203753262758255, 0.2769210934638977, 0.3500889241695404, 0.4232567548751831, 0.4964245855808258, 0.5695924162864685, 0.6427602767944336, 0.7159280776977539, 0.7890958786010742, 0.8622637391090393, 0.9354315996170044, 1.0085994005203247, 1.081767201423645, 1.1549351215362549, 1.2281029224395752, 1.3012707233428955, 1.3744385242462158, 1.4476063251495361, 1.520774245262146, 1.5939420461654663, 1.6671098470687866, 1.7402777671813965, 1.8134455680847168, 1.886613368988037, 1.9597811698913574, 2.0329489707946777, 2.106116771697998, 2.1792845726013184, 2.2524526119232178, 2.325620412826538, 2.3987882137298584, 2.4719560146331787]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 5.0, 7.0, 10.0, 22.0, 33.0, 58.0, 118.0, 244.0, 645.0, 1733.0, 6680.0, 4167648.0, 13709.0, 2270.0, 631.0, 222.0, 92.0, 41.0, 39.0, 17.0, 14.0, 8.0, 5.0, 7.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388671875, -0.3755760192871094, -0.36248016357421875, -0.3493843078613281, -0.3362884521484375, -0.3231925964355469, -0.31009674072265625, -0.2970008850097656, -0.283905029296875, -0.2708091735839844, -0.25771331787109375, -0.24461746215820312, -0.2315216064453125, -0.21842575073242188, -0.20532989501953125, -0.19223403930664062, -0.17913818359375, -0.16604232788085938, -0.15294647216796875, -0.13985061645507812, -0.1267547607421875, -0.11365890502929688, -0.10056304931640625, -0.08746719360351562, -0.074371337890625, -0.061275482177734375, -0.04817962646484375, -0.035083770751953125, -0.0219879150390625, -0.008892059326171875, 0.00420379638671875, 0.017299652099609375, 0.0303955078125, 0.043491363525390625, 0.05658721923828125, 0.06968307495117188, 0.0827789306640625, 0.09587478637695312, 0.10897064208984375, 0.12206649780273438, 0.135162353515625, 0.14825820922851562, 0.16135406494140625, 0.17444992065429688, 0.1875457763671875, 0.20064163208007812, 0.21373748779296875, 0.22683334350585938, 0.23992919921875, 0.2530250549316406, 0.26612091064453125, 0.2792167663574219, 0.2923126220703125, 0.3054084777832031, 0.31850433349609375, 0.3316001892089844, 0.344696044921875, 0.3577919006347656, 0.37088775634765625, 0.3839836120605469, 0.3970794677734375, 0.4101753234863281, 0.42327117919921875, 0.4363670349121094, 0.449462890625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 11.0, 15.0, 19.0, 13.0, 21.0, 621.0, 179.0, 17.0, 12.0, 13.0, 15.0, 4.0, 8.0, 4.0, 5.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0253143310546875, -0.02446269989013672, -0.023611068725585938, -0.022759437561035156, -0.021907806396484375, -0.021056175231933594, -0.020204544067382812, -0.01935291290283203, -0.01850128173828125, -0.01764965057373047, -0.016798019409179688, -0.015946388244628906, -0.015094757080078125, -0.014243125915527344, -0.013391494750976562, -0.012539863586425781, -0.011688232421875, -0.010836601257324219, -0.009984970092773438, -0.009133338928222656, -0.008281707763671875, -0.007430076599121094, -0.0065784454345703125, -0.005726814270019531, -0.00487518310546875, -0.004023551940917969, -0.0031719207763671875, -0.0023202896118164062, -0.001468658447265625, -0.0006170272827148438, 0.0002346038818359375, 0.0010862350463867188, 0.0019378662109375, 0.0027894973754882812, 0.0036411285400390625, 0.004492759704589844, 0.005344390869140625, 0.006196022033691406, 0.0070476531982421875, 0.007899284362792969, 0.00875091552734375, 0.009602546691894531, 0.010454177856445312, 0.011305809020996094, 0.012157440185546875, 0.013009071350097656, 0.013860702514648438, 0.014712333679199219, 0.01556396484375, 0.01641559600830078, 0.017267227172851562, 0.018118858337402344, 0.018970489501953125, 0.019822120666503906, 0.020673751831054688, 0.02152538299560547, 0.02237701416015625, 0.02322864532470703, 0.024080276489257812, 0.024931907653808594, 0.025783538818359375, 0.026635169982910156, 0.027486801147460938, 0.02833843231201172, 0.0291900634765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 12.0, 12.0, 15.0, 10.0, 16.0, 19.0, 25.0, 36.0, 48.0, 107.0, 159.0, 342.0, 1107.0, 5478.0, 71232.0, 4100418.0, 12328.0, 1815.0, 506.0, 205.0, 118.0, 69.0, 40.0, 24.0, 26.0, 11.0, 17.0, 14.0, 10.0, 7.0, 14.0, 4.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2890625, -0.28035736083984375, -0.2716522216796875, -0.26294708251953125, -0.254241943359375, -0.24553680419921875, -0.2368316650390625, -0.22812652587890625, -0.21942138671875, -0.21071624755859375, -0.2020111083984375, -0.19330596923828125, -0.184600830078125, -0.17589569091796875, -0.1671905517578125, -0.15848541259765625, -0.1497802734375, -0.14107513427734375, -0.1323699951171875, -0.12366485595703125, -0.114959716796875, -0.10625457763671875, -0.0975494384765625, -0.08884429931640625, -0.08013916015625, -0.07143402099609375, -0.0627288818359375, -0.05402374267578125, -0.045318603515625, -0.03661346435546875, -0.0279083251953125, -0.01920318603515625, -0.010498046875, -0.00179290771484375, 0.0069122314453125, 0.01561737060546875, 0.024322509765625, 0.03302764892578125, 0.0417327880859375, 0.05043792724609375, 0.05914306640625, 0.06784820556640625, 0.0765533447265625, 0.08525848388671875, 0.093963623046875, 0.10266876220703125, 0.1113739013671875, 0.12007904052734375, 0.1287841796875, 0.13748931884765625, 0.1461944580078125, 0.15489959716796875, 0.163604736328125, 0.17230987548828125, 0.1810150146484375, 0.18972015380859375, 0.19842529296875, 0.20713043212890625, 0.2158355712890625, 0.22454071044921875, 0.233245849609375, 0.24195098876953125, 0.2506561279296875, 0.25936126708984375, 0.26806640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 8.0, 7.0, 6.0, 7.0, 6.0, 10.0, 12.0, 10.0, 11.0, 21.0, 19.0, 19.0, 23.0, 32.0, 85.0, 3585.0, 43.0, 29.0, 26.0, 18.0, 15.0, 16.0, 9.0, 4.0, 9.0, 3.0, 4.0, 5.0, 4.0, 3.0, 9.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04144287109375, -0.04019451141357422, -0.03894615173339844, -0.037697792053222656, -0.036449432373046875, -0.035201072692871094, -0.03395271301269531, -0.03270435333251953, -0.03145599365234375, -0.03020763397216797, -0.028959274291992188, -0.027710914611816406, -0.026462554931640625, -0.025214195251464844, -0.023965835571289062, -0.02271747589111328, -0.0214691162109375, -0.02022075653076172, -0.018972396850585938, -0.017724037170410156, -0.016475677490234375, -0.015227317810058594, -0.013978958129882812, -0.012730598449707031, -0.01148223876953125, -0.010233879089355469, -0.008985519409179688, -0.007737159729003906, -0.006488800048828125, -0.005240440368652344, -0.0039920806884765625, -0.0027437210083007812, -0.001495361328125, -0.00024700164794921875, 0.0010013580322265625, 0.0022497177124023438, 0.003498077392578125, 0.004746437072753906, 0.0059947967529296875, 0.007243156433105469, 0.00849151611328125, 0.009739875793457031, 0.010988235473632812, 0.012236595153808594, 0.013484954833984375, 0.014733314514160156, 0.015981674194335938, 0.01723003387451172, 0.0184783935546875, 0.01972675323486328, 0.020975112915039062, 0.022223472595214844, 0.023471832275390625, 0.024720191955566406, 0.025968551635742188, 0.02721691131591797, 0.02846527099609375, 0.02971363067626953, 0.030961990356445312, 0.032210350036621094, 0.033458709716796875, 0.034707069396972656, 0.03595542907714844, 0.03720378875732422, 0.0384521484375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 10.0, 26.0, 299.0, 626.0, 34.0, 9.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.20011991262435913, -0.19661298394203186, -0.1931060552597046, -0.18959912657737732, -0.18609221279621124, -0.18258528411388397, -0.1790783554315567, -0.17557142674922943, -0.17206449806690216, -0.1685575693845749, -0.16505064070224762, -0.16154372692108154, -0.15803679823875427, -0.154529869556427, -0.15102294087409973, -0.14751601219177246, -0.1440090835094452, -0.14050215482711792, -0.13699522614479065, -0.13348829746246338, -0.1299813836812973, -0.12647445499897003, -0.12296752631664276, -0.11946059763431549, -0.11595368385314941, -0.11244675517082214, -0.10893983393907547, -0.1054329052567482, -0.10192597657442093, -0.09841905534267426, -0.09491212666034698, -0.09140519797801971, -0.08789826929569244, -0.08439134061336517, -0.0808844193816185, -0.07737749069929123, -0.07387056201696396, -0.07036364078521729, -0.06685671210289001, -0.06334978342056274, -0.059842854738235474, -0.0563359297811985, -0.05282900109887123, -0.04932207614183426, -0.04581514745950699, -0.042308222502470016, -0.038801297545433044, -0.035294368863105774, -0.0317874439060688, -0.02828051708638668, -0.02477359026670456, -0.021266665309667587, -0.017759738489985466, -0.014252811670303345, -0.010745886713266373, -0.007238959893584251, -0.00373203307390213, -0.00022510671988129616, 0.003281819634139538, 0.0067887455224990845, 0.010295672342181206, 0.013802599161863327, 0.0173095241189003, 0.02081645093858242, 0.02432337775826454]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 3.0, 10.0, 9.0, 21.0, 28.0, 61.0, 111.0, 161.0, 190.0, 141.0, 94.0, 47.0, 28.0, 13.0, 8.0, 13.0, 3.0, 6.0, 9.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18961292505264282, -0.1826980859041214, -0.17578324675559998, -0.16886842250823975, -0.16195358335971832, -0.1550387442111969, -0.14812391996383667, -0.14120908081531525, -0.13429424166679382, -0.1273794025182724, -0.12046457082033157, -0.11354973912239075, -0.10663489997386932, -0.0997200608253479, -0.09280522912740707, -0.08589039742946625, -0.07897555828094482, -0.0720607191324234, -0.06514588743448257, -0.05823105201125145, -0.051316216588020325, -0.0444013811647892, -0.037486545741558075, -0.03057171031832695, -0.023656874895095825, -0.0167420394718647, -0.009827204048633575, -0.0029123686254024506, 0.004002466797828674, 0.0109173022210598, 0.017832137644290924, 0.02474697306752205, 0.031661808490753174, 0.0385766439139843, 0.045491479337215424, 0.05240631476044655, 0.05932115018367767, 0.0662359893321991, 0.07315082103013992, 0.08006565272808075, 0.08698049187660217, 0.0938953310251236, 0.10081016272306442, 0.10772499442100525, 0.11463983356952667, 0.1215546727180481, 0.12846949696540833, 0.13538433611392975, 0.14229917526245117, 0.1492140144109726, 0.15612885355949402, 0.16304367780685425, 0.16995851695537567, 0.1768733561038971, 0.18378818035125732, 0.19070301949977875, 0.19761785864830017, 0.2045326977968216, 0.21144753694534302, 0.21836236119270325, 0.22527720034122467, 0.2321920394897461, 0.23910686373710632, 0.24602170288562775, 0.25293654203414917]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 6.0, 1.0, 2.0, 6.0, 17.0, 14.0, 17.0, 33.0, 37.0, 57.0, 90.0, 125.0, 173.0, 269.0, 378.0, 551.0, 1000.0, 1575.0, 2601.0, 4615.0, 8950.0, 20573.0, 129116.0, 830909.0, 24282.0, 10234.0, 5273.0, 3030.0, 1662.0, 974.0, 682.0, 413.0, 259.0, 192.0, 113.0, 74.0, 75.0, 42.0, 48.0, 24.0, 18.0, 12.0, 10.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.0831298828125, -0.08069133758544922, -0.07825279235839844, -0.07581424713134766, -0.07337570190429688, -0.0709371566772461, -0.06849861145019531, -0.06606006622314453, -0.06362152099609375, -0.06118297576904297, -0.05874443054199219, -0.056305885314941406, -0.053867340087890625, -0.051428794860839844, -0.04899024963378906, -0.04655170440673828, -0.0441131591796875, -0.04167461395263672, -0.03923606872558594, -0.036797523498535156, -0.034358978271484375, -0.031920433044433594, -0.029481887817382812, -0.02704334259033203, -0.02460479736328125, -0.02216625213623047, -0.019727706909179688, -0.017289161682128906, -0.014850616455078125, -0.012412071228027344, -0.009973526000976562, -0.007534980773925781, -0.005096435546875, -0.0026578903198242188, -0.0002193450927734375, 0.0022192001342773438, 0.004657745361328125, 0.007096290588378906, 0.009534835815429688, 0.011973381042480469, 0.01441192626953125, 0.01685047149658203, 0.019289016723632812, 0.021727561950683594, 0.024166107177734375, 0.026604652404785156, 0.029043197631835938, 0.03148174285888672, 0.0339202880859375, 0.03635883331298828, 0.03879737854003906, 0.041235923767089844, 0.043674468994140625, 0.046113014221191406, 0.04855155944824219, 0.05099010467529297, 0.05342864990234375, 0.05586719512939453, 0.05830574035644531, 0.060744285583496094, 0.06318283081054688, 0.06562137603759766, 0.06805992126464844, 0.07049846649169922, 0.07293701171875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 6.0, 5.0, 14.0, 13.0, 17.0, 17.0, 51.0, 727.0, 39.0, 18.0, 9.0, 17.0, 11.0, 5.0, 8.0, 2.0, 7.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02294921875, -0.022167682647705078, -0.021386146545410156, -0.020604610443115234, -0.019823074340820312, -0.01904153823852539, -0.01826000213623047, -0.017478466033935547, -0.016696929931640625, -0.015915393829345703, -0.015133857727050781, -0.01435232162475586, -0.013570785522460938, -0.012789249420166016, -0.012007713317871094, -0.011226177215576172, -0.01044464111328125, -0.009663105010986328, -0.008881568908691406, -0.008100032806396484, -0.0073184967041015625, -0.006536960601806641, -0.005755424499511719, -0.004973888397216797, -0.004192352294921875, -0.003410816192626953, -0.0026292800903320312, -0.0018477439880371094, -0.0010662078857421875, -0.0002846717834472656, 0.0004968643188476562, 0.0012784004211425781, 0.0020599365234375, 0.002841472625732422, 0.0036230087280273438, 0.004404544830322266, 0.0051860809326171875, 0.005967617034912109, 0.006749153137207031, 0.007530689239501953, 0.008312225341796875, 0.009093761444091797, 0.009875297546386719, 0.01065683364868164, 0.011438369750976562, 0.012219905853271484, 0.013001441955566406, 0.013782978057861328, 0.01456451416015625, 0.015346050262451172, 0.016127586364746094, 0.016909122467041016, 0.017690658569335938, 0.01847219467163086, 0.01925373077392578, 0.020035266876220703, 0.020816802978515625, 0.021598339080810547, 0.02237987518310547, 0.02316141128540039, 0.023942947387695312, 0.024724483489990234, 0.025506019592285156, 0.026287555694580078, 0.027069091796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 10.0, 13.0, 15.0, 22.0, 24.0, 23.0, 35.0, 48.0, 52.0, 63.0, 84.0, 95.0, 111.0, 137.0, 171.0, 232.0, 412.0, 1149.0, 9004.0, 681718.0, 346324.0, 6339.0, 959.0, 382.0, 216.0, 186.0, 138.0, 102.0, 102.0, 76.0, 64.0, 49.0, 36.0, 36.0, 30.0, 24.0, 11.0, 15.0, 11.0, 3.0, 7.0, 7.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1221923828125, -0.11836814880371094, -0.11454391479492188, -0.11071968078613281, -0.10689544677734375, -0.10307121276855469, -0.09924697875976562, -0.09542274475097656, -0.0915985107421875, -0.08777427673339844, -0.08395004272460938, -0.08012580871582031, -0.07630157470703125, -0.07247734069824219, -0.06865310668945312, -0.06482887268066406, -0.061004638671875, -0.05718040466308594, -0.053356170654296875, -0.04953193664550781, -0.04570770263671875, -0.04188346862792969, -0.038059234619140625, -0.03423500061035156, -0.0304107666015625, -0.026586532592773438, -0.022762298583984375, -0.018938064575195312, -0.01511383056640625, -0.011289596557617188, -0.007465362548828125, -0.0036411285400390625, 0.00018310546875, 0.0040073394775390625, 0.007831573486328125, 0.011655807495117188, 0.01548004150390625, 0.019304275512695312, 0.023128509521484375, 0.026952743530273438, 0.0307769775390625, 0.03460121154785156, 0.038425445556640625, 0.04224967956542969, 0.04607391357421875, 0.04989814758300781, 0.053722381591796875, 0.05754661560058594, 0.061370849609375, 0.06519508361816406, 0.06901931762695312, 0.07284355163574219, 0.07666778564453125, 0.08049201965332031, 0.08431625366210938, 0.08814048767089844, 0.0919647216796875, 0.09578895568847656, 0.09961318969726562, 0.10343742370605469, 0.10726165771484375, 0.11108589172363281, 0.11491012573242188, 0.11873435974121094, 0.12255859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 8.0, 11.0, 14.0, 13.0, 20.0, 15.0, 21.0, 22.0, 17.0, 32.0, 31.0, 35.0, 30.0, 26.0, 37.0, 40.0, 44.0, 40.0, 38.0, 31.0, 50.0, 37.0, 37.0, 31.0, 43.0, 29.0, 32.0, 33.0, 28.0, 20.0, 17.0, 13.0, 16.0, 17.0, 13.0, 8.0, 11.0, 8.0, 1.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0570068359375, -0.05522298812866211, -0.05343914031982422, -0.05165529251098633, -0.04987144470214844, -0.04808759689331055, -0.046303749084472656, -0.044519901275634766, -0.042736053466796875, -0.040952205657958984, -0.039168357849121094, -0.0373845100402832, -0.03560066223144531, -0.03381681442260742, -0.03203296661376953, -0.03024911880493164, -0.02846527099609375, -0.02668142318725586, -0.02489757537841797, -0.023113727569580078, -0.021329879760742188, -0.019546031951904297, -0.017762184143066406, -0.015978336334228516, -0.014194488525390625, -0.012410640716552734, -0.010626792907714844, -0.008842945098876953, -0.0070590972900390625, -0.005275249481201172, -0.0034914016723632812, -0.0017075538635253906, 7.62939453125e-05, 0.0018601417541503906, 0.0036439895629882812, 0.005427837371826172, 0.0072116851806640625, 0.008995532989501953, 0.010779380798339844, 0.012563228607177734, 0.014347076416015625, 0.016130924224853516, 0.017914772033691406, 0.019698619842529297, 0.021482467651367188, 0.023266315460205078, 0.02505016326904297, 0.02683401107788086, 0.02861785888671875, 0.03040170669555664, 0.03218555450439453, 0.03396940231323242, 0.03575325012207031, 0.0375370979309082, 0.039320945739746094, 0.041104793548583984, 0.042888641357421875, 0.044672489166259766, 0.046456336975097656, 0.04824018478393555, 0.05002403259277344, 0.05180788040161133, 0.05359172821044922, 0.05537557601928711, 0.057159423828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 5.0, 14.0, 13.0, 26.0, 30.0, 52.0, 85.0, 134.0, 255.0, 518.0, 1428.0, 5489.0, 81645.0, 937713.0, 16653.0, 2769.0, 870.0, 379.0, 174.0, 120.0, 60.0, 33.0, 27.0, 20.0, 13.0, 9.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016033649444580078, -0.00015551596879959106, -0.00015069544315338135, -0.00014587491750717163, -0.00014105439186096191, -0.0001362338662147522, -0.00013141334056854248, -0.00012659281492233276, -0.00012177228927612305, -0.00011695176362991333, -0.00011213123798370361, -0.0001073107123374939, -0.00010249018669128418, -9.766966104507446e-05, -9.284913539886475e-05, -8.802860975265503e-05, -8.320808410644531e-05, -7.83875584602356e-05, -7.356703281402588e-05, -6.874650716781616e-05, -6.392598152160645e-05, -5.910545587539673e-05, -5.428493022918701e-05, -4.9464404582977295e-05, -4.464387893676758e-05, -3.982335329055786e-05, -3.5002827644348145e-05, -3.0182301998138428e-05, -2.536177635192871e-05, -2.0541250705718994e-05, -1.5720725059509277e-05, -1.090019941329956e-05, -6.079673767089844e-06, -1.259148120880127e-06, 3.56137752532959e-06, 8.381903171539307e-06, 1.3202428817749023e-05, 1.802295446395874e-05, 2.2843480110168457e-05, 2.7664005756378174e-05, 3.248453140258789e-05, 3.730505704879761e-05, 4.2125582695007324e-05, 4.694610834121704e-05, 5.176663398742676e-05, 5.6587159633636475e-05, 6.140768527984619e-05, 6.622821092605591e-05, 7.104873657226562e-05, 7.586926221847534e-05, 8.068978786468506e-05, 8.551031351089478e-05, 9.033083915710449e-05, 9.515136480331421e-05, 9.997189044952393e-05, 0.00010479241609573364, 0.00010961294174194336, 0.00011443346738815308, 0.00011925399303436279, 0.0001240745186805725, 0.00012889504432678223, 0.00013371556997299194, 0.00013853609561920166, 0.00014335662126541138, 0.0001481771469116211]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 18.0, 22.0, 34.0, 44.0, 91.0, 86.0, 133.0, 96.0, 163.0, 113.0, 65.0, 48.0, 30.0, 21.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.62939453125e-06, -7.352791726589203e-06, -7.076188921928406e-06, -6.799586117267609e-06, -6.5229833126068115e-06, -6.246380507946014e-06, -5.969777703285217e-06, -5.69317489862442e-06, -5.416572093963623e-06, -5.139969289302826e-06, -4.863366484642029e-06, -4.586763679981232e-06, -4.3101608753204346e-06, -4.0335580706596375e-06, -3.7569552659988403e-06, -3.4803524613380432e-06, -3.203749656677246e-06, -2.927146852016449e-06, -2.650544047355652e-06, -2.3739412426948547e-06, -2.0973384380340576e-06, -1.8207356333732605e-06, -1.5441328287124634e-06, -1.2675300240516663e-06, -9.909272193908691e-07, -7.14324414730072e-07, -4.377216100692749e-07, -1.6111880540847778e-07, 1.1548399925231934e-07, 3.9208680391311646e-07, 6.686896085739136e-07, 9.452924132347107e-07, 1.2218952178955078e-06, 1.498498022556305e-06, 1.775100827217102e-06, 2.051703631877899e-06, 2.3283064365386963e-06, 2.6049092411994934e-06, 2.8815120458602905e-06, 3.1581148505210876e-06, 3.4347176551818848e-06, 3.711320459842682e-06, 3.987923264503479e-06, 4.264526069164276e-06, 4.541128873825073e-06, 4.81773167848587e-06, 5.0943344831466675e-06, 5.370937287807465e-06, 5.647540092468262e-06, 5.924142897129059e-06, 6.200745701789856e-06, 6.477348506450653e-06, 6.75395131111145e-06, 7.030554115772247e-06, 7.3071569204330444e-06, 7.5837597250938416e-06, 7.860362529754639e-06, 8.136965334415436e-06, 8.413568139076233e-06, 8.69017094373703e-06, 8.966773748397827e-06, 9.243376553058624e-06, 9.519979357719421e-06, 9.796582162380219e-06, 1.0073184967041016e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 4.0, 5.0, 3.0, 8.0, 12.0, 12.0, 16.0, 33.0, 39.0, 49.0, 61.0, 102.0, 130.0, 183.0, 286.0, 726.0, 6480.0, 996730.0, 40891.0, 1580.0, 440.0, 235.0, 151.0, 115.0, 67.0, 54.0, 46.0, 20.0, 14.0, 20.0, 9.0, 13.0, 10.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00010514259338378906, -0.00010160170495510101, -9.806081652641296e-05, -9.451992809772491e-05, -9.097903966903687e-05, -8.743815124034882e-05, -8.389726281166077e-05, -8.035637438297272e-05, -7.681548595428467e-05, -7.327459752559662e-05, -6.973370909690857e-05, -6.619282066822052e-05, -6.265193223953247e-05, -5.911104381084442e-05, -5.557015538215637e-05, -5.202926695346832e-05, -4.8488378524780273e-05, -4.4947490096092224e-05, -4.1406601667404175e-05, -3.7865713238716125e-05, -3.4324824810028076e-05, -3.078393638134003e-05, -2.7243047952651978e-05, -2.3702159523963928e-05, -2.016127109527588e-05, -1.662038266658783e-05, -1.307949423789978e-05, -9.538605809211731e-06, -5.997717380523682e-06, -2.4568289518356323e-06, 1.084059476852417e-06, 4.624947905540466e-06, 8.165836334228516e-06, 1.1706724762916565e-05, 1.5247613191604614e-05, 1.8788501620292664e-05, 2.2329390048980713e-05, 2.5870278477668762e-05, 2.941116690635681e-05, 3.295205533504486e-05, 3.649294376373291e-05, 4.003383219242096e-05, 4.357472062110901e-05, 4.711560904979706e-05, 5.065649747848511e-05, 5.419738590717316e-05, 5.7738274335861206e-05, 6.127916276454926e-05, 6.48200511932373e-05, 6.836093962192535e-05, 7.19018280506134e-05, 7.544271647930145e-05, 7.89836049079895e-05, 8.252449333667755e-05, 8.60653817653656e-05, 8.960627019405365e-05, 9.31471586227417e-05, 9.668804705142975e-05, 0.0001002289354801178, 0.00010376982390880585, 0.0001073107123374939, 0.00011085160076618195, 0.00011439248919487, 0.00011793337762355804, 0.0001214742660522461]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 11.0, 16.0, 23.0, 25.0, 25.0, 38.0, 33.0, 46.0, 53.0, 54.0, 83.0, 91.0, 94.0, 71.0, 65.0, 59.0, 40.0, 39.0, 20.0, 22.0, 25.0, 7.0, 7.0, 11.0, 5.0, 9.0, 5.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9054622650146484e-05, -4.7402456402778625e-05, -4.5750290155410767e-05, -4.409812390804291e-05, -4.244595766067505e-05, -4.079379141330719e-05, -3.914162516593933e-05, -3.748945891857147e-05, -3.583729267120361e-05, -3.4185126423835754e-05, -3.2532960176467896e-05, -3.088079392910004e-05, -2.9228627681732178e-05, -2.757646143436432e-05, -2.592429518699646e-05, -2.42721289396286e-05, -2.2619962692260742e-05, -2.0967796444892883e-05, -1.9315630197525024e-05, -1.7663463950157166e-05, -1.6011297702789307e-05, -1.4359131455421448e-05, -1.2706965208053589e-05, -1.105479896068573e-05, -9.402632713317871e-06, -7.750466465950012e-06, -6.098300218582153e-06, -4.4461339712142944e-06, -2.7939677238464355e-06, -1.1418014764785767e-06, 5.103647708892822e-07, 2.162531018257141e-06, 3.814697265625e-06, 5.466863512992859e-06, 7.119029760360718e-06, 8.771196007728577e-06, 1.0423362255096436e-05, 1.2075528502464294e-05, 1.3727694749832153e-05, 1.5379860997200012e-05, 1.703202724456787e-05, 1.868419349193573e-05, 2.033635973930359e-05, 2.1988525986671448e-05, 2.3640692234039307e-05, 2.5292858481407166e-05, 2.6945024728775024e-05, 2.8597190976142883e-05, 3.0249357223510742e-05, 3.19015234708786e-05, 3.355368971824646e-05, 3.520585596561432e-05, 3.685802221298218e-05, 3.851018846035004e-05, 4.0162354707717896e-05, 4.1814520955085754e-05, 4.346668720245361e-05, 4.511885344982147e-05, 4.677101969718933e-05, 4.842318594455719e-05, 5.007535219192505e-05, 5.172751843929291e-05, 5.3379684686660767e-05, 5.5031850934028625e-05, 5.6684017181396484e-05]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 22.0, 993.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.128461241722107, -1.0280100107192993, -0.9275587201118469, -0.8271074891090393, -0.7266561985015869, -0.6262049674987793, -0.5257537364959717, -0.4253024458885193, -0.32485121488571167, -0.22439995408058167, -0.12394870817661285, -0.023497462272644043, 0.07695379853248596, 0.17740505933761597, 0.2778562903404236, 0.378307580947876, 0.4787588119506836, 0.5792100429534912, 0.6796613335609436, 0.7801125645637512, 0.8805638551712036, 0.9810150861740112, 1.0814663171768188, 1.181917667388916, 1.2823688983917236, 1.3828201293945312, 1.4832713603973389, 1.5837225914001465, 1.6841739416122437, 1.7846251726150513, 1.8850764036178589, 1.985527753829956, 2.0859787464141846, 2.186429977416992, 2.2868812084198, 2.3873324394226074, 2.487783670425415, 2.5882349014282227, 2.6886863708496094, 2.789137601852417, 2.8895888328552246, 2.9900400638580322, 3.09049129486084, 3.1909425258636475, 3.291393756866455, 3.391845226287842, 3.4922962188720703, 3.592747688293457, 3.6931986808776855, 3.793649911880493, 3.894101142883301, 3.9945523738861084, 4.095003604888916, 4.195455074310303, 4.295906066894531, 4.396357536315918, 4.496809005737305, 4.597260475158691, 4.69771146774292, 4.798162937164307, 4.898613929748535, 4.999065399169922, 5.09951639175415, 5.199967861175537, 5.300418853759766]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 5.0, 7.0, 7.0, 8.0, 21.0, 28.0, 43.0, 60.0, 81.0, 91.0, 102.0, 117.0, 119.0, 92.0, 65.0, 47.0, 30.0, 16.0, 16.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.0344904661178589, -1.0088820457458496, -0.9832736253738403, -0.957665205001831, -0.9320568442344666, -0.9064484238624573, -0.880840003490448, -0.8552315831184387, -0.8296232223510742, -0.8040148019790649, -0.7784063816070557, -0.7527979612350464, -0.7271896004676819, -0.7015811800956726, -0.6759727597236633, -0.650364339351654, -0.6247559189796448, -0.5991474986076355, -0.5735390782356262, -0.5479307174682617, -0.5223222970962524, -0.49671387672424316, -0.4711054563522339, -0.4454970359802246, -0.4198886454105377, -0.39428022503852844, -0.36867183446884155, -0.3430634140968323, -0.317454993724823, -0.2918466031551361, -0.26623818278312683, -0.24062977731227875, -0.21502143144607544, -0.18941302597522736, -0.16380462050437927, -0.13819620013237, -0.11258779466152191, -0.08697938919067383, -0.06137096881866455, -0.03576256334781647, -0.010154157876968384, 0.015454251319169998, 0.04106266051530838, 0.06667107343673706, 0.09227947890758514, 0.11788788437843323, 0.1434963047504425, 0.1691047102212906, 0.19471311569213867, 0.22032152116298676, 0.24592992663383484, 0.2715383470058441, 0.297146737575531, 0.3227551579475403, 0.34836357831954956, 0.37397199869155884, 0.3995803892612457, 0.425188809633255, 0.4507972002029419, 0.47640562057495117, 0.5020140409469604, 0.5276224613189697, 0.553230881690979, 0.5788392424583435, 0.6044476628303528]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 0.0, 3.0, 6.0, 8.0, 11.0, 12.0, 17.0, 23.0, 41.0, 59.0, 119.0, 169.0, 306.0, 576.0, 1192.0, 2535.0, 6648.0, 38377.0, 4126789.0, 11676.0, 3314.0, 1265.0, 519.0, 263.0, 144.0, 71.0, 52.0, 31.0, 12.0, 16.0, 11.0, 8.0, 4.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2269287109375, -0.21966171264648438, -0.21239471435546875, -0.20512771606445312, -0.1978607177734375, -0.19059371948242188, -0.18332672119140625, -0.17605972290039062, -0.168792724609375, -0.16152572631835938, -0.15425872802734375, -0.14699172973632812, -0.1397247314453125, -0.13245773315429688, -0.12519073486328125, -0.11792373657226562, -0.11065673828125, -0.10338973999023438, -0.09612274169921875, -0.08885574340820312, -0.0815887451171875, -0.07432174682617188, -0.06705474853515625, -0.059787750244140625, -0.052520751953125, -0.045253753662109375, -0.03798675537109375, -0.030719757080078125, -0.0234527587890625, -0.016185760498046875, -0.00891876220703125, -0.001651763916015625, 0.005615234375, 0.012882232666015625, 0.02014923095703125, 0.027416229248046875, 0.0346832275390625, 0.041950225830078125, 0.04921722412109375, 0.056484222412109375, 0.063751220703125, 0.07101821899414062, 0.07828521728515625, 0.08555221557617188, 0.0928192138671875, 0.10008621215820312, 0.10735321044921875, 0.11462020874023438, 0.12188720703125, 0.12915420532226562, 0.13642120361328125, 0.14368820190429688, 0.1509552001953125, 0.15822219848632812, 0.16548919677734375, 0.17275619506835938, 0.180023193359375, 0.18729019165039062, 0.19455718994140625, 0.20182418823242188, 0.2090911865234375, 0.21635818481445312, 0.22362518310546875, 0.23089218139648438, 0.2381591796875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 2.0, 3.0, 6.0, 2.0, 7.0, 2.0, 15.0, 7.0, 14.0, 17.0, 18.0, 130.0, 632.0, 45.0, 18.0, 12.0, 12.0, 12.0, 6.0, 9.0, 4.0, 4.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021514892578125, -0.02082514762878418, -0.02013540267944336, -0.01944565773010254, -0.01875591278076172, -0.0180661678314209, -0.017376422882080078, -0.016686677932739258, -0.015996932983398438, -0.015307188034057617, -0.014617443084716797, -0.013927698135375977, -0.013237953186035156, -0.012548208236694336, -0.011858463287353516, -0.011168718338012695, -0.010478973388671875, -0.009789228439331055, -0.009099483489990234, -0.008409738540649414, -0.007719993591308594, -0.0070302486419677734, -0.006340503692626953, -0.005650758743286133, -0.0049610137939453125, -0.004271268844604492, -0.003581523895263672, -0.0028917789459228516, -0.0022020339965820312, -0.001512289047241211, -0.0008225440979003906, -0.0001327991485595703, 0.00055694580078125, 0.0012466907501220703, 0.0019364356994628906, 0.002626180648803711, 0.0033159255981445312, 0.0040056705474853516, 0.004695415496826172, 0.005385160446166992, 0.0060749053955078125, 0.006764650344848633, 0.007454395294189453, 0.008144140243530273, 0.008833885192871094, 0.009523630142211914, 0.010213375091552734, 0.010903120040893555, 0.011592864990234375, 0.012282609939575195, 0.012972354888916016, 0.013662099838256836, 0.014351844787597656, 0.015041589736938477, 0.015731334686279297, 0.016421079635620117, 0.017110824584960938, 0.017800569534301758, 0.018490314483642578, 0.0191800594329834, 0.01986980438232422, 0.02055954933166504, 0.02124929428100586, 0.02193903923034668, 0.0226287841796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 11.0, 7.0, 14.0, 13.0, 16.0, 15.0, 22.0, 27.0, 40.0, 63.0, 74.0, 99.0, 203.0, 391.0, 1049.0, 7661.0, 4132536.0, 48679.0, 2023.0, 562.0, 276.0, 139.0, 85.0, 68.0, 51.0, 33.0, 24.0, 17.0, 12.0, 16.0, 13.0, 12.0, 10.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357177734375, -0.3462677001953125, -0.335357666015625, -0.3244476318359375, -0.31353759765625, -0.3026275634765625, -0.291717529296875, -0.2808074951171875, -0.2698974609375, -0.2589874267578125, -0.248077392578125, -0.2371673583984375, -0.22625732421875, -0.2153472900390625, -0.204437255859375, -0.1935272216796875, -0.1826171875, -0.1717071533203125, -0.160797119140625, -0.1498870849609375, -0.13897705078125, -0.1280670166015625, -0.117156982421875, -0.1062469482421875, -0.0953369140625, -0.0844268798828125, -0.073516845703125, -0.0626068115234375, -0.05169677734375, -0.0407867431640625, -0.029876708984375, -0.0189666748046875, -0.008056640625, 0.0028533935546875, 0.013763427734375, 0.0246734619140625, 0.03558349609375, 0.0464935302734375, 0.057403564453125, 0.0683135986328125, 0.0792236328125, 0.0901336669921875, 0.101043701171875, 0.1119537353515625, 0.12286376953125, 0.1337738037109375, 0.144683837890625, 0.1555938720703125, 0.16650390625, 0.1774139404296875, 0.188323974609375, 0.1992340087890625, 0.21014404296875, 0.2210540771484375, 0.231964111328125, 0.2428741455078125, 0.2537841796875, 0.2646942138671875, 0.275604248046875, 0.2865142822265625, 0.29742431640625, 0.3083343505859375, 0.319244384765625, 0.3301544189453125, 0.341064453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 8.0, 6.0, 7.0, 9.0, 11.0, 9.0, 15.0, 20.0, 20.0, 27.0, 40.0, 51.0, 73.0, 86.0, 136.0, 486.0, 2588.0, 148.0, 90.0, 63.0, 48.0, 24.0, 16.0, 15.0, 19.0, 10.0, 2.0, 9.0, 1.0, 5.0, 5.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052825927734375, -0.05136442184448242, -0.049902915954589844, -0.048441410064697266, -0.04697990417480469, -0.04551839828491211, -0.04405689239501953, -0.04259538650512695, -0.041133880615234375, -0.0396723747253418, -0.03821086883544922, -0.03674936294555664, -0.03528785705566406, -0.033826351165771484, -0.032364845275878906, -0.030903339385986328, -0.02944183349609375, -0.027980327606201172, -0.026518821716308594, -0.025057315826416016, -0.023595809936523438, -0.02213430404663086, -0.02067279815673828, -0.019211292266845703, -0.017749786376953125, -0.016288280487060547, -0.014826774597167969, -0.01336526870727539, -0.011903762817382812, -0.010442256927490234, -0.008980751037597656, -0.007519245147705078, -0.0060577392578125, -0.004596233367919922, -0.0031347274780273438, -0.0016732215881347656, -0.0002117156982421875, 0.0012497901916503906, 0.0027112960815429688, 0.004172801971435547, 0.005634307861328125, 0.007095813751220703, 0.008557319641113281, 0.01001882553100586, 0.011480331420898438, 0.012941837310791016, 0.014403343200683594, 0.015864849090576172, 0.01732635498046875, 0.018787860870361328, 0.020249366760253906, 0.021710872650146484, 0.023172378540039062, 0.02463388442993164, 0.02609539031982422, 0.027556896209716797, 0.029018402099609375, 0.030479907989501953, 0.03194141387939453, 0.03340291976928711, 0.03486442565917969, 0.036325931549072266, 0.037787437438964844, 0.03924894332885742, 0.04071044921875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 52.0, 962.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4700276553630829, -0.43908369541168213, -0.40813976526260376, -0.377195805311203, -0.34625184535980225, -0.3153079152107239, -0.2843639552593231, -0.25341999530792236, -0.222476065158844, -0.19153212010860443, -0.16058817505836487, -0.1296442151069641, -0.09870027005672455, -0.06775632500648499, -0.03681236505508423, -0.0058684200048446655, 0.025075525045394897, 0.05601947382092476, 0.08696342259645462, 0.11790737509727478, 0.14885132014751434, 0.1797952651977539, 0.21073922514915466, 0.24168317019939423, 0.2726271152496338, 0.30357107520103455, 0.3345150053501129, 0.36545896530151367, 0.39640289545059204, 0.4273468554019928, 0.45829081535339355, 0.4892347455024719, 0.5201786756515503, 0.5511226058006287, 0.5820665955543518, 0.6130105257034302, 0.6439544558525085, 0.6748983860015869, 0.7058423757553101, 0.7367863059043884, 0.7677302360534668, 0.7986741662025452, 0.8296181559562683, 0.8605620861053467, 0.891506016254425, 0.9224499464035034, 0.9533939361572266, 0.9843378663063049, 1.0152819156646729, 1.046225905418396, 1.0771697759628296, 1.1081137657165527, 1.1390577554702759, 1.1700016260147095, 1.2009456157684326, 1.2318896055221558, 1.2628334760665894, 1.2937774658203125, 1.324721336364746, 1.3556653261184692, 1.3866093158721924, 1.417553186416626, 1.4484971761703491, 1.4794411659240723, 1.5103850364685059]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 15.0, 16.0, 17.0, 26.0, 40.0, 63.0, 63.0, 93.0, 88.0, 90.0, 90.0, 103.0, 76.0, 52.0, 47.0, 36.0, 25.0, 14.0, 11.0, 10.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31139427423477173, -0.30238795280456543, -0.29338163137435913, -0.28437530994415283, -0.27536898851394653, -0.26636266708374023, -0.25735634565353394, -0.24834999442100525, -0.23934367299079895, -0.23033735156059265, -0.22133103013038635, -0.21232470870018005, -0.20331837236881256, -0.19431205093860626, -0.18530572950839996, -0.17629939317703247, -0.16729308664798737, -0.15828676521778107, -0.14928044378757477, -0.14027410745620728, -0.13126778602600098, -0.12226146459579468, -0.11325514316558838, -0.10424881428480148, -0.09524249285459518, -0.08623617142438889, -0.07722984254360199, -0.06822352111339569, -0.059217195957899094, -0.050210870802402496, -0.0412045493721962, -0.0321982204914093, -0.023191899061203003, -0.01418557483702898, -0.005179250612854958, 0.0038270726799964905, 0.012833397835493088, 0.021839722990989685, 0.030846044421195984, 0.03985237330198288, 0.04885869473218918, 0.057865019887685776, 0.06687134504318237, 0.07587766647338867, 0.08488398790359497, 0.09389031678438187, 0.10289663821458817, 0.11190296709537506, 0.12090928852558136, 0.12991560995578766, 0.13892193138599396, 0.14792826771736145, 0.15693458914756775, 0.16594091057777405, 0.17494723200798035, 0.18395355343818665, 0.19295987486839294, 0.20196619629859924, 0.21097251772880554, 0.21997883915901184, 0.22898517549037933, 0.23799149692058563, 0.24699781835079193, 0.2560041546821594, 0.2650104761123657]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 10.0, 9.0, 15.0, 12.0, 23.0, 29.0, 34.0, 56.0, 67.0, 92.0, 123.0, 182.0, 276.0, 409.0, 578.0, 919.0, 1541.0, 2599.0, 4915.0, 10643.0, 30571.0, 907988.0, 58795.0, 14289.0, 6205.0, 3191.0, 1801.0, 1085.0, 651.0, 483.0, 284.0, 192.0, 144.0, 98.0, 73.0, 56.0, 29.0, 18.0, 14.0, 15.0, 8.0, 12.0, 6.0, 6.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.066436767578125, -0.06427001953125, -0.062103271484375, -0.0599365234375, -0.057769775390625, -0.05560302734375, -0.053436279296875, -0.05126953125, -0.049102783203125, -0.04693603515625, -0.044769287109375, -0.0426025390625, -0.040435791015625, -0.03826904296875, -0.036102294921875, -0.033935546875, -0.031768798828125, -0.02960205078125, -0.027435302734375, -0.0252685546875, -0.023101806640625, -0.02093505859375, -0.018768310546875, -0.0166015625, -0.014434814453125, -0.01226806640625, -0.010101318359375, -0.0079345703125, -0.005767822265625, -0.00360107421875, -0.001434326171875, 0.000732421875, 0.002899169921875, 0.00506591796875, 0.007232666015625, 0.0093994140625, 0.011566162109375, 0.01373291015625, 0.015899658203125, 0.01806640625, 0.020233154296875, 0.02239990234375, 0.024566650390625, 0.0267333984375, 0.028900146484375, 0.03106689453125, 0.033233642578125, 0.035400390625, 0.037567138671875, 0.03973388671875, 0.041900634765625, 0.0440673828125, 0.046234130859375, 0.04840087890625, 0.050567626953125, 0.052734375, 0.054901123046875, 0.05706787109375, 0.059234619140625, 0.0614013671875, 0.063568115234375, 0.06573486328125, 0.067901611328125, 0.070068359375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 8.0, 0.0, 4.0, 3.0, 4.0, 5.0, 6.0, 3.0, 13.0, 5.0, 13.0, 16.0, 16.0, 60.0, 395.0, 326.0, 36.0, 17.0, 9.0, 13.0, 11.0, 8.0, 8.0, 4.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185546875, -0.01797032356262207, -0.01738595962524414, -0.01680159568786621, -0.01621723175048828, -0.01563286781311035, -0.015048503875732422, -0.014464139938354492, -0.013879776000976562, -0.013295412063598633, -0.012711048126220703, -0.012126684188842773, -0.011542320251464844, -0.010957956314086914, -0.010373592376708984, -0.009789228439331055, -0.009204864501953125, -0.008620500564575195, -0.008036136627197266, -0.007451772689819336, -0.006867408752441406, -0.0062830448150634766, -0.005698680877685547, -0.005114316940307617, -0.0045299530029296875, -0.003945589065551758, -0.003361225128173828, -0.0027768611907958984, -0.0021924972534179688, -0.001608133316040039, -0.0010237693786621094, -0.0004394054412841797, 0.00014495849609375, 0.0007293224334716797, 0.0013136863708496094, 0.001898050308227539, 0.0024824142456054688, 0.0030667781829833984, 0.003651142120361328, 0.004235506057739258, 0.0048198699951171875, 0.005404233932495117, 0.005988597869873047, 0.0065729618072509766, 0.007157325744628906, 0.007741689682006836, 0.008326053619384766, 0.008910417556762695, 0.009494781494140625, 0.010079145431518555, 0.010663509368896484, 0.011247873306274414, 0.011832237243652344, 0.012416601181030273, 0.013000965118408203, 0.013585329055786133, 0.014169692993164062, 0.014754056930541992, 0.015338420867919922, 0.01592278480529785, 0.01650714874267578, 0.01709151268005371, 0.01767587661743164, 0.01826024055480957, 0.0188446044921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 8.0, 5.0, 10.0, 17.0, 20.0, 27.0, 29.0, 30.0, 56.0, 60.0, 73.0, 81.0, 134.0, 121.0, 168.0, 208.0, 335.0, 894.0, 6846.0, 892135.0, 142360.0, 3064.0, 649.0, 262.0, 204.0, 130.0, 130.0, 94.0, 66.0, 76.0, 59.0, 47.0, 29.0, 32.0, 16.0, 22.0, 12.0, 10.0, 8.0, 8.0, 5.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.169189453125, -0.16403770446777344, -0.15888595581054688, -0.1537342071533203, -0.14858245849609375, -0.1434307098388672, -0.13827896118164062, -0.13312721252441406, -0.1279754638671875, -0.12282371520996094, -0.11767196655273438, -0.11252021789550781, -0.10736846923828125, -0.10221672058105469, -0.09706497192382812, -0.09191322326660156, -0.086761474609375, -0.08160972595214844, -0.07645797729492188, -0.07130622863769531, -0.06615447998046875, -0.06100273132324219, -0.055850982666015625, -0.05069923400878906, -0.0455474853515625, -0.04039573669433594, -0.035243988037109375, -0.030092239379882812, -0.02494049072265625, -0.019788742065429688, -0.014636993408203125, -0.009485244750976562, -0.00433349609375, 0.0008182525634765625, 0.005970001220703125, 0.011121749877929688, 0.01627349853515625, 0.021425247192382812, 0.026576995849609375, 0.03172874450683594, 0.0368804931640625, 0.04203224182128906, 0.047183990478515625, 0.05233573913574219, 0.05748748779296875, 0.06263923645019531, 0.06779098510742188, 0.07294273376464844, 0.078094482421875, 0.08324623107910156, 0.08839797973632812, 0.09354972839355469, 0.09870147705078125, 0.10385322570800781, 0.10900497436523438, 0.11415672302246094, 0.1193084716796875, 0.12446022033691406, 0.12961196899414062, 0.1347637176513672, 0.13991546630859375, 0.1450672149658203, 0.15021896362304688, 0.15537071228027344, 0.1605224609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 7.0, 10.0, 14.0, 14.0, 16.0, 10.0, 18.0, 29.0, 33.0, 33.0, 47.0, 27.0, 42.0, 45.0, 38.0, 35.0, 46.0, 39.0, 47.0, 48.0, 37.0, 39.0, 39.0, 35.0, 42.0, 24.0, 24.0, 27.0, 24.0, 20.0, 12.0, 19.0, 7.0, 15.0, 7.0, 7.0, 4.0, 6.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.053863525390625, -0.05222320556640625, -0.0505828857421875, -0.04894256591796875, -0.04730224609375, -0.04566192626953125, -0.0440216064453125, -0.04238128662109375, -0.040740966796875, -0.03910064697265625, -0.0374603271484375, -0.03582000732421875, -0.0341796875, -0.03253936767578125, -0.0308990478515625, -0.02925872802734375, -0.027618408203125, -0.02597808837890625, -0.0243377685546875, -0.02269744873046875, -0.02105712890625, -0.01941680908203125, -0.0177764892578125, -0.01613616943359375, -0.014495849609375, -0.01285552978515625, -0.0112152099609375, -0.00957489013671875, -0.0079345703125, -0.00629425048828125, -0.0046539306640625, -0.00301361083984375, -0.001373291015625, 0.00026702880859375, 0.0019073486328125, 0.00354766845703125, 0.00518798828125, 0.00682830810546875, 0.0084686279296875, 0.01010894775390625, 0.011749267578125, 0.01338958740234375, 0.0150299072265625, 0.01667022705078125, 0.018310546875, 0.01995086669921875, 0.0215911865234375, 0.02323150634765625, 0.024871826171875, 0.02651214599609375, 0.0281524658203125, 0.02979278564453125, 0.03143310546875, 0.03307342529296875, 0.0347137451171875, 0.03635406494140625, 0.037994384765625, 0.03963470458984375, 0.0412750244140625, 0.04291534423828125, 0.0445556640625, 0.04619598388671875, 0.0478363037109375, 0.04947662353515625, 0.051116943359375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 12.0, 16.0, 23.0, 62.0, 62.0, 82.0, 158.0, 277.0, 579.0, 1487.0, 8230.0, 992684.0, 40439.0, 2682.0, 822.0, 377.0, 250.0, 120.0, 66.0, 39.0, 24.0, 15.0, 11.0, 12.0, 7.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002751350402832031, -0.0002672094851732254, -0.0002592839300632477, -0.00025135837495326996, -0.00024343281984329224, -0.00023550726473331451, -0.0002275817096233368, -0.00021965615451335907, -0.00021173059940338135, -0.00020380504429340363, -0.0001958794891834259, -0.00018795393407344818, -0.00018002837896347046, -0.00017210282385349274, -0.00016417726874351501, -0.0001562517136335373, -0.00014832615852355957, -0.00014040060341358185, -0.00013247504830360413, -0.0001245494931936264, -0.00011662393808364868, -0.00010869838297367096, -0.00010077282786369324, -9.284727275371552e-05, -8.492171764373779e-05, -7.699616253376007e-05, -6.907060742378235e-05, -6.114505231380463e-05, -5.3219497203826904e-05, -4.529394209384918e-05, -3.736838698387146e-05, -2.9442831873893738e-05, -2.1517276763916016e-05, -1.3591721653938293e-05, -5.666166543960571e-06, 2.259388566017151e-06, 1.0184943675994873e-05, 1.8110498785972595e-05, 2.6036053895950317e-05, 3.396160900592804e-05, 4.188716411590576e-05, 4.9812719225883484e-05, 5.7738274335861206e-05, 6.566382944583893e-05, 7.358938455581665e-05, 8.151493966579437e-05, 8.94404947757721e-05, 9.736604988574982e-05, 0.00010529160499572754, 0.00011321716010570526, 0.00012114271521568298, 0.0001290682703256607, 0.00013699382543563843, 0.00014491938054561615, 0.00015284493565559387, 0.0001607704907655716, 0.00016869604587554932, 0.00017662160098552704, 0.00018454715609550476, 0.00019247271120548248, 0.0002003982663154602, 0.00020832382142543793, 0.00021624937653541565, 0.00022417493164539337, 0.0002321004867553711]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 7.0, 11.0, 10.0, 25.0, 28.0, 42.0, 65.0, 74.0, 94.0, 73.0, 118.0, 89.0, 102.0, 55.0, 50.0, 42.0, 29.0, 16.0, 12.0, 14.0, 4.0, 5.0, 6.0, 10.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.477588951587677e-06, -7.266178727149963e-06, -7.05476850271225e-06, -6.843358278274536e-06, -6.6319480538368225e-06, -6.420537829399109e-06, -6.209127604961395e-06, -5.997717380523682e-06, -5.786307156085968e-06, -5.574896931648254e-06, -5.363486707210541e-06, -5.152076482772827e-06, -4.9406662583351135e-06, -4.7292560338974e-06, -4.517845809459686e-06, -4.306435585021973e-06, -4.095025360584259e-06, -3.883615136146545e-06, -3.6722049117088318e-06, -3.460794687271118e-06, -3.2493844628334045e-06, -3.037974238395691e-06, -2.8265640139579773e-06, -2.6151537895202637e-06, -2.40374356508255e-06, -2.1923333406448364e-06, -1.980923116207123e-06, -1.7695128917694092e-06, -1.5581026673316956e-06, -1.346692442893982e-06, -1.1352822184562683e-06, -9.238719940185547e-07, -7.124617695808411e-07, -5.010515451431274e-07, -2.896413207054138e-07, -7.82310962677002e-08, 1.3317912817001343e-07, 3.4458935260772705e-07, 5.559995770454407e-07, 7.674098014831543e-07, 9.78820025920868e-07, 1.1902302503585815e-06, 1.4016404747962952e-06, 1.6130506992340088e-06, 1.8244609236717224e-06, 2.035871148109436e-06, 2.2472813725471497e-06, 2.4586915969848633e-06, 2.670101821422577e-06, 2.8815120458602905e-06, 3.092922270298004e-06, 3.3043324947357178e-06, 3.5157427191734314e-06, 3.727152943611145e-06, 3.938563168048859e-06, 4.149973392486572e-06, 4.361383616924286e-06, 4.5727938413619995e-06, 4.784204065799713e-06, 4.995614290237427e-06, 5.20702451467514e-06, 5.418434739112854e-06, 5.629844963550568e-06, 5.841255187988281e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 8.0, 9.0, 18.0, 24.0, 28.0, 64.0, 75.0, 134.0, 257.0, 751.0, 15056.0, 1028984.0, 2182.0, 417.0, 207.0, 120.0, 70.0, 45.0, 32.0, 21.0, 15.0, 12.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00038933753967285156, -0.0003788955509662628, -0.00036845356225967407, -0.00035801157355308533, -0.0003475695848464966, -0.00033712759613990784, -0.0003266856074333191, -0.00031624361872673035, -0.0003058016300201416, -0.00029535964131355286, -0.0002849176526069641, -0.00027447566390037537, -0.0002640336751937866, -0.0002535916864871979, -0.00024314969778060913, -0.00023270770907402039, -0.00022226572036743164, -0.0002118237316608429, -0.00020138174295425415, -0.0001909397542476654, -0.00018049776554107666, -0.00017005577683448792, -0.00015961378812789917, -0.00014917179942131042, -0.00013872981071472168, -0.00012828782200813293, -0.00011784583330154419, -0.00010740384459495544, -9.69618558883667e-05, -8.651986718177795e-05, -7.607787847518921e-05, -6.563588976860046e-05, -5.519390106201172e-05, -4.4751912355422974e-05, -3.430992364883423e-05, -2.3867934942245483e-05, -1.3425946235656738e-05, -2.983957529067993e-06, 7.458031177520752e-06, 1.7900019884109497e-05, 2.8342008590698242e-05, 3.878399729728699e-05, 4.922598600387573e-05, 5.966797471046448e-05, 7.010996341705322e-05, 8.055195212364197e-05, 9.099394083023071e-05, 0.00010143592953681946, 0.0001118779182434082, 0.00012231990694999695, 0.0001327618956565857, 0.00014320388436317444, 0.00015364587306976318, 0.00016408786177635193, 0.00017452985048294067, 0.00018497183918952942, 0.00019541382789611816, 0.0002058558166027069, 0.00021629780530929565, 0.0002267397940158844, 0.00023718178272247314, 0.0002476237714290619, 0.00025806576013565063, 0.0002685077488422394, 0.0002789497375488281]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 8.0, 9.0, 8.0, 24.0, 18.0, 28.0, 40.0, 65.0, 91.0, 119.0, 123.0, 106.0, 84.0, 68.0, 61.0, 41.0, 27.0, 20.0, 13.0, 13.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.0001239776611328125, -0.00012112874537706375, -0.000118279829621315, -0.00011543091386556625, -0.0001125819981098175, -0.00010973308235406876, -0.00010688416659832001, -0.00010403525084257126, -0.00010118633508682251, -9.833741933107376e-05, -9.548850357532501e-05, -9.263958781957626e-05, -8.979067206382751e-05, -8.694175630807877e-05, -8.409284055233002e-05, -8.124392479658127e-05, -7.839500904083252e-05, -7.554609328508377e-05, -7.269717752933502e-05, -6.984826177358627e-05, -6.699934601783752e-05, -6.415043026208878e-05, -6.130151450634003e-05, -5.845259875059128e-05, -5.560368299484253e-05, -5.275476723909378e-05, -4.990585148334503e-05, -4.705693572759628e-05, -4.4208019971847534e-05, -4.1359104216098785e-05, -3.851018846035004e-05, -3.566127270460129e-05, -3.281235694885254e-05, -2.996344119310379e-05, -2.711452543735504e-05, -2.4265609681606293e-05, -2.1416693925857544e-05, -1.8567778170108795e-05, -1.5718862414360046e-05, -1.2869946658611298e-05, -1.0021030902862549e-05, -7.1721151471138e-06, -4.323199391365051e-06, -1.4742836356163025e-06, 1.3746321201324463e-06, 4.223547875881195e-06, 7.072463631629944e-06, 9.921379387378693e-06, 1.2770295143127441e-05, 1.561921089887619e-05, 1.846812665462494e-05, 2.1317042410373688e-05, 2.4165958166122437e-05, 2.7014873921871185e-05, 2.9863789677619934e-05, 3.271270543336868e-05, 3.556162118911743e-05, 3.841053694486618e-05, 4.125945270061493e-05, 4.410836845636368e-05, 4.695728421211243e-05, 4.9806199967861176e-05, 5.2655115723609924e-05, 5.550403147935867e-05, 5.835294723510742e-05]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 86.0, 920.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.172924280166626, -1.1366114616394043, -1.1002987623214722, -1.06398606300354, -1.0276732444763184, -0.9913604855537415, -0.9550477266311646, -0.9187349677085876, -0.8824222087860107, -0.8461094498634338, -0.8097966909408569, -0.77348393201828, -0.7371711730957031, -0.7008584141731262, -0.6645456552505493, -0.6282328963279724, -0.5919201374053955, -0.5556073784828186, -0.5192946195602417, -0.4829818606376648, -0.4466691017150879, -0.410356342792511, -0.3740435838699341, -0.3377308249473572, -0.3014180660247803, -0.26510530710220337, -0.22879254817962646, -0.19247978925704956, -0.15616703033447266, -0.11985427141189575, -0.08354151248931885, -0.04722875356674194, -0.01091611385345459, 0.025396645069122314, 0.06170940399169922, 0.09802216291427612, 0.13433492183685303, 0.17064768075942993, 0.20696043968200684, 0.24327319860458374, 0.27958595752716064, 0.31589871644973755, 0.35221147537231445, 0.38852423429489136, 0.42483699321746826, 0.46114975214004517, 0.49746251106262207, 0.533775269985199, 0.5700880289077759, 0.6064007878303528, 0.6427135467529297, 0.6790263056755066, 0.7153390645980835, 0.7516518235206604, 0.7879645824432373, 0.8242773413658142, 0.8605901002883911, 0.896902859210968, 0.9332156181335449, 0.9695283770561218, 1.0058411359786987, 1.0421538352966309, 1.0784666538238525, 1.1147794723510742, 1.1510921716690063]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 6.0, 24.0, 24.0, 11.0, 24.0, 26.0, 40.0, 36.0, 48.0, 50.0, 41.0, 43.0, 56.0, 59.0, 64.0, 59.0, 36.0, 55.0, 51.0, 41.0, 44.0, 24.0, 21.0, 20.0, 16.0, 21.0, 20.0, 6.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4240266680717468, -0.41023263335227966, -0.3964385986328125, -0.38264456391334534, -0.3688505291938782, -0.3550565242767334, -0.34126245975494385, -0.3274684548377991, -0.3136744201183319, -0.29988038539886475, -0.2860863506793976, -0.2722923159599304, -0.25849828124046326, -0.2447042614221573, -0.23091022670269012, -0.21711620688438416, -0.2033221572637558, -0.18952812254428864, -0.17573408782482147, -0.1619400680065155, -0.14814603328704834, -0.13435199856758118, -0.12055796384811401, -0.10676393657922745, -0.09296990185976028, -0.07917586714029312, -0.06538183987140656, -0.05158780515193939, -0.03779377415776253, -0.023999743163585663, -0.0102057084441185, 0.0035883188247680664, 0.01738235354423523, 0.031176384538412094, 0.04497041553258896, 0.05876445025205612, 0.07255847752094269, 0.08635251224040985, 0.10014654695987701, 0.11394057422876358, 0.12773460149765015, 0.1415286362171173, 0.15532267093658447, 0.16911670565605164, 0.1829107254743576, 0.19670476019382477, 0.21049879491329193, 0.2242928147315979, 0.23808686435222626, 0.2518808841705322, 0.2656749188899994, 0.27946895360946655, 0.2932629883289337, 0.3070570230484009, 0.32085105776786804, 0.3346450924873352, 0.34843912720680237, 0.36223316192626953, 0.3760271966457367, 0.38982123136520386, 0.403615266084671, 0.4174093008041382, 0.43120330572128296, 0.4449973404407501, 0.4587913751602173]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 0.0, 6.0, 9.0, 9.0, 9.0, 23.0, 34.0, 64.0, 109.0, 258.0, 735.0, 2978.0, 4179007.0, 9421.0, 1073.0, 287.0, 102.0, 50.0, 35.0, 16.0, 9.0, 4.0, 12.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.2629241943359375, -0.254364013671875, -0.2458038330078125, -0.23724365234375, -0.2286834716796875, -0.220123291015625, -0.2115631103515625, -0.2030029296875, -0.1944427490234375, -0.185882568359375, -0.1773223876953125, -0.16876220703125, -0.1602020263671875, -0.151641845703125, -0.1430816650390625, -0.134521484375, -0.1259613037109375, -0.117401123046875, -0.1088409423828125, -0.10028076171875, -0.0917205810546875, -0.083160400390625, -0.0746002197265625, -0.0660400390625, -0.0574798583984375, -0.048919677734375, -0.0403594970703125, -0.03179931640625, -0.0232391357421875, -0.014678955078125, -0.0061187744140625, 0.00244140625, 0.0110015869140625, 0.019561767578125, 0.0281219482421875, 0.03668212890625, 0.0452423095703125, 0.053802490234375, 0.0623626708984375, 0.0709228515625, 0.0794830322265625, 0.088043212890625, 0.0966033935546875, 0.10516357421875, 0.1137237548828125, 0.122283935546875, 0.1308441162109375, 0.139404296875, 0.1479644775390625, 0.156524658203125, 0.1650848388671875, 0.17364501953125, 0.1822052001953125, 0.190765380859375, 0.1993255615234375, 0.2078857421875, 0.2164459228515625, 0.225006103515625, 0.2335662841796875, 0.24212646484375, 0.2506866455078125, 0.259246826171875, 0.2678070068359375, 0.2763671875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 0.0, 4.0, 7.0, 3.0, 1.0, 7.0, 9.0, 11.0, 13.0, 14.0, 20.0, 73.0, 389.0, 297.0, 52.0, 20.0, 8.0, 15.0, 11.0, 7.0, 6.0, 2.0, 7.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0180511474609375, -0.017482280731201172, -0.016913414001464844, -0.016344547271728516, -0.015775680541992188, -0.01520681381225586, -0.014637947082519531, -0.014069080352783203, -0.013500213623046875, -0.012931346893310547, -0.012362480163574219, -0.01179361343383789, -0.011224746704101562, -0.010655879974365234, -0.010087013244628906, -0.009518146514892578, -0.00894927978515625, -0.008380413055419922, -0.007811546325683594, -0.007242679595947266, -0.0066738128662109375, -0.006104946136474609, -0.005536079406738281, -0.004967212677001953, -0.004398345947265625, -0.003829479217529297, -0.0032606124877929688, -0.0026917457580566406, -0.0021228790283203125, -0.0015540122985839844, -0.0009851455688476562, -0.0004162788391113281, 0.000152587890625, 0.0007214546203613281, 0.0012903213500976562, 0.0018591880798339844, 0.0024280548095703125, 0.0029969215393066406, 0.0035657882690429688, 0.004134654998779297, 0.004703521728515625, 0.005272388458251953, 0.005841255187988281, 0.006410121917724609, 0.0069789886474609375, 0.007547855377197266, 0.008116722106933594, 0.008685588836669922, 0.00925445556640625, 0.009823322296142578, 0.010392189025878906, 0.010961055755615234, 0.011529922485351562, 0.01209878921508789, 0.012667655944824219, 0.013236522674560547, 0.013805389404296875, 0.014374256134033203, 0.014943122863769531, 0.01551198959350586, 0.016080856323242188, 0.016649723052978516, 0.017218589782714844, 0.017787456512451172, 0.0183563232421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 14.0, 7.0, 12.0, 7.0, 18.0, 27.0, 24.0, 25.0, 44.0, 61.0, 89.0, 103.0, 239.0, 680.0, 5916.0, 4168043.0, 17028.0, 1078.0, 340.0, 165.0, 91.0, 72.0, 38.0, 31.0, 23.0, 22.0, 21.0, 7.0, 9.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.180908203125, -0.1743640899658203, -0.16781997680664062, -0.16127586364746094, -0.15473175048828125, -0.14818763732910156, -0.14164352416992188, -0.1350994110107422, -0.1285552978515625, -0.12201118469238281, -0.11546707153320312, -0.10892295837402344, -0.10237884521484375, -0.09583473205566406, -0.08929061889648438, -0.08274650573730469, -0.076202392578125, -0.06965827941894531, -0.06311416625976562, -0.05657005310058594, -0.05002593994140625, -0.04348182678222656, -0.036937713623046875, -0.030393600463867188, -0.0238494873046875, -0.017305374145507812, -0.010761260986328125, -0.0042171478271484375, 0.00232696533203125, 0.008871078491210938, 0.015415191650390625, 0.021959304809570312, 0.02850341796875, 0.03504753112792969, 0.041591644287109375, 0.04813575744628906, 0.05467987060546875, 0.06122398376464844, 0.06776809692382812, 0.07431221008300781, 0.0808563232421875, 0.08740043640136719, 0.09394454956054688, 0.10048866271972656, 0.10703277587890625, 0.11357688903808594, 0.12012100219726562, 0.1266651153564453, 0.133209228515625, 0.1397533416748047, 0.14629745483398438, 0.15284156799316406, 0.15938568115234375, 0.16592979431152344, 0.17247390747070312, 0.1790180206298828, 0.1855621337890625, 0.1921062469482422, 0.19865036010742188, 0.20519447326660156, 0.21173858642578125, 0.21828269958496094, 0.22482681274414062, 0.2313709259033203, 0.2379150390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 9.0, 3.0, 7.0, 2.0, 4.0, 8.0, 11.0, 10.0, 20.0, 18.0, 22.0, 24.0, 27.0, 53.0, 193.0, 3206.0, 238.0, 61.0, 35.0, 35.0, 19.0, 9.0, 12.0, 9.0, 7.0, 5.0, 3.0, 3.0, 4.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0270538330078125, -0.026075124740600586, -0.025096416473388672, -0.024117708206176758, -0.023138999938964844, -0.02216029167175293, -0.021181583404541016, -0.0202028751373291, -0.019224166870117188, -0.018245458602905273, -0.01726675033569336, -0.016288042068481445, -0.015309333801269531, -0.014330625534057617, -0.013351917266845703, -0.012373208999633789, -0.011394500732421875, -0.010415792465209961, -0.009437084197998047, -0.008458375930786133, -0.007479667663574219, -0.006500959396362305, -0.005522251129150391, -0.0045435428619384766, -0.0035648345947265625, -0.0025861263275146484, -0.0016074180603027344, -0.0006287097930908203, 0.00034999847412109375, 0.0013287067413330078, 0.002307415008544922, 0.003286123275756836, 0.00426483154296875, 0.005243539810180664, 0.006222248077392578, 0.007200956344604492, 0.008179664611816406, 0.00915837287902832, 0.010137081146240234, 0.011115789413452148, 0.012094497680664062, 0.013073205947875977, 0.01405191421508789, 0.015030622482299805, 0.01600933074951172, 0.016988039016723633, 0.017966747283935547, 0.01894545555114746, 0.019924163818359375, 0.02090287208557129, 0.021881580352783203, 0.022860288619995117, 0.02383899688720703, 0.024817705154418945, 0.02579641342163086, 0.026775121688842773, 0.027753829956054688, 0.0287325382232666, 0.029711246490478516, 0.03068995475769043, 0.031668663024902344, 0.03264737129211426, 0.03362607955932617, 0.034604787826538086, 0.03558349609375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1017.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36682894825935364, -0.3237524628639221, -0.280676007270813, -0.23759952187538147, -0.19452305138111115, -0.15144658088684082, -0.1083700954914093, -0.06529363989830017, -0.022217154502868652, 0.02085931971669197, 0.0639357939362526, 0.10701227188110352, 0.15008874237537384, 0.19316521286964417, 0.23624169826507568, 0.2793181538581848, 0.32239463925361633, 0.36547112464904785, 0.408547580242157, 0.4516240656375885, 0.49470055103302, 0.5377770066261292, 0.5808534622192383, 0.6239299774169922, 0.6670064330101013, 0.7100828886032104, 0.7531594038009644, 0.7962358593940735, 0.8393123149871826, 0.8823888301849365, 0.9254652857780457, 0.9685417413711548, 1.0116182565689087, 1.0546947717666626, 1.097771167755127, 1.1408476829528809, 1.1839241981506348, 1.2270005941390991, 1.270077109336853, 1.3131535053253174, 1.3562300205230713, 1.3993065357208252, 1.4423829317092896, 1.4854594469070435, 1.5285359621047974, 1.5716123580932617, 1.6146888732910156, 1.6577653884887695, 1.7008419036865234, 1.7439184188842773, 1.7869948148727417, 1.8300713300704956, 1.8731478452682495, 1.9162242412567139, 1.9593007564544678, 2.0023772716522217, 2.0454535484313965, 2.0885300636291504, 2.1316065788269043, 2.174683094024658, 2.217759370803833, 2.260835886001587, 2.303912401199341, 2.3469889163970947, 2.3900654315948486]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 8.0, 8.0, 7.0, 8.0, 5.0, 14.0, 20.0, 24.0, 22.0, 18.0, 37.0, 43.0, 57.0, 50.0, 69.0, 68.0, 69.0, 47.0, 71.0, 49.0, 53.0, 39.0, 46.0, 40.0, 22.0, 19.0, 27.0, 20.0, 15.0, 5.0, 8.0, 5.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08975297212600708, -0.086431123316288, -0.08310927450656891, -0.07978742569684982, -0.07646557688713074, -0.07314373552799225, -0.06982188671827316, -0.06650003790855408, -0.06317818909883499, -0.059856340289115906, -0.05653449147939682, -0.05321264639496803, -0.04989079758524895, -0.04656894877552986, -0.043247103691101074, -0.03992525488138199, -0.0366034060716629, -0.03328155726194382, -0.02995971031486988, -0.026637863367795944, -0.02331601455807686, -0.019994165748357773, -0.016672318801283836, -0.0133504718542099, -0.010028623044490814, -0.006706775166094303, -0.003384927287697792, -6.307940930128098e-05, 0.00325876846909523, 0.006580617278814316, 0.009902464225888252, 0.013224311172962189, 0.016546159982681274, 0.01986800879240036, 0.023189855739474297, 0.026511702686548233, 0.02983355149626732, 0.033155400305986404, 0.03647724539041519, 0.03979909420013428, 0.04312094300985336, 0.04644279181957245, 0.049764640629291534, 0.05308648571372032, 0.05640833452343941, 0.05973018333315849, 0.06305202841758728, 0.06637387722730637, 0.06969572603702545, 0.07301757484674454, 0.07633942365646362, 0.07966127246618271, 0.0829831212759018, 0.08630496263504028, 0.08962681144475937, 0.09294866025447845, 0.09627050906419754, 0.09959235787391663, 0.10291420668363571, 0.1062360554933548, 0.10955789685249329, 0.11287975311279297, 0.11620159447193146, 0.11952344328165054, 0.12284529209136963]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 11.0, 7.0, 7.0, 14.0, 17.0, 31.0, 48.0, 56.0, 82.0, 148.0, 230.0, 356.0, 603.0, 944.0, 1752.0, 3354.0, 7005.0, 17669.0, 133361.0, 839572.0, 25092.0, 9028.0, 4060.0, 2122.0, 1176.0, 699.0, 374.0, 257.0, 151.0, 98.0, 74.0, 53.0, 38.0, 22.0, 19.0, 9.0, 3.0, 6.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05902099609375, -0.05718517303466797, -0.05534934997558594, -0.053513526916503906, -0.051677703857421875, -0.049841880798339844, -0.04800605773925781, -0.04617023468017578, -0.04433441162109375, -0.04249858856201172, -0.04066276550292969, -0.038826942443847656, -0.036991119384765625, -0.035155296325683594, -0.03331947326660156, -0.03148365020751953, -0.0296478271484375, -0.02781200408935547, -0.025976181030273438, -0.024140357971191406, -0.022304534912109375, -0.020468711853027344, -0.018632888793945312, -0.01679706573486328, -0.01496124267578125, -0.013125419616699219, -0.011289596557617188, -0.009453773498535156, -0.007617950439453125, -0.005782127380371094, -0.0039463043212890625, -0.0021104812622070312, -0.000274658203125, 0.0015611648559570312, 0.0033969879150390625, 0.005232810974121094, 0.007068634033203125, 0.008904457092285156, 0.010740280151367188, 0.012576103210449219, 0.01441192626953125, 0.01624774932861328, 0.018083572387695312, 0.019919395446777344, 0.021755218505859375, 0.023591041564941406, 0.025426864624023438, 0.02726268768310547, 0.0290985107421875, 0.03093433380126953, 0.03277015686035156, 0.034605979919433594, 0.036441802978515625, 0.038277626037597656, 0.04011344909667969, 0.04194927215576172, 0.04378509521484375, 0.04562091827392578, 0.04745674133300781, 0.049292564392089844, 0.051128387451171875, 0.052964210510253906, 0.05480003356933594, 0.05663585662841797, 0.0584716796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 6.0, 3.0, 4.0, 5.0, 10.0, 8.0, 14.0, 13.0, 20.0, 66.0, 311.0, 344.0, 89.0, 22.0, 9.0, 12.0, 11.0, 8.0, 8.0, 3.0, 7.0, 2.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01763916015625, -0.017086267471313477, -0.016533374786376953, -0.01598048210144043, -0.015427589416503906, -0.014874696731567383, -0.01432180404663086, -0.013768911361694336, -0.013216018676757812, -0.012663125991821289, -0.012110233306884766, -0.011557340621948242, -0.011004447937011719, -0.010451555252075195, -0.009898662567138672, -0.009345769882202148, -0.008792877197265625, -0.008239984512329102, -0.007687091827392578, -0.007134199142456055, -0.006581306457519531, -0.006028413772583008, -0.005475521087646484, -0.004922628402709961, -0.0043697357177734375, -0.003816843032836914, -0.0032639503479003906, -0.002711057662963867, -0.0021581649780273438, -0.0016052722930908203, -0.0010523796081542969, -0.0004994869232177734, 5.340576171875e-05, 0.0006062984466552734, 0.0011591911315917969, 0.0017120838165283203, 0.0022649765014648438, 0.002817869186401367, 0.0033707618713378906, 0.003923654556274414, 0.0044765472412109375, 0.005029439926147461, 0.005582332611083984, 0.006135225296020508, 0.006688117980957031, 0.007241010665893555, 0.007793903350830078, 0.008346796035766602, 0.008899688720703125, 0.009452581405639648, 0.010005474090576172, 0.010558366775512695, 0.011111259460449219, 0.011664152145385742, 0.012217044830322266, 0.012769937515258789, 0.013322830200195312, 0.013875722885131836, 0.01442861557006836, 0.014981508255004883, 0.015534400939941406, 0.01608729362487793, 0.016640186309814453, 0.017193078994750977, 0.0177459716796875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 4.0, 8.0, 10.0, 8.0, 9.0, 16.0, 19.0, 22.0, 27.0, 30.0, 24.0, 29.0, 31.0, 38.0, 53.0, 57.0, 72.0, 95.0, 94.0, 98.0, 129.0, 213.0, 318.0, 562.0, 1462.0, 9754.0, 825654.0, 202029.0, 4819.0, 1061.0, 499.0, 284.0, 195.0, 130.0, 101.0, 96.0, 74.0, 65.0, 53.0, 53.0, 33.0, 36.0, 25.0, 29.0, 30.0, 28.0, 21.0, 19.0, 9.0, 10.0, 10.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.10028076171875, -0.09703254699707031, -0.09378433227539062, -0.09053611755371094, -0.08728790283203125, -0.08403968811035156, -0.08079147338867188, -0.07754325866699219, -0.0742950439453125, -0.07104682922363281, -0.06779861450195312, -0.06455039978027344, -0.06130218505859375, -0.05805397033691406, -0.054805755615234375, -0.05155754089355469, -0.048309326171875, -0.04506111145019531, -0.041812896728515625, -0.03856468200683594, -0.03531646728515625, -0.03206825256347656, -0.028820037841796875, -0.025571823120117188, -0.0223236083984375, -0.019075393676757812, -0.015827178955078125, -0.012578964233398438, -0.00933074951171875, -0.0060825347900390625, -0.002834320068359375, 0.0004138946533203125, 0.003662109375, 0.0069103240966796875, 0.010158538818359375, 0.013406753540039062, 0.01665496826171875, 0.019903182983398438, 0.023151397705078125, 0.026399612426757812, 0.0296478271484375, 0.03289604187011719, 0.036144256591796875, 0.03939247131347656, 0.04264068603515625, 0.04588890075683594, 0.049137115478515625, 0.05238533020019531, 0.055633544921875, 0.05888175964355469, 0.062129974365234375, 0.06537818908691406, 0.06862640380859375, 0.07187461853027344, 0.07512283325195312, 0.07837104797363281, 0.0816192626953125, 0.08486747741699219, 0.08811569213867188, 0.09136390686035156, 0.09461212158203125, 0.09786033630371094, 0.10110855102539062, 0.10435676574707031, 0.10760498046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 9.0, 7.0, 9.0, 9.0, 9.0, 8.0, 8.0, 12.0, 12.0, 20.0, 17.0, 26.0, 32.0, 27.0, 23.0, 25.0, 29.0, 33.0, 40.0, 30.0, 49.0, 38.0, 52.0, 53.0, 44.0, 46.0, 35.0, 47.0, 34.0, 23.0, 22.0, 20.0, 20.0, 18.0, 18.0, 14.0, 14.0, 8.0, 7.0, 13.0, 8.0, 7.0, 9.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03961181640625, -0.03832864761352539, -0.03704547882080078, -0.03576231002807617, -0.03447914123535156, -0.03319597244262695, -0.031912803649902344, -0.030629634857177734, -0.029346466064453125, -0.028063297271728516, -0.026780128479003906, -0.025496959686279297, -0.024213790893554688, -0.022930622100830078, -0.02164745330810547, -0.02036428451538086, -0.01908111572265625, -0.01779794692993164, -0.01651477813720703, -0.015231609344482422, -0.013948440551757812, -0.012665271759033203, -0.011382102966308594, -0.010098934173583984, -0.008815765380859375, -0.007532596588134766, -0.006249427795410156, -0.004966259002685547, -0.0036830902099609375, -0.002399921417236328, -0.0011167526245117188, 0.00016641616821289062, 0.0014495849609375, 0.0027327537536621094, 0.004015922546386719, 0.005299091339111328, 0.0065822601318359375, 0.007865428924560547, 0.009148597717285156, 0.010431766510009766, 0.011714935302734375, 0.012998104095458984, 0.014281272888183594, 0.015564441680908203, 0.016847610473632812, 0.018130779266357422, 0.01941394805908203, 0.02069711685180664, 0.02198028564453125, 0.02326345443725586, 0.02454662322998047, 0.025829792022705078, 0.027112960815429688, 0.028396129608154297, 0.029679298400878906, 0.030962467193603516, 0.032245635986328125, 0.033528804779052734, 0.034811973571777344, 0.03609514236450195, 0.03737831115722656, 0.03866147994995117, 0.03994464874267578, 0.04122781753540039, 0.042510986328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 12.0, 18.0, 22.0, 24.0, 40.0, 69.0, 117.0, 209.0, 480.0, 1727.0, 26661.0, 1012371.0, 5092.0, 960.0, 345.0, 161.0, 77.0, 49.0, 30.0, 19.0, 14.0, 14.0, 8.0, 7.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00026607513427734375, -0.0002591237425804138, -0.0002521723508834839, -0.00024522095918655396, -0.00023826956748962402, -0.0002313181757926941, -0.00022436678409576416, -0.00021741539239883423, -0.0002104640007019043, -0.00020351260900497437, -0.00019656121730804443, -0.0001896098256111145, -0.00018265843391418457, -0.00017570704221725464, -0.0001687556505203247, -0.00016180425882339478, -0.00015485286712646484, -0.0001479014754295349, -0.00014095008373260498, -0.00013399869203567505, -0.00012704730033874512, -0.00012009590864181519, -0.00011314451694488525, -0.00010619312524795532, -9.924173355102539e-05, -9.229034185409546e-05, -8.533895015716553e-05, -7.83875584602356e-05, -7.143616676330566e-05, -6.448477506637573e-05, -5.75333833694458e-05, -5.058199167251587e-05, -4.363059997558594e-05, -3.6679208278656006e-05, -2.9727816581726074e-05, -2.2776424884796143e-05, -1.582503318786621e-05, -8.87364149093628e-06, -1.9222497940063477e-06, 5.029141902923584e-06, 1.1980533599853516e-05, 1.8931925296783447e-05, 2.588331699371338e-05, 3.283470869064331e-05, 3.978610038757324e-05, 4.6737492084503174e-05, 5.3688883781433105e-05, 6.064027547836304e-05, 6.759166717529297e-05, 7.45430588722229e-05, 8.149445056915283e-05, 8.844584226608276e-05, 9.53972339630127e-05, 0.00010234862565994263, 0.00010930001735687256, 0.00011625140905380249, 0.00012320280075073242, 0.00013015419244766235, 0.00013710558414459229, 0.00014405697584152222, 0.00015100836753845215, 0.00015795975923538208, 0.000164911150932312, 0.00017186254262924194, 0.00017881393432617188]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 1.0, 3.0, 5.0, 5.0, 11.0, 9.0, 11.0, 22.0, 21.0, 23.0, 33.0, 25.0, 35.0, 14.0, 35.0, 51.0, 50.0, 44.0, 62.0, 59.0, 58.0, 38.0, 57.0, 50.0, 40.0, 37.0, 18.0, 27.0, 29.0, 24.0, 11.0, 17.0, 19.0, 9.0, 7.0, 15.0, 7.0, 2.0, 6.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.635883331298828e-06, -3.5213306546211243e-06, -3.4067779779434204e-06, -3.2922253012657166e-06, -3.1776726245880127e-06, -3.063119947910309e-06, -2.948567271232605e-06, -2.834014594554901e-06, -2.7194619178771973e-06, -2.6049092411994934e-06, -2.4903565645217896e-06, -2.3758038878440857e-06, -2.261251211166382e-06, -2.146698534488678e-06, -2.032145857810974e-06, -1.9175931811332703e-06, -1.8030405044555664e-06, -1.6884878277778625e-06, -1.5739351511001587e-06, -1.4593824744224548e-06, -1.344829797744751e-06, -1.2302771210670471e-06, -1.1157244443893433e-06, -1.0011717677116394e-06, -8.866190910339355e-07, -7.720664143562317e-07, -6.575137376785278e-07, -5.42961061000824e-07, -4.284083843231201e-07, -3.1385570764541626e-07, -1.993030309677124e-07, -8.475035429000854e-08, 2.9802322387695312e-08, 1.4435499906539917e-07, 2.5890767574310303e-07, 3.734603524208069e-07, 4.880130290985107e-07, 6.025657057762146e-07, 7.171183824539185e-07, 8.316710591316223e-07, 9.462237358093262e-07, 1.06077641248703e-06, 1.1753290891647339e-06, 1.2898817658424377e-06, 1.4044344425201416e-06, 1.5189871191978455e-06, 1.6335397958755493e-06, 1.7480924725532532e-06, 1.862645149230957e-06, 1.977197825908661e-06, 2.0917505025863647e-06, 2.2063031792640686e-06, 2.3208558559417725e-06, 2.4354085326194763e-06, 2.54996120929718e-06, 2.664513885974884e-06, 2.779066562652588e-06, 2.8936192393302917e-06, 3.0081719160079956e-06, 3.1227245926856995e-06, 3.2372772693634033e-06, 3.351829946041107e-06, 3.466382622718811e-06, 3.580935299396515e-06, 3.6954879760742188e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 7.0, 13.0, 20.0, 32.0, 45.0, 63.0, 101.0, 205.0, 444.0, 2100.0, 1024700.0, 19364.0, 770.0, 293.0, 133.0, 101.0, 45.0, 37.0, 21.0, 10.0, 7.0, 8.0, 7.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002617835998535156, -0.0002540312707424164, -0.00024627894163131714, -0.0002385266125202179, -0.00023077428340911865, -0.0002230219542980194, -0.00021526962518692017, -0.00020751729607582092, -0.00019976496696472168, -0.00019201263785362244, -0.0001842603087425232, -0.00017650797963142395, -0.0001687556505203247, -0.00016100332140922546, -0.00015325099229812622, -0.00014549866318702698, -0.00013774633407592773, -0.0001299940049648285, -0.00012224167585372925, -0.00011448934674263, -0.00010673701763153076, -9.898468852043152e-05, -9.123235940933228e-05, -8.348003029823303e-05, -7.572770118713379e-05, -6.797537207603455e-05, -6.02230429649353e-05, -5.247071385383606e-05, -4.4718384742736816e-05, -3.696605563163757e-05, -2.921372652053833e-05, -2.1461397409439087e-05, -1.3709068298339844e-05, -5.956739187240601e-06, 1.7955899238586426e-06, 9.547919034957886e-06, 1.730024814605713e-05, 2.5052577257156372e-05, 3.2804906368255615e-05, 4.055723547935486e-05, 4.83095645904541e-05, 5.6061893701553345e-05, 6.381422281265259e-05, 7.156655192375183e-05, 7.931888103485107e-05, 8.707121014595032e-05, 9.482353925704956e-05, 0.0001025758683681488, 0.00011032819747924805, 0.00011808052659034729, 0.00012583285570144653, 0.00013358518481254578, 0.00014133751392364502, 0.00014908984303474426, 0.0001568421721458435, 0.00016459450125694275, 0.000172346830368042, 0.00018009915947914124, 0.00018785148859024048, 0.00019560381770133972, 0.00020335614681243896, 0.0002111084759235382, 0.00021886080503463745, 0.0002266131341457367, 0.00023436546325683594]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 10.0, 12.0, 18.0, 17.0, 26.0, 52.0, 73.0, 105.0, 125.0, 143.0, 127.0, 90.0, 49.0, 42.0, 26.0, 24.0, 14.0, 11.0, 7.0, 6.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0001036524772644043, -0.00010126456618309021, -9.887665510177612e-05, -9.648874402046204e-05, -9.410083293914795e-05, -9.171292185783386e-05, -8.932501077651978e-05, -8.693709969520569e-05, -8.45491886138916e-05, -8.216127753257751e-05, -7.977336645126343e-05, -7.738545536994934e-05, -7.499754428863525e-05, -7.260963320732117e-05, -7.022172212600708e-05, -6.783381104469299e-05, -6.54458999633789e-05, -6.305798888206482e-05, -6.067007780075073e-05, -5.8282166719436646e-05, -5.589425563812256e-05, -5.350634455680847e-05, -5.1118433475494385e-05, -4.87305223941803e-05, -4.634261131286621e-05, -4.3954700231552124e-05, -4.156678915023804e-05, -3.917887806892395e-05, -3.679096698760986e-05, -3.4403055906295776e-05, -3.201514482498169e-05, -2.9627233743667603e-05, -2.7239322662353516e-05, -2.485141158103943e-05, -2.2463500499725342e-05, -2.0075589418411255e-05, -1.7687678337097168e-05, -1.529976725578308e-05, -1.2911856174468994e-05, -1.0523945093154907e-05, -8.13603401184082e-06, -5.748122930526733e-06, -3.3602118492126465e-06, -9.723007678985596e-07, 1.4156103134155273e-06, 3.8035213947296143e-06, 6.191432476043701e-06, 8.579343557357788e-06, 1.0967254638671875e-05, 1.3355165719985962e-05, 1.574307680130005e-05, 1.8130987882614136e-05, 2.0518898963928223e-05, 2.290681004524231e-05, 2.5294721126556396e-05, 2.7682632207870483e-05, 3.007054328918457e-05, 3.245845437049866e-05, 3.4846365451812744e-05, 3.723427653312683e-05, 3.962218761444092e-05, 4.2010098695755005e-05, 4.439800977706909e-05, 4.678592085838318e-05, 4.9173831939697266e-05]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 20.0, 991.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12164776772260666, -0.07050877809524536, -0.019369788467884064, 0.03176919370889664, 0.08290819078683853, 0.13404718041419983, 0.18518614768981934, 0.23632514476776123, 0.2874641418457031, 0.338603138923645, 0.3897421360015869, 0.4408811032772064, 0.4920201003551483, 0.5431591272354126, 0.5942980647087097, 0.6454370617866516, 0.6965760588645935, 0.7477150559425354, 0.7988540530204773, 0.8499929904937744, 0.9011319875717163, 0.9522709846496582, 1.0034099817276, 1.054548978805542, 1.1056879758834839, 1.1568269729614258, 1.2079659700393677, 1.2591049671173096, 1.3102439641952515, 1.3613829612731934, 1.4125218391418457, 1.4636609554290771, 1.5147998332977295, 1.5659388303756714, 1.6170778274536133, 1.6682168245315552, 1.719355821609497, 1.770494818687439, 1.8216338157653809, 1.8727726936340332, 1.9239118099212646, 1.9750508069992065, 2.0261898040771484, 2.077328681945801, 2.1284677982330322, 2.1796066761016846, 2.230745792388916, 2.2818846702575684, 2.3330235481262207, 2.384162425994873, 2.4353015422821045, 2.486440420150757, 2.5375795364379883, 2.5887184143066406, 2.639857530593872, 2.6909964084625244, 2.742135524749756, 2.793274402618408, 2.8444135189056396, 2.895552396774292, 2.9466915130615234, 2.997830390930176, 3.0489695072174072, 3.1001083850860596, 3.151247501373291]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 7.0, 10.0, 7.0, 14.0, 25.0, 19.0, 23.0, 35.0, 22.0, 48.0, 42.0, 44.0, 72.0, 62.0, 62.0, 58.0, 52.0, 46.0, 58.0, 55.0, 48.0, 29.0, 26.0, 31.0, 18.0, 23.0, 20.0, 5.0, 5.0, 9.0, 10.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29127877950668335, -0.27896028757095337, -0.2666417956352234, -0.2543233036994934, -0.24200479686260223, -0.22968630492687225, -0.21736779808998108, -0.2050493061542511, -0.19273081421852112, -0.18041232228279114, -0.16809383034706116, -0.15577532351016998, -0.14345683157444, -0.13113833963871002, -0.11881984025239944, -0.10650134086608887, -0.09418284893035889, -0.0818643569946289, -0.06954585760831833, -0.05722736194729805, -0.04490886628627777, -0.03259037062525749, -0.020271874964237213, -0.007953375577926636, 0.004365116357803345, 0.016683612018823624, 0.029002107679843903, 0.04132060334086418, 0.05363909900188446, 0.06595759093761444, 0.07827609032392502, 0.0905945897102356, 0.10291308164596558, 0.11523157358169556, 0.12755006551742554, 0.1398685723543167, 0.1521870642900467, 0.16450555622577667, 0.17682406306266785, 0.18914255499839783, 0.2014610469341278, 0.2137795388698578, 0.22609803080558777, 0.23841653764247894, 0.2507350444793701, 0.2630535364151001, 0.2753720283508301, 0.28769052028656006, 0.30000901222229004, 0.31232750415802, 0.32464599609375, 0.33696448802948, 0.34928297996520996, 0.36160150170326233, 0.3739199936389923, 0.3862384855747223, 0.39855697751045227, 0.41087546944618225, 0.42319396138191223, 0.4355124533176422, 0.4478309750556946, 0.46014946699142456, 0.47246795892715454, 0.4847864508628845, 0.4971049427986145]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 2.0, 4.0, 8.0, 8.0, 17.0, 19.0, 13.0, 28.0, 49.0, 53.0, 67.0, 110.0, 141.0, 232.0, 340.0, 601.0, 1294.0, 11502.0, 4164692.0, 12449.0, 1203.0, 553.0, 328.0, 197.0, 130.0, 82.0, 43.0, 35.0, 28.0, 13.0, 10.0, 11.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06658935546875, -0.06447315216064453, -0.06235694885253906, -0.060240745544433594, -0.058124542236328125, -0.056008338928222656, -0.05389213562011719, -0.05177593231201172, -0.04965972900390625, -0.04754352569580078, -0.04542732238769531, -0.043311119079589844, -0.041194915771484375, -0.039078712463378906, -0.03696250915527344, -0.03484630584716797, -0.0327301025390625, -0.03061389923095703, -0.028497695922851562, -0.026381492614746094, -0.024265289306640625, -0.022149085998535156, -0.020032882690429688, -0.01791667938232422, -0.01580047607421875, -0.013684272766113281, -0.011568069458007812, -0.009451866149902344, -0.007335662841796875, -0.005219459533691406, -0.0031032562255859375, -0.0009870529174804688, 0.001129150390625, 0.0032453536987304688, 0.0053615570068359375, 0.007477760314941406, 0.009593963623046875, 0.011710166931152344, 0.013826370239257812, 0.01594257354736328, 0.01805877685546875, 0.02017498016357422, 0.022291183471679688, 0.024407386779785156, 0.026523590087890625, 0.028639793395996094, 0.030755996704101562, 0.03287220001220703, 0.0349884033203125, 0.03710460662841797, 0.03922080993652344, 0.041337013244628906, 0.043453216552734375, 0.045569419860839844, 0.04768562316894531, 0.04980182647705078, 0.05191802978515625, 0.05403423309326172, 0.05615043640136719, 0.058266639709472656, 0.060382843017578125, 0.062499046325683594, 0.06461524963378906, 0.06673145294189453, 0.06884765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 2.0, 6.0, 4.0, 2.0, 10.0, 9.0, 10.0, 10.0, 21.0, 26.0, 149.0, 364.0, 232.0, 54.0, 19.0, 7.0, 16.0, 10.0, 9.0, 5.0, 4.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017303466796875, -0.016755104064941406, -0.016206741333007812, -0.01565837860107422, -0.015110015869140625, -0.014561653137207031, -0.014013290405273438, -0.013464927673339844, -0.01291656494140625, -0.012368202209472656, -0.011819839477539062, -0.011271476745605469, -0.010723114013671875, -0.010174751281738281, -0.009626388549804688, -0.009078025817871094, -0.0085296630859375, -0.007981300354003906, -0.0074329376220703125, -0.006884574890136719, -0.006336212158203125, -0.005787849426269531, -0.0052394866943359375, -0.004691123962402344, -0.00414276123046875, -0.0035943984985351562, -0.0030460357666015625, -0.0024976730346679688, -0.001949310302734375, -0.0014009475708007812, -0.0008525848388671875, -0.00030422210693359375, 0.000244140625, 0.0007925033569335938, 0.0013408660888671875, 0.0018892288208007812, 0.002437591552734375, 0.0029859542846679688, 0.0035343170166015625, 0.004082679748535156, 0.00463104248046875, 0.005179405212402344, 0.0057277679443359375, 0.006276130676269531, 0.006824493408203125, 0.007372856140136719, 0.007921218872070312, 0.008469581604003906, 0.0090179443359375, 0.009566307067871094, 0.010114669799804688, 0.010663032531738281, 0.011211395263671875, 0.011759757995605469, 0.012308120727539062, 0.012856483459472656, 0.01340484619140625, 0.013953208923339844, 0.014501571655273438, 0.015049934387207031, 0.015598297119140625, 0.01614665985107422, 0.016695022583007812, 0.017243385314941406, 0.017791748046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 7.0, 13.0, 18.0, 21.0, 20.0, 22.0, 49.0, 97.0, 140.0, 290.0, 2003.0, 514773.0, 3674205.0, 1881.0, 311.0, 146.0, 74.0, 53.0, 41.0, 19.0, 14.0, 12.0, 11.0, 7.0, 4.0, 7.0, 6.0, 3.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136962890625, -0.13254547119140625, -0.1281280517578125, -0.12371063232421875, -0.119293212890625, -0.11487579345703125, -0.1104583740234375, -0.10604095458984375, -0.10162353515625, -0.09720611572265625, -0.0927886962890625, -0.08837127685546875, -0.083953857421875, -0.07953643798828125, -0.0751190185546875, -0.07070159912109375, -0.0662841796875, -0.06186676025390625, -0.0574493408203125, -0.05303192138671875, -0.048614501953125, -0.04419708251953125, -0.0397796630859375, -0.03536224365234375, -0.03094482421875, -0.02652740478515625, -0.0221099853515625, -0.01769256591796875, -0.013275146484375, -0.00885772705078125, -0.0044403076171875, -2.288818359375e-05, 0.00439453125, 0.00881195068359375, 0.0132293701171875, 0.01764678955078125, 0.022064208984375, 0.02648162841796875, 0.0308990478515625, 0.03531646728515625, 0.03973388671875, 0.04415130615234375, 0.0485687255859375, 0.05298614501953125, 0.057403564453125, 0.06182098388671875, 0.0662384033203125, 0.07065582275390625, 0.0750732421875, 0.07949066162109375, 0.0839080810546875, 0.08832550048828125, 0.092742919921875, 0.09716033935546875, 0.1015777587890625, 0.10599517822265625, 0.11041259765625, 0.11483001708984375, 0.1192474365234375, 0.12366485595703125, 0.128082275390625, 0.13249969482421875, 0.1369171142578125, 0.14133453369140625, 0.145751953125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 10.0, 15.0, 16.0, 13.0, 17.0, 42.0, 187.0, 3391.0, 214.0, 62.0, 27.0, 15.0, 11.0, 8.0, 6.0, 3.0, 9.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0281524658203125, -0.02731466293334961, -0.02647686004638672, -0.025639057159423828, -0.024801254272460938, -0.023963451385498047, -0.023125648498535156, -0.022287845611572266, -0.021450042724609375, -0.020612239837646484, -0.019774436950683594, -0.018936634063720703, -0.018098831176757812, -0.017261028289794922, -0.01642322540283203, -0.01558542251586914, -0.01474761962890625, -0.01390981674194336, -0.013072013854980469, -0.012234210968017578, -0.011396408081054688, -0.010558605194091797, -0.009720802307128906, -0.008882999420166016, -0.008045196533203125, -0.007207393646240234, -0.006369590759277344, -0.005531787872314453, -0.0046939849853515625, -0.003856182098388672, -0.0030183792114257812, -0.0021805763244628906, -0.0013427734375, -0.0005049705505371094, 0.00033283233642578125, 0.0011706352233886719, 0.0020084381103515625, 0.002846240997314453, 0.0036840438842773438, 0.004521846771240234, 0.005359649658203125, 0.006197452545166016, 0.007035255432128906, 0.007873058319091797, 0.008710861206054688, 0.009548664093017578, 0.010386466979980469, 0.01122426986694336, 0.01206207275390625, 0.01289987564086914, 0.013737678527832031, 0.014575481414794922, 0.015413284301757812, 0.016251087188720703, 0.017088890075683594, 0.017926692962646484, 0.018764495849609375, 0.019602298736572266, 0.020440101623535156, 0.021277904510498047, 0.022115707397460938, 0.022953510284423828, 0.02379131317138672, 0.02462911605834961, 0.0254669189453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 214.0, 797.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39401137828826904, -0.38417524099349976, -0.37433910369873047, -0.36450299620628357, -0.3546668589115143, -0.344830721616745, -0.3349945843219757, -0.3251584470272064, -0.3153223395347595, -0.30548620223999023, -0.29565006494522095, -0.28581395745277405, -0.27597782015800476, -0.2661416828632355, -0.2563055455684662, -0.2464694082736969, -0.2366332709789276, -0.22679713368415833, -0.21696101129055023, -0.20712487399578094, -0.19728875160217285, -0.18745261430740356, -0.17761647701263428, -0.167780339717865, -0.1579442173242569, -0.1481080800294876, -0.13827195763587952, -0.12843582034111023, -0.11859969049692154, -0.10876356065273285, -0.09892742335796356, -0.08909129351377487, -0.07925516366958618, -0.06941903382539749, -0.0595829002559185, -0.049746766686439514, -0.039910636842250824, -0.030074506998062134, -0.020238373428583145, -0.010402239859104156, -0.0005661100149154663, 0.009270021691918373, 0.019106153398752213, 0.028942285105586052, 0.03877841681241989, 0.04861454665660858, 0.05845068022608757, 0.06828681379556656, 0.07812294363975525, 0.08795907348394394, 0.09779520332813263, 0.10763134062290192, 0.1174674704670906, 0.1273036003112793, 0.13713973760604858, 0.14697587490081787, 0.15681199729442596, 0.16664813458919525, 0.17648425698280334, 0.18632039427757263, 0.19615653157234192, 0.20599265396595, 0.2158287912607193, 0.2256649136543274, 0.23550105094909668]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 3.0, 4.0, 12.0, 10.0, 10.0, 8.0, 24.0, 13.0, 29.0, 25.0, 36.0, 31.0, 24.0, 42.0, 38.0, 55.0, 37.0, 49.0, 58.0, 46.0, 65.0, 45.0, 36.0, 41.0, 30.0, 30.0, 27.0, 24.0, 16.0, 21.0, 18.0, 20.0, 14.0, 10.0, 10.0, 9.0, 11.0, 6.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050300538539886475, -0.04870740324258804, -0.04711426794528961, -0.04552113264799118, -0.04392799735069275, -0.04233486205339432, -0.040741726756095886, -0.039148591458797455, -0.03755545616149902, -0.03596232086420059, -0.03436918556690216, -0.03277605026960373, -0.031182914972305298, -0.029589779675006866, -0.027996644377708435, -0.026403509080410004, -0.024810373783111572, -0.02321723848581314, -0.02162410318851471, -0.020030967891216278, -0.018437832593917847, -0.016844697296619415, -0.015251561999320984, -0.013658426702022552, -0.012065291404724121, -0.01047215610742569, -0.008879020810127258, -0.007285885512828827, -0.0056927502155303955, -0.004099614918231964, -0.0025064796209335327, -0.0009133443236351013, 0.0006797909736633301, 0.0022729262709617615, 0.003866061568260193, 0.005459196865558624, 0.007052332162857056, 0.008645467460155487, 0.010238602757453918, 0.01183173805475235, 0.013424873352050781, 0.015018008649349213, 0.016611143946647644, 0.018204279243946075, 0.019797414541244507, 0.021390549838542938, 0.02298368513584137, 0.0245768204331398, 0.026169955730438232, 0.027763091027736664, 0.029356226325035095, 0.030949361622333527, 0.03254249691963196, 0.03413563221693039, 0.03572876751422882, 0.03732190281152725, 0.038915038108825684, 0.040508173406124115, 0.042101308703422546, 0.04369444400072098, 0.04528757929801941, 0.04688071459531784, 0.04847384989261627, 0.0500669851899147, 0.051660120487213135]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 7.0, 7.0, 8.0, 9.0, 19.0, 23.0, 29.0, 37.0, 46.0, 85.0, 107.0, 159.0, 222.0, 324.0, 489.0, 705.0, 1184.0, 1837.0, 3266.0, 5883.0, 12555.0, 41062.0, 882571.0, 66012.0, 15467.0, 6912.0, 3709.0, 2069.0, 1251.0, 780.0, 510.0, 362.0, 249.0, 145.0, 129.0, 74.0, 64.0, 49.0, 37.0, 25.0, 14.0, 16.0, 15.0, 9.0, 5.0, 5.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.036895751953125, -0.03572845458984375, -0.0345611572265625, -0.03339385986328125, -0.0322265625, -0.03105926513671875, -0.0298919677734375, -0.02872467041015625, -0.027557373046875, -0.02639007568359375, -0.0252227783203125, -0.02405548095703125, -0.02288818359375, -0.02172088623046875, -0.0205535888671875, -0.01938629150390625, -0.018218994140625, -0.01705169677734375, -0.0158843994140625, -0.01471710205078125, -0.0135498046875, -0.01238250732421875, -0.0112152099609375, -0.01004791259765625, -0.008880615234375, -0.00771331787109375, -0.0065460205078125, -0.00537872314453125, -0.00421142578125, -0.00304412841796875, -0.0018768310546875, -0.00070953369140625, 0.000457763671875, 0.00162506103515625, 0.0027923583984375, 0.00395965576171875, 0.005126953125, 0.00629425048828125, 0.0074615478515625, 0.00862884521484375, 0.009796142578125, 0.01096343994140625, 0.0121307373046875, 0.01329803466796875, 0.01446533203125, 0.01563262939453125, 0.0167999267578125, 0.01796722412109375, 0.019134521484375, 0.02030181884765625, 0.0214691162109375, 0.02263641357421875, 0.0238037109375, 0.02497100830078125, 0.0261383056640625, 0.02730560302734375, 0.028472900390625, 0.02964019775390625, 0.0308074951171875, 0.03197479248046875, 0.03314208984375, 0.03430938720703125, 0.0354766845703125, 0.03664398193359375, 0.037811279296875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 1.0, 5.0, 6.0, 2.0, 7.0, 10.0, 11.0, 12.0, 20.0, 28.0, 133.0, 359.0, 238.0, 63.0, 20.0, 12.0, 14.0, 9.0, 7.0, 7.0, 3.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017181396484375, -0.01663804054260254, -0.016094684600830078, -0.015551328659057617, -0.015007972717285156, -0.014464616775512695, -0.013921260833740234, -0.013377904891967773, -0.012834548950195312, -0.012291193008422852, -0.01174783706665039, -0.01120448112487793, -0.010661125183105469, -0.010117769241333008, -0.009574413299560547, -0.009031057357788086, -0.008487701416015625, -0.007944345474243164, -0.007400989532470703, -0.006857633590698242, -0.006314277648925781, -0.00577092170715332, -0.005227565765380859, -0.0046842098236083984, -0.0041408538818359375, -0.0035974979400634766, -0.0030541419982910156, -0.0025107860565185547, -0.0019674301147460938, -0.0014240741729736328, -0.0008807182312011719, -0.00033736228942871094, 0.00020599365234375, 0.0007493495941162109, 0.0012927055358886719, 0.0018360614776611328, 0.0023794174194335938, 0.0029227733612060547, 0.0034661293029785156, 0.0040094852447509766, 0.0045528411865234375, 0.0050961971282958984, 0.005639553070068359, 0.00618290901184082, 0.006726264953613281, 0.007269620895385742, 0.007812976837158203, 0.008356332778930664, 0.008899688720703125, 0.009443044662475586, 0.009986400604248047, 0.010529756546020508, 0.011073112487792969, 0.01161646842956543, 0.01215982437133789, 0.012703180313110352, 0.013246536254882812, 0.013789892196655273, 0.014333248138427734, 0.014876604080200195, 0.015419960021972656, 0.015963315963745117, 0.016506671905517578, 0.01705002784729004, 0.0175933837890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 2.0, 6.0, 5.0, 7.0, 11.0, 11.0, 19.0, 23.0, 25.0, 42.0, 49.0, 64.0, 78.0, 97.0, 104.0, 139.0, 151.0, 226.0, 337.0, 605.0, 1465.0, 8562.0, 902724.0, 127361.0, 3700.0, 1011.0, 457.0, 270.0, 208.0, 158.0, 134.0, 96.0, 89.0, 77.0, 49.0, 46.0, 31.0, 26.0, 27.0, 12.0, 13.0, 7.0, 5.0, 9.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.090576171875, -0.08772945404052734, -0.08488273620605469, -0.08203601837158203, -0.07918930053710938, -0.07634258270263672, -0.07349586486816406, -0.0706491470336914, -0.06780242919921875, -0.0649557113647461, -0.06210899353027344, -0.05926227569580078, -0.056415557861328125, -0.05356884002685547, -0.05072212219238281, -0.047875404357910156, -0.0450286865234375, -0.042181968688964844, -0.03933525085449219, -0.03648853302001953, -0.033641815185546875, -0.03079509735107422, -0.027948379516601562, -0.025101661682128906, -0.02225494384765625, -0.019408226013183594, -0.016561508178710938, -0.013714790344238281, -0.010868072509765625, -0.008021354675292969, -0.0051746368408203125, -0.0023279190063476562, 0.000518798828125, 0.0033655166625976562, 0.0062122344970703125, 0.009058952331542969, 0.011905670166015625, 0.014752388000488281, 0.017599105834960938, 0.020445823669433594, 0.02329254150390625, 0.026139259338378906, 0.028985977172851562, 0.03183269500732422, 0.034679412841796875, 0.03752613067626953, 0.04037284851074219, 0.043219566345214844, 0.0460662841796875, 0.048913002014160156, 0.05175971984863281, 0.05460643768310547, 0.057453155517578125, 0.06029987335205078, 0.06314659118652344, 0.0659933090209961, 0.06884002685546875, 0.0716867446899414, 0.07453346252441406, 0.07738018035888672, 0.08022689819335938, 0.08307361602783203, 0.08592033386230469, 0.08876705169677734, 0.09161376953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 10.0, 12.0, 16.0, 21.0, 27.0, 21.0, 25.0, 37.0, 22.0, 39.0, 37.0, 38.0, 43.0, 43.0, 54.0, 41.0, 47.0, 45.0, 32.0, 38.0, 44.0, 36.0, 39.0, 33.0, 28.0, 31.0, 27.0, 18.0, 16.0, 11.0, 11.0, 14.0, 4.0, 5.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04437255859375, -0.04297780990600586, -0.04158306121826172, -0.04018831253051758, -0.03879356384277344, -0.0373988151550293, -0.036004066467285156, -0.034609317779541016, -0.033214569091796875, -0.031819820404052734, -0.030425071716308594, -0.029030323028564453, -0.027635574340820312, -0.026240825653076172, -0.02484607696533203, -0.02345132827758789, -0.02205657958984375, -0.02066183090209961, -0.01926708221435547, -0.017872333526611328, -0.016477584838867188, -0.015082836151123047, -0.013688087463378906, -0.012293338775634766, -0.010898590087890625, -0.009503841400146484, -0.008109092712402344, -0.006714344024658203, -0.0053195953369140625, -0.003924846649169922, -0.0025300979614257812, -0.0011353492736816406, 0.0002593994140625, 0.0016541481018066406, 0.0030488967895507812, 0.004443645477294922, 0.0058383941650390625, 0.007233142852783203, 0.008627891540527344, 0.010022640228271484, 0.011417388916015625, 0.012812137603759766, 0.014206886291503906, 0.015601634979248047, 0.016996383666992188, 0.018391132354736328, 0.01978588104248047, 0.02118062973022461, 0.02257537841796875, 0.02397012710571289, 0.02536487579345703, 0.026759624481201172, 0.028154373168945312, 0.029549121856689453, 0.030943870544433594, 0.032338619232177734, 0.033733367919921875, 0.035128116607666016, 0.036522865295410156, 0.0379176139831543, 0.03931236267089844, 0.04070711135864258, 0.04210186004638672, 0.04349660873413086, 0.044891357421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 7.0, 5.0, 8.0, 17.0, 20.0, 26.0, 25.0, 30.0, 53.0, 50.0, 100.0, 192.0, 245.0, 467.0, 985.0, 3169.0, 37585.0, 980267.0, 20864.0, 2443.0, 873.0, 392.0, 195.0, 172.0, 96.0, 53.0, 54.0, 37.0, 17.0, 29.0, 20.0, 12.0, 10.0, 7.0, 3.0, 3.0, 4.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.908178329467773e-05, -6.701424717903137e-05, -6.494671106338501e-05, -6.287917494773865e-05, -6.0811638832092285e-05, -5.874410271644592e-05, -5.667656660079956e-05, -5.46090304851532e-05, -5.2541494369506836e-05, -5.0473958253860474e-05, -4.840642213821411e-05, -4.633888602256775e-05, -4.427134990692139e-05, -4.2203813791275024e-05, -4.013627767562866e-05, -3.80687415599823e-05, -3.600120544433594e-05, -3.3933669328689575e-05, -3.186613321304321e-05, -2.979859709739685e-05, -2.7731060981750488e-05, -2.5663524866104126e-05, -2.3595988750457764e-05, -2.15284526348114e-05, -1.946091651916504e-05, -1.7393380403518677e-05, -1.5325844287872314e-05, -1.3258308172225952e-05, -1.119077205657959e-05, -9.123235940933228e-06, -7.055699825286865e-06, -4.988163709640503e-06, -2.9206275939941406e-06, -8.530914783477783e-07, 1.214444637298584e-06, 3.2819807529449463e-06, 5.349516868591309e-06, 7.417052984237671e-06, 9.484589099884033e-06, 1.1552125215530396e-05, 1.3619661331176758e-05, 1.568719744682312e-05, 1.7754733562469482e-05, 1.9822269678115845e-05, 2.1889805793762207e-05, 2.395734190940857e-05, 2.602487802505493e-05, 2.8092414140701294e-05, 3.0159950256347656e-05, 3.222748637199402e-05, 3.429502248764038e-05, 3.636255860328674e-05, 3.8430094718933105e-05, 4.049763083457947e-05, 4.256516695022583e-05, 4.463270306587219e-05, 4.6700239181518555e-05, 4.876777529716492e-05, 5.083531141281128e-05, 5.290284752845764e-05, 5.4970383644104004e-05, 5.7037919759750366e-05, 5.910545587539673e-05, 6.117299199104309e-05, 6.324052810668945e-05]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 8.0, 7.0, 10.0, 7.0, 20.0, 22.0, 25.0, 32.0, 37.0, 58.0, 89.0, 89.0, 85.0, 96.0, 96.0, 72.0, 62.0, 43.0, 30.0, 23.0, 18.0, 9.0, 13.0, 13.0, 5.0, 1.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-8.52346420288086e-06, -8.291564881801605e-06, -8.059665560722351e-06, -7.827766239643097e-06, -7.595866918563843e-06, -7.363967597484589e-06, -7.1320682764053345e-06, -6.90016895532608e-06, -6.668269634246826e-06, -6.436370313167572e-06, -6.204470992088318e-06, -5.972571671009064e-06, -5.7406723499298096e-06, -5.508773028850555e-06, -5.276873707771301e-06, -5.044974386692047e-06, -4.813075065612793e-06, -4.581175744533539e-06, -4.349276423454285e-06, -4.1173771023750305e-06, -3.885477781295776e-06, -3.6535784602165222e-06, -3.421679139137268e-06, -3.189779818058014e-06, -2.9578804969787598e-06, -2.7259811758995056e-06, -2.4940818548202515e-06, -2.2621825337409973e-06, -2.030283212661743e-06, -1.798383891582489e-06, -1.5664845705032349e-06, -1.3345852494239807e-06, -1.1026859283447266e-06, -8.707866072654724e-07, -6.388872861862183e-07, -4.069879651069641e-07, -1.7508864402770996e-07, 5.681067705154419e-08, 2.8870999813079834e-07, 5.206093192100525e-07, 7.525086402893066e-07, 9.844079613685608e-07, 1.216307282447815e-06, 1.448206603527069e-06, 1.6801059246063232e-06, 1.9120052456855774e-06, 2.1439045667648315e-06, 2.3758038878440857e-06, 2.60770320892334e-06, 2.839602530002594e-06, 3.071501851081848e-06, 3.3034011721611023e-06, 3.5353004932403564e-06, 3.7671998143196106e-06, 3.999099135398865e-06, 4.230998456478119e-06, 4.462897777557373e-06, 4.694797098636627e-06, 4.926696419715881e-06, 5.1585957407951355e-06, 5.39049506187439e-06, 5.622394382953644e-06, 5.854293704032898e-06, 6.086193025112152e-06, 6.318092346191406e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 3.0, 7.0, 7.0, 3.0, 13.0, 14.0, 24.0, 30.0, 42.0, 54.0, 74.0, 141.0, 202.0, 473.0, 1532.0, 46205.0, 995088.0, 3220.0, 617.0, 273.0, 180.0, 102.0, 58.0, 48.0, 43.0, 22.0, 18.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00011897087097167969, -0.00011548958718776703, -0.00011200830340385437, -0.00010852701961994171, -0.00010504573583602905, -0.0001015644520521164, -9.808316826820374e-05, -9.460188448429108e-05, -9.112060070037842e-05, -8.763931691646576e-05, -8.41580331325531e-05, -8.067674934864044e-05, -7.719546556472778e-05, -7.371418178081512e-05, -7.023289799690247e-05, -6.675161421298981e-05, -6.327033042907715e-05, -5.978904664516449e-05, -5.630776286125183e-05, -5.282647907733917e-05, -4.9345195293426514e-05, -4.5863911509513855e-05, -4.2382627725601196e-05, -3.890134394168854e-05, -3.542006015777588e-05, -3.193877637386322e-05, -2.845749258995056e-05, -2.4976208806037903e-05, -2.1494925022125244e-05, -1.8013641238212585e-05, -1.4532357454299927e-05, -1.1051073670387268e-05, -7.569789886474609e-06, -4.088506102561951e-06, -6.07222318649292e-07, 2.8740614652633667e-06, 6.355345249176025e-06, 9.836629033088684e-06, 1.3317912817001343e-05, 1.6799196600914e-05, 2.028048038482666e-05, 2.376176416873932e-05, 2.7243047952651978e-05, 3.0724331736564636e-05, 3.4205615520477295e-05, 3.7686899304389954e-05, 4.116818308830261e-05, 4.464946687221527e-05, 4.813075065612793e-05, 5.161203444004059e-05, 5.509331822395325e-05, 5.8574602007865906e-05, 6.205588579177856e-05, 6.553716957569122e-05, 6.901845335960388e-05, 7.249973714351654e-05, 7.59810209274292e-05, 7.946230471134186e-05, 8.294358849525452e-05, 8.642487227916718e-05, 8.990615606307983e-05, 9.338743984699249e-05, 9.686872363090515e-05, 0.00010035000741481781, 0.00010383129119873047]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 7.0, 14.0, 6.0, 15.0, 11.0, 15.0, 29.0, 35.0, 61.0, 105.0, 112.0, 176.0, 126.0, 68.0, 49.0, 43.0, 37.0, 28.0, 17.0, 9.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.835294723510742e-05, -5.665980279445648e-05, -5.496665835380554e-05, -5.32735139131546e-05, -5.158036947250366e-05, -4.988722503185272e-05, -4.819408059120178e-05, -4.650093615055084e-05, -4.48077917098999e-05, -4.311464726924896e-05, -4.142150282859802e-05, -3.972835838794708e-05, -3.803521394729614e-05, -3.63420695066452e-05, -3.464892506599426e-05, -3.295578062534332e-05, -3.126263618469238e-05, -2.9569491744041443e-05, -2.7876347303390503e-05, -2.6183202862739563e-05, -2.4490058422088623e-05, -2.2796913981437683e-05, -2.1103769540786743e-05, -1.9410625100135803e-05, -1.7717480659484863e-05, -1.6024336218833923e-05, -1.4331191778182983e-05, -1.2638047337532043e-05, -1.0944902896881104e-05, -9.251758456230164e-06, -7.558614015579224e-06, -5.865469574928284e-06, -4.172325134277344e-06, -2.479180693626404e-06, -7.860362529754639e-07, 9.071081876754761e-07, 2.600252628326416e-06, 4.293397068977356e-06, 5.986541509628296e-06, 7.679685950279236e-06, 9.372830390930176e-06, 1.1065974831581116e-05, 1.2759119272232056e-05, 1.4452263712882996e-05, 1.6145408153533936e-05, 1.7838552594184875e-05, 1.9531697034835815e-05, 2.1224841475486755e-05, 2.2917985916137695e-05, 2.4611130356788635e-05, 2.6304274797439575e-05, 2.7997419238090515e-05, 2.9690563678741455e-05, 3.1383708119392395e-05, 3.3076852560043335e-05, 3.4769997000694275e-05, 3.6463141441345215e-05, 3.8156285881996155e-05, 3.9849430322647095e-05, 4.1542574763298035e-05, 4.3235719203948975e-05, 4.4928863644599915e-05, 4.6622008085250854e-05, 4.8315152525901794e-05, 5.0008296966552734e-05]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 15.0, 357.0, 629.0, 12.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9460000395774841, -0.9288132786750793, -0.9116265177726746, -0.894439697265625, -0.8772529363632202, -0.8600661754608154, -0.8428794145584106, -0.8256926536560059, -0.8085058927536011, -0.7913191318511963, -0.7741323709487915, -0.7569455504417419, -0.7397587895393372, -0.7225720286369324, -0.7053852677345276, -0.6881985068321228, -0.6710116863250732, -0.6538249254226685, -0.6366381645202637, -0.6194513440132141, -0.6022645831108093, -0.5850778222084045, -0.5678910613059998, -0.550704300403595, -0.5335174798965454, -0.5163307189941406, -0.49914392828941345, -0.48195716738700867, -0.4647703766822815, -0.4475836157798767, -0.4303968548774719, -0.41321009397506714, -0.39602333307266235, -0.37883657217025757, -0.3616497814655304, -0.3444630205631256, -0.32727622985839844, -0.31008946895599365, -0.29290270805358887, -0.2757159471511841, -0.2585291564464569, -0.24134238064289093, -0.22415560483932495, -0.20696884393692017, -0.1897820681333542, -0.1725952923297882, -0.15540853142738342, -0.13822175562381744, -0.12103497982025146, -0.10384820401668549, -0.0866614356637001, -0.06947466731071472, -0.05228789150714874, -0.035101115703582764, -0.01791434735059738, -0.0007275789976119995, 0.01645919680595398, 0.03364596888422966, 0.05083274096250534, 0.06801950931549072, 0.0852062851190567, 0.10239306092262268, 0.11957982927560806, 0.13676659762859344, 0.15395337343215942]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 8.0, 2.0, 14.0, 10.0, 16.0, 20.0, 28.0, 29.0, 30.0, 47.0, 46.0, 40.0, 49.0, 64.0, 61.0, 63.0, 47.0, 60.0, 59.0, 43.0, 48.0, 43.0, 33.0, 28.0, 14.0, 21.0, 15.0, 17.0, 11.0, 10.0, 2.0, 8.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.35643166303634644, -0.3463435471057892, -0.3362554609775543, -0.32616734504699707, -0.3160792291164398, -0.30599114298820496, -0.2959030270576477, -0.28581494092941284, -0.2757268249988556, -0.26563870906829834, -0.2555506229400635, -0.24546250700950623, -0.23537440598011017, -0.2252863049507141, -0.21519818902015686, -0.2051100879907608, -0.19502197206020355, -0.1849338710308075, -0.17484575510025024, -0.1647576540708542, -0.15466955304145813, -0.14458143711090088, -0.13449333608150482, -0.12440523505210876, -0.11431712657213211, -0.10422901809215546, -0.0941409170627594, -0.08405280858278275, -0.07396470010280609, -0.06387659907341003, -0.05378849059343338, -0.04370038956403732, -0.03361228108406067, -0.023524176329374313, -0.013436069712042809, -0.0033479630947113037, 0.006740141659975052, 0.016828246414661407, 0.02691635489463806, 0.03700445592403412, 0.04709256440401077, 0.05718066915869713, 0.06726877391338348, 0.07735688239336014, 0.08744499087333679, 0.09753309190273285, 0.1076212003827095, 0.11770930141210556, 0.12779740989208221, 0.13788551092147827, 0.14797362685203552, 0.15806172788143158, 0.16814982891082764, 0.1782379448413849, 0.18832604587078094, 0.198414146900177, 0.20850226283073425, 0.2185903638601303, 0.22867847979068756, 0.23876658082008362, 0.24885468184947968, 0.25894278287887573, 0.269030898809433, 0.27911901473999023, 0.2892071008682251]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 8.0, 3.0, 10.0, 14.0, 14.0, 18.0, 20.0, 25.0, 28.0, 36.0, 52.0, 71.0, 95.0, 154.0, 259.0, 828.0, 23548.0, 4164625.0, 3516.0, 358.0, 158.0, 119.0, 80.0, 51.0, 39.0, 38.0, 24.0, 18.0, 16.0, 14.0, 8.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05975341796875, -0.05789804458618164, -0.05604267120361328, -0.05418729782104492, -0.05233192443847656, -0.0504765510559082, -0.048621177673339844, -0.046765804290771484, -0.044910430908203125, -0.043055057525634766, -0.041199684143066406, -0.03934431076049805, -0.03748893737792969, -0.03563356399536133, -0.03377819061279297, -0.03192281723022461, -0.03006744384765625, -0.02821207046508789, -0.02635669708251953, -0.024501323699951172, -0.022645950317382812, -0.020790576934814453, -0.018935203552246094, -0.017079830169677734, -0.015224456787109375, -0.013369083404541016, -0.011513710021972656, -0.009658336639404297, -0.0078029632568359375, -0.005947589874267578, -0.004092216491699219, -0.0022368431091308594, -0.0003814697265625, 0.0014739036560058594, 0.0033292770385742188, 0.005184650421142578, 0.0070400238037109375, 0.008895397186279297, 0.010750770568847656, 0.012606143951416016, 0.014461517333984375, 0.016316890716552734, 0.018172264099121094, 0.020027637481689453, 0.021883010864257812, 0.023738384246826172, 0.02559375762939453, 0.02744913101196289, 0.02930450439453125, 0.03115987777709961, 0.03301525115966797, 0.03487062454223633, 0.03672599792480469, 0.03858137130737305, 0.040436744689941406, 0.042292118072509766, 0.044147491455078125, 0.046002864837646484, 0.047858238220214844, 0.0497136116027832, 0.05156898498535156, 0.05342435836791992, 0.05527973175048828, 0.05713510513305664, 0.058990478515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 1.0, 4.0, 7.0, 1.0, 5.0, 7.0, 14.0, 8.0, 14.0, 19.0, 51.0, 204.0, 331.0, 187.0, 53.0, 15.0, 10.0, 12.0, 9.0, 7.0, 8.0, 2.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0168914794921875, -0.016368865966796875, -0.01584625244140625, -0.015323638916015625, -0.014801025390625, -0.014278411865234375, -0.01375579833984375, -0.013233184814453125, -0.0127105712890625, -0.012187957763671875, -0.01166534423828125, -0.011142730712890625, -0.0106201171875, -0.010097503662109375, -0.00957489013671875, -0.009052276611328125, -0.0085296630859375, -0.008007049560546875, -0.00748443603515625, -0.006961822509765625, -0.006439208984375, -0.005916595458984375, -0.00539398193359375, -0.004871368408203125, -0.0043487548828125, -0.003826141357421875, -0.00330352783203125, -0.002780914306640625, -0.00225830078125, -0.001735687255859375, -0.00121307373046875, -0.000690460205078125, -0.0001678466796875, 0.000354766845703125, 0.00087738037109375, 0.001399993896484375, 0.001922607421875, 0.002445220947265625, 0.00296783447265625, 0.003490447998046875, 0.0040130615234375, 0.004535675048828125, 0.00505828857421875, 0.005580902099609375, 0.006103515625, 0.006626129150390625, 0.00714874267578125, 0.007671356201171875, 0.0081939697265625, 0.008716583251953125, 0.00923919677734375, 0.009761810302734375, 0.010284423828125, 0.010807037353515625, 0.01132965087890625, 0.011852264404296875, 0.0123748779296875, 0.012897491455078125, 0.01342010498046875, 0.013942718505859375, 0.01446533203125, 0.014987945556640625, 0.01551055908203125, 0.016033172607421875, 0.0165557861328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 16.0, 27.0, 21.0, 67.0, 244.0, 896.0, 7765.0, 4179912.0, 4557.0, 458.0, 136.0, 55.0, 33.0, 16.0, 15.0, 8.0, 5.0, 4.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0616455078125, -0.05931282043457031, -0.056980133056640625, -0.05464744567871094, -0.05231475830078125, -0.04998207092285156, -0.047649383544921875, -0.04531669616699219, -0.0429840087890625, -0.04065132141113281, -0.038318634033203125, -0.03598594665527344, -0.03365325927734375, -0.03132057189941406, -0.028987884521484375, -0.026655197143554688, -0.024322509765625, -0.021989822387695312, -0.019657135009765625, -0.017324447631835938, -0.01499176025390625, -0.012659072875976562, -0.010326385498046875, -0.007993698120117188, -0.0056610107421875, -0.0033283233642578125, -0.000995635986328125, 0.0013370513916015625, 0.00366973876953125, 0.0060024261474609375, 0.008335113525390625, 0.010667800903320312, 0.01300048828125, 0.015333175659179688, 0.017665863037109375, 0.019998550415039062, 0.02233123779296875, 0.024663925170898438, 0.026996612548828125, 0.029329299926757812, 0.0316619873046875, 0.03399467468261719, 0.036327362060546875, 0.03866004943847656, 0.04099273681640625, 0.04332542419433594, 0.045658111572265625, 0.04799079895019531, 0.050323486328125, 0.05265617370605469, 0.054988861083984375, 0.05732154846191406, 0.05965423583984375, 0.06198692321777344, 0.06431961059570312, 0.06665229797363281, 0.0689849853515625, 0.07131767272949219, 0.07365036010742188, 0.07598304748535156, 0.07831573486328125, 0.08064842224121094, 0.08298110961914062, 0.08531379699707031, 0.087646484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 12.0, 20.0, 41.0, 55.0, 189.0, 3469.0, 154.0, 57.0, 29.0, 15.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0182647705078125, -0.017824292182922363, -0.017383813858032227, -0.01694333553314209, -0.016502857208251953, -0.016062378883361816, -0.01562190055847168, -0.015181422233581543, -0.014740943908691406, -0.01430046558380127, -0.013859987258911133, -0.013419508934020996, -0.01297903060913086, -0.012538552284240723, -0.012098073959350586, -0.01165759563446045, -0.011217117309570312, -0.010776638984680176, -0.010336160659790039, -0.009895682334899902, -0.009455204010009766, -0.009014725685119629, -0.008574247360229492, -0.008133769035339355, -0.007693290710449219, -0.007252812385559082, -0.006812334060668945, -0.006371855735778809, -0.005931377410888672, -0.005490899085998535, -0.0050504207611083984, -0.004609942436218262, -0.004169464111328125, -0.0037289857864379883, -0.0032885074615478516, -0.002848029136657715, -0.002407550811767578, -0.0019670724868774414, -0.0015265941619873047, -0.001086115837097168, -0.0006456375122070312, -0.00020515918731689453, 0.0002353191375732422, 0.0006757974624633789, 0.0011162757873535156, 0.0015567541122436523, 0.001997232437133789, 0.0024377107620239258, 0.0028781890869140625, 0.0033186674118041992, 0.003759145736694336, 0.004199624061584473, 0.004640102386474609, 0.005080580711364746, 0.005521059036254883, 0.0059615373611450195, 0.006402015686035156, 0.006842494010925293, 0.00728297233581543, 0.007723450660705566, 0.008163928985595703, 0.00860440731048584, 0.009044885635375977, 0.009485363960266113, 0.00992584228515625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 11.0, 994.0, 11.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23863057792186737, -0.23426498472690582, -0.22989939153194427, -0.22553378343582153, -0.22116819024085999, -0.21680259704589844, -0.2124370038509369, -0.20807141065597534, -0.2037058174610138, -0.19934022426605225, -0.1949746310710907, -0.19060902297496796, -0.1862434297800064, -0.18187783658504486, -0.1775122433900833, -0.17314665019512177, -0.16878104209899902, -0.16441544890403748, -0.16004985570907593, -0.15568424761295319, -0.15131865441799164, -0.1469530612230301, -0.14258746802806854, -0.138221874833107, -0.13385626673698425, -0.1294906735420227, -0.12512508034706116, -0.12075947970151901, -0.11639387905597687, -0.11202828586101532, -0.10766269266605377, -0.10329709947109222, -0.09893152117729187, -0.09456592798233032, -0.09020032733678818, -0.08583473414182663, -0.08146913349628448, -0.07710354030132294, -0.07273794710636139, -0.06837235391139984, -0.0640067532658577, -0.05964115634560585, -0.055275559425354004, -0.050909966230392456, -0.04654436931014061, -0.04217877238988876, -0.037813179194927216, -0.03344758227467537, -0.029081985354423523, -0.024716388434171677, -0.02035079337656498, -0.015985198318958282, -0.011619601398706436, -0.00725400447845459, -0.0028884094208478928, 0.0014771856367588043, 0.005842782557010651, 0.010208378545939922, 0.014573974534869194, 0.01893956959247589, 0.023305166512727737, 0.027670763432979584, 0.03203635662794113, 0.03640195354819298, 0.040767550468444824]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 5.0, 8.0, 8.0, 7.0, 19.0, 23.0, 17.0, 26.0, 36.0, 51.0, 37.0, 61.0, 53.0, 66.0, 64.0, 69.0, 65.0, 59.0, 56.0, 56.0, 40.0, 43.0, 35.0, 24.0, 19.0, 14.0, 20.0, 10.0, 7.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0346912145614624, -0.03365989029407501, -0.03262856975197792, -0.03159724920988083, -0.03056592494249344, -0.029534602537751198, -0.028503280133008957, -0.027471957728266716, -0.026440635323524475, -0.025409312918782234, -0.024377990514039993, -0.023346668109297752, -0.02231534570455551, -0.02128402329981327, -0.02025270089507103, -0.01922137849032879, -0.018190056085586548, -0.017158733680844307, -0.016127411276102066, -0.015096088871359825, -0.014064766466617584, -0.013033444061875343, -0.012002121657133102, -0.010970799252390862, -0.00993947684764862, -0.00890815444290638, -0.007876832038164139, -0.006845509633421898, -0.005814187228679657, -0.004782864823937416, -0.003751542419195175, -0.0027202200144529343, -0.0016888976097106934, -0.0006575752049684525, 0.00037374719977378845, 0.0014050696045160294, 0.0024363920092582703, 0.003467714414000511, 0.004499036818742752, 0.005530359223484993, 0.006561681628227234, 0.007593004032969475, 0.008624326437711716, 0.009655648842453957, 0.010686971247196198, 0.011718293651938438, 0.01274961605668068, 0.01378093846142292, 0.014812260866165161, 0.015843583270907402, 0.016874905675649643, 0.017906228080391884, 0.018937550485134125, 0.019968872889876366, 0.021000195294618607, 0.022031517699360847, 0.02306284010410309, 0.02409416250884533, 0.02512548491358757, 0.02615680731832981, 0.027188129723072052, 0.028219452127814293, 0.029250774532556534, 0.030282096937298775, 0.031313419342041016]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 9.0, 8.0, 10.0, 13.0, 10.0, 17.0, 19.0, 37.0, 53.0, 57.0, 74.0, 99.0, 140.0, 209.0, 291.0, 372.0, 533.0, 807.0, 1181.0, 1932.0, 2999.0, 4941.0, 9131.0, 19710.0, 117572.0, 819327.0, 37882.0, 13201.0, 6772.0, 3832.0, 2403.0, 1493.0, 999.0, 715.0, 460.0, 345.0, 227.0, 172.0, 132.0, 82.0, 70.0, 62.0, 48.0, 27.0, 23.0, 11.0, 5.0, 7.0, 6.0, 7.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0216522216796875, -0.0209810733795166, -0.020309925079345703, -0.019638776779174805, -0.018967628479003906, -0.018296480178833008, -0.01762533187866211, -0.01695418357849121, -0.016283035278320312, -0.015611886978149414, -0.014940738677978516, -0.014269590377807617, -0.013598442077636719, -0.01292729377746582, -0.012256145477294922, -0.011584997177124023, -0.010913848876953125, -0.010242700576782227, -0.009571552276611328, -0.00890040397644043, -0.008229255676269531, -0.007558107376098633, -0.006886959075927734, -0.006215810775756836, -0.0055446624755859375, -0.004873514175415039, -0.004202365875244141, -0.003531217575073242, -0.0028600692749023438, -0.0021889209747314453, -0.0015177726745605469, -0.0008466243743896484, -0.00017547607421875, 0.0004956722259521484, 0.0011668205261230469, 0.0018379688262939453, 0.0025091171264648438, 0.003180265426635742, 0.0038514137268066406, 0.004522562026977539, 0.0051937103271484375, 0.005864858627319336, 0.006536006927490234, 0.007207155227661133, 0.007878303527832031, 0.00854945182800293, 0.009220600128173828, 0.009891748428344727, 0.010562896728515625, 0.011234045028686523, 0.011905193328857422, 0.01257634162902832, 0.013247489929199219, 0.013918638229370117, 0.014589786529541016, 0.015260934829711914, 0.015932083129882812, 0.01660323143005371, 0.01727437973022461, 0.017945528030395508, 0.018616676330566406, 0.019287824630737305, 0.019958972930908203, 0.0206301212310791, 0.02130126953125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 1.0, 5.0, 6.0, 1.0, 5.0, 8.0, 13.0, 8.0, 12.0, 19.0, 54.0, 192.0, 328.0, 198.0, 55.0, 13.0, 12.0, 14.0, 7.0, 7.0, 7.0, 4.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0168304443359375, -0.01631021499633789, -0.01578998565673828, -0.015269756317138672, -0.014749526977539062, -0.014229297637939453, -0.013709068298339844, -0.013188838958740234, -0.012668609619140625, -0.012148380279541016, -0.011628150939941406, -0.011107921600341797, -0.010587692260742188, -0.010067462921142578, -0.009547233581542969, -0.00902700424194336, -0.00850677490234375, -0.00798654556274414, -0.007466316223144531, -0.006946086883544922, -0.0064258575439453125, -0.005905628204345703, -0.005385398864746094, -0.004865169525146484, -0.004344940185546875, -0.0038247108459472656, -0.0033044815063476562, -0.002784252166748047, -0.0022640228271484375, -0.0017437934875488281, -0.0012235641479492188, -0.0007033348083496094, -0.00018310546875, 0.0003371238708496094, 0.0008573532104492188, 0.0013775825500488281, 0.0018978118896484375, 0.002418041229248047, 0.0029382705688476562, 0.0034584999084472656, 0.003978729248046875, 0.004498958587646484, 0.005019187927246094, 0.005539417266845703, 0.0060596466064453125, 0.006579875946044922, 0.007100105285644531, 0.007620334625244141, 0.00814056396484375, 0.00866079330444336, 0.009181022644042969, 0.009701251983642578, 0.010221481323242188, 0.010741710662841797, 0.011261940002441406, 0.011782169342041016, 0.012302398681640625, 0.012822628021240234, 0.013342857360839844, 0.013863086700439453, 0.014383316040039062, 0.014903545379638672, 0.015423774719238281, 0.01594400405883789, 0.0164642333984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 10.0, 9.0, 11.0, 10.0, 13.0, 19.0, 28.0, 23.0, 32.0, 37.0, 61.0, 67.0, 81.0, 99.0, 149.0, 202.0, 284.0, 475.0, 898.0, 2163.0, 14932.0, 944854.0, 77349.0, 3607.0, 1198.0, 629.0, 349.0, 237.0, 155.0, 114.0, 89.0, 80.0, 60.0, 47.0, 38.0, 36.0, 22.0, 20.0, 14.0, 18.0, 6.0, 5.0, 6.0, 2.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.06787109375, -0.06558609008789062, -0.06330108642578125, -0.061016082763671875, -0.0587310791015625, -0.056446075439453125, -0.05416107177734375, -0.051876068115234375, -0.049591064453125, -0.047306060791015625, -0.04502105712890625, -0.042736053466796875, -0.0404510498046875, -0.038166046142578125, -0.03588104248046875, -0.033596038818359375, -0.03131103515625, -0.029026031494140625, -0.02674102783203125, -0.024456024169921875, -0.0221710205078125, -0.019886016845703125, -0.01760101318359375, -0.015316009521484375, -0.013031005859375, -0.010746002197265625, -0.00846099853515625, -0.006175994873046875, -0.0038909912109375, -0.001605987548828125, 0.00067901611328125, 0.002964019775390625, 0.0052490234375, 0.007534027099609375, 0.00981903076171875, 0.012104034423828125, 0.0143890380859375, 0.016674041748046875, 0.01895904541015625, 0.021244049072265625, 0.023529052734375, 0.025814056396484375, 0.02809906005859375, 0.030384063720703125, 0.0326690673828125, 0.034954071044921875, 0.03723907470703125, 0.039524078369140625, 0.04180908203125, 0.044094085693359375, 0.04637908935546875, 0.048664093017578125, 0.0509490966796875, 0.053234100341796875, 0.05551910400390625, 0.057804107666015625, 0.060089111328125, 0.062374114990234375, 0.06465911865234375, 0.06694412231445312, 0.0692291259765625, 0.07151412963867188, 0.07379913330078125, 0.07608413696289062, 0.078369140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 7.0, 7.0, 14.0, 15.0, 9.0, 12.0, 20.0, 28.0, 23.0, 28.0, 27.0, 38.0, 40.0, 33.0, 47.0, 35.0, 47.0, 39.0, 42.0, 41.0, 42.0, 37.0, 47.0, 39.0, 31.0, 33.0, 27.0, 22.0, 26.0, 23.0, 18.0, 16.0, 18.0, 10.0, 10.0, 6.0, 10.0, 4.0, 3.0, 4.0, 0.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.039215087890625, -0.037894248962402344, -0.03657341003417969, -0.03525257110595703, -0.033931732177734375, -0.03261089324951172, -0.03129005432128906, -0.029969215393066406, -0.02864837646484375, -0.027327537536621094, -0.026006698608398438, -0.02468585968017578, -0.023365020751953125, -0.02204418182373047, -0.020723342895507812, -0.019402503967285156, -0.0180816650390625, -0.016760826110839844, -0.015439987182617188, -0.014119148254394531, -0.012798309326171875, -0.011477470397949219, -0.010156631469726562, -0.008835792541503906, -0.00751495361328125, -0.006194114685058594, -0.0048732757568359375, -0.0035524368286132812, -0.002231597900390625, -0.0009107589721679688, 0.0004100799560546875, 0.0017309188842773438, 0.0030517578125, 0.004372596740722656, 0.0056934356689453125, 0.007014274597167969, 0.008335113525390625, 0.009655952453613281, 0.010976791381835938, 0.012297630310058594, 0.01361846923828125, 0.014939308166503906, 0.016260147094726562, 0.01758098602294922, 0.018901824951171875, 0.02022266387939453, 0.021543502807617188, 0.022864341735839844, 0.0241851806640625, 0.025506019592285156, 0.026826858520507812, 0.02814769744873047, 0.029468536376953125, 0.03078937530517578, 0.03211021423339844, 0.033431053161621094, 0.03475189208984375, 0.036072731018066406, 0.03739356994628906, 0.03871440887451172, 0.040035247802734375, 0.04135608673095703, 0.04267692565917969, 0.043997764587402344, 0.045318603515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 3.0, 5.0, 7.0, 4.0, 7.0, 18.0, 31.0, 38.0, 71.0, 134.0, 220.0, 564.0, 1914.0, 16022.0, 1000923.0, 25225.0, 2169.0, 604.0, 249.0, 155.0, 66.0, 31.0, 24.0, 17.0, 13.0, 12.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.76837158203125e-05, -4.5818276703357697e-05, -4.395283758640289e-05, -4.208739846944809e-05, -4.0221959352493286e-05, -3.835652023553848e-05, -3.649108111858368e-05, -3.4625642001628876e-05, -3.276020288467407e-05, -3.089476376771927e-05, -2.9029324650764465e-05, -2.7163885533809662e-05, -2.529844641685486e-05, -2.3433007299900055e-05, -2.156756818294525e-05, -1.9702129065990448e-05, -1.7836689949035645e-05, -1.597125083208084e-05, -1.4105811715126038e-05, -1.2240372598171234e-05, -1.037493348121643e-05, -8.509494364261627e-06, -6.644055247306824e-06, -4.77861613035202e-06, -2.913177013397217e-06, -1.0477378964424133e-06, 8.177012205123901e-07, 2.6831403374671936e-06, 4.548579454421997e-06, 6.4140185713768005e-06, 8.279457688331604e-06, 1.0144896805286407e-05, 1.2010335922241211e-05, 1.3875775039196014e-05, 1.5741214156150818e-05, 1.760665327310562e-05, 1.9472092390060425e-05, 2.1337531507015228e-05, 2.3202970623970032e-05, 2.5068409740924835e-05, 2.693384885787964e-05, 2.8799287974834442e-05, 3.0664727091789246e-05, 3.253016620874405e-05, 3.439560532569885e-05, 3.6261044442653656e-05, 3.812648355960846e-05, 3.999192267656326e-05, 4.1857361793518066e-05, 4.372280091047287e-05, 4.558824002742767e-05, 4.745367914438248e-05, 4.931911826133728e-05, 5.1184557378292084e-05, 5.304999649524689e-05, 5.491543561220169e-05, 5.6780874729156494e-05, 5.86463138461113e-05, 6.05117529630661e-05, 6.23771920800209e-05, 6.424263119697571e-05, 6.610807031393051e-05, 6.797350943088531e-05, 6.983894854784012e-05, 7.170438766479492e-05]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 12.0, 10.0, 10.0, 16.0, 30.0, 22.0, 20.0, 24.0, 47.0, 51.0, 56.0, 45.0, 46.0, 86.0, 48.0, 63.0, 48.0, 66.0, 39.0, 41.0, 41.0, 36.0, 16.0, 16.0, 11.0, 22.0, 16.0, 10.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.708766937255859e-06, -4.575587809085846e-06, -4.4424086809158325e-06, -4.309229552745819e-06, -4.176050424575806e-06, -4.042871296405792e-06, -3.909692168235779e-06, -3.7765130400657654e-06, -3.643333911895752e-06, -3.5101547837257385e-06, -3.376975655555725e-06, -3.2437965273857117e-06, -3.1106173992156982e-06, -2.977438271045685e-06, -2.8442591428756714e-06, -2.711080014705658e-06, -2.5779008865356445e-06, -2.444721758365631e-06, -2.3115426301956177e-06, -2.1783635020256042e-06, -2.045184373855591e-06, -1.9120052456855774e-06, -1.778826117515564e-06, -1.6456469893455505e-06, -1.5124678611755371e-06, -1.3792887330055237e-06, -1.2461096048355103e-06, -1.1129304766654968e-06, -9.797513484954834e-07, -8.4657222032547e-07, -7.133930921554565e-07, -5.802139639854431e-07, -4.470348358154297e-07, -3.1385570764541626e-07, -1.8067657947540283e-07, -4.7497451305389404e-08, 8.568167686462402e-08, 2.1886080503463745e-07, 3.520399332046509e-07, 4.852190613746643e-07, 6.183981895446777e-07, 7.515773177146912e-07, 8.847564458847046e-07, 1.017935574054718e-06, 1.1511147022247314e-06, 1.2842938303947449e-06, 1.4174729585647583e-06, 1.5506520867347717e-06, 1.6838312149047852e-06, 1.8170103430747986e-06, 1.950189471244812e-06, 2.0833685994148254e-06, 2.216547727584839e-06, 2.3497268557548523e-06, 2.4829059839248657e-06, 2.616085112094879e-06, 2.7492642402648926e-06, 2.882443368434906e-06, 3.0156224966049194e-06, 3.148801624774933e-06, 3.2819807529449463e-06, 3.4151598811149597e-06, 3.548339009284973e-06, 3.6815181374549866e-06, 3.814697265625e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 11.0, 7.0, 13.0, 12.0, 31.0, 36.0, 67.0, 110.0, 257.0, 643.0, 4261.0, 1033385.0, 8277.0, 822.0, 280.0, 132.0, 68.0, 56.0, 23.0, 19.0, 12.0, 9.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.581710815429688e-05, -7.32550397515297e-05, -7.069297134876251e-05, -6.813090294599533e-05, -6.556883454322815e-05, -6.300676614046097e-05, -6.044469773769379e-05, -5.7882629334926605e-05, -5.5320560932159424e-05, -5.275849252939224e-05, -5.019642412662506e-05, -4.763435572385788e-05, -4.50722873210907e-05, -4.251021891832352e-05, -3.9948150515556335e-05, -3.7386082112789154e-05, -3.482401371002197e-05, -3.226194530725479e-05, -2.969987690448761e-05, -2.713780850172043e-05, -2.4575740098953247e-05, -2.2013671696186066e-05, -1.9451603293418884e-05, -1.6889534890651703e-05, -1.4327466487884521e-05, -1.176539808511734e-05, -9.203329682350159e-06, -6.641261279582977e-06, -4.079192876815796e-06, -1.5171244740486145e-06, 1.044943928718567e-06, 3.6070123314857483e-06, 6.16908073425293e-06, 8.731149137020111e-06, 1.1293217539787292e-05, 1.3855285942554474e-05, 1.6417354345321655e-05, 1.8979422748088837e-05, 2.1541491150856018e-05, 2.41035595536232e-05, 2.666562795639038e-05, 2.9227696359157562e-05, 3.1789764761924744e-05, 3.4351833164691925e-05, 3.6913901567459106e-05, 3.947596997022629e-05, 4.203803837299347e-05, 4.460010677576065e-05, 4.716217517852783e-05, 4.9724243581295013e-05, 5.2286311984062195e-05, 5.4848380386829376e-05, 5.741044878959656e-05, 5.997251719236374e-05, 6.253458559513092e-05, 6.50966539978981e-05, 6.765872240066528e-05, 7.022079080343246e-05, 7.278285920619965e-05, 7.534492760896683e-05, 7.790699601173401e-05, 8.046906441450119e-05, 8.303113281726837e-05, 8.559320122003555e-05, 8.815526962280273e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 9.0, 10.0, 19.0, 24.0, 32.0, 69.0, 94.0, 162.0, 229.0, 111.0, 75.0, 56.0, 32.0, 22.0, 15.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.017353057861328e-05, -3.8751401007175446e-05, -3.732927143573761e-05, -3.5907141864299774e-05, -3.448501229286194e-05, -3.30628827214241e-05, -3.164075314998627e-05, -3.021862357854843e-05, -2.8796494007110596e-05, -2.737436443567276e-05, -2.5952234864234924e-05, -2.453010529279709e-05, -2.3107975721359253e-05, -2.1685846149921417e-05, -2.026371657848358e-05, -1.8841587007045746e-05, -1.741945743560791e-05, -1.5997327864170074e-05, -1.4575198292732239e-05, -1.3153068721294403e-05, -1.1730939149856567e-05, -1.0308809578418732e-05, -8.886680006980896e-06, -7.46455043554306e-06, -6.042420864105225e-06, -4.620291292667389e-06, -3.1981617212295532e-06, -1.7760321497917175e-06, -3.5390257835388184e-07, 1.0682269930839539e-06, 2.4903565645217896e-06, 3.912486135959625e-06, 5.334615707397461e-06, 6.756745278835297e-06, 8.178874850273132e-06, 9.601004421710968e-06, 1.1023133993148804e-05, 1.244526356458664e-05, 1.3867393136024475e-05, 1.528952270746231e-05, 1.6711652278900146e-05, 1.8133781850337982e-05, 1.9555911421775818e-05, 2.0978040993213654e-05, 2.240017056465149e-05, 2.3822300136089325e-05, 2.524442970752716e-05, 2.6666559278964996e-05, 2.8088688850402832e-05, 2.9510818421840668e-05, 3.0932947993278503e-05, 3.235507756471634e-05, 3.3777207136154175e-05, 3.519933670759201e-05, 3.6621466279029846e-05, 3.804359585046768e-05, 3.946572542190552e-05, 4.088785499334335e-05, 4.230998456478119e-05, 4.3732114136219025e-05, 4.515424370765686e-05, 4.6576373279094696e-05, 4.799850285053253e-05, 4.942063242197037e-05, 5.08427619934082e-05]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 11.0, 45.0, 637.0, 263.0, 31.0, 10.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.489690363407135, -0.48059576749801636, -0.4715012013912201, -0.46240660548210144, -0.4533120393753052, -0.4442174434661865, -0.43512284755706787, -0.4260282814502716, -0.41693368554115295, -0.4078390896320343, -0.39874452352523804, -0.3896499276161194, -0.3805553615093231, -0.37146076560020447, -0.3623661994934082, -0.35327160358428955, -0.3441770076751709, -0.33508241176605225, -0.325987845659256, -0.31689324975013733, -0.30779868364334106, -0.2987040877342224, -0.28960949182510376, -0.2805149257183075, -0.27142035961151123, -0.2623257637023926, -0.2532311975955963, -0.24413660168647766, -0.2350420206785202, -0.22594743967056274, -0.21685285866260529, -0.20775827765464783, -0.19866369664669037, -0.1895691156387329, -0.18047453463077545, -0.171379953622818, -0.16228535771369934, -0.15319077670574188, -0.14409619569778442, -0.13500159978866577, -0.1259070336818695, -0.11681245267391205, -0.10771786421537399, -0.09862328320741653, -0.08952869474887848, -0.08043411374092102, -0.07133953273296356, -0.06224494427442551, -0.05315035581588745, -0.044055771082639694, -0.03496118634939194, -0.02586660534143448, -0.016772020608186722, -0.007677435874938965, 0.0014171451330184937, 0.010511733591556549, 0.019606314599514008, 0.028700899332761765, 0.03779548406600952, 0.04689006507396698, 0.05598464980721474, 0.0650792345404625, 0.07417381554841995, 0.08326840400695801, 0.09236298501491547]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 10.0, 18.0, 28.0, 31.0, 45.0, 49.0, 73.0, 66.0, 70.0, 71.0, 90.0, 86.0, 71.0, 61.0, 61.0, 32.0, 32.0, 28.0, 20.0, 13.0, 8.0, 10.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5326033234596252, -0.5182681083679199, -0.5039328336715698, -0.4895976185798645, -0.4752623736858368, -0.4609271287918091, -0.44659191370010376, -0.43225666880607605, -0.41792142391204834, -0.40358617901802063, -0.3892509639263153, -0.3749157190322876, -0.3605804741382599, -0.3462452292442322, -0.33191001415252686, -0.31757476925849915, -0.30323952436447144, -0.2889042794704437, -0.2745690643787384, -0.2602338194847107, -0.24589857459068298, -0.23156334459781647, -0.21722811460494995, -0.20289286971092224, -0.18855765461921692, -0.1742224246263504, -0.1598871797323227, -0.14555194973945618, -0.13121670484542847, -0.11688147485256195, -0.10254623740911484, -0.08821099996566772, -0.07387575507164001, -0.0595405176281929, -0.04520528018474579, -0.030870046466588974, -0.01653480902314186, -0.0021995753049850464, 0.012135662138462067, 0.02647089958190918, 0.04080613702535629, 0.055141374468803406, 0.06947661191225052, 0.08381184935569763, 0.09814707934856415, 0.11248231679201126, 0.12681755423545837, 0.14115279912948608, 0.1554880291223526, 0.16982325911521912, 0.18415850400924683, 0.19849373400211334, 0.21282897889614105, 0.22716420888900757, 0.24149945378303528, 0.255834698677063, 0.2701699137687683, 0.284505158662796, 0.29884037375450134, 0.31317561864852905, 0.32751086354255676, 0.3418461084365845, 0.3561813235282898, 0.3705165684223175, 0.3848518133163452]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 8.0, 5.0, 16.0, 9.0, 15.0, 20.0, 30.0, 34.0, 62.0, 73.0, 114.0, 149.0, 258.0, 424.0, 1465.0, 37745.0, 4120524.0, 29438.0, 2835.0, 414.0, 220.0, 140.0, 93.0, 57.0, 40.0, 22.0, 17.0, 12.0, 14.0, 10.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045196533203125, -0.04384469985961914, -0.04249286651611328, -0.04114103317260742, -0.03978919982910156, -0.0384373664855957, -0.037085533142089844, -0.035733699798583984, -0.034381866455078125, -0.033030033111572266, -0.031678199768066406, -0.030326366424560547, -0.028974533081054688, -0.027622699737548828, -0.02627086639404297, -0.02491903305053711, -0.02356719970703125, -0.02221536636352539, -0.02086353302001953, -0.019511699676513672, -0.018159866333007812, -0.016808032989501953, -0.015456199645996094, -0.014104366302490234, -0.012752532958984375, -0.011400699615478516, -0.010048866271972656, -0.008697032928466797, -0.0073451995849609375, -0.005993366241455078, -0.004641532897949219, -0.0032896995544433594, -0.0019378662109375, -0.0005860328674316406, 0.0007658004760742188, 0.002117633819580078, 0.0034694671630859375, 0.004821300506591797, 0.006173133850097656, 0.007524967193603516, 0.008876800537109375, 0.010228633880615234, 0.011580467224121094, 0.012932300567626953, 0.014284133911132812, 0.015635967254638672, 0.01698780059814453, 0.01833963394165039, 0.01969146728515625, 0.02104330062866211, 0.02239513397216797, 0.023746967315673828, 0.025098800659179688, 0.026450634002685547, 0.027802467346191406, 0.029154300689697266, 0.030506134033203125, 0.031857967376708984, 0.033209800720214844, 0.0345616340637207, 0.03591346740722656, 0.03726530075073242, 0.03861713409423828, 0.03996896743774414, 0.04132080078125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 2.0, 2.0, 2.0, 8.0, 1.0, 5.0, 8.0, 11.0, 7.0, 15.0, 17.0, 37.0, 133.0, 296.0, 240.0, 107.0, 23.0, 14.0, 10.0, 10.0, 9.0, 7.0, 5.0, 3.0, 6.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016510009765625, -0.01601994037628174, -0.015529870986938477, -0.015039801597595215, -0.014549732208251953, -0.014059662818908691, -0.01356959342956543, -0.013079524040222168, -0.012589454650878906, -0.012099385261535645, -0.011609315872192383, -0.011119246482849121, -0.01062917709350586, -0.010139107704162598, -0.009649038314819336, -0.009158968925476074, -0.008668899536132812, -0.00817883014678955, -0.007688760757446289, -0.007198691368103027, -0.006708621978759766, -0.006218552589416504, -0.005728483200073242, -0.0052384138107299805, -0.004748344421386719, -0.004258275032043457, -0.0037682056427001953, -0.0032781362533569336, -0.002788066864013672, -0.00229799747467041, -0.0018079280853271484, -0.0013178586959838867, -0.000827789306640625, -0.0003377199172973633, 0.00015234947204589844, 0.0006424188613891602, 0.0011324882507324219, 0.0016225576400756836, 0.0021126270294189453, 0.002602696418762207, 0.0030927658081054688, 0.0035828351974487305, 0.004072904586791992, 0.004562973976135254, 0.005053043365478516, 0.005543112754821777, 0.006033182144165039, 0.006523251533508301, 0.0070133209228515625, 0.007503390312194824, 0.007993459701538086, 0.008483529090881348, 0.00897359848022461, 0.009463667869567871, 0.009953737258911133, 0.010443806648254395, 0.010933876037597656, 0.011423945426940918, 0.01191401481628418, 0.012404084205627441, 0.012894153594970703, 0.013384222984313965, 0.013874292373657227, 0.014364361763000488, 0.01485443115234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 6.0, 12.0, 7.0, 15.0, 12.0, 19.0, 37.0, 58.0, 82.0, 189.0, 522.0, 2685.0, 47255.0, 4137458.0, 4652.0, 697.0, 248.0, 94.0, 50.0, 54.0, 25.0, 19.0, 10.0, 13.0, 10.0, 7.0, 7.0, 7.0, 1.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06146240234375, -0.05942726135253906, -0.057392120361328125, -0.05535697937011719, -0.05332183837890625, -0.05128669738769531, -0.049251556396484375, -0.04721641540527344, -0.0451812744140625, -0.04314613342285156, -0.041110992431640625, -0.03907585144042969, -0.03704071044921875, -0.03500556945800781, -0.032970428466796875, -0.030935287475585938, -0.028900146484375, -0.026865005493164062, -0.024829864501953125, -0.022794723510742188, -0.02075958251953125, -0.018724441528320312, -0.016689300537109375, -0.014654159545898438, -0.0126190185546875, -0.010583877563476562, -0.008548736572265625, -0.0065135955810546875, -0.00447845458984375, -0.0024433135986328125, -0.000408172607421875, 0.0016269683837890625, 0.003662109375, 0.0056972503662109375, 0.007732391357421875, 0.009767532348632812, 0.01180267333984375, 0.013837814331054688, 0.015872955322265625, 0.017908096313476562, 0.0199432373046875, 0.021978378295898438, 0.024013519287109375, 0.026048660278320312, 0.02808380126953125, 0.030118942260742188, 0.032154083251953125, 0.03418922424316406, 0.036224365234375, 0.03825950622558594, 0.040294647216796875, 0.04232978820800781, 0.04436492919921875, 0.04640007019042969, 0.048435211181640625, 0.05047035217285156, 0.0525054931640625, 0.05454063415527344, 0.056575775146484375, 0.05861091613769531, 0.06064605712890625, 0.06268119812011719, 0.06471633911132812, 0.06675148010253906, 0.06878662109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 5.0, 5.0, 10.0, 10.0, 23.0, 66.0, 169.0, 477.0, 2332.0, 626.0, 196.0, 67.0, 27.0, 11.0, 6.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0225677490234375, -0.02195143699645996, -0.021335124969482422, -0.020718812942504883, -0.020102500915527344, -0.019486188888549805, -0.018869876861572266, -0.018253564834594727, -0.017637252807617188, -0.01702094078063965, -0.01640462875366211, -0.01578831672668457, -0.015172004699707031, -0.014555692672729492, -0.013939380645751953, -0.013323068618774414, -0.012706756591796875, -0.012090444564819336, -0.011474132537841797, -0.010857820510864258, -0.010241508483886719, -0.00962519645690918, -0.00900888442993164, -0.008392572402954102, -0.0077762603759765625, -0.0071599483489990234, -0.006543636322021484, -0.005927324295043945, -0.005311012268066406, -0.004694700241088867, -0.004078388214111328, -0.003462076187133789, -0.00284576416015625, -0.002229452133178711, -0.0016131401062011719, -0.0009968280792236328, -0.00038051605224609375, 0.0002357959747314453, 0.0008521080017089844, 0.0014684200286865234, 0.0020847320556640625, 0.0027010440826416016, 0.0033173561096191406, 0.00393366813659668, 0.004549980163574219, 0.005166292190551758, 0.005782604217529297, 0.006398916244506836, 0.007015228271484375, 0.007631540298461914, 0.008247852325439453, 0.008864164352416992, 0.009480476379394531, 0.01009678840637207, 0.01071310043334961, 0.011329412460327148, 0.011945724487304688, 0.012562036514282227, 0.013178348541259766, 0.013794660568237305, 0.014410972595214844, 0.015027284622192383, 0.015643596649169922, 0.01625990867614746, 0.016876220703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 272.0, 744.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312051922082901, -0.2972142696380615, -0.28237658739089966, -0.2675389051437378, -0.2527012526988983, -0.23786358535289764, -0.22302591800689697, -0.2081882506608963, -0.19335058331489563, -0.17851291596889496, -0.1636752486228943, -0.14883758127689362, -0.13399991393089294, -0.11916224658489227, -0.1043245792388916, -0.08948691189289093, -0.07464924454689026, -0.05981157720088959, -0.044973909854888916, -0.030136242508888245, -0.015298575162887573, -0.00046090781688690186, 0.01437675952911377, 0.02921442687511444, 0.04405209422111511, 0.058889761567115784, 0.07372742891311646, 0.08856509625911713, 0.1034027636051178, 0.11824043095111847, 0.13307809829711914, 0.1479157656431198, 0.16275346279144287, 0.17759113013744354, 0.1924287974834442, 0.20726646482944489, 0.22210413217544556, 0.23694179952144623, 0.2517794668674469, 0.2666171193122864, 0.28145480155944824, 0.2962924838066101, 0.3111301362514496, 0.32596778869628906, 0.3408054709434509, 0.3556431531906128, 0.37048080563545227, 0.38531845808029175, 0.4001561403274536, 0.4149938225746155, 0.42983147501945496, 0.44466912746429443, 0.4595068097114563, 0.47434449195861816, 0.48918214440345764, 0.5040197968482971, 0.518857479095459, 0.5336951613426208, 0.5485328435897827, 0.5633704662322998, 0.5782081484794617, 0.5930458307266235, 0.6078834533691406, 0.6227211356163025, 0.6375588178634644]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 9.0, 8.0, 8.0, 21.0, 14.0, 11.0, 22.0, 16.0, 31.0, 34.0, 28.0, 38.0, 44.0, 32.0, 47.0, 44.0, 62.0, 52.0, 61.0, 55.0, 41.0, 43.0, 36.0, 36.0, 35.0, 26.0, 27.0, 21.0, 22.0, 8.0, 13.0, 14.0, 11.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04668515920639038, -0.04504138231277466, -0.043397609144449234, -0.04175383597612381, -0.04011005908250809, -0.038466282188892365, -0.03682250902056694, -0.035178735852241516, -0.03353495895862579, -0.03189118206501007, -0.030247408896684647, -0.028603633865714073, -0.0269598588347435, -0.025316083803772926, -0.023672308772802353, -0.02202853374183178, -0.020384758710861206, -0.018740983679890633, -0.01709720864892006, -0.015453433617949486, -0.013809658586978912, -0.012165883556008339, -0.010522108525037766, -0.008878333494067192, -0.007234558463096619, -0.005590783432126045, -0.003947008401155472, -0.0023032333701848984, -0.000659458339214325, 0.0009843166917562485, 0.002628091722726822, 0.004271866753697395, 0.005915641784667969, 0.007559416815638542, 0.009203191846609116, 0.010846966877579689, 0.012490741908550262, 0.014134516939520836, 0.01577829197049141, 0.017422067001461983, 0.019065842032432556, 0.02070961706340313, 0.022353392094373703, 0.023997167125344276, 0.02564094215631485, 0.027284717187285423, 0.028928492218255997, 0.03057226724922657, 0.032216042280197144, 0.033859819173812866, 0.03550359234213829, 0.037147365510463715, 0.03879114240407944, 0.04043491929769516, 0.042078692466020584, 0.04372246563434601, 0.04536624252796173, 0.047010019421577454, 0.04865379258990288, 0.0502975657582283, 0.051941342651844025, 0.05358511954545975, 0.05522889271378517, 0.056872665882110596, 0.05851644277572632]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 15.0, 11.0, 19.0, 28.0, 31.0, 36.0, 61.0, 86.0, 124.0, 148.0, 253.0, 416.0, 492.0, 848.0, 1396.0, 2166.0, 3799.0, 7244.0, 15863.0, 65562.0, 868657.0, 50795.0, 14340.0, 6707.0, 3649.0, 2031.0, 1310.0, 797.0, 495.0, 341.0, 252.0, 155.0, 111.0, 69.0, 59.0, 59.0, 39.0, 23.0, 12.0, 12.0, 10.0, 12.0, 4.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.02239990234375, -0.021664142608642578, -0.020928382873535156, -0.020192623138427734, -0.019456863403320312, -0.01872110366821289, -0.01798534393310547, -0.017249584197998047, -0.016513824462890625, -0.015778064727783203, -0.015042304992675781, -0.01430654525756836, -0.013570785522460938, -0.012835025787353516, -0.012099266052246094, -0.011363506317138672, -0.01062774658203125, -0.009891986846923828, -0.009156227111816406, -0.008420467376708984, -0.0076847076416015625, -0.006948947906494141, -0.006213188171386719, -0.005477428436279297, -0.004741668701171875, -0.004005908966064453, -0.0032701492309570312, -0.0025343894958496094, -0.0017986297607421875, -0.0010628700256347656, -0.00032711029052734375, 0.0004086494445800781, 0.0011444091796875, 0.0018801689147949219, 0.0026159286499023438, 0.0033516883850097656, 0.0040874481201171875, 0.004823207855224609, 0.005558967590332031, 0.006294727325439453, 0.007030487060546875, 0.007766246795654297, 0.008502006530761719, 0.00923776626586914, 0.009973526000976562, 0.010709285736083984, 0.011445045471191406, 0.012180805206298828, 0.01291656494140625, 0.013652324676513672, 0.014388084411621094, 0.015123844146728516, 0.015859603881835938, 0.01659536361694336, 0.01733112335205078, 0.018066883087158203, 0.018802642822265625, 0.019538402557373047, 0.02027416229248047, 0.02100992202758789, 0.021745681762695312, 0.022481441497802734, 0.023217201232910156, 0.023952960968017578, 0.024688720703125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 8.0, 0.0, 6.0, 8.0, 11.0, 9.0, 13.0, 19.0, 44.0, 135.0, 313.0, 231.0, 93.0, 20.0, 12.0, 13.0, 7.0, 8.0, 8.0, 6.0, 3.0, 7.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0164947509765625, -0.016003966331481934, -0.015513181686401367, -0.0150223970413208, -0.014531612396240234, -0.014040827751159668, -0.013550043106079102, -0.013059258460998535, -0.012568473815917969, -0.012077689170837402, -0.011586904525756836, -0.01109611988067627, -0.010605335235595703, -0.010114550590515137, -0.00962376594543457, -0.009132981300354004, -0.008642196655273438, -0.008151412010192871, -0.007660627365112305, -0.007169842720031738, -0.006679058074951172, -0.0061882734298706055, -0.005697488784790039, -0.005206704139709473, -0.004715919494628906, -0.00422513484954834, -0.0037343502044677734, -0.003243565559387207, -0.0027527809143066406, -0.0022619962692260742, -0.0017712116241455078, -0.0012804269790649414, -0.000789642333984375, -0.0002988576889038086, 0.0001919269561767578, 0.0006827116012573242, 0.0011734962463378906, 0.001664280891418457, 0.0021550655364990234, 0.00264585018157959, 0.0031366348266601562, 0.0036274194717407227, 0.004118204116821289, 0.0046089887619018555, 0.005099773406982422, 0.005590558052062988, 0.006081342697143555, 0.006572127342224121, 0.0070629119873046875, 0.007553696632385254, 0.00804448127746582, 0.008535265922546387, 0.009026050567626953, 0.00951683521270752, 0.010007619857788086, 0.010498404502868652, 0.010989189147949219, 0.011479973793029785, 0.011970758438110352, 0.012461543083190918, 0.012952327728271484, 0.01344311237335205, 0.013933897018432617, 0.014424681663513184, 0.01491546630859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 15.0, 10.0, 13.0, 24.0, 24.0, 25.0, 29.0, 40.0, 67.0, 75.0, 99.0, 131.0, 183.0, 286.0, 438.0, 821.0, 2420.0, 55267.0, 975121.0, 10088.0, 1474.0, 612.0, 389.0, 224.0, 152.0, 127.0, 91.0, 63.0, 46.0, 43.0, 42.0, 30.0, 15.0, 22.0, 11.0, 14.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06591796875, -0.06366825103759766, -0.06141853332519531, -0.05916881561279297, -0.056919097900390625, -0.05466938018798828, -0.05241966247558594, -0.050169944763183594, -0.04792022705078125, -0.045670509338378906, -0.04342079162597656, -0.04117107391357422, -0.038921356201171875, -0.03667163848876953, -0.03442192077636719, -0.032172203063964844, -0.0299224853515625, -0.027672767639160156, -0.025423049926757812, -0.02317333221435547, -0.020923614501953125, -0.01867389678955078, -0.016424179077148438, -0.014174461364746094, -0.01192474365234375, -0.009675025939941406, -0.0074253082275390625, -0.005175590515136719, -0.002925872802734375, -0.0006761550903320312, 0.0015735626220703125, 0.0038232803344726562, 0.006072998046875, 0.008322715759277344, 0.010572433471679688, 0.012822151184082031, 0.015071868896484375, 0.01732158660888672, 0.019571304321289062, 0.021821022033691406, 0.02407073974609375, 0.026320457458496094, 0.028570175170898438, 0.03081989288330078, 0.033069610595703125, 0.03531932830810547, 0.03756904602050781, 0.039818763732910156, 0.0420684814453125, 0.044318199157714844, 0.04656791687011719, 0.04881763458251953, 0.051067352294921875, 0.05331707000732422, 0.05556678771972656, 0.057816505432128906, 0.06006622314453125, 0.062315940856933594, 0.06456565856933594, 0.06681537628173828, 0.06906509399414062, 0.07131481170654297, 0.07356452941894531, 0.07581424713134766, 0.07806396484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 14.0, 5.0, 10.0, 17.0, 14.0, 15.0, 15.0, 23.0, 32.0, 33.0, 37.0, 32.0, 38.0, 46.0, 42.0, 35.0, 40.0, 40.0, 49.0, 40.0, 48.0, 43.0, 39.0, 39.0, 36.0, 44.0, 29.0, 29.0, 17.0, 23.0, 20.0, 15.0, 5.0, 11.0, 7.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03887939453125, -0.037549495697021484, -0.03621959686279297, -0.03488969802856445, -0.03355979919433594, -0.03222990036010742, -0.030900001525878906, -0.02957010269165039, -0.028240203857421875, -0.02691030502319336, -0.025580406188964844, -0.024250507354736328, -0.022920608520507812, -0.021590709686279297, -0.02026081085205078, -0.018930912017822266, -0.01760101318359375, -0.016271114349365234, -0.014941215515136719, -0.013611316680908203, -0.012281417846679688, -0.010951519012451172, -0.009621620178222656, -0.00829172134399414, -0.006961822509765625, -0.005631923675537109, -0.004302024841308594, -0.002972126007080078, -0.0016422271728515625, -0.0003123283386230469, 0.0010175704956054688, 0.0023474693298339844, 0.0036773681640625, 0.005007266998291016, 0.006337165832519531, 0.007667064666748047, 0.008996963500976562, 0.010326862335205078, 0.011656761169433594, 0.01298666000366211, 0.014316558837890625, 0.01564645767211914, 0.016976356506347656, 0.018306255340576172, 0.019636154174804688, 0.020966053009033203, 0.02229595184326172, 0.023625850677490234, 0.02495574951171875, 0.026285648345947266, 0.02761554718017578, 0.028945446014404297, 0.030275344848632812, 0.03160524368286133, 0.032935142517089844, 0.03426504135131836, 0.035594940185546875, 0.03692483901977539, 0.038254737854003906, 0.03958463668823242, 0.04091453552246094, 0.04224443435668945, 0.04357433319091797, 0.044904232025146484, 0.046234130859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 7.0, 10.0, 22.0, 23.0, 26.0, 45.0, 89.0, 143.0, 263.0, 568.0, 1155.0, 3796.0, 18942.0, 659567.0, 344516.0, 14327.0, 2885.0, 1094.0, 495.0, 209.0, 140.0, 68.0, 51.0, 31.0, 21.0, 17.0, 5.0, 15.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7894973754882812e-05, -2.713967114686966e-05, -2.6384368538856506e-05, -2.5629065930843353e-05, -2.48737633228302e-05, -2.4118460714817047e-05, -2.3363158106803894e-05, -2.260785549879074e-05, -2.1852552890777588e-05, -2.1097250282764435e-05, -2.0341947674751282e-05, -1.958664506673813e-05, -1.8831342458724976e-05, -1.8076039850711823e-05, -1.732073724269867e-05, -1.6565434634685516e-05, -1.5810132026672363e-05, -1.505482941865921e-05, -1.4299526810646057e-05, -1.3544224202632904e-05, -1.2788921594619751e-05, -1.2033618986606598e-05, -1.1278316378593445e-05, -1.0523013770580292e-05, -9.767711162567139e-06, -9.012408554553986e-06, -8.257105946540833e-06, -7.5018033385276794e-06, -6.746500730514526e-06, -5.991198122501373e-06, -5.23589551448822e-06, -4.480592906475067e-06, -3.725290298461914e-06, -2.969987690448761e-06, -2.214685082435608e-06, -1.4593824744224548e-06, -7.040798664093018e-07, 5.122274160385132e-08, 8.065253496170044e-07, 1.5618279576301575e-06, 2.3171305656433105e-06, 3.0724331736564636e-06, 3.827735781669617e-06, 4.58303838968277e-06, 5.338340997695923e-06, 6.093643605709076e-06, 6.848946213722229e-06, 7.604248821735382e-06, 8.359551429748535e-06, 9.114854037761688e-06, 9.870156645774841e-06, 1.0625459253787994e-05, 1.1380761861801147e-05, 1.21360644698143e-05, 1.2891367077827454e-05, 1.3646669685840607e-05, 1.440197229385376e-05, 1.5157274901866913e-05, 1.5912577509880066e-05, 1.666788011789322e-05, 1.7423182725906372e-05, 1.8178485333919525e-05, 1.8933787941932678e-05, 1.968909054994583e-05, 2.0444393157958984e-05]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 8.0, 7.0, 5.0, 12.0, 15.0, 16.0, 27.0, 22.0, 29.0, 39.0, 58.0, 73.0, 63.0, 59.0, 80.0, 84.0, 72.0, 61.0, 61.0, 46.0, 40.0, 24.0, 9.0, 18.0, 11.0, 10.0, 8.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.887580871582031e-06, -4.715286195278168e-06, -4.542991518974304e-06, -4.370696842670441e-06, -4.198402166366577e-06, -4.026107490062714e-06, -3.85381281375885e-06, -3.6815181374549866e-06, -3.509223461151123e-06, -3.3369287848472595e-06, -3.164634108543396e-06, -2.9923394322395325e-06, -2.820044755935669e-06, -2.6477500796318054e-06, -2.475455403327942e-06, -2.3031607270240784e-06, -2.130866050720215e-06, -1.9585713744163513e-06, -1.7862766981124878e-06, -1.6139820218086243e-06, -1.4416873455047607e-06, -1.2693926692008972e-06, -1.0970979928970337e-06, -9.248033165931702e-07, -7.525086402893066e-07, -5.802139639854431e-07, -4.079192876815796e-07, -2.3562461137771606e-07, -6.332993507385254e-08, 1.0896474123001099e-07, 2.812594175338745e-07, 4.5355409383773804e-07, 6.258487701416016e-07, 7.981434464454651e-07, 9.704381227493286e-07, 1.1427327990531921e-06, 1.3150274753570557e-06, 1.4873221516609192e-06, 1.6596168279647827e-06, 1.8319115042686462e-06, 2.0042061805725098e-06, 2.1765008568763733e-06, 2.348795533180237e-06, 2.5210902094841003e-06, 2.693384885787964e-06, 2.8656795620918274e-06, 3.037974238395691e-06, 3.2102689146995544e-06, 3.382563591003418e-06, 3.5548582673072815e-06, 3.727152943611145e-06, 3.8994476199150085e-06, 4.071742296218872e-06, 4.244036972522736e-06, 4.416331648826599e-06, 4.588626325130463e-06, 4.760921001434326e-06, 4.93321567773819e-06, 5.105510354042053e-06, 5.277805030345917e-06, 5.45009970664978e-06, 5.622394382953644e-06, 5.794689059257507e-06, 5.966983735561371e-06, 6.139278411865234e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 9.0, 16.0, 21.0, 35.0, 55.0, 120.0, 310.0, 1482.0, 1035415.0, 10124.0, 571.0, 163.0, 97.0, 46.0, 26.0, 15.0, 9.0, 10.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.053945541381836e-05, -8.793268352746964e-05, -8.532591164112091e-05, -8.271913975477219e-05, -8.011236786842346e-05, -7.750559598207474e-05, -7.489882409572601e-05, -7.229205220937729e-05, -6.968528032302856e-05, -6.707850843667984e-05, -6.447173655033112e-05, -6.186496466398239e-05, -5.925819277763367e-05, -5.665142089128494e-05, -5.404464900493622e-05, -5.1437877118587494e-05, -4.883110523223877e-05, -4.6224333345890045e-05, -4.361756145954132e-05, -4.1010789573192596e-05, -3.840401768684387e-05, -3.579724580049515e-05, -3.319047391414642e-05, -3.05837020277977e-05, -2.7976930141448975e-05, -2.537015825510025e-05, -2.2763386368751526e-05, -2.01566144824028e-05, -1.7549842596054077e-05, -1.4943070709705353e-05, -1.2336298823356628e-05, -9.729526937007904e-06, -7.12275505065918e-06, -4.515983164310455e-06, -1.909211277961731e-06, 6.975606083869934e-07, 3.3043324947357178e-06, 5.911104381084442e-06, 8.517876267433167e-06, 1.1124648153781891e-05, 1.3731420040130615e-05, 1.633819192647934e-05, 1.8944963812828064e-05, 2.155173569917679e-05, 2.4158507585525513e-05, 2.6765279471874237e-05, 2.937205135822296e-05, 3.1978823244571686e-05, 3.458559513092041e-05, 3.7192367017269135e-05, 3.979913890361786e-05, 4.240591078996658e-05, 4.501268267631531e-05, 4.761945456266403e-05, 5.0226226449012756e-05, 5.283299833536148e-05, 5.5439770221710205e-05, 5.804654210805893e-05, 6.0653313994407654e-05, 6.326008588075638e-05, 6.58668577671051e-05, 6.847362965345383e-05, 7.108040153980255e-05, 7.368717342615128e-05, 7.62939453125e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 6.0, 7.0, 6.0, 15.0, 21.0, 27.0, 41.0, 106.0, 183.0, 349.0, 95.0, 54.0, 32.0, 22.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-05, -5.223974585533142e-05, -5.083531141281128e-05, -4.943087697029114e-05, -4.8026442527770996e-05, -4.6622008085250854e-05, -4.521757364273071e-05, -4.381313920021057e-05, -4.240870475769043e-05, -4.100427031517029e-05, -3.9599835872650146e-05, -3.8195401430130005e-05, -3.679096698760986e-05, -3.538653254508972e-05, -3.398209810256958e-05, -3.257766366004944e-05, -3.11732292175293e-05, -2.9768794775009155e-05, -2.8364360332489014e-05, -2.6959925889968872e-05, -2.555549144744873e-05, -2.415105700492859e-05, -2.2746622562408447e-05, -2.1342188119888306e-05, -1.9937753677368164e-05, -1.8533319234848022e-05, -1.712888479232788e-05, -1.572445034980774e-05, -1.4320015907287598e-05, -1.2915581464767456e-05, -1.1511147022247314e-05, -1.0106712579727173e-05, -8.702278137207031e-06, -7.29784369468689e-06, -5.893409252166748e-06, -4.4889748096466064e-06, -3.084540367126465e-06, -1.6801059246063232e-06, -2.7567148208618164e-07, 1.12876296043396e-06, 2.5331974029541016e-06, 3.937631845474243e-06, 5.342066287994385e-06, 6.746500730514526e-06, 8.150935173034668e-06, 9.55536961555481e-06, 1.0959804058074951e-05, 1.2364238500595093e-05, 1.3768672943115234e-05, 1.5173107385635376e-05, 1.6577541828155518e-05, 1.798197627067566e-05, 1.93864107131958e-05, 2.0790845155715942e-05, 2.2195279598236084e-05, 2.3599714040756226e-05, 2.5004148483276367e-05, 2.640858292579651e-05, 2.781301736831665e-05, 2.9217451810836792e-05, 3.0621886253356934e-05, 3.2026320695877075e-05, 3.343075513839722e-05, 3.483518958091736e-05, 3.62396240234375e-05]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 89.0, 820.0, 81.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5508574843406677, -0.5394999980926514, -0.528142511844635, -0.5167850852012634, -0.5054275989532471, -0.4940701127052307, -0.48271262645721436, -0.4713551700115204, -0.45999768376350403, -0.44864019751548767, -0.4372827410697937, -0.42592525482177734, -0.4145677983760834, -0.403210312128067, -0.39185285568237305, -0.3804953694343567, -0.36913788318634033, -0.357780396938324, -0.34642294049263, -0.33506545424461365, -0.3237079977989197, -0.3123505115509033, -0.30099302530288696, -0.289635568857193, -0.278278112411499, -0.26692062616348267, -0.2555631697177887, -0.24420568346977234, -0.23284821212291718, -0.221490740776062, -0.21013326942920685, -0.19877579808235168, -0.18741831183433533, -0.17606084048748016, -0.164703369140625, -0.15334588289260864, -0.14198841154575348, -0.13063094019889832, -0.11927346885204315, -0.10791599005460739, -0.09655851870775223, -0.08520104736089706, -0.0738435685634613, -0.06248609721660614, -0.05112862214446068, -0.039771147072315216, -0.028413675725460052, -0.017056196928024292, -0.005698725581169128, 0.005658748559653759, 0.017016222700476646, 0.02837369590997696, 0.03973117098212242, 0.05108864605426788, 0.06244611740112305, 0.07380359619855881, 0.08516106754541397, 0.09651853889226913, 0.1078760176897049, 0.11923348903656006, 0.13059096038341522, 0.14194843173027039, 0.15330591797828674, 0.1646633893251419, 0.17602086067199707]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 8.0, 10.0, 7.0, 12.0, 19.0, 22.0, 28.0, 23.0, 32.0, 36.0, 35.0, 51.0, 50.0, 51.0, 61.0, 62.0, 53.0, 55.0, 38.0, 50.0, 59.0, 43.0, 34.0, 32.0, 29.0, 16.0, 14.0, 16.0, 16.0, 13.0, 4.0, 10.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.24950659275054932, -0.24082477390766144, -0.23214295506477356, -0.22346115112304688, -0.214779332280159, -0.20609751343727112, -0.19741569459438324, -0.18873387575149536, -0.18005207180976868, -0.1713702529668808, -0.16268843412399292, -0.15400663018226624, -0.14532481133937836, -0.13664299249649048, -0.1279611736536026, -0.11927935481071472, -0.11059753596782684, -0.10191571712493896, -0.09323390573263168, -0.0845520868897438, -0.07587027549743652, -0.06718845665454865, -0.05850663781166077, -0.04982482269406319, -0.04114300757646561, -0.03246119245886803, -0.023779375478625298, -0.015097558498382568, -0.006415743380784988, 0.0022660717368125916, 0.01094789057970047, 0.01962970569729805, 0.02831152081489563, 0.03699333593249321, 0.04567515105009079, 0.05435696989297867, 0.06303878128528595, 0.07172060012817383, 0.0804024189710617, 0.08908423781394958, 0.09776604920625687, 0.10644786804914474, 0.11512967944145203, 0.1238114982843399, 0.13249331712722778, 0.14117512106895447, 0.14985695481300354, 0.15853875875473022, 0.1672205775976181, 0.17590239644050598, 0.18458421528339386, 0.19326603412628174, 0.20194783806800842, 0.2106296569108963, 0.21931147575378418, 0.22799329459667206, 0.23667511343955994, 0.24535693228244781, 0.2540387511253357, 0.2627205550670624, 0.27140238881111145, 0.28008419275283813, 0.2887660264968872, 0.2974478304386139, 0.3061296343803406]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 10.0, 4.0, 12.0, 15.0, 21.0, 27.0, 41.0, 53.0, 133.0, 1210.0, 4083624.0, 106961.0, 1681.0, 276.0, 59.0, 43.0, 21.0, 20.0, 16.0, 6.0, 4.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0408935546875, -0.03968954086303711, -0.03848552703857422, -0.03728151321411133, -0.03607749938964844, -0.03487348556518555, -0.033669471740722656, -0.032465457916259766, -0.031261444091796875, -0.030057430267333984, -0.028853416442871094, -0.027649402618408203, -0.026445388793945312, -0.025241374969482422, -0.02403736114501953, -0.02283334732055664, -0.02162933349609375, -0.02042531967163086, -0.01922130584716797, -0.018017292022705078, -0.016813278198242188, -0.015609264373779297, -0.014405250549316406, -0.013201236724853516, -0.011997222900390625, -0.010793209075927734, -0.009589195251464844, -0.008385181427001953, -0.0071811676025390625, -0.005977153778076172, -0.004773139953613281, -0.0035691261291503906, -0.0023651123046875, -0.0011610984802246094, 4.291534423828125e-05, 0.0012469291687011719, 0.0024509429931640625, 0.003654956817626953, 0.004858970642089844, 0.006062984466552734, 0.007266998291015625, 0.008471012115478516, 0.009675025939941406, 0.010879039764404297, 0.012083053588867188, 0.013287067413330078, 0.014491081237792969, 0.01569509506225586, 0.01689910888671875, 0.01810312271118164, 0.01930713653564453, 0.020511150360107422, 0.021715164184570312, 0.022919178009033203, 0.024123191833496094, 0.025327205657958984, 0.026531219482421875, 0.027735233306884766, 0.028939247131347656, 0.030143260955810547, 0.03134727478027344, 0.03255128860473633, 0.03375530242919922, 0.03495931625366211, 0.036163330078125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 5.0, 2.0, 5.0, 8.0, 12.0, 6.0, 14.0, 15.0, 26.0, 68.0, 217.0, 305.0, 154.0, 59.0, 20.0, 11.0, 12.0, 7.0, 9.0, 6.0, 4.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016326904296875, -0.01584911346435547, -0.015371322631835938, -0.014893531799316406, -0.014415740966796875, -0.013937950134277344, -0.013460159301757812, -0.012982368469238281, -0.01250457763671875, -0.012026786804199219, -0.011548995971679688, -0.011071205139160156, -0.010593414306640625, -0.010115623474121094, -0.009637832641601562, -0.009160041809082031, -0.0086822509765625, -0.008204460144042969, -0.0077266693115234375, -0.007248878479003906, -0.006771087646484375, -0.006293296813964844, -0.0058155059814453125, -0.005337715148925781, -0.00485992431640625, -0.004382133483886719, -0.0039043426513671875, -0.0034265518188476562, -0.002948760986328125, -0.0024709701538085938, -0.0019931793212890625, -0.0015153884887695312, -0.00103759765625, -0.0005598068237304688, -8.20159912109375e-05, 0.00039577484130859375, 0.000873565673828125, 0.0013513565063476562, 0.0018291473388671875, 0.0023069381713867188, 0.00278472900390625, 0.0032625198364257812, 0.0037403106689453125, 0.004218101501464844, 0.004695892333984375, 0.005173683166503906, 0.0056514739990234375, 0.006129264831542969, 0.0066070556640625, 0.007084846496582031, 0.0075626373291015625, 0.008040428161621094, 0.008518218994140625, 0.008996009826660156, 0.009473800659179688, 0.009951591491699219, 0.01042938232421875, 0.010907173156738281, 0.011384963989257812, 0.011862754821777344, 0.012340545654296875, 0.012818336486816406, 0.013296127319335938, 0.013773918151855469, 0.014251708984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 12.0, 16.0, 29.0, 45.0, 133.0, 386.0, 1930.0, 301145.0, 3887901.0, 2045.0, 378.0, 134.0, 40.0, 24.0, 14.0, 15.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02783203125, -0.02683877944946289, -0.02584552764892578, -0.024852275848388672, -0.023859024047851562, -0.022865772247314453, -0.021872520446777344, -0.020879268646240234, -0.019886016845703125, -0.018892765045166016, -0.017899513244628906, -0.016906261444091797, -0.015913009643554688, -0.014919757843017578, -0.013926506042480469, -0.01293325424194336, -0.01194000244140625, -0.01094675064086914, -0.009953498840332031, -0.008960247039794922, -0.007966995239257812, -0.006973743438720703, -0.005980491638183594, -0.004987239837646484, -0.003993988037109375, -0.0030007362365722656, -0.0020074844360351562, -0.0010142326354980469, -2.09808349609375e-05, 0.0009722709655761719, 0.0019655227661132812, 0.0029587745666503906, 0.0039520263671875, 0.004945278167724609, 0.005938529968261719, 0.006931781768798828, 0.007925033569335938, 0.008918285369873047, 0.009911537170410156, 0.010904788970947266, 0.011898040771484375, 0.012891292572021484, 0.013884544372558594, 0.014877796173095703, 0.015871047973632812, 0.016864299774169922, 0.01785755157470703, 0.01885080337524414, 0.01984405517578125, 0.02083730697631836, 0.02183055877685547, 0.022823810577392578, 0.023817062377929688, 0.024810314178466797, 0.025803565979003906, 0.026796817779541016, 0.027790069580078125, 0.028783321380615234, 0.029776573181152344, 0.030769824981689453, 0.03176307678222656, 0.03275632858276367, 0.03374958038330078, 0.03474283218383789, 0.035736083984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 6.0, 26.0, 42.0, 111.0, 857.0, 2865.0, 86.0, 37.0, 15.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01180267333984375, -0.011475205421447754, -0.011147737503051758, -0.010820269584655762, -0.010492801666259766, -0.01016533374786377, -0.009837865829467773, -0.009510397911071777, -0.009182929992675781, -0.008855462074279785, -0.008527994155883789, -0.008200526237487793, -0.007873058319091797, -0.007545590400695801, -0.007218122482299805, -0.006890654563903809, -0.0065631866455078125, -0.006235718727111816, -0.00590825080871582, -0.005580782890319824, -0.005253314971923828, -0.004925847053527832, -0.004598379135131836, -0.00427091121673584, -0.003943443298339844, -0.0036159753799438477, -0.0032885074615478516, -0.0029610395431518555, -0.0026335716247558594, -0.0023061037063598633, -0.001978635787963867, -0.001651167869567871, -0.001323699951171875, -0.000996232032775879, -0.0006687641143798828, -0.0003412961959838867, -1.3828277587890625e-05, 0.00031363964080810547, 0.0006411075592041016, 0.0009685754776000977, 0.0012960433959960938, 0.0016235113143920898, 0.001950979232788086, 0.002278447151184082, 0.002605915069580078, 0.0029333829879760742, 0.0032608509063720703, 0.0035883188247680664, 0.0039157867431640625, 0.004243254661560059, 0.004570722579956055, 0.004898190498352051, 0.005225658416748047, 0.005553126335144043, 0.005880594253540039, 0.006208062171936035, 0.006535530090332031, 0.006862998008728027, 0.0071904659271240234, 0.0075179338455200195, 0.007845401763916016, 0.008172869682312012, 0.008500337600708008, 0.008827805519104004, 0.0091552734375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 1003.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13570308685302734, -0.1322835385799408, -0.12886397540569305, -0.1254444122314453, -0.12202486395835876, -0.11860530823469162, -0.11518575251102448, -0.11176619678735733, -0.10834664106369019, -0.10492708534002304, -0.1015075296163559, -0.09808797389268875, -0.0946684181690216, -0.09124886244535446, -0.08782930672168732, -0.08440975099802017, -0.08099019527435303, -0.07757063955068588, -0.07415108382701874, -0.07073152810335159, -0.06731197237968445, -0.0638924166560173, -0.06047286093235016, -0.057053305208683014, -0.05363374948501587, -0.050214193761348724, -0.04679463803768158, -0.043375082314014435, -0.03995552659034729, -0.036535970866680145, -0.033116415143013, -0.029696859419345856, -0.02627730369567871, -0.022857747972011566, -0.01943819224834442, -0.016018636524677277, -0.012599080801010132, -0.009179525077342987, -0.005759969353675842, -0.0023404136300086975, 0.0010791420936584473, 0.004498697817325592, 0.007918253540992737, 0.011337809264659882, 0.014757364988327026, 0.01817692071199417, 0.021596476435661316, 0.02501603215932846, 0.028435587882995605, 0.03185514360666275, 0.035274699330329895, 0.03869425505399704, 0.042113810777664185, 0.04553336650133133, 0.048952922224998474, 0.05237247794866562, 0.055792033672332764, 0.05921158939599991, 0.06263114511966705, 0.0660507008433342, 0.06947025656700134, 0.07288981229066849, 0.07630936801433563, 0.07972892373800278, 0.08314847946166992]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 1.0, 7.0, 16.0, 9.0, 12.0, 21.0, 21.0, 20.0, 22.0, 22.0, 30.0, 30.0, 33.0, 43.0, 51.0, 54.0, 52.0, 42.0, 47.0, 53.0, 26.0, 50.0, 42.0, 46.0, 36.0, 31.0, 31.0, 23.0, 24.0, 19.0, 23.0, 18.0, 13.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.01308673620223999, -0.012709271162748337, -0.012331806123256683, -0.01195434108376503, -0.011576876044273376, -0.011199411004781723, -0.01082194596529007, -0.010444480925798416, -0.010067015886306763, -0.00968955084681511, -0.009312085807323456, -0.008934620767831802, -0.008557155728340149, -0.008179690688848495, -0.007802225649356842, -0.007424760609865189, -0.007047295570373535, -0.006669830530881882, -0.006292365491390228, -0.005914900451898575, -0.005537435412406921, -0.005159970372915268, -0.0047825053334236145, -0.004405040293931961, -0.004027575254440308, -0.003650110214948654, -0.0032726451754570007, -0.0028951801359653473, -0.002517715096473694, -0.0021402500569820404, -0.001762785017490387, -0.0013853199779987335, -0.00100785493850708, -0.0006303898990154266, -0.0002529248595237732, 0.00012454017996788025, 0.0005020052194595337, 0.0008794702589511871, 0.0012569352984428406, 0.001634400337934494, 0.0020118653774261475, 0.002389330416917801, 0.0027667954564094543, 0.003144260495901108, 0.0035217255353927612, 0.0038991905748844147, 0.004276655614376068, 0.0046541206538677216, 0.005031585693359375, 0.0054090507328510284, 0.005786515772342682, 0.006163980811834335, 0.006541445851325989, 0.006918910890817642, 0.007296375930309296, 0.007673840969800949, 0.008051306009292603, 0.008428771048784256, 0.00880623608827591, 0.009183701127767563, 0.009561166167259216, 0.00993863120675087, 0.010316096246242523, 0.010693561285734177, 0.01107102632522583]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 8.0, 14.0, 14.0, 18.0, 26.0, 26.0, 47.0, 42.0, 76.0, 106.0, 146.0, 241.0, 351.0, 671.0, 1092.0, 2397.0, 5585.0, 16761.0, 184244.0, 801738.0, 21766.0, 6990.0, 2888.0, 1323.0, 717.0, 416.0, 225.0, 152.0, 103.0, 86.0, 67.0, 46.0, 28.0, 25.0, 16.0, 17.0, 15.0, 10.0, 8.0, 11.0, 5.0, 4.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.0299530029296875, -0.029074668884277344, -0.028196334838867188, -0.02731800079345703, -0.026439666748046875, -0.02556133270263672, -0.024682998657226562, -0.023804664611816406, -0.02292633056640625, -0.022047996520996094, -0.021169662475585938, -0.02029132843017578, -0.019412994384765625, -0.01853466033935547, -0.017656326293945312, -0.016777992248535156, -0.015899658203125, -0.015021324157714844, -0.014142990112304688, -0.013264656066894531, -0.012386322021484375, -0.011507987976074219, -0.010629653930664062, -0.009751319885253906, -0.00887298583984375, -0.007994651794433594, -0.0071163177490234375, -0.006237983703613281, -0.005359649658203125, -0.004481315612792969, -0.0036029815673828125, -0.0027246475219726562, -0.0018463134765625, -0.0009679794311523438, -8.96453857421875e-05, 0.0007886886596679688, 0.001667022705078125, 0.0025453567504882812, 0.0034236907958984375, 0.004302024841308594, 0.00518035888671875, 0.006058692932128906, 0.0069370269775390625, 0.007815361022949219, 0.008693695068359375, 0.009572029113769531, 0.010450363159179688, 0.011328697204589844, 0.01220703125, 0.013085365295410156, 0.013963699340820312, 0.014842033386230469, 0.015720367431640625, 0.01659870147705078, 0.017477035522460938, 0.018355369567871094, 0.01923370361328125, 0.020112037658691406, 0.020990371704101562, 0.02186870574951172, 0.022747039794921875, 0.02362537384033203, 0.024503707885742188, 0.025382041931152344, 0.0262603759765625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 12.0, 6.0, 14.0, 15.0, 29.0, 70.0, 217.0, 303.0, 154.0, 56.0, 20.0, 11.0, 12.0, 9.0, 8.0, 5.0, 4.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016326904296875, -0.015848755836486816, -0.015370607376098633, -0.01489245891571045, -0.014414310455322266, -0.013936161994934082, -0.013458013534545898, -0.012979865074157715, -0.012501716613769531, -0.012023568153381348, -0.011545419692993164, -0.01106727123260498, -0.010589122772216797, -0.010110974311828613, -0.00963282585144043, -0.009154677391052246, -0.008676528930664062, -0.008198380470275879, -0.007720232009887695, -0.007242083549499512, -0.006763935089111328, -0.0062857866287231445, -0.005807638168334961, -0.005329489707946777, -0.004851341247558594, -0.00437319278717041, -0.0038950443267822266, -0.003416895866394043, -0.0029387474060058594, -0.0024605989456176758, -0.001982450485229492, -0.0015043020248413086, -0.001026153564453125, -0.0005480051040649414, -6.985664367675781e-05, 0.0004082918167114258, 0.0008864402770996094, 0.001364588737487793, 0.0018427371978759766, 0.00232088565826416, 0.0027990341186523438, 0.0032771825790405273, 0.003755331039428711, 0.0042334794998168945, 0.004711627960205078, 0.005189776420593262, 0.005667924880981445, 0.006146073341369629, 0.0066242218017578125, 0.007102370262145996, 0.00758051872253418, 0.008058667182922363, 0.008536815643310547, 0.00901496410369873, 0.009493112564086914, 0.009971261024475098, 0.010449409484863281, 0.010927557945251465, 0.011405706405639648, 0.011883854866027832, 0.012362003326416016, 0.0128401517868042, 0.013318300247192383, 0.013796448707580566, 0.01427459716796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 2.0, 4.0, 7.0, 13.0, 16.0, 10.0, 18.0, 22.0, 19.0, 29.0, 53.0, 46.0, 56.0, 58.0, 78.0, 107.0, 137.0, 196.0, 309.0, 520.0, 884.0, 2257.0, 27001.0, 998030.0, 14325.0, 1937.0, 836.0, 421.0, 283.0, 191.0, 146.0, 105.0, 99.0, 68.0, 66.0, 35.0, 31.0, 26.0, 27.0, 23.0, 17.0, 7.0, 7.0, 9.0, 3.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.0634765625, -0.061632633209228516, -0.05978870391845703, -0.05794477462768555, -0.05610084533691406, -0.05425691604614258, -0.052412986755371094, -0.05056905746459961, -0.048725128173828125, -0.04688119888305664, -0.045037269592285156, -0.04319334030151367, -0.04134941101074219, -0.0395054817199707, -0.03766155242919922, -0.035817623138427734, -0.03397369384765625, -0.032129764556884766, -0.03028583526611328, -0.028441905975341797, -0.026597976684570312, -0.024754047393798828, -0.022910118103027344, -0.02106618881225586, -0.019222259521484375, -0.01737833023071289, -0.015534400939941406, -0.013690471649169922, -0.011846542358398438, -0.010002613067626953, -0.008158683776855469, -0.006314754486083984, -0.0044708251953125, -0.0026268959045410156, -0.0007829666137695312, 0.0010609626770019531, 0.0029048919677734375, 0.004748821258544922, 0.006592750549316406, 0.00843667984008789, 0.010280609130859375, 0.01212453842163086, 0.013968467712402344, 0.015812397003173828, 0.017656326293945312, 0.019500255584716797, 0.02134418487548828, 0.023188114166259766, 0.02503204345703125, 0.026875972747802734, 0.02871990203857422, 0.030563831329345703, 0.03240776062011719, 0.03425168991088867, 0.036095619201660156, 0.03793954849243164, 0.039783477783203125, 0.04162740707397461, 0.043471336364746094, 0.04531526565551758, 0.04715919494628906, 0.04900312423706055, 0.05084705352783203, 0.052690982818603516, 0.054534912109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 8.0, 10.0, 9.0, 11.0, 15.0, 24.0, 28.0, 24.0, 32.0, 26.0, 33.0, 30.0, 31.0, 33.0, 38.0, 36.0, 34.0, 33.0, 32.0, 41.0, 52.0, 33.0, 32.0, 43.0, 44.0, 34.0, 31.0, 33.0, 26.0, 19.0, 13.0, 13.0, 13.0, 12.0, 17.0, 6.0, 5.0, 4.0, 6.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0], "bins": [-0.038299560546875, -0.03719615936279297, -0.03609275817871094, -0.034989356994628906, -0.033885955810546875, -0.032782554626464844, -0.03167915344238281, -0.03057575225830078, -0.02947235107421875, -0.02836894989013672, -0.027265548706054688, -0.026162147521972656, -0.025058746337890625, -0.023955345153808594, -0.022851943969726562, -0.02174854278564453, -0.0206451416015625, -0.01954174041748047, -0.018438339233398438, -0.017334938049316406, -0.016231536865234375, -0.015128135681152344, -0.014024734497070312, -0.012921333312988281, -0.01181793212890625, -0.010714530944824219, -0.009611129760742188, -0.008507728576660156, -0.007404327392578125, -0.006300926208496094, -0.0051975250244140625, -0.004094123840332031, -0.00299072265625, -0.0018873214721679688, -0.0007839202880859375, 0.00031948089599609375, 0.001422882080078125, 0.0025262832641601562, 0.0036296844482421875, 0.004733085632324219, 0.00583648681640625, 0.006939888000488281, 0.008043289184570312, 0.009146690368652344, 0.010250091552734375, 0.011353492736816406, 0.012456893920898438, 0.013560295104980469, 0.0146636962890625, 0.01576709747314453, 0.016870498657226562, 0.017973899841308594, 0.019077301025390625, 0.020180702209472656, 0.021284103393554688, 0.02238750457763672, 0.02349090576171875, 0.02459430694580078, 0.025697708129882812, 0.026801109313964844, 0.027904510498046875, 0.029007911682128906, 0.030111312866210938, 0.03121471405029297, 0.032318115234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 2.0, 6.0, 5.0, 3.0, 7.0, 9.0, 14.0, 31.0, 20.0, 31.0, 43.0, 65.0, 69.0, 116.0, 207.0, 429.0, 822.0, 2213.0, 6711.0, 35288.0, 881223.0, 102644.0, 13276.0, 2890.0, 1232.0, 483.0, 264.0, 123.0, 91.0, 46.0, 46.0, 29.0, 31.0, 22.0, 18.0, 18.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4543533325195312e-05, -1.4098361134529114e-05, -1.3653188943862915e-05, -1.3208016753196716e-05, -1.2762844562530518e-05, -1.2317672371864319e-05, -1.187250018119812e-05, -1.1427327990531921e-05, -1.0982155799865723e-05, -1.0536983609199524e-05, -1.0091811418533325e-05, -9.646639227867126e-06, -9.201467037200928e-06, -8.756294846534729e-06, -8.31112265586853e-06, -7.865950465202332e-06, -7.420778274536133e-06, -6.975606083869934e-06, -6.530433893203735e-06, -6.085261702537537e-06, -5.640089511871338e-06, -5.194917321205139e-06, -4.7497451305389404e-06, -4.304572939872742e-06, -3.859400749206543e-06, -3.4142285585403442e-06, -2.9690563678741455e-06, -2.5238841772079468e-06, -2.078711986541748e-06, -1.6335397958755493e-06, -1.1883676052093506e-06, -7.431954145431519e-07, -2.980232238769531e-07, 1.471489667892456e-07, 5.923211574554443e-07, 1.037493348121643e-06, 1.4826655387878418e-06, 1.9278377294540405e-06, 2.3730099201202393e-06, 2.818182110786438e-06, 3.2633543014526367e-06, 3.7085264921188354e-06, 4.153698682785034e-06, 4.598870873451233e-06, 5.044043064117432e-06, 5.48921525478363e-06, 5.934387445449829e-06, 6.379559636116028e-06, 6.8247318267822266e-06, 7.269904017448425e-06, 7.715076208114624e-06, 8.160248398780823e-06, 8.605420589447021e-06, 9.05059278011322e-06, 9.495764970779419e-06, 9.940937161445618e-06, 1.0386109352111816e-05, 1.0831281542778015e-05, 1.1276453733444214e-05, 1.1721625924110413e-05, 1.2166798114776611e-05, 1.261197030544281e-05, 1.3057142496109009e-05, 1.3502314686775208e-05, 1.3947486877441406e-05]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 6.0, 3.0, 4.0, 8.0, 11.0, 20.0, 15.0, 12.0, 14.0, 33.0, 43.0, 33.0, 74.0, 68.0, 78.0, 97.0, 59.0, 71.0, 73.0, 62.0, 36.0, 30.0, 38.0, 13.0, 19.0, 5.0, 15.0, 11.0, 6.0, 10.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.046627044677734e-06, -7.821246981620789e-06, -7.595866918563843e-06, -7.370486855506897e-06, -7.145106792449951e-06, -6.919726729393005e-06, -6.6943466663360596e-06, -6.468966603279114e-06, -6.243586540222168e-06, -6.018206477165222e-06, -5.792826414108276e-06, -5.5674463510513306e-06, -5.342066287994385e-06, -5.116686224937439e-06, -4.891306161880493e-06, -4.665926098823547e-06, -4.4405460357666016e-06, -4.215165972709656e-06, -3.98978590965271e-06, -3.764405846595764e-06, -3.5390257835388184e-06, -3.3136457204818726e-06, -3.0882656574249268e-06, -2.862885594367981e-06, -2.637505531311035e-06, -2.4121254682540894e-06, -2.1867454051971436e-06, -1.9613653421401978e-06, -1.735985279083252e-06, -1.5106052160263062e-06, -1.2852251529693604e-06, -1.0598450899124146e-06, -8.344650268554688e-07, -6.09084963798523e-07, -3.8370490074157715e-07, -1.5832483768463135e-07, 6.705522537231445e-08, 2.9243528842926025e-07, 5.178153514862061e-07, 7.431954145431519e-07, 9.685754776000977e-07, 1.1939555406570435e-06, 1.4193356037139893e-06, 1.644715666770935e-06, 1.8700957298278809e-06, 2.0954757928848267e-06, 2.3208558559417725e-06, 2.5462359189987183e-06, 2.771615982055664e-06, 2.99699604511261e-06, 3.2223761081695557e-06, 3.4477561712265015e-06, 3.6731362342834473e-06, 3.898516297340393e-06, 4.123896360397339e-06, 4.349276423454285e-06, 4.5746564865112305e-06, 4.800036549568176e-06, 5.025416612625122e-06, 5.250796675682068e-06, 5.476176738739014e-06, 5.7015568017959595e-06, 5.926936864852905e-06, 6.152316927909851e-06, 6.377696990966797e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 5.0, 9.0, 9.0, 8.0, 19.0, 21.0, 30.0, 50.0, 82.0, 118.0, 254.0, 608.0, 4053.0, 1035415.0, 6541.0, 673.0, 241.0, 144.0, 84.0, 56.0, 24.0, 30.0, 16.0, 8.0, 11.0, 7.0, 7.0, 9.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6312808990478516e-05, -4.4745393097400665e-05, -4.3177977204322815e-05, -4.1610561311244965e-05, -4.0043145418167114e-05, -3.8475729525089264e-05, -3.6908313632011414e-05, -3.534089773893356e-05, -3.377348184585571e-05, -3.220606595277786e-05, -3.063865005970001e-05, -2.9071234166622162e-05, -2.750381827354431e-05, -2.593640238046646e-05, -2.436898648738861e-05, -2.280157059431076e-05, -2.123415470123291e-05, -1.966673880815506e-05, -1.809932291507721e-05, -1.653190702199936e-05, -1.4964491128921509e-05, -1.3397075235843658e-05, -1.1829659342765808e-05, -1.0262243449687958e-05, -8.694827556610107e-06, -7.127411663532257e-06, -5.559995770454407e-06, -3.992579877376556e-06, -2.425163984298706e-06, -8.577480912208557e-07, 7.096678018569946e-07, 2.277083694934845e-06, 3.844499588012695e-06, 5.411915481090546e-06, 6.979331374168396e-06, 8.546747267246246e-06, 1.0114163160324097e-05, 1.1681579053401947e-05, 1.3248994946479797e-05, 1.4816410839557648e-05, 1.6383826732635498e-05, 1.795124262571335e-05, 1.95186585187912e-05, 2.108607441186905e-05, 2.26534903049469e-05, 2.422090619802475e-05, 2.57883220911026e-05, 2.735573798418045e-05, 2.89231538772583e-05, 3.049056977033615e-05, 3.2057985663414e-05, 3.362540155649185e-05, 3.51928174495697e-05, 3.676023334264755e-05, 3.83276492357254e-05, 3.989506512880325e-05, 4.1462481021881104e-05, 4.3029896914958954e-05, 4.4597312808036804e-05, 4.6164728701114655e-05, 4.7732144594192505e-05, 4.9299560487270355e-05, 5.0866976380348206e-05, 5.2434392273426056e-05, 5.4001808166503906e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 6.0, 9.0, 4.0, 13.0, 19.0, 23.0, 21.0, 42.0, 78.0, 123.0, 308.0, 119.0, 73.0, 30.0, 37.0, 24.0, 17.0, 12.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7835369110107422e-05, -2.6891008019447327e-05, -2.594664692878723e-05, -2.5002285838127136e-05, -2.405792474746704e-05, -2.3113563656806946e-05, -2.216920256614685e-05, -2.1224841475486755e-05, -2.028048038482666e-05, -1.9336119294166565e-05, -1.839175820350647e-05, -1.7447397112846375e-05, -1.650303602218628e-05, -1.5558674931526184e-05, -1.4614313840866089e-05, -1.3669952750205994e-05, -1.2725591659545898e-05, -1.1781230568885803e-05, -1.0836869478225708e-05, -9.892508387565613e-06, -8.948147296905518e-06, -8.003786206245422e-06, -7.059425115585327e-06, -6.115064024925232e-06, -5.170702934265137e-06, -4.2263418436050415e-06, -3.2819807529449463e-06, -2.337619662284851e-06, -1.3932585716247559e-06, -4.4889748096466064e-07, 4.954636096954346e-07, 1.4398247003555298e-06, 2.384185791015625e-06, 3.3285468816757202e-06, 4.2729079723358154e-06, 5.217269062995911e-06, 6.161630153656006e-06, 7.105991244316101e-06, 8.050352334976196e-06, 8.994713425636292e-06, 9.939074516296387e-06, 1.0883435606956482e-05, 1.1827796697616577e-05, 1.2772157788276672e-05, 1.3716518878936768e-05, 1.4660879969596863e-05, 1.5605241060256958e-05, 1.6549602150917053e-05, 1.749396324157715e-05, 1.8438324332237244e-05, 1.938268542289734e-05, 2.0327046513557434e-05, 2.127140760421753e-05, 2.2215768694877625e-05, 2.316012978553772e-05, 2.4104490876197815e-05, 2.504885196685791e-05, 2.5993213057518005e-05, 2.69375741481781e-05, 2.7881935238838196e-05, 2.882629632949829e-05, 2.9770657420158386e-05, 3.071501851081848e-05, 3.165937960147858e-05, 3.260374069213867e-05]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 398.0, 616.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.1275577545166016, -2.090240478515625, -2.0529232025146484, -2.015605926513672, -1.9782886505126953, -1.9409712553024292, -1.9036539793014526, -1.866336703300476, -1.8290194272994995, -1.791702151298523, -1.7543848752975464, -1.7170675992965698, -1.6797502040863037, -1.6424329280853271, -1.6051156520843506, -1.567798376083374, -1.5304811000823975, -1.493163824081421, -1.4558465480804443, -1.4185292720794678, -1.3812119960784912, -1.343894600868225, -1.3065773248672485, -1.269260048866272, -1.2319427728652954, -1.1946254968643188, -1.1573082208633423, -1.1199909448623657, -1.0826735496520996, -1.045356273651123, -1.0080389976501465, -0.9707217216491699, -0.9334044456481934, -0.8960871696472168, -0.8587698936462402, -0.8214525580406189, -0.7841352820396423, -0.7468180060386658, -0.7095006704330444, -0.6721833944320679, -0.6348661184310913, -0.5975488424301147, -0.5602315664291382, -0.5229142308235168, -0.4855969548225403, -0.4482796788215637, -0.41096237301826477, -0.3736450672149658, -0.33632776141166687, -0.2990104556083679, -0.26169317960739136, -0.2243758887052536, -0.18705859780311584, -0.1497413069009781, -0.11242401599884033, -0.07510671019554138, -0.03778943419456482, -0.000472143292427063, 0.03684514760971069, 0.07416243851184845, 0.1114797294139862, 0.14879702031612396, 0.18611431121826172, 0.22343161702156067, 0.26074889302253723]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 14.0, 8.0, 12.0, 12.0, 8.0, 11.0, 13.0, 12.0, 17.0, 25.0, 23.0, 33.0, 37.0, 32.0, 50.0, 46.0, 37.0, 37.0, 39.0, 45.0, 46.0, 51.0, 35.0, 42.0, 52.0, 33.0, 31.0, 30.0, 31.0, 34.0, 18.0, 18.0, 12.0, 12.0, 8.0, 12.0, 6.0, 5.0, 5.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21565335988998413, -0.20882388949394226, -0.2019944190979004, -0.19516494870185852, -0.18833547830581665, -0.18150600790977478, -0.1746765375137329, -0.16784706711769104, -0.16101759672164917, -0.1541881263256073, -0.14735865592956543, -0.14052918553352356, -0.1336997151374817, -0.12687024474143982, -0.12004077434539795, -0.11321130394935608, -0.10638183355331421, -0.09955236315727234, -0.09272289276123047, -0.0858934223651886, -0.07906395196914673, -0.07223448157310486, -0.06540501117706299, -0.05857554078102112, -0.05174607038497925, -0.04491659998893738, -0.03808712959289551, -0.03125765919685364, -0.024428188800811768, -0.017598718404769897, -0.010769248008728027, -0.003939777612686157, 0.002889692783355713, 0.009719163179397583, 0.016548633575439453, 0.023378103971481323, 0.030207574367523193, 0.037037044763565063, 0.043866515159606934, 0.050695985555648804, 0.057525455951690674, 0.06435492634773254, 0.07118439674377441, 0.07801386713981628, 0.08484333753585815, 0.09167280793190002, 0.0985022783279419, 0.10533174872398376, 0.11216121912002563, 0.1189906895160675, 0.12582015991210938, 0.13264963030815125, 0.13947910070419312, 0.14630857110023499, 0.15313804149627686, 0.15996751189231873, 0.1667969822883606, 0.17362645268440247, 0.18045592308044434, 0.1872853934764862, 0.19411486387252808, 0.20094433426856995, 0.20777380466461182, 0.2146032750606537, 0.22143274545669556]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 6.0, 3.0, 4.0, 8.0, 7.0, 9.0, 15.0, 23.0, 41.0, 95.0, 1123.0, 4192526.0, 225.0, 83.0, 27.0, 11.0, 12.0, 8.0, 9.0, 7.0, 3.0, 6.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21533203125, -0.2090435028076172, -0.20275497436523438, -0.19646644592285156, -0.19017791748046875, -0.18388938903808594, -0.17760086059570312, -0.1713123321533203, -0.1650238037109375, -0.1587352752685547, -0.15244674682617188, -0.14615821838378906, -0.13986968994140625, -0.13358116149902344, -0.12729263305664062, -0.12100410461425781, -0.114715576171875, -0.10842704772949219, -0.10213851928710938, -0.09584999084472656, -0.08956146240234375, -0.08327293395996094, -0.07698440551757812, -0.07069587707519531, -0.0644073486328125, -0.05811882019042969, -0.051830291748046875, -0.04554176330566406, -0.03925323486328125, -0.03296470642089844, -0.026676177978515625, -0.020387649536132812, -0.01409912109375, -0.0078105926513671875, -0.001522064208984375, 0.0047664642333984375, 0.01105499267578125, 0.017343521118164062, 0.023632049560546875, 0.029920578002929688, 0.0362091064453125, 0.04249763488769531, 0.048786163330078125, 0.05507469177246094, 0.06136322021484375, 0.06765174865722656, 0.07394027709960938, 0.08022880554199219, 0.086517333984375, 0.09280586242675781, 0.09909439086914062, 0.10538291931152344, 0.11167144775390625, 0.11795997619628906, 0.12424850463867188, 0.1305370330810547, 0.1368255615234375, 0.1431140899658203, 0.14940261840820312, 0.15569114685058594, 0.16197967529296875, 0.16826820373535156, 0.17455673217773438, 0.1808452606201172, 0.1871337890625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 2.0, 4.0, 7.0, 7.0, 10.0, 11.0, 16.0, 26.0, 59.0, 177.0, 301.0, 182.0, 82.0, 21.0, 13.0, 13.0, 7.0, 10.0, 8.0, 3.0, 6.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0161895751953125, -0.015718817710876465, -0.01524806022644043, -0.014777302742004395, -0.01430654525756836, -0.013835787773132324, -0.013365030288696289, -0.012894272804260254, -0.012423515319824219, -0.011952757835388184, -0.011482000350952148, -0.011011242866516113, -0.010540485382080078, -0.010069727897644043, -0.009598970413208008, -0.009128212928771973, -0.008657455444335938, -0.008186697959899902, -0.007715940475463867, -0.007245182991027832, -0.006774425506591797, -0.006303668022155762, -0.0058329105377197266, -0.005362153053283691, -0.004891395568847656, -0.004420638084411621, -0.003949880599975586, -0.0034791231155395508, -0.0030083656311035156, -0.0025376081466674805, -0.0020668506622314453, -0.0015960931777954102, -0.001125335693359375, -0.0006545782089233398, -0.0001838207244873047, 0.00028693675994873047, 0.0007576942443847656, 0.0012284517288208008, 0.001699209213256836, 0.002169966697692871, 0.0026407241821289062, 0.0031114816665649414, 0.0035822391510009766, 0.004052996635437012, 0.004523754119873047, 0.004994511604309082, 0.005465269088745117, 0.005936026573181152, 0.0064067840576171875, 0.006877541542053223, 0.007348299026489258, 0.007819056510925293, 0.008289813995361328, 0.008760571479797363, 0.009231328964233398, 0.009702086448669434, 0.010172843933105469, 0.010643601417541504, 0.011114358901977539, 0.011585116386413574, 0.01205587387084961, 0.012526631355285645, 0.01299738883972168, 0.013468146324157715, 0.01393890380859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 14.0, 17.0, 15.0, 77.0, 182.0, 737.0, 5616.0, 4179647.0, 6710.0, 841.0, 260.0, 81.0, 27.0, 22.0, 11.0, 4.0, 1.0, 1.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03509521484375, -0.03404855728149414, -0.03300189971923828, -0.03195524215698242, -0.030908584594726562, -0.029861927032470703, -0.028815269470214844, -0.027768611907958984, -0.026721954345703125, -0.025675296783447266, -0.024628639221191406, -0.023581981658935547, -0.022535324096679688, -0.021488666534423828, -0.02044200897216797, -0.01939535140991211, -0.01834869384765625, -0.01730203628540039, -0.01625537872314453, -0.015208721160888672, -0.014162063598632812, -0.013115406036376953, -0.012068748474121094, -0.011022090911865234, -0.009975433349609375, -0.008928775787353516, -0.007882118225097656, -0.006835460662841797, -0.0057888031005859375, -0.004742145538330078, -0.0036954879760742188, -0.0026488304138183594, -0.0016021728515625, -0.0005555152893066406, 0.0004911422729492188, 0.0015377998352050781, 0.0025844573974609375, 0.003631114959716797, 0.004677772521972656, 0.005724430084228516, 0.006771087646484375, 0.007817745208740234, 0.008864402770996094, 0.009911060333251953, 0.010957717895507812, 0.012004375457763672, 0.013051033020019531, 0.01409769058227539, 0.01514434814453125, 0.01619100570678711, 0.01723766326904297, 0.018284320831298828, 0.019330978393554688, 0.020377635955810547, 0.021424293518066406, 0.022470951080322266, 0.023517608642578125, 0.024564266204833984, 0.025610923767089844, 0.026657581329345703, 0.027704238891601562, 0.028750896453857422, 0.02979755401611328, 0.03084421157836914, 0.031890869140625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 14.0, 18.0, 46.0, 118.0, 599.0, 3003.0, 167.0, 56.0, 29.0, 9.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00897979736328125, -0.008623123168945312, -0.008266448974609375, -0.007909774780273438, -0.0075531005859375, -0.0071964263916015625, -0.006839752197265625, -0.0064830780029296875, -0.00612640380859375, -0.0057697296142578125, -0.005413055419921875, -0.0050563812255859375, -0.00469970703125, -0.0043430328369140625, -0.003986358642578125, -0.0036296844482421875, -0.00327301025390625, -0.0029163360595703125, -0.002559661865234375, -0.0022029876708984375, -0.0018463134765625, -0.0014896392822265625, -0.001132965087890625, -0.0007762908935546875, -0.00041961669921875, -6.29425048828125e-05, 0.000293731689453125, 0.0006504058837890625, 0.001007080078125, 0.0013637542724609375, 0.001720428466796875, 0.0020771026611328125, 0.00243377685546875, 0.0027904510498046875, 0.003147125244140625, 0.0035037994384765625, 0.0038604736328125, 0.0042171478271484375, 0.004573822021484375, 0.0049304962158203125, 0.00528717041015625, 0.0056438446044921875, 0.006000518798828125, 0.0063571929931640625, 0.0067138671875, 0.0070705413818359375, 0.007427215576171875, 0.0077838897705078125, 0.00814056396484375, 0.008497238159179688, 0.008853912353515625, 0.009210586547851562, 0.0095672607421875, 0.009923934936523438, 0.010280609130859375, 0.010637283325195312, 0.01099395751953125, 0.011350631713867188, 0.011707305908203125, 0.012063980102539062, 0.012420654296875, 0.012777328491210938, 0.013134002685546875, 0.013490676879882812, 0.01384735107421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1017.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022792378440499306, 0.007710134610533714, 0.017699506133794785, 0.027688879519701004, 0.037678252905607224, 0.04766762629151344, 0.057656995952129364, 0.06764636933803558, 0.0776357427239418, 0.08762511610984802, 0.09761448949575424, 0.10760386288166046, 0.11759322881698608, 0.1275826096534729, 0.13757197558879852, 0.14756134152412415, 0.15755072236061096, 0.16754008829593658, 0.1775294691324234, 0.18751883506774902, 0.19750821590423584, 0.20749758183956146, 0.21748694777488708, 0.2274763286113739, 0.23746569454669952, 0.24745506048202515, 0.25744444131851196, 0.2674338221549988, 0.2774231731891632, 0.28741255402565, 0.29740193486213684, 0.30739128589630127, 0.3173806965351105, 0.3273700773715973, 0.3373594284057617, 0.34734880924224854, 0.35733819007873535, 0.36732757091522217, 0.3773169219493866, 0.3873063027858734, 0.39729568362236023, 0.40728506445884705, 0.4172744154930115, 0.4272637963294983, 0.4372531771659851, 0.4472425580024719, 0.45723190903663635, 0.46722128987312317, 0.4772106409072876, 0.4872000217437744, 0.49718937277793884, 0.507178783416748, 0.5171681046485901, 0.5271574854850769, 0.5371468663215637, 0.5471362471580505, 0.5571256279945374, 0.5671150088310242, 0.577104389667511, 0.5870937705039978, 0.5970830917358398, 0.6070724725723267, 0.6170618534088135, 0.6270512342453003, 0.6370406150817871]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 9.0, 21.0, 19.0, 32.0, 32.0, 38.0, 42.0, 64.0, 50.0, 55.0, 64.0, 81.0, 78.0, 57.0, 65.0, 43.0, 48.0, 44.0, 31.0, 22.0, 27.0, 25.0, 15.0, 12.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.025221288204193115, -0.02449130080640316, -0.023761313408613205, -0.02303132601082325, -0.022301338613033295, -0.02157135121524334, -0.020841363817453384, -0.02011137641966343, -0.019381389021873474, -0.01865140162408352, -0.017921414226293564, -0.01719142682850361, -0.016461439430713654, -0.0157314520329237, -0.015001464635133743, -0.014271477237343788, -0.013541489839553833, -0.012811502441763878, -0.012081515043973923, -0.011351527646183968, -0.010621540248394012, -0.009891552850604057, -0.009161565452814102, -0.008431578055024147, -0.007701590657234192, -0.006971603259444237, -0.006241615861654282, -0.0055116284638643265, -0.004781641066074371, -0.004051653668284416, -0.003321666270494461, -0.002591678872704506, -0.0018616914749145508, -0.0011317040771245956, -0.0004017166793346405, 0.00032827071845531464, 0.0010582581162452698, 0.001788245514035225, 0.00251823291182518, 0.003248220309615135, 0.00397820770740509, 0.0047081951051950455, 0.005438182502985001, 0.006168169900774956, 0.006898157298564911, 0.007628144696354866, 0.008358132094144821, 0.009088119491934776, 0.009818106889724731, 0.010548094287514687, 0.011278081685304642, 0.012008069083094597, 0.012738056480884552, 0.013468043878674507, 0.014198031276464462, 0.014928018674254417, 0.015658006072044373, 0.016387993469834328, 0.017117980867624283, 0.017847968265414238, 0.018577955663204193, 0.019307943060994148, 0.020037930458784103, 0.02076791785657406, 0.021497905254364014]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 6.0, 13.0, 4.0, 13.0, 14.0, 20.0, 51.0, 56.0, 67.0, 99.0, 159.0, 231.0, 352.0, 583.0, 999.0, 1805.0, 3641.0, 8561.0, 27800.0, 868585.0, 108227.0, 15262.0, 5712.0, 2681.0, 1435.0, 796.0, 455.0, 341.0, 184.0, 108.0, 85.0, 51.0, 50.0, 28.0, 20.0, 12.0, 12.0, 6.0, 10.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0171966552734375, -0.016619205474853516, -0.01604175567626953, -0.015464305877685547, -0.014886856079101562, -0.014309406280517578, -0.013731956481933594, -0.01315450668334961, -0.012577056884765625, -0.01199960708618164, -0.011422157287597656, -0.010844707489013672, -0.010267257690429688, -0.009689807891845703, -0.009112358093261719, -0.008534908294677734, -0.00795745849609375, -0.007380008697509766, -0.006802558898925781, -0.006225109100341797, -0.0056476593017578125, -0.005070209503173828, -0.004492759704589844, -0.003915309906005859, -0.003337860107421875, -0.0027604103088378906, -0.0021829605102539062, -0.0016055107116699219, -0.0010280609130859375, -0.0004506111145019531, 0.00012683868408203125, 0.0007042884826660156, 0.00128173828125, 0.0018591880798339844, 0.0024366378784179688, 0.003014087677001953, 0.0035915374755859375, 0.004168987274169922, 0.004746437072753906, 0.005323886871337891, 0.005901336669921875, 0.006478786468505859, 0.007056236267089844, 0.007633686065673828, 0.008211135864257812, 0.008788585662841797, 0.009366035461425781, 0.009943485260009766, 0.01052093505859375, 0.011098384857177734, 0.011675834655761719, 0.012253284454345703, 0.012830734252929688, 0.013408184051513672, 0.013985633850097656, 0.01456308364868164, 0.015140533447265625, 0.01571798324584961, 0.016295433044433594, 0.016872882843017578, 0.017450332641601562, 0.018027782440185547, 0.01860523223876953, 0.019182682037353516, 0.0197601318359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 2.0, 4.0, 7.0, 7.0, 10.0, 11.0, 15.0, 24.0, 60.0, 173.0, 303.0, 185.0, 83.0, 20.0, 14.0, 13.0, 6.0, 11.0, 8.0, 3.0, 6.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016204833984375, -0.015733838081359863, -0.015262842178344727, -0.01479184627532959, -0.014320850372314453, -0.013849854469299316, -0.01337885856628418, -0.012907862663269043, -0.012436866760253906, -0.01196587085723877, -0.011494874954223633, -0.011023879051208496, -0.01055288314819336, -0.010081887245178223, -0.009610891342163086, -0.00913989543914795, -0.008668899536132812, -0.008197903633117676, -0.007726907730102539, -0.007255911827087402, -0.006784915924072266, -0.006313920021057129, -0.005842924118041992, -0.0053719282150268555, -0.004900932312011719, -0.004429936408996582, -0.003958940505981445, -0.0034879446029663086, -0.003016948699951172, -0.002545952796936035, -0.0020749568939208984, -0.0016039609909057617, -0.001132965087890625, -0.0006619691848754883, -0.00019097328186035156, 0.00028002262115478516, 0.0007510185241699219, 0.0012220144271850586, 0.0016930103302001953, 0.002164006233215332, 0.0026350021362304688, 0.0031059980392456055, 0.003576993942260742, 0.004047989845275879, 0.004518985748291016, 0.004989981651306152, 0.005460977554321289, 0.005931973457336426, 0.0064029693603515625, 0.006873965263366699, 0.007344961166381836, 0.007815957069396973, 0.00828695297241211, 0.008757948875427246, 0.009228944778442383, 0.00969994068145752, 0.010170936584472656, 0.010641932487487793, 0.01111292839050293, 0.011583924293518066, 0.012054920196533203, 0.01252591609954834, 0.012996912002563477, 0.013467907905578613, 0.01393890380859375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 7.0, 8.0, 11.0, 13.0, 16.0, 23.0, 21.0, 29.0, 57.0, 76.0, 106.0, 120.0, 164.0, 241.0, 421.0, 770.0, 1996.0, 58993.0, 976859.0, 5791.0, 1189.0, 554.0, 314.0, 191.0, 135.0, 125.0, 80.0, 59.0, 42.0, 36.0, 24.0, 24.0, 11.0, 17.0, 5.0, 11.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048553466796875, -0.047176361083984375, -0.04579925537109375, -0.044422149658203125, -0.0430450439453125, -0.041667938232421875, -0.04029083251953125, -0.038913726806640625, -0.03753662109375, -0.036159515380859375, -0.03478240966796875, -0.033405303955078125, -0.0320281982421875, -0.030651092529296875, -0.02927398681640625, -0.027896881103515625, -0.026519775390625, -0.025142669677734375, -0.02376556396484375, -0.022388458251953125, -0.0210113525390625, -0.019634246826171875, -0.01825714111328125, -0.016880035400390625, -0.0155029296875, -0.014125823974609375, -0.01274871826171875, -0.011371612548828125, -0.0099945068359375, -0.008617401123046875, -0.00724029541015625, -0.005863189697265625, -0.004486083984375, -0.003108978271484375, -0.00173187255859375, -0.000354766845703125, 0.0010223388671875, 0.002399444580078125, 0.00377655029296875, 0.005153656005859375, 0.00653076171875, 0.007907867431640625, 0.00928497314453125, 0.010662078857421875, 0.0120391845703125, 0.013416290283203125, 0.01479339599609375, 0.016170501708984375, 0.017547607421875, 0.018924713134765625, 0.02030181884765625, 0.021678924560546875, 0.0230560302734375, 0.024433135986328125, 0.02581024169921875, 0.027187347412109375, 0.028564453125, 0.029941558837890625, 0.03131866455078125, 0.032695770263671875, 0.0340728759765625, 0.035449981689453125, 0.03682708740234375, 0.038204193115234375, 0.039581298828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 7.0, 6.0, 11.0, 11.0, 14.0, 18.0, 15.0, 20.0, 20.0, 33.0, 31.0, 28.0, 33.0, 47.0, 44.0, 40.0, 46.0, 45.0, 44.0, 51.0, 48.0, 44.0, 49.0, 37.0, 31.0, 40.0, 29.0, 23.0, 24.0, 20.0, 17.0, 21.0, 11.0, 15.0, 5.0, 11.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.041961669921875, -0.0407719612121582, -0.039582252502441406, -0.03839254379272461, -0.03720283508300781, -0.036013126373291016, -0.03482341766357422, -0.03363370895385742, -0.032444000244140625, -0.03125429153442383, -0.03006458282470703, -0.028874874114990234, -0.027685165405273438, -0.02649545669555664, -0.025305747985839844, -0.024116039276123047, -0.02292633056640625, -0.021736621856689453, -0.020546913146972656, -0.01935720443725586, -0.018167495727539062, -0.016977787017822266, -0.01578807830810547, -0.014598369598388672, -0.013408660888671875, -0.012218952178955078, -0.011029243469238281, -0.009839534759521484, -0.008649826049804688, -0.007460117340087891, -0.006270408630371094, -0.005080699920654297, -0.0038909912109375, -0.002701282501220703, -0.0015115737915039062, -0.0003218650817871094, 0.0008678436279296875, 0.0020575523376464844, 0.0032472610473632812, 0.004436969757080078, 0.005626678466796875, 0.006816387176513672, 0.008006095886230469, 0.009195804595947266, 0.010385513305664062, 0.01157522201538086, 0.012764930725097656, 0.013954639434814453, 0.01514434814453125, 0.016334056854248047, 0.017523765563964844, 0.01871347427368164, 0.019903182983398438, 0.021092891693115234, 0.02228260040283203, 0.023472309112548828, 0.024662017822265625, 0.025851726531982422, 0.02704143524169922, 0.028231143951416016, 0.029420852661132812, 0.03061056137084961, 0.031800270080566406, 0.0329899787902832, 0.0341796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 2.0, 7.0, 5.0, 5.0, 11.0, 12.0, 25.0, 33.0, 32.0, 57.0, 94.0, 123.0, 193.0, 422.0, 1298.0, 3319.0, 14636.0, 200794.0, 790861.0, 31029.0, 3257.0, 1118.0, 502.0, 296.0, 139.0, 69.0, 55.0, 49.0, 28.0, 14.0, 17.0, 22.0, 5.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.377696990966797e-06, -6.184913218021393e-06, -5.992129445075989e-06, -5.799345672130585e-06, -5.606561899185181e-06, -5.413778126239777e-06, -5.2209943532943726e-06, -5.0282105803489685e-06, -4.8354268074035645e-06, -4.64264303445816e-06, -4.449859261512756e-06, -4.257075488567352e-06, -4.064291715621948e-06, -3.871507942676544e-06, -3.67872416973114e-06, -3.485940396785736e-06, -3.293156623840332e-06, -3.100372850894928e-06, -2.907589077949524e-06, -2.71480530500412e-06, -2.522021532058716e-06, -2.3292377591133118e-06, -2.1364539861679077e-06, -1.9436702132225037e-06, -1.7508864402770996e-06, -1.5581026673316956e-06, -1.3653188943862915e-06, -1.1725351214408875e-06, -9.797513484954834e-07, -7.869675755500793e-07, -5.941838026046753e-07, -4.0140002965927124e-07, -2.086162567138672e-07, -1.5832483768463135e-08, 1.7695128917694092e-07, 3.6973506212234497e-07, 5.62518835067749e-07, 7.553026080131531e-07, 9.480863809585571e-07, 1.1408701539039612e-06, 1.3336539268493652e-06, 1.5264376997947693e-06, 1.7192214727401733e-06, 1.9120052456855774e-06, 2.1047890186309814e-06, 2.2975727915763855e-06, 2.4903565645217896e-06, 2.6831403374671936e-06, 2.8759241104125977e-06, 3.0687078833580017e-06, 3.2614916563034058e-06, 3.45427542924881e-06, 3.647059202194214e-06, 3.839842975139618e-06, 4.032626748085022e-06, 4.225410521030426e-06, 4.41819429397583e-06, 4.610978066921234e-06, 4.803761839866638e-06, 4.996545612812042e-06, 5.189329385757446e-06, 5.38211315870285e-06, 5.574896931648254e-06, 5.7676807045936584e-06, 5.9604644775390625e-06]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 8.0, 10.0, 14.0, 10.0, 19.0, 27.0, 32.0, 31.0, 53.0, 58.0, 71.0, 79.0, 123.0, 88.0, 83.0, 60.0, 77.0, 34.0, 27.0, 23.0, 15.0, 13.0, 9.0, 9.0, 5.0, 9.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.973743438720703e-06, -6.792135536670685e-06, -6.6105276346206665e-06, -6.428919732570648e-06, -6.24731183052063e-06, -6.0657039284706116e-06, -5.884096026420593e-06, -5.702488124370575e-06, -5.520880222320557e-06, -5.339272320270538e-06, -5.15766441822052e-06, -4.976056516170502e-06, -4.794448614120483e-06, -4.612840712070465e-06, -4.431232810020447e-06, -4.2496249079704285e-06, -4.06801700592041e-06, -3.886409103870392e-06, -3.7048012018203735e-06, -3.5231932997703552e-06, -3.341585397720337e-06, -3.1599774956703186e-06, -2.9783695936203003e-06, -2.796761691570282e-06, -2.6151537895202637e-06, -2.4335458874702454e-06, -2.251937985420227e-06, -2.0703300833702087e-06, -1.8887221813201904e-06, -1.7071142792701721e-06, -1.5255063772201538e-06, -1.3438984751701355e-06, -1.1622905731201172e-06, -9.806826710700989e-07, -7.990747690200806e-07, -6.174668669700623e-07, -4.3585896492004395e-07, -2.5425106287002563e-07, -7.264316082000732e-08, 1.0896474123001099e-07, 2.905726432800293e-07, 4.721805453300476e-07, 6.537884473800659e-07, 8.353963494300842e-07, 1.0170042514801025e-06, 1.1986121535301208e-06, 1.3802200555801392e-06, 1.5618279576301575e-06, 1.7434358596801758e-06, 1.925043761730194e-06, 2.1066516637802124e-06, 2.2882595658302307e-06, 2.469867467880249e-06, 2.6514753699302673e-06, 2.8330832719802856e-06, 3.014691174030304e-06, 3.1962990760803223e-06, 3.3779069781303406e-06, 3.559514880180359e-06, 3.741122782230377e-06, 3.9227306842803955e-06, 4.104338586330414e-06, 4.285946488380432e-06, 4.4675543904304504e-06, 4.649162292480469e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 13.0, 17.0, 24.0, 47.0, 108.0, 271.0, 1538.0, 1043141.0, 2827.0, 313.0, 111.0, 64.0, 28.0, 20.0, 9.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.950429916381836e-05, -2.8570182621479034e-05, -2.763606607913971e-05, -2.6701949536800385e-05, -2.576783299446106e-05, -2.4833716452121735e-05, -2.389959990978241e-05, -2.2965483367443085e-05, -2.203136682510376e-05, -2.1097250282764435e-05, -2.016313374042511e-05, -1.9229017198085785e-05, -1.829490065574646e-05, -1.7360784113407135e-05, -1.642666757106781e-05, -1.5492551028728485e-05, -1.455843448638916e-05, -1.3624317944049835e-05, -1.269020140171051e-05, -1.1756084859371185e-05, -1.082196831703186e-05, -9.887851774692535e-06, -8.95373523235321e-06, -8.019618690013885e-06, -7.0855021476745605e-06, -6.151385605335236e-06, -5.217269062995911e-06, -4.283152520656586e-06, -3.3490359783172607e-06, -2.414919435977936e-06, -1.4808028936386108e-06, -5.466863512992859e-07, 3.8743019104003906e-07, 1.321546733379364e-06, 2.255663275718689e-06, 3.189779818058014e-06, 4.123896360397339e-06, 5.058012902736664e-06, 5.992129445075989e-06, 6.926245987415314e-06, 7.860362529754639e-06, 8.794479072093964e-06, 9.728595614433289e-06, 1.0662712156772614e-05, 1.1596828699111938e-05, 1.2530945241451263e-05, 1.3465061783790588e-05, 1.4399178326129913e-05, 1.5333294868469238e-05, 1.6267411410808563e-05, 1.7201527953147888e-05, 1.8135644495487213e-05, 1.9069761037826538e-05, 2.0003877580165863e-05, 2.0937994122505188e-05, 2.1872110664844513e-05, 2.2806227207183838e-05, 2.3740343749523163e-05, 2.4674460291862488e-05, 2.5608576834201813e-05, 2.6542693376541138e-05, 2.7476809918880463e-05, 2.8410926461219788e-05, 2.9345043003559113e-05, 3.0279159545898438e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 11.0, 8.0, 9.0, 18.0, 32.0, 49.0, 99.0, 528.0, 112.0, 44.0, 36.0, 20.0, 13.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5451183319091797e-05, -2.4645589292049408e-05, -2.383999526500702e-05, -2.303440123796463e-05, -2.222880721092224e-05, -2.1423213183879852e-05, -2.0617619156837463e-05, -1.9812025129795074e-05, -1.9006431102752686e-05, -1.8200837075710297e-05, -1.7395243048667908e-05, -1.658964902162552e-05, -1.578405499458313e-05, -1.4978460967540741e-05, -1.4172866940498352e-05, -1.3367272913455963e-05, -1.2561678886413574e-05, -1.1756084859371185e-05, -1.0950490832328796e-05, -1.0144896805286407e-05, -9.339302778244019e-06, -8.53370875120163e-06, -7.72811472415924e-06, -6.922520697116852e-06, -6.116926670074463e-06, -5.311332643032074e-06, -4.505738615989685e-06, -3.700144588947296e-06, -2.8945505619049072e-06, -2.0889565348625183e-06, -1.2833625078201294e-06, -4.777684807777405e-07, 3.2782554626464844e-07, 1.1334195733070374e-06, 1.9390136003494263e-06, 2.744607627391815e-06, 3.550201654434204e-06, 4.355795681476593e-06, 5.161389708518982e-06, 5.966983735561371e-06, 6.77257776260376e-06, 7.578171789646149e-06, 8.383765816688538e-06, 9.189359843730927e-06, 9.994953870773315e-06, 1.0800547897815704e-05, 1.1606141924858093e-05, 1.2411735951900482e-05, 1.3217329978942871e-05, 1.402292400598526e-05, 1.4828518033027649e-05, 1.5634112060070038e-05, 1.6439706087112427e-05, 1.7245300114154816e-05, 1.8050894141197205e-05, 1.8856488168239594e-05, 1.9662082195281982e-05, 2.046767622232437e-05, 2.127327024936676e-05, 2.207886427640915e-05, 2.2884458303451538e-05, 2.3690052330493927e-05, 2.4495646357536316e-05, 2.5301240384578705e-05, 2.6106834411621094e-05]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 70.0, 871.0, 62.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7223028540611267, -0.7092974781990051, -0.6962921023368835, -0.6832866668701172, -0.6702812910079956, -0.657275915145874, -0.6442705392837524, -0.6312651634216309, -0.6182597279548645, -0.6052543520927429, -0.5922489762306213, -0.579243540763855, -0.5662381649017334, -0.5532327890396118, -0.5402274131774902, -0.5272220373153687, -0.5142166614532471, -0.5012112855911255, -0.4882058799266815, -0.47520050406455994, -0.46219509840011597, -0.4491897225379944, -0.4361843466758728, -0.42317894101142883, -0.41017353534698486, -0.3971681594848633, -0.3841627538204193, -0.37115737795829773, -0.35815197229385376, -0.3451465964317322, -0.3321412205696106, -0.3191358149051666, -0.30613040924072266, -0.2931250333786011, -0.2801196277141571, -0.2671142518520355, -0.25410884618759155, -0.24110347032546997, -0.2280980795621872, -0.21509268879890442, -0.20208731293678284, -0.18908192217350006, -0.17607653141021729, -0.1630711555480957, -0.15006574988365173, -0.13706037402153015, -0.12405498325824738, -0.1110495924949646, -0.09804419428110123, -0.08503880351781845, -0.07203342020511627, -0.059028029441833496, -0.04602263867855072, -0.033017247915267944, -0.020011864602565765, -0.0070064738392829895, 0.005998916923999786, 0.019004305824637413, 0.03200969472527504, 0.04501508176326752, 0.05802047252655029, 0.07102586328983307, 0.08403124660253525, 0.09703663736581802, 0.1100420281291008]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 8.0, 9.0, 15.0, 9.0, 16.0, 17.0, 19.0, 22.0, 16.0, 23.0, 25.0, 31.0, 35.0, 41.0, 38.0, 41.0, 43.0, 48.0, 47.0, 42.0, 36.0, 48.0, 46.0, 41.0, 30.0, 34.0, 30.0, 25.0, 30.0, 19.0, 23.0, 17.0, 20.0, 13.0, 6.0, 10.0, 3.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15088272094726562, -0.14540554583072662, -0.13992835581302643, -0.13445118069648743, -0.12897400557994843, -0.12349682301282883, -0.11801964044570923, -0.11254246532917023, -0.10706528276205063, -0.10158810019493103, -0.09611092507839203, -0.09063374251127243, -0.08515655994415283, -0.07967938482761383, -0.07420220226049423, -0.06872501969337463, -0.06324784457683563, -0.05777066573500633, -0.05229348689317703, -0.046816304326057434, -0.041339125484228134, -0.035861946642398834, -0.030384764075279236, -0.024907585233449936, -0.019430406391620636, -0.013953226618468761, -0.008476046845316887, -0.0029988661408424377, 0.002478312700986862, 0.007955491542816162, 0.01343267410993576, 0.01890985295176506, 0.02438703179359436, 0.02986421063542366, 0.03534138947725296, 0.04081857204437256, 0.04629575088620186, 0.05177292972803116, 0.05725011229515076, 0.06272728741168976, 0.06820446997880936, 0.07368165254592896, 0.07915882766246796, 0.08463601022958755, 0.09011319279670715, 0.09559036791324615, 0.10106755048036575, 0.10654473304748535, 0.11202190816402435, 0.11749909073114395, 0.12297626584768295, 0.12845344841480255, 0.13393062353134155, 0.13940781354904175, 0.14488498866558075, 0.15036216378211975, 0.15583935379981995, 0.16131652891635895, 0.16679371893405914, 0.17227089405059814, 0.17774806916713715, 0.18322524428367615, 0.18870243430137634, 0.19417960941791534, 0.19965678453445435]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 5.0, 2.0, 8.0, 4.0, 9.0, 8.0, 16.0, 22.0, 42.0, 142.0, 3702.0, 4189026.0, 1089.0, 89.0, 27.0, 15.0, 10.0, 7.0, 11.0, 7.0, 4.0, 5.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0596923828125, -0.057951927185058594, -0.05621147155761719, -0.05447101593017578, -0.052730560302734375, -0.05099010467529297, -0.04924964904785156, -0.047509193420410156, -0.04576873779296875, -0.044028282165527344, -0.04228782653808594, -0.04054737091064453, -0.038806915283203125, -0.03706645965576172, -0.03532600402832031, -0.033585548400878906, -0.0318450927734375, -0.030104637145996094, -0.028364181518554688, -0.02662372589111328, -0.024883270263671875, -0.02314281463623047, -0.021402359008789062, -0.019661903381347656, -0.01792144775390625, -0.016180992126464844, -0.014440536499023438, -0.012700080871582031, -0.010959625244140625, -0.009219169616699219, -0.0074787139892578125, -0.005738258361816406, -0.003997802734375, -0.0022573471069335938, -0.0005168914794921875, 0.0012235641479492188, 0.002964019775390625, 0.004704475402832031, 0.0064449310302734375, 0.008185386657714844, 0.00992584228515625, 0.011666297912597656, 0.013406753540039062, 0.015147209167480469, 0.016887664794921875, 0.01862812042236328, 0.020368576049804688, 0.022109031677246094, 0.0238494873046875, 0.025589942932128906, 0.027330398559570312, 0.02907085418701172, 0.030811309814453125, 0.03255176544189453, 0.03429222106933594, 0.036032676696777344, 0.03777313232421875, 0.039513587951660156, 0.04125404357910156, 0.04299449920654297, 0.044734954833984375, 0.04647541046142578, 0.04821586608886719, 0.049956321716308594, 0.05169677734375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 6.0, 5.0, 9.0, 10.0, 12.0, 13.0, 31.0, 61.0, 189.0, 286.0, 181.0, 80.0, 20.0, 15.0, 11.0, 6.0, 12.0, 6.0, 5.0, 4.0, 5.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015960693359375, -0.015496134757995605, -0.015031576156616211, -0.014567017555236816, -0.014102458953857422, -0.013637900352478027, -0.013173341751098633, -0.012708783149719238, -0.012244224548339844, -0.01177966594696045, -0.011315107345581055, -0.01085054874420166, -0.010385990142822266, -0.009921431541442871, -0.009456872940063477, -0.008992314338684082, -0.008527755737304688, -0.008063197135925293, -0.0075986385345458984, -0.007134079933166504, -0.006669521331787109, -0.006204962730407715, -0.00574040412902832, -0.005275845527648926, -0.004811286926269531, -0.004346728324890137, -0.003882169723510742, -0.0034176111221313477, -0.002953052520751953, -0.0024884939193725586, -0.002023935317993164, -0.0015593767166137695, -0.001094818115234375, -0.0006302595138549805, -0.00016570091247558594, 0.0002988576889038086, 0.0007634162902832031, 0.0012279748916625977, 0.0016925334930419922, 0.0021570920944213867, 0.0026216506958007812, 0.0030862092971801758, 0.0035507678985595703, 0.004015326499938965, 0.004479885101318359, 0.004944443702697754, 0.0054090023040771484, 0.005873560905456543, 0.0063381195068359375, 0.006802678108215332, 0.0072672367095947266, 0.007731795310974121, 0.008196353912353516, 0.00866091251373291, 0.009125471115112305, 0.0095900297164917, 0.010054588317871094, 0.010519146919250488, 0.010983705520629883, 0.011448264122009277, 0.011912822723388672, 0.012377381324768066, 0.012841939926147461, 0.013306498527526855, 0.01377105712890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 16.0, 35.0, 94.0, 361.0, 1116.0, 4137348.0, 53967.0, 931.0, 270.0, 93.0, 25.0, 12.0, 7.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033355712890625, -0.032277584075927734, -0.03119945526123047, -0.030121326446533203, -0.029043197631835938, -0.027965068817138672, -0.026886940002441406, -0.02580881118774414, -0.024730682373046875, -0.02365255355834961, -0.022574424743652344, -0.021496295928955078, -0.020418167114257812, -0.019340038299560547, -0.01826190948486328, -0.017183780670166016, -0.01610565185546875, -0.015027523040771484, -0.013949394226074219, -0.012871265411376953, -0.011793136596679688, -0.010715007781982422, -0.009636878967285156, -0.00855875015258789, -0.007480621337890625, -0.006402492523193359, -0.005324363708496094, -0.004246234893798828, -0.0031681060791015625, -0.002089977264404297, -0.0010118484497070312, 6.628036499023438e-05, 0.0011444091796875, 0.0022225379943847656, 0.0033006668090820312, 0.004378795623779297, 0.0054569244384765625, 0.006535053253173828, 0.007613182067871094, 0.00869131088256836, 0.009769439697265625, 0.01084756851196289, 0.011925697326660156, 0.013003826141357422, 0.014081954956054688, 0.015160083770751953, 0.01623821258544922, 0.017316341400146484, 0.01839447021484375, 0.019472599029541016, 0.02055072784423828, 0.021628856658935547, 0.022706985473632812, 0.023785114288330078, 0.024863243103027344, 0.02594137191772461, 0.027019500732421875, 0.02809762954711914, 0.029175758361816406, 0.030253887176513672, 0.03133201599121094, 0.0324101448059082, 0.03348827362060547, 0.034566402435302734, 0.03564453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 12.0, 40.0, 277.0, 3681.0, 46.0, 11.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01213836669921875, -0.0117720365524292, -0.011405706405639648, -0.011039376258850098, -0.010673046112060547, -0.010306715965270996, -0.009940385818481445, -0.009574055671691895, -0.009207725524902344, -0.008841395378112793, -0.008475065231323242, -0.008108735084533691, -0.007742404937744141, -0.00737607479095459, -0.007009744644165039, -0.006643414497375488, -0.0062770843505859375, -0.005910754203796387, -0.005544424057006836, -0.005178093910217285, -0.004811763763427734, -0.004445433616638184, -0.004079103469848633, -0.003712773323059082, -0.0033464431762695312, -0.0029801130294799805, -0.0026137828826904297, -0.002247452735900879, -0.0018811225891113281, -0.0015147924423217773, -0.0011484622955322266, -0.0007821321487426758, -0.000415802001953125, -4.947185516357422e-05, 0.00031685829162597656, 0.0006831884384155273, 0.0010495185852050781, 0.001415848731994629, 0.0017821788787841797, 0.0021485090255737305, 0.0025148391723632812, 0.002881169319152832, 0.003247499465942383, 0.0036138296127319336, 0.003980159759521484, 0.004346489906311035, 0.004712820053100586, 0.005079150199890137, 0.0054454803466796875, 0.005811810493469238, 0.006178140640258789, 0.00654447078704834, 0.006910800933837891, 0.007277131080627441, 0.007643461227416992, 0.008009791374206543, 0.008376121520996094, 0.008742451667785645, 0.009108781814575195, 0.009475111961364746, 0.009841442108154297, 0.010207772254943848, 0.010574102401733398, 0.01094043254852295, 0.0113067626953125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1002.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07299946993589401, -0.06930620223283768, -0.06561294198036194, -0.0619196742773056, -0.058226410299539566, -0.05453314632177353, -0.050839878618717194, -0.04714661464095116, -0.04345335066318512, -0.03976008668541908, -0.036066822707653046, -0.03237355500459671, -0.028680291026830673, -0.024987027049064636, -0.02129376120865345, -0.017600495368242264, -0.013907231390476227, -0.010213966481387615, -0.006520701572299004, -0.002827436663210392, 0.0008658282458782196, 0.004559092223644257, 0.008252358064055443, 0.011945623904466629, 0.015638887882232666, 0.019332151859998703, 0.02302541770040989, 0.026718683540821075, 0.030411947518587112, 0.03410521149635315, 0.037798479199409485, 0.04149174317717552, 0.04518499970436096, 0.048878263682127, 0.052571527659893036, 0.05626479536294937, 0.05995805934071541, 0.06365132331848145, 0.06734459102153778, 0.07103785872459412, 0.07473111897706985, 0.07842438668012619, 0.08211764693260193, 0.08581091463565826, 0.0895041823387146, 0.09319744259119034, 0.09689071029424667, 0.10058397054672241, 0.10427723824977875, 0.10797050595283508, 0.11166376620531082, 0.11535703390836716, 0.1190502941608429, 0.12274356186389923, 0.12643682956695557, 0.1301300972700119, 0.13382336497306824, 0.13751663267612457, 0.1412099003791809, 0.14490315318107605, 0.14859642088413239, 0.15228968858718872, 0.15598295629024506, 0.1596762239933014, 0.16336947679519653]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 11.0, 16.0, 23.0, 20.0, 37.0, 47.0, 59.0, 55.0, 93.0, 81.0, 78.0, 84.0, 75.0, 84.0, 61.0, 41.0, 36.0, 19.0, 24.0, 23.0, 14.0, 12.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021182239055633545, -0.020583298057317734, -0.019984357059001923, -0.01938541606068611, -0.0187864750623703, -0.01818753406405449, -0.017588593065738678, -0.016989652067422867, -0.016390711069107056, -0.015791770070791245, -0.015192829072475433, -0.014593888074159622, -0.013994947075843811, -0.013396006077528, -0.012797065079212189, -0.012198124080896378, -0.011599183082580566, -0.011000242084264755, -0.010401301085948944, -0.009802360087633133, -0.009203419089317322, -0.00860447809100151, -0.0080055370926857, -0.007406596094369888, -0.006807655096054077, -0.006208714097738266, -0.005609773099422455, -0.005010832101106644, -0.0044118911027908325, -0.0038129501044750214, -0.00321400910615921, -0.002615068107843399, -0.002016127109527588, -0.0014171861112117767, -0.0008182451128959656, -0.00021930411458015442, 0.00037963688373565674, 0.000978577882051468, 0.001577518880367279, 0.00217645987868309, 0.0027754008769989014, 0.0033743418753147125, 0.003973282873630524, 0.004572223871946335, 0.005171164870262146, 0.005770105868577957, 0.006369046866893768, 0.0069679878652095795, 0.007566928863525391, 0.008165869861841202, 0.008764810860157013, 0.009363751858472824, 0.009962692856788635, 0.010561633855104446, 0.011160574853420258, 0.011759515851736069, 0.01235845685005188, 0.012957397848367691, 0.013556338846683502, 0.014155279844999313, 0.014754220843315125, 0.015353161841630936, 0.015952102839946747, 0.016551043838262558, 0.01714998483657837]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 17.0, 23.0, 28.0, 31.0, 29.0, 45.0, 85.0, 114.0, 131.0, 200.0, 332.0, 554.0, 773.0, 1257.0, 2225.0, 4070.0, 8179.0, 20711.0, 185610.0, 773006.0, 29392.0, 10246.0, 4724.0, 2567.0, 1527.0, 900.0, 573.0, 365.0, 235.0, 151.0, 158.0, 89.0, 64.0, 32.0, 19.0, 17.0, 13.0, 16.0, 11.0, 13.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.017822265625, -0.017300128936767578, -0.016777992248535156, -0.016255855560302734, -0.015733718872070312, -0.01521158218383789, -0.014689445495605469, -0.014167308807373047, -0.013645172119140625, -0.013123035430908203, -0.012600898742675781, -0.01207876205444336, -0.011556625366210938, -0.011034488677978516, -0.010512351989746094, -0.009990215301513672, -0.00946807861328125, -0.008945941925048828, -0.008423805236816406, -0.007901668548583984, -0.0073795318603515625, -0.006857395172119141, -0.006335258483886719, -0.005813121795654297, -0.005290985107421875, -0.004768848419189453, -0.004246711730957031, -0.0037245750427246094, -0.0032024383544921875, -0.0026803016662597656, -0.0021581649780273438, -0.0016360282897949219, -0.0011138916015625, -0.0005917549133300781, -6.961822509765625e-05, 0.0004525184631347656, 0.0009746551513671875, 0.0014967918395996094, 0.0020189285278320312, 0.002541065216064453, 0.003063201904296875, 0.003585338592529297, 0.004107475280761719, 0.004629611968994141, 0.0051517486572265625, 0.005673885345458984, 0.006196022033691406, 0.006718158721923828, 0.00724029541015625, 0.007762432098388672, 0.008284568786621094, 0.008806705474853516, 0.009328842163085938, 0.00985097885131836, 0.010373115539550781, 0.010895252227783203, 0.011417388916015625, 0.011939525604248047, 0.012461662292480469, 0.01298379898071289, 0.013505935668945312, 0.014028072357177734, 0.014550209045410156, 0.015072345733642578, 0.015594482421875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 6.0, 2.0, 5.0, 6.0, 9.0, 10.0, 12.0, 13.0, 31.0, 60.0, 187.0, 287.0, 182.0, 81.0, 20.0, 15.0, 11.0, 6.0, 12.0, 7.0, 4.0, 4.0, 5.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0159759521484375, -0.015511035919189453, -0.015046119689941406, -0.01458120346069336, -0.014116287231445312, -0.013651371002197266, -0.013186454772949219, -0.012721538543701172, -0.012256622314453125, -0.011791706085205078, -0.011326789855957031, -0.010861873626708984, -0.010396957397460938, -0.00993204116821289, -0.009467124938964844, -0.009002208709716797, -0.00853729248046875, -0.008072376251220703, -0.007607460021972656, -0.007142543792724609, -0.0066776275634765625, -0.006212711334228516, -0.005747795104980469, -0.005282878875732422, -0.004817962646484375, -0.004353046417236328, -0.0038881301879882812, -0.0034232139587402344, -0.0029582977294921875, -0.0024933815002441406, -0.0020284652709960938, -0.0015635490417480469, -0.0010986328125, -0.0006337165832519531, -0.00016880035400390625, 0.0002961158752441406, 0.0007610321044921875, 0.0012259483337402344, 0.0016908645629882812, 0.002155780792236328, 0.002620697021484375, 0.003085613250732422, 0.0035505294799804688, 0.004015445709228516, 0.0044803619384765625, 0.004945278167724609, 0.005410194396972656, 0.005875110626220703, 0.00634002685546875, 0.006804943084716797, 0.007269859313964844, 0.007734775543212891, 0.008199691772460938, 0.008664608001708984, 0.009129524230957031, 0.009594440460205078, 0.010059356689453125, 0.010524272918701172, 0.010989189147949219, 0.011454105377197266, 0.011919021606445312, 0.01238393783569336, 0.012848854064941406, 0.013313770294189453, 0.0137786865234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 2.0, 3.0, 6.0, 10.0, 12.0, 20.0, 11.0, 21.0, 22.0, 39.0, 35.0, 50.0, 62.0, 77.0, 96.0, 120.0, 177.0, 319.0, 513.0, 912.0, 2994.0, 102162.0, 927788.0, 9831.0, 1356.0, 649.0, 357.0, 221.0, 167.0, 109.0, 94.0, 50.0, 53.0, 44.0, 28.0, 23.0, 32.0, 16.0, 13.0, 13.0, 8.0, 10.0, 10.0, 3.0, 1.0, 1.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034332275390625, -0.033196449279785156, -0.03206062316894531, -0.03092479705810547, -0.029788970947265625, -0.02865314483642578, -0.027517318725585938, -0.026381492614746094, -0.02524566650390625, -0.024109840393066406, -0.022974014282226562, -0.02183818817138672, -0.020702362060546875, -0.01956653594970703, -0.018430709838867188, -0.017294883728027344, -0.0161590576171875, -0.015023231506347656, -0.013887405395507812, -0.012751579284667969, -0.011615753173828125, -0.010479927062988281, -0.009344100952148438, -0.008208274841308594, -0.00707244873046875, -0.005936622619628906, -0.0048007965087890625, -0.0036649703979492188, -0.002529144287109375, -0.0013933181762695312, -0.0002574920654296875, 0.0008783340454101562, 0.00201416015625, 0.0031499862670898438, 0.0042858123779296875, 0.005421638488769531, 0.006557464599609375, 0.007693290710449219, 0.008829116821289062, 0.009964942932128906, 0.01110076904296875, 0.012236595153808594, 0.013372421264648438, 0.014508247375488281, 0.015644073486328125, 0.01677989959716797, 0.017915725708007812, 0.019051551818847656, 0.0201873779296875, 0.021323204040527344, 0.022459030151367188, 0.02359485626220703, 0.024730682373046875, 0.02586650848388672, 0.027002334594726562, 0.028138160705566406, 0.02927398681640625, 0.030409812927246094, 0.03154563903808594, 0.03268146514892578, 0.033817291259765625, 0.03495311737060547, 0.03608894348144531, 0.037224769592285156, 0.038360595703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 6.0, 7.0, 6.0, 15.0, 9.0, 14.0, 13.0, 28.0, 19.0, 27.0, 27.0, 32.0, 34.0, 23.0, 29.0, 31.0, 47.0, 35.0, 43.0, 35.0, 46.0, 40.0, 43.0, 37.0, 42.0, 35.0, 33.0, 28.0, 30.0, 19.0, 20.0, 21.0, 16.0, 17.0, 24.0, 10.0, 7.0, 11.0, 5.0, 7.0, 9.0, 2.0, 1.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0301971435546875, -0.02919745445251465, -0.028197765350341797, -0.027198076248168945, -0.026198387145996094, -0.025198698043823242, -0.02419900894165039, -0.02319931983947754, -0.022199630737304688, -0.021199941635131836, -0.020200252532958984, -0.019200563430786133, -0.01820087432861328, -0.01720118522644043, -0.016201496124267578, -0.015201807022094727, -0.014202117919921875, -0.013202428817749023, -0.012202739715576172, -0.01120305061340332, -0.010203361511230469, -0.009203672409057617, -0.008203983306884766, -0.007204294204711914, -0.0062046051025390625, -0.005204916000366211, -0.004205226898193359, -0.003205537796020508, -0.0022058486938476562, -0.0012061595916748047, -0.00020647048950195312, 0.0007932186126708984, 0.00179290771484375, 0.0027925968170166016, 0.003792285919189453, 0.004791975021362305, 0.005791664123535156, 0.006791353225708008, 0.007791042327880859, 0.008790731430053711, 0.009790420532226562, 0.010790109634399414, 0.011789798736572266, 0.012789487838745117, 0.013789176940917969, 0.01478886604309082, 0.015788555145263672, 0.016788244247436523, 0.017787933349609375, 0.018787622451782227, 0.019787311553955078, 0.02078700065612793, 0.02178668975830078, 0.022786378860473633, 0.023786067962646484, 0.024785757064819336, 0.025785446166992188, 0.02678513526916504, 0.02778482437133789, 0.028784513473510742, 0.029784202575683594, 0.030783891677856445, 0.0317835807800293, 0.03278326988220215, 0.033782958984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 11.0, 10.0, 13.0, 20.0, 15.0, 28.0, 35.0, 55.0, 35.0, 58.0, 122.0, 185.0, 201.0, 507.0, 1215.0, 3131.0, 6077.0, 41515.0, 731667.0, 233790.0, 21976.0, 3766.0, 2187.0, 825.0, 381.0, 165.0, 178.0, 88.0, 88.0, 31.0, 34.0, 40.0, 29.0, 10.0, 16.0, 14.0, 15.0, 5.0, 0.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.245208740234375e-06, -5.080364644527435e-06, -4.915520548820496e-06, -4.750676453113556e-06, -4.585832357406616e-06, -4.4209882616996765e-06, -4.256144165992737e-06, -4.091300070285797e-06, -3.926455974578857e-06, -3.7616118788719177e-06, -3.596767783164978e-06, -3.4319236874580383e-06, -3.2670795917510986e-06, -3.102235496044159e-06, -2.9373914003372192e-06, -2.7725473046302795e-06, -2.60770320892334e-06, -2.4428591132164e-06, -2.2780150175094604e-06, -2.1131709218025208e-06, -1.948326826095581e-06, -1.7834827303886414e-06, -1.6186386346817017e-06, -1.453794538974762e-06, -1.2889504432678223e-06, -1.1241063475608826e-06, -9.592622518539429e-07, -7.944181561470032e-07, -6.295740604400635e-07, -4.647299647331238e-07, -2.998858690261841e-07, -1.3504177331924438e-07, 2.9802322387695312e-08, 1.94646418094635e-07, 3.594905138015747e-07, 5.243346095085144e-07, 6.891787052154541e-07, 8.540228009223938e-07, 1.0188668966293335e-06, 1.1837109923362732e-06, 1.3485550880432129e-06, 1.5133991837501526e-06, 1.6782432794570923e-06, 1.843087375164032e-06, 2.0079314708709717e-06, 2.1727755665779114e-06, 2.337619662284851e-06, 2.5024637579917908e-06, 2.6673078536987305e-06, 2.83215194940567e-06, 2.99699604511261e-06, 3.1618401408195496e-06, 3.3266842365264893e-06, 3.491528332233429e-06, 3.6563724279403687e-06, 3.821216523647308e-06, 3.986060619354248e-06, 4.150904715061188e-06, 4.3157488107681274e-06, 4.480592906475067e-06, 4.645437002182007e-06, 4.8102810978889465e-06, 4.975125193595886e-06, 5.139969289302826e-06, 5.304813385009766e-06]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 1.0, 8.0, 15.0, 5.0, 19.0, 12.0, 6.0, 19.0, 37.0, 12.0, 17.0, 42.0, 16.0, 35.0, 18.0, 43.0, 48.0, 46.0, 67.0, 56.0, 31.0, 45.0, 58.0, 32.0, 42.0, 26.0, 35.0, 30.0, 21.0, 20.0, 28.0, 8.0, 15.0, 17.0, 6.0, 13.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-3.0994415283203125e-06, -3.0016526579856873e-06, -2.903863787651062e-06, -2.8060749173164368e-06, -2.7082860469818115e-06, -2.6104971766471863e-06, -2.512708306312561e-06, -2.414919435977936e-06, -2.3171305656433105e-06, -2.2193416953086853e-06, -2.12155282497406e-06, -2.023763954639435e-06, -1.9259750843048096e-06, -1.8281862139701843e-06, -1.730397343635559e-06, -1.6326084733009338e-06, -1.5348196029663086e-06, -1.4370307326316833e-06, -1.339241862297058e-06, -1.2414529919624329e-06, -1.1436641216278076e-06, -1.0458752512931824e-06, -9.480863809585571e-07, -8.502975106239319e-07, -7.525086402893066e-07, -6.547197699546814e-07, -5.569308996200562e-07, -4.591420292854309e-07, -3.6135315895080566e-07, -2.635642886161804e-07, -1.6577541828155518e-07, -6.798654794692993e-08, 2.9802322387695312e-08, 1.2759119272232056e-07, 2.253800630569458e-07, 3.2316893339157104e-07, 4.209578037261963e-07, 5.187466740608215e-07, 6.165355443954468e-07, 7.14324414730072e-07, 8.121132850646973e-07, 9.099021553993225e-07, 1.0076910257339478e-06, 1.105479896068573e-06, 1.2032687664031982e-06, 1.3010576367378235e-06, 1.3988465070724487e-06, 1.496635377407074e-06, 1.5944242477416992e-06, 1.6922131180763245e-06, 1.7900019884109497e-06, 1.887790858745575e-06, 1.9855797290802e-06, 2.0833685994148254e-06, 2.1811574697494507e-06, 2.278946340084076e-06, 2.376735210418701e-06, 2.4745240807533264e-06, 2.5723129510879517e-06, 2.670101821422577e-06, 2.767890691757202e-06, 2.8656795620918274e-06, 2.9634684324264526e-06, 3.061257302761078e-06, 3.159046173095703e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 6.0, 13.0, 25.0, 26.0, 68.0, 131.0, 513.0, 13204.0, 1033028.0, 1105.0, 218.0, 84.0, 37.0, 26.0, 17.0, 9.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.218650817871094e-05, -3.112107515335083e-05, -3.0055642127990723e-05, -2.8990209102630615e-05, -2.7924776077270508e-05, -2.68593430519104e-05, -2.5793910026550293e-05, -2.4728477001190186e-05, -2.3663043975830078e-05, -2.259761095046997e-05, -2.1532177925109863e-05, -2.0466744899749756e-05, -1.940131187438965e-05, -1.833587884902954e-05, -1.7270445823669434e-05, -1.6205012798309326e-05, -1.5139579772949219e-05, -1.4074146747589111e-05, -1.3008713722229004e-05, -1.1943280696868896e-05, -1.0877847671508789e-05, -9.812414646148682e-06, -8.746981620788574e-06, -7.681548595428467e-06, -6.616115570068359e-06, -5.550682544708252e-06, -4.4852495193481445e-06, -3.419816493988037e-06, -2.3543834686279297e-06, -1.2889504432678223e-06, -2.2351741790771484e-07, 8.419156074523926e-07, 1.9073486328125e-06, 2.9727816581726074e-06, 4.038214683532715e-06, 5.103647708892822e-06, 6.16908073425293e-06, 7.234513759613037e-06, 8.299946784973145e-06, 9.365379810333252e-06, 1.043081283569336e-05, 1.1496245861053467e-05, 1.2561678886413574e-05, 1.3627111911773682e-05, 1.4692544937133789e-05, 1.5757977962493896e-05, 1.6823410987854004e-05, 1.788884401321411e-05, 1.895427703857422e-05, 2.0019710063934326e-05, 2.1085143089294434e-05, 2.215057611465454e-05, 2.321600914001465e-05, 2.4281442165374756e-05, 2.5346875190734863e-05, 2.641230821609497e-05, 2.7477741241455078e-05, 2.8543174266815186e-05, 2.9608607292175293e-05, 3.06740403175354e-05, 3.173947334289551e-05, 3.2804906368255615e-05, 3.387033939361572e-05, 3.493577241897583e-05, 3.600120544433594e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 9.0, 7.0, 24.0, 26.0, 58.0, 122.0, 558.0, 79.0, 43.0, 23.0, 11.0, 11.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8371810913085938e-05, -2.7434900403022766e-05, -2.6497989892959595e-05, -2.5561079382896423e-05, -2.4624168872833252e-05, -2.368725836277008e-05, -2.275034785270691e-05, -2.1813437342643738e-05, -2.0876526832580566e-05, -1.9939616322517395e-05, -1.9002705812454224e-05, -1.8065795302391052e-05, -1.712888479232788e-05, -1.619197428226471e-05, -1.5255063772201538e-05, -1.4318153262138367e-05, -1.3381242752075195e-05, -1.2444332242012024e-05, -1.1507421731948853e-05, -1.0570511221885681e-05, -9.63360071182251e-06, -8.696690201759338e-06, -7.759779691696167e-06, -6.822869181632996e-06, -5.885958671569824e-06, -4.949048161506653e-06, -4.0121376514434814e-06, -3.07522714138031e-06, -2.1383166313171387e-06, -1.2014061212539673e-06, -2.644956111907959e-07, 6.724148988723755e-07, 1.6093254089355469e-06, 2.5462359189987183e-06, 3.4831464290618896e-06, 4.420056939125061e-06, 5.356967449188232e-06, 6.293877959251404e-06, 7.230788469314575e-06, 8.167698979377747e-06, 9.104609489440918e-06, 1.004151999950409e-05, 1.097843050956726e-05, 1.1915341019630432e-05, 1.2852251529693604e-05, 1.3789162039756775e-05, 1.4726072549819946e-05, 1.5662983059883118e-05, 1.659989356994629e-05, 1.753680408000946e-05, 1.8473714590072632e-05, 1.9410625100135803e-05, 2.0347535610198975e-05, 2.1284446120262146e-05, 2.2221356630325317e-05, 2.315826714038849e-05, 2.409517765045166e-05, 2.503208816051483e-05, 2.5968998670578003e-05, 2.6905909180641174e-05, 2.7842819690704346e-05, 2.8779730200767517e-05, 2.971664071083069e-05, 3.065355122089386e-05, 3.159046173095703e-05]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 34.0, 583.0, 385.0, 10.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6500817537307739, -0.6386701464653015, -0.6272584795951843, -0.6158468723297119, -0.6044352650642395, -0.5930235981941223, -0.5816119909286499, -0.5702003240585327, -0.5587887167930603, -0.5473771095275879, -0.5359654426574707, -0.5245538353919983, -0.5131422281265259, -0.5017305612564087, -0.4903189539909363, -0.4789073169231415, -0.4674956798553467, -0.4560840427875519, -0.44467243552207947, -0.43326079845428467, -0.42184916138648987, -0.41043752431869507, -0.39902591705322266, -0.38761427998542786, -0.37620267271995544, -0.36479103565216064, -0.35337942838668823, -0.34196779131889343, -0.33055615425109863, -0.31914451718330383, -0.3077329099178314, -0.2963212728500366, -0.2849096655845642, -0.2734980285167694, -0.262086421251297, -0.2506747841835022, -0.2392631471157074, -0.2278515249490738, -0.21643990278244019, -0.20502826571464539, -0.19361662864685059, -0.18220500648021698, -0.17079336941242218, -0.15938174724578857, -0.14797011017799377, -0.13655848801136017, -0.12514686584472656, -0.11373522877693176, -0.10232359170913696, -0.09091196209192276, -0.07950033247470856, -0.06808871030807495, -0.05667707696557045, -0.04526544734835625, -0.03385382145643234, -0.02244219183921814, -0.011030562222003937, 0.0003810664638876915, 0.01179269514977932, 0.023204322904348373, 0.034615952521562576, 0.04602758213877678, 0.057439208030700684, 0.06885083764791489, 0.08026246726512909]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 9.0, 11.0, 18.0, 8.0, 16.0, 10.0, 21.0, 28.0, 30.0, 33.0, 33.0, 47.0, 59.0, 42.0, 51.0, 57.0, 63.0, 57.0, 43.0, 36.0, 41.0, 51.0, 45.0, 30.0, 23.0, 24.0, 21.0, 19.0, 13.0, 12.0, 13.0, 9.0, 7.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1894260048866272, -0.18333856761455536, -0.17725111544132233, -0.1711636781692505, -0.16507622599601746, -0.15898878872394562, -0.15290135145187378, -0.14681389927864075, -0.14072644710540771, -0.13463900983333588, -0.12855155766010284, -0.122464120388031, -0.11637666821479797, -0.11028923094272614, -0.1042017862200737, -0.09811434149742126, -0.09202690422534943, -0.08593945950269699, -0.07985201478004456, -0.07376457750797272, -0.06767712533473969, -0.06158968433737755, -0.05550224334001541, -0.049414798617362976, -0.04332735389471054, -0.037239909172058105, -0.03115246631205082, -0.025065023452043533, -0.018977578729391098, -0.012890134006738663, -0.006802693009376526, -0.0007152482867240906, 0.005372196435928345, 0.011459640227258205, 0.017547084018588066, 0.023634526878595352, 0.029721971601247787, 0.03580941632390022, 0.04189685732126236, 0.047984302043914795, 0.05407174676656723, 0.060159191489219666, 0.0662466362118721, 0.07233408093452454, 0.07842151820659637, 0.0845089703798294, 0.09059640765190125, 0.09668385237455368, 0.10277129709720612, 0.10885874181985855, 0.11494618654251099, 0.12103362381458282, 0.12712107598781586, 0.1332085132598877, 0.13929596543312073, 0.14538340270519257, 0.1514708399772644, 0.15755827724933624, 0.16364572942256927, 0.1697331666946411, 0.17582061886787415, 0.18190805613994598, 0.18799549341201782, 0.19408294558525085, 0.2001703977584839]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 9.0, 14.0, 22.0, 40.0, 111.0, 735.0, 4192819.0, 289.0, 93.0, 28.0, 15.0, 13.0, 7.0, 11.0, 6.0, 4.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1602783203125, -0.1556072235107422, -0.15093612670898438, -0.14626502990722656, -0.14159393310546875, -0.13692283630371094, -0.13225173950195312, -0.1275806427001953, -0.1229095458984375, -0.11823844909667969, -0.11356735229492188, -0.10889625549316406, -0.10422515869140625, -0.09955406188964844, -0.09488296508789062, -0.09021186828613281, -0.085540771484375, -0.08086967468261719, -0.07619857788085938, -0.07152748107910156, -0.06685638427734375, -0.06218528747558594, -0.057514190673828125, -0.05284309387207031, -0.0481719970703125, -0.04350090026855469, -0.038829803466796875, -0.03415870666503906, -0.02948760986328125, -0.024816513061523438, -0.020145416259765625, -0.015474319458007812, -0.01080322265625, -0.0061321258544921875, -0.001461029052734375, 0.0032100677490234375, 0.00788116455078125, 0.012552261352539062, 0.017223358154296875, 0.021894454956054688, 0.0265655517578125, 0.031236648559570312, 0.035907745361328125, 0.04057884216308594, 0.04524993896484375, 0.04992103576660156, 0.054592132568359375, 0.05926322937011719, 0.063934326171875, 0.06860542297363281, 0.07327651977539062, 0.07794761657714844, 0.08261871337890625, 0.08728981018066406, 0.09196090698242188, 0.09663200378417969, 0.1013031005859375, 0.10597419738769531, 0.11064529418945312, 0.11531639099121094, 0.11998748779296875, 0.12465858459472656, 0.12932968139648438, 0.1340007781982422, 0.138671875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 9.0, 10.0, 11.0, 17.0, 27.0, 64.0, 184.0, 292.0, 183.0, 73.0, 20.0, 14.0, 14.0, 7.0, 11.0, 6.0, 4.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015716552734375, -0.01525866985321045, -0.014800786972045898, -0.014342904090881348, -0.013885021209716797, -0.013427138328552246, -0.012969255447387695, -0.012511372566223145, -0.012053489685058594, -0.011595606803894043, -0.011137723922729492, -0.010679841041564941, -0.01022195816040039, -0.00976407527923584, -0.009306192398071289, -0.008848309516906738, -0.008390426635742188, -0.007932543754577637, -0.007474660873413086, -0.007016777992248535, -0.006558895111083984, -0.006101012229919434, -0.005643129348754883, -0.005185246467590332, -0.004727363586425781, -0.0042694807052612305, -0.0038115978240966797, -0.003353714942932129, -0.002895832061767578, -0.0024379491806030273, -0.0019800662994384766, -0.0015221834182739258, -0.001064300537109375, -0.0006064176559448242, -0.00014853477478027344, 0.00030934810638427734, 0.0007672309875488281, 0.001225113868713379, 0.0016829967498779297, 0.0021408796310424805, 0.0025987625122070312, 0.003056645393371582, 0.003514528274536133, 0.003972411155700684, 0.004430294036865234, 0.004888176918029785, 0.005346059799194336, 0.005803942680358887, 0.0062618255615234375, 0.006719708442687988, 0.007177591323852539, 0.00763547420501709, 0.00809335708618164, 0.008551239967346191, 0.009009122848510742, 0.009467005729675293, 0.009924888610839844, 0.010382771492004395, 0.010840654373168945, 0.011298537254333496, 0.011756420135498047, 0.012214303016662598, 0.012672185897827148, 0.0131300687789917, 0.01358795166015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 27.0, 104.0, 244.0, 633.0, 11968.0, 4179964.0, 848.0, 303.0, 114.0, 49.0, 11.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0501708984375, -0.04870033264160156, -0.047229766845703125, -0.04575920104980469, -0.04428863525390625, -0.04281806945800781, -0.041347503662109375, -0.03987693786621094, -0.0384063720703125, -0.03693580627441406, -0.035465240478515625, -0.03399467468261719, -0.03252410888671875, -0.031053543090820312, -0.029582977294921875, -0.028112411499023438, -0.026641845703125, -0.025171279907226562, -0.023700714111328125, -0.022230148315429688, -0.02075958251953125, -0.019289016723632812, -0.017818450927734375, -0.016347885131835938, -0.0148773193359375, -0.013406753540039062, -0.011936187744140625, -0.010465621948242188, -0.00899505615234375, -0.0075244903564453125, -0.006053924560546875, -0.0045833587646484375, -0.00311279296875, -0.0016422271728515625, -0.000171661376953125, 0.0012989044189453125, 0.00276947021484375, 0.0042400360107421875, 0.005710601806640625, 0.0071811676025390625, 0.0086517333984375, 0.010122299194335938, 0.011592864990234375, 0.013063430786132812, 0.01453399658203125, 0.016004562377929688, 0.017475128173828125, 0.018945693969726562, 0.020416259765625, 0.021886825561523438, 0.023357391357421875, 0.024827957153320312, 0.02629852294921875, 0.027769088745117188, 0.029239654541015625, 0.030710220336914062, 0.0321807861328125, 0.03365135192871094, 0.035121917724609375, 0.03659248352050781, 0.03806304931640625, 0.03953361511230469, 0.041004180908203125, 0.04247474670410156, 0.0439453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 15.0, 115.0, 3924.0, 21.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0137176513671875, -0.013247013092041016, -0.012776374816894531, -0.012305736541748047, -0.011835098266601562, -0.011364459991455078, -0.010893821716308594, -0.01042318344116211, -0.009952545166015625, -0.00948190689086914, -0.009011268615722656, -0.008540630340576172, -0.008069992065429688, -0.007599353790283203, -0.007128715515136719, -0.006658077239990234, -0.00618743896484375, -0.005716800689697266, -0.005246162414550781, -0.004775524139404297, -0.0043048858642578125, -0.003834247589111328, -0.0033636093139648438, -0.0028929710388183594, -0.002422332763671875, -0.0019516944885253906, -0.0014810562133789062, -0.0010104179382324219, -0.0005397796630859375, -6.914138793945312e-05, 0.00040149688720703125, 0.0008721351623535156, 0.0013427734375, 0.0018134117126464844, 0.0022840499877929688, 0.002754688262939453, 0.0032253265380859375, 0.003695964813232422, 0.004166603088378906, 0.004637241363525391, 0.005107879638671875, 0.005578517913818359, 0.006049156188964844, 0.006519794464111328, 0.0069904327392578125, 0.007461071014404297, 0.007931709289550781, 0.008402347564697266, 0.00887298583984375, 0.009343624114990234, 0.009814262390136719, 0.010284900665283203, 0.010755538940429688, 0.011226177215576172, 0.011696815490722656, 0.01216745376586914, 0.012638092041015625, 0.01310873031616211, 0.013579368591308594, 0.014050006866455078, 0.014520645141601562, 0.014991283416748047, 0.015461921691894531, 0.015932559967041016, 0.0164031982421875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 97.0, 917.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04290713369846344, -0.03758405148983002, -0.032260969281196594, -0.02693789079785347, -0.021614808589220047, -0.016291726380586624, -0.0109686478972435, -0.005645565688610077, -0.00032248347997665405, 0.005000597797334194, 0.010323679074645042, 0.015646759420633316, 0.02096984162926674, 0.026292923837900162, 0.031616002321243286, 0.03693908452987671, 0.04226216673851013, 0.047585248947143555, 0.05290833115577698, 0.0582314096391201, 0.06355449557304382, 0.06887757778167725, 0.07420065253973007, 0.0795237347483635, 0.08484681695699692, 0.09016989916563034, 0.09549298137426376, 0.10081605613231659, 0.10613913834095001, 0.11146222054958344, 0.11678530275821686, 0.12210838496685028, 0.1274314522743225, 0.13275453448295593, 0.13807761669158936, 0.14340069890022278, 0.1487237811088562, 0.15404686331748962, 0.15936994552612305, 0.16469302773475647, 0.1700161099433899, 0.17533919215202332, 0.18066227436065674, 0.18598535656929016, 0.19130843877792358, 0.196631520986557, 0.20195460319519043, 0.20727768540382385, 0.21260075271129608, 0.2179238349199295, 0.22324691712856293, 0.22856999933719635, 0.23389308154582977, 0.2392161637544632, 0.24453923106193542, 0.24986231327056885, 0.25518539547920227, 0.2605084776878357, 0.2658315598964691, 0.27115464210510254, 0.27647772431373596, 0.2818008065223694, 0.2871238887310028, 0.29244697093963623, 0.29777005314826965]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 10.0, 5.0, 16.0, 34.0, 46.0, 70.0, 68.0, 92.0, 96.0, 96.0, 96.0, 98.0, 67.0, 52.0, 54.0, 40.0, 20.0, 11.0, 10.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028296470642089844, -0.027525432407855988, -0.026754392310976982, -0.025983352214097977, -0.02521231397986412, -0.024441275745630264, -0.02367023564875126, -0.022899195551872253, -0.022128157317638397, -0.02135711908340454, -0.020586078986525536, -0.01981503888964653, -0.019044000655412674, -0.018272962421178818, -0.017501922324299812, -0.016730882227420807, -0.01595984399318695, -0.01518880482763052, -0.014417765662074089, -0.013646726496517658, -0.012875687330961227, -0.012104648165404797, -0.011333608999848366, -0.010562569834291935, -0.009791530668735504, -0.009020491503179073, -0.008249452337622643, -0.007478413172066212, -0.006707374006509781, -0.00593633484095335, -0.005165295675396919, -0.0043942565098404884, -0.0036232173442840576, -0.002852178178727627, -0.002081139013171196, -0.0013100998476147652, -0.0005390606820583344, 0.00023197848349809647, 0.0010030176490545273, 0.001774056814610958, 0.002545095980167389, 0.0033161351457238197, 0.0040871743112802505, 0.004858213476836681, 0.005629252642393112, 0.006400291807949543, 0.007171330973505974, 0.007942370139062405, 0.008713409304618835, 0.009484448470175266, 0.010255487635731697, 0.011026526801288128, 0.011797565966844559, 0.01256860513240099, 0.01333964429795742, 0.014110683463513851, 0.014881722629070282, 0.015652760863304138, 0.016423800960183144, 0.01719484105706215, 0.017965879291296005, 0.01873691752552986, 0.019507957622408867, 0.020278997719287872, 0.02105003595352173]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 8.0, 17.0, 17.0, 28.0, 39.0, 64.0, 87.0, 126.0, 194.0, 333.0, 561.0, 985.0, 1740.0, 3595.0, 8257.0, 29247.0, 897780.0, 81916.0, 13165.0, 4945.0, 2378.0, 1206.0, 674.0, 405.0, 252.0, 180.0, 103.0, 74.0, 42.0, 35.0, 27.0, 21.0, 10.0, 16.0, 4.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0323486328125, -0.031260013580322266, -0.03017139434814453, -0.029082775115966797, -0.027994155883789062, -0.026905536651611328, -0.025816917419433594, -0.02472829818725586, -0.023639678955078125, -0.02255105972290039, -0.021462440490722656, -0.020373821258544922, -0.019285202026367188, -0.018196582794189453, -0.01710796356201172, -0.016019344329833984, -0.01493072509765625, -0.013842105865478516, -0.012753486633300781, -0.011664867401123047, -0.010576248168945312, -0.009487628936767578, -0.008399009704589844, -0.007310390472412109, -0.006221771240234375, -0.005133152008056641, -0.004044532775878906, -0.002955913543701172, -0.0018672943115234375, -0.0007786750793457031, 0.00030994415283203125, 0.0013985633850097656, 0.0024871826171875, 0.0035758018493652344, 0.004664421081542969, 0.005753040313720703, 0.0068416595458984375, 0.007930278778076172, 0.009018898010253906, 0.01010751724243164, 0.011196136474609375, 0.01228475570678711, 0.013373374938964844, 0.014461994171142578, 0.015550613403320312, 0.016639232635498047, 0.01772785186767578, 0.018816471099853516, 0.01990509033203125, 0.020993709564208984, 0.02208232879638672, 0.023170948028564453, 0.024259567260742188, 0.025348186492919922, 0.026436805725097656, 0.02752542495727539, 0.028614044189453125, 0.02970266342163086, 0.030791282653808594, 0.03187990188598633, 0.03296852111816406, 0.0340571403503418, 0.03514575958251953, 0.036234378814697266, 0.037322998046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 10.0, 9.0, 11.0, 18.0, 26.0, 66.0, 178.0, 297.0, 180.0, 75.0, 21.0, 13.0, 13.0, 8.0, 11.0, 6.0, 4.0, 5.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0157318115234375, -0.015273571014404297, -0.014815330505371094, -0.01435708999633789, -0.013898849487304688, -0.013440608978271484, -0.012982368469238281, -0.012524127960205078, -0.012065887451171875, -0.011607646942138672, -0.011149406433105469, -0.010691165924072266, -0.010232925415039062, -0.00977468490600586, -0.009316444396972656, -0.008858203887939453, -0.00839996337890625, -0.007941722869873047, -0.007483482360839844, -0.007025241851806641, -0.0065670013427734375, -0.006108760833740234, -0.005650520324707031, -0.005192279815673828, -0.004734039306640625, -0.004275798797607422, -0.0038175582885742188, -0.0033593177795410156, -0.0029010772705078125, -0.0024428367614746094, -0.0019845962524414062, -0.0015263557434082031, -0.001068115234375, -0.0006098747253417969, -0.00015163421630859375, 0.0003066062927246094, 0.0007648468017578125, 0.0012230873107910156, 0.0016813278198242188, 0.002139568328857422, 0.002597808837890625, 0.003056049346923828, 0.0035142898559570312, 0.003972530364990234, 0.0044307708740234375, 0.004889011383056641, 0.005347251892089844, 0.005805492401123047, 0.00626373291015625, 0.006721973419189453, 0.007180213928222656, 0.007638454437255859, 0.008096694946289062, 0.008554935455322266, 0.009013175964355469, 0.009471416473388672, 0.009929656982421875, 0.010387897491455078, 0.010846138000488281, 0.011304378509521484, 0.011762619018554688, 0.01222085952758789, 0.012679100036621094, 0.013137340545654297, 0.0135955810546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 10.0, 13.0, 15.0, 15.0, 15.0, 17.0, 17.0, 20.0, 31.0, 41.0, 53.0, 90.0, 145.0, 190.0, 361.0, 760.0, 1678.0, 13797.0, 1021831.0, 6426.0, 1409.0, 650.0, 317.0, 177.0, 134.0, 80.0, 77.0, 38.0, 37.0, 19.0, 21.0, 15.0, 9.0, 14.0, 12.0, 4.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0587158203125, -0.05657386779785156, -0.054431915283203125, -0.05228996276855469, -0.05014801025390625, -0.04800605773925781, -0.045864105224609375, -0.04372215270996094, -0.0415802001953125, -0.03943824768066406, -0.037296295166015625, -0.03515434265136719, -0.03301239013671875, -0.030870437622070312, -0.028728485107421875, -0.026586532592773438, -0.024444580078125, -0.022302627563476562, -0.020160675048828125, -0.018018722534179688, -0.01587677001953125, -0.013734817504882812, -0.011592864990234375, -0.009450912475585938, -0.0073089599609375, -0.0051670074462890625, -0.003025054931640625, -0.0008831024169921875, 0.00125885009765625, 0.0034008026123046875, 0.005542755126953125, 0.0076847076416015625, 0.00982666015625, 0.011968612670898438, 0.014110565185546875, 0.016252517700195312, 0.01839447021484375, 0.020536422729492188, 0.022678375244140625, 0.024820327758789062, 0.0269622802734375, 0.029104232788085938, 0.031246185302734375, 0.03338813781738281, 0.03553009033203125, 0.03767204284667969, 0.039813995361328125, 0.04195594787597656, 0.044097900390625, 0.04623985290527344, 0.048381805419921875, 0.05052375793457031, 0.05266571044921875, 0.05480766296386719, 0.056949615478515625, 0.05909156799316406, 0.0612335205078125, 0.06337547302246094, 0.06551742553710938, 0.06765937805175781, 0.06980133056640625, 0.07194328308105469, 0.07408523559570312, 0.07622718811035156, 0.078369140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 12.0, 17.0, 13.0, 13.0, 16.0, 15.0, 20.0, 18.0, 27.0, 26.0, 39.0, 36.0, 39.0, 37.0, 41.0, 51.0, 44.0, 40.0, 61.0, 47.0, 45.0, 36.0, 51.0, 34.0, 30.0, 36.0, 19.0, 27.0, 18.0, 18.0, 13.0, 12.0, 10.0, 12.0, 4.0, 6.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.031341552734375, -0.0301971435546875, -0.029052734375, -0.0279083251953125, -0.026763916015625, -0.0256195068359375, -0.02447509765625, -0.0233306884765625, -0.022186279296875, -0.0210418701171875, -0.0198974609375, -0.0187530517578125, -0.017608642578125, -0.0164642333984375, -0.01531982421875, -0.0141754150390625, -0.013031005859375, -0.0118865966796875, -0.0107421875, -0.0095977783203125, -0.008453369140625, -0.0073089599609375, -0.00616455078125, -0.0050201416015625, -0.003875732421875, -0.0027313232421875, -0.0015869140625, -0.0004425048828125, 0.000701904296875, 0.0018463134765625, 0.00299072265625, 0.0041351318359375, 0.005279541015625, 0.0064239501953125, 0.007568359375, 0.0087127685546875, 0.009857177734375, 0.0110015869140625, 0.01214599609375, 0.0132904052734375, 0.014434814453125, 0.0155792236328125, 0.0167236328125, 0.0178680419921875, 0.019012451171875, 0.0201568603515625, 0.02130126953125, 0.0224456787109375, 0.023590087890625, 0.0247344970703125, 0.02587890625, 0.0270233154296875, 0.028167724609375, 0.0293121337890625, 0.03045654296875, 0.0316009521484375, 0.032745361328125, 0.0338897705078125, 0.0350341796875, 0.0361785888671875, 0.037322998046875, 0.0384674072265625, 0.03961181640625, 0.0407562255859375, 0.041900634765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 10.0, 15.0, 23.0, 47.0, 64.0, 120.0, 377.0, 976.0, 7619.0, 955137.0, 80379.0, 2754.0, 514.0, 218.0, 107.0, 62.0, 40.0, 28.0, 14.0, 13.0, 6.0, 6.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.574920654296875e-05, -2.50302255153656e-05, -2.431124448776245e-05, -2.3592263460159302e-05, -2.2873282432556152e-05, -2.2154301404953003e-05, -2.1435320377349854e-05, -2.0716339349746704e-05, -1.9997358322143555e-05, -1.9278377294540405e-05, -1.8559396266937256e-05, -1.7840415239334106e-05, -1.7121434211730957e-05, -1.6402453184127808e-05, -1.5683472156524658e-05, -1.4964491128921509e-05, -1.424551010131836e-05, -1.352652907371521e-05, -1.280754804611206e-05, -1.2088567018508911e-05, -1.1369585990905762e-05, -1.0650604963302612e-05, -9.931623935699463e-06, -9.212642908096313e-06, -8.493661880493164e-06, -7.774680852890015e-06, -7.055699825286865e-06, -6.336718797683716e-06, -5.617737770080566e-06, -4.898756742477417e-06, -4.179775714874268e-06, -3.460794687271118e-06, -2.7418136596679688e-06, -2.0228326320648193e-06, -1.30385160446167e-06, -5.848705768585205e-07, 1.341104507446289e-07, 8.530914783477783e-07, 1.5720725059509277e-06, 2.291053533554077e-06, 3.0100345611572266e-06, 3.729015588760376e-06, 4.447996616363525e-06, 5.166977643966675e-06, 5.885958671569824e-06, 6.604939699172974e-06, 7.323920726776123e-06, 8.042901754379272e-06, 8.761882781982422e-06, 9.480863809585571e-06, 1.019984483718872e-05, 1.091882586479187e-05, 1.163780689239502e-05, 1.2356787919998169e-05, 1.3075768947601318e-05, 1.3794749975204468e-05, 1.4513731002807617e-05, 1.5232712030410767e-05, 1.5951693058013916e-05, 1.6670674085617065e-05, 1.7389655113220215e-05, 1.8108636140823364e-05, 1.8827617168426514e-05, 1.9546598196029663e-05, 2.0265579223632812e-05]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 9.0, 12.0, 14.0, 21.0, 42.0, 47.0, 77.0, 99.0, 127.0, 110.0, 117.0, 97.0, 74.0, 38.0, 29.0, 21.0, 14.0, 21.0, 7.0, 2.0, 5.0, 8.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5139579772949219e-05, -1.473352313041687e-05, -1.4327466487884521e-05, -1.3921409845352173e-05, -1.3515353202819824e-05, -1.3109296560287476e-05, -1.2703239917755127e-05, -1.2297183275222778e-05, -1.189112663269043e-05, -1.1485069990158081e-05, -1.1079013347625732e-05, -1.0672956705093384e-05, -1.0266900062561035e-05, -9.860843420028687e-06, -9.454786777496338e-06, -9.04873013496399e-06, -8.64267349243164e-06, -8.236616849899292e-06, -7.830560207366943e-06, -7.424503564834595e-06, -7.018446922302246e-06, -6.6123902797698975e-06, -6.206333637237549e-06, -5.8002769947052e-06, -5.3942203521728516e-06, -4.988163709640503e-06, -4.582107067108154e-06, -4.176050424575806e-06, -3.769993782043457e-06, -3.3639371395111084e-06, -2.9578804969787598e-06, -2.551823854446411e-06, -2.1457672119140625e-06, -1.7397105693817139e-06, -1.3336539268493652e-06, -9.275972843170166e-07, -5.21540641784668e-07, -1.1548399925231934e-07, 2.905726432800293e-07, 6.966292858123779e-07, 1.1026859283447266e-06, 1.5087425708770752e-06, 1.914799213409424e-06, 2.3208558559417725e-06, 2.726912498474121e-06, 3.1329691410064697e-06, 3.5390257835388184e-06, 3.945082426071167e-06, 4.351139068603516e-06, 4.757195711135864e-06, 5.163252353668213e-06, 5.5693089962005615e-06, 5.97536563873291e-06, 6.381422281265259e-06, 6.787478923797607e-06, 7.193535566329956e-06, 7.599592208862305e-06, 8.005648851394653e-06, 8.411705493927002e-06, 8.81776213645935e-06, 9.2238187789917e-06, 9.629875421524048e-06, 1.0035932064056396e-05, 1.0441988706588745e-05, 1.0848045349121094e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 3.0, 10.0, 14.0, 6.0, 36.0, 32.0, 80.0, 167.0, 468.0, 6586.0, 1039368.0, 1253.0, 260.0, 109.0, 59.0, 33.0, 22.0, 6.0, 17.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.514787673950195e-05, -6.330106407403946e-05, -6.145425140857697e-05, -5.960743874311447e-05, -5.776062607765198e-05, -5.5913813412189484e-05, -5.406700074672699e-05, -5.2220188081264496e-05, -5.0373375415802e-05, -4.852656275033951e-05, -4.6679750084877014e-05, -4.483293741941452e-05, -4.2986124753952026e-05, -4.113931208848953e-05, -3.929249942302704e-05, -3.7445686757564545e-05, -3.559887409210205e-05, -3.375206142663956e-05, -3.190524876117706e-05, -3.005843609571457e-05, -2.8211623430252075e-05, -2.636481076478958e-05, -2.4517998099327087e-05, -2.2671185433864594e-05, -2.08243727684021e-05, -1.8977560102939606e-05, -1.7130747437477112e-05, -1.5283934772014618e-05, -1.3437122106552124e-05, -1.159030944108963e-05, -9.743496775627136e-06, -7.896684110164642e-06, -6.0498714447021484e-06, -4.2030587792396545e-06, -2.3562461137771606e-06, -5.094334483146667e-07, 1.3373792171478271e-06, 3.184191882610321e-06, 5.031004548072815e-06, 6.877817213535309e-06, 8.724629878997803e-06, 1.0571442544460297e-05, 1.241825520992279e-05, 1.4265067875385284e-05, 1.611188054084778e-05, 1.7958693206310272e-05, 1.9805505871772766e-05, 2.165231853723526e-05, 2.3499131202697754e-05, 2.5345943868160248e-05, 2.7192756533622742e-05, 2.9039569199085236e-05, 3.088638186454773e-05, 3.2733194530010223e-05, 3.458000719547272e-05, 3.642681986093521e-05, 3.8273632526397705e-05, 4.01204451918602e-05, 4.196725785732269e-05, 4.381407052278519e-05, 4.566088318824768e-05, 4.7507695853710175e-05, 4.935450851917267e-05, 5.120132118463516e-05, 5.3048133850097656e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 7.0, 5.0, 17.0, 14.0, 24.0, 41.0, 69.0, 141.0, 418.0, 124.0, 40.0, 23.0, 21.0, 13.0, 8.0, 6.0, 11.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4689903259277344e-05, -3.370549529790878e-05, -3.272108733654022e-05, -3.173667937517166e-05, -3.07522714138031e-05, -2.976786345243454e-05, -2.878345549106598e-05, -2.7799047529697418e-05, -2.6814639568328857e-05, -2.5830231606960297e-05, -2.4845823645591736e-05, -2.3861415684223175e-05, -2.2877007722854614e-05, -2.1892599761486053e-05, -2.0908191800117493e-05, -1.9923783838748932e-05, -1.893937587738037e-05, -1.795496791601181e-05, -1.697055995464325e-05, -1.598615199327469e-05, -1.5001744031906128e-05, -1.4017336070537567e-05, -1.3032928109169006e-05, -1.2048520147800446e-05, -1.1064112186431885e-05, -1.0079704225063324e-05, -9.095296263694763e-06, -8.110888302326202e-06, -7.126480340957642e-06, -6.142072379589081e-06, -5.15766441822052e-06, -4.173256456851959e-06, -3.1888484954833984e-06, -2.2044405341148376e-06, -1.2200325727462769e-06, -2.3562461137771606e-07, 7.487833499908447e-07, 1.7331913113594055e-06, 2.7175992727279663e-06, 3.702007234096527e-06, 4.686415195465088e-06, 5.670823156833649e-06, 6.6552311182022095e-06, 7.63963907957077e-06, 8.624047040939331e-06, 9.608455002307892e-06, 1.0592862963676453e-05, 1.1577270925045013e-05, 1.2561678886413574e-05, 1.3546086847782135e-05, 1.4530494809150696e-05, 1.5514902770519257e-05, 1.6499310731887817e-05, 1.7483718693256378e-05, 1.846812665462494e-05, 1.94525346159935e-05, 2.043694257736206e-05, 2.142135053873062e-05, 2.2405758500099182e-05, 2.3390166461467743e-05, 2.4374574422836304e-05, 2.5358982384204865e-05, 2.6343390345573425e-05, 2.7327798306941986e-05, 2.8312206268310547e-05]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 9.0, 57.0, 747.0, 183.0, 13.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4693419337272644, -0.45971786975860596, -0.4500938057899475, -0.4404697120189667, -0.4308456480503082, -0.4212215840816498, -0.41159749031066895, -0.4019734263420105, -0.39234936237335205, -0.3827252984046936, -0.37310123443603516, -0.3634771406650543, -0.3538530766963959, -0.3442290127277374, -0.3346049189567566, -0.32498085498809814, -0.3153567910194397, -0.30573272705078125, -0.2961086630821228, -0.28648456931114197, -0.2768605053424835, -0.2672364413738251, -0.25761234760284424, -0.2479882836341858, -0.23836421966552734, -0.2287401556968689, -0.21911607682704926, -0.20949199795722961, -0.19986793398857117, -0.19024387001991272, -0.18061979115009308, -0.17099571228027344, -0.1613716185092926, -0.15174755454063416, -0.14212347567081451, -0.13249939680099487, -0.12287533283233643, -0.11325126141309738, -0.10362718999385834, -0.0940031185746193, -0.08437904715538025, -0.0747549757361412, -0.06513090431690216, -0.055506832897663116, -0.04588276147842407, -0.03625869005918503, -0.026634618639945984, -0.01701054722070694, -0.0073864758014678955, 0.0022375956177711487, 0.011861667037010193, 0.021485738456249237, 0.03110980987548828, 0.040733881294727325, 0.05035795271396637, 0.059982024133205414, 0.06960609555244446, 0.0792301669716835, 0.08885423839092255, 0.09847830981016159, 0.10810238122940063, 0.11772645264863968, 0.12735052406787872, 0.13697460293769836, 0.1465986669063568]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 3.0, 3.0, 2.0, 12.0, 9.0, 2.0, 10.0, 14.0, 15.0, 22.0, 31.0, 24.0, 34.0, 33.0, 29.0, 53.0, 37.0, 49.0, 53.0, 47.0, 45.0, 45.0, 41.0, 56.0, 42.0, 36.0, 43.0, 28.0, 35.0, 22.0, 25.0, 17.0, 15.0, 19.0, 15.0, 11.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17362594604492188, -0.16753961145877838, -0.1614532619714737, -0.1553669273853302, -0.1492805778980255, -0.14319424331188202, -0.13710790872573853, -0.13102155923843384, -0.12493521720170975, -0.11884887516498566, -0.11276253312826157, -0.10667619109153748, -0.10058985650539398, -0.0945035070180893, -0.0884171724319458, -0.08233083039522171, -0.07624448835849762, -0.07015814632177353, -0.06407180428504944, -0.057985465973615646, -0.051899123936891556, -0.045812781900167465, -0.03972644358873367, -0.03364010155200958, -0.027553759515285492, -0.0214674174785614, -0.01538107730448246, -0.009294737130403519, -0.003208395093679428, 0.0028779469430446625, 0.008964285254478455, 0.015050627291202545, 0.021136969327926636, 0.027223311364650726, 0.03330965340137482, 0.03939599171280861, 0.0454823337495327, 0.05156867578625679, 0.05765501409769058, 0.06374135613441467, 0.06982769817113876, 0.07591404020786285, 0.08200038224458694, 0.08808672428131104, 0.09417305886745453, 0.10025940835475922, 0.10634574294090271, 0.1124320849776268, 0.11851842701435089, 0.12460476905107498, 0.13069111108779907, 0.13677744567394257, 0.14286379516124725, 0.14895012974739075, 0.15503647923469543, 0.16112281382083893, 0.16720914840698242, 0.17329548299312592, 0.1793818324804306, 0.1854681670665741, 0.19155451655387878, 0.19764085114002228, 0.20372718572616577, 0.20981353521347046, 0.21589988470077515]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 9.0, 5.0, 5.0, 8.0, 14.0, 11.0, 19.0, 23.0, 27.0, 43.0, 59.0, 691.0, 6407.0, 4180736.0, 5006.0, 781.0, 246.0, 42.0, 35.0, 20.0, 19.0, 16.0, 9.0, 8.0, 6.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032379150390625, -0.03143906593322754, -0.030498981475830078, -0.029558897018432617, -0.028618812561035156, -0.027678728103637695, -0.026738643646240234, -0.025798559188842773, -0.024858474731445312, -0.02391839027404785, -0.02297830581665039, -0.02203822135925293, -0.02109813690185547, -0.020158052444458008, -0.019217967987060547, -0.018277883529663086, -0.017337799072265625, -0.016397714614868164, -0.015457630157470703, -0.014517545700073242, -0.013577461242675781, -0.01263737678527832, -0.01169729232788086, -0.010757207870483398, -0.009817123413085938, -0.008877038955688477, -0.007936954498291016, -0.006996870040893555, -0.006056785583496094, -0.005116701126098633, -0.004176616668701172, -0.003236532211303711, -0.00229644775390625, -0.001356363296508789, -0.0004162788391113281, 0.0005238056182861328, 0.0014638900756835938, 0.0024039745330810547, 0.0033440589904785156, 0.0042841434478759766, 0.0052242279052734375, 0.0061643123626708984, 0.007104396820068359, 0.00804448127746582, 0.008984565734863281, 0.009924650192260742, 0.010864734649658203, 0.011804819107055664, 0.012744903564453125, 0.013684988021850586, 0.014625072479248047, 0.015565156936645508, 0.01650524139404297, 0.01744532585144043, 0.01838541030883789, 0.01932549476623535, 0.020265579223632812, 0.021205663681030273, 0.022145748138427734, 0.023085832595825195, 0.024025917053222656, 0.024966001510620117, 0.025906085968017578, 0.02684617042541504, 0.0277862548828125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 2.0, 5.0, 7.0, 8.0, 9.0, 11.0, 19.0, 28.0, 61.0, 176.0, 301.0, 179.0, 77.0, 18.0, 13.0, 15.0, 9.0, 10.0, 6.0, 4.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01555633544921875, -0.015103340148925781, -0.014650344848632812, -0.014197349548339844, -0.013744354248046875, -0.013291358947753906, -0.012838363647460938, -0.012385368347167969, -0.011932373046875, -0.011479377746582031, -0.011026382446289062, -0.010573387145996094, -0.010120391845703125, -0.009667396545410156, -0.009214401245117188, -0.008761405944824219, -0.00830841064453125, -0.007855415344238281, -0.0074024200439453125, -0.006949424743652344, -0.006496429443359375, -0.006043434143066406, -0.0055904388427734375, -0.005137443542480469, -0.0046844482421875, -0.004231452941894531, -0.0037784576416015625, -0.0033254623413085938, -0.002872467041015625, -0.0024194717407226562, -0.0019664764404296875, -0.0015134811401367188, -0.00106048583984375, -0.0006074905395507812, -0.0001544952392578125, 0.00029850006103515625, 0.000751495361328125, 0.0012044906616210938, 0.0016574859619140625, 0.0021104812622070312, 0.0025634765625, 0.0030164718627929688, 0.0034694671630859375, 0.003922462463378906, 0.004375457763671875, 0.004828453063964844, 0.0052814483642578125, 0.005734443664550781, 0.00618743896484375, 0.006640434265136719, 0.0070934295654296875, 0.007546424865722656, 0.007999420166015625, 0.008452415466308594, 0.008905410766601562, 0.009358406066894531, 0.0098114013671875, 0.010264396667480469, 0.010717391967773438, 0.011170387268066406, 0.011623382568359375, 0.012076377868652344, 0.012529373168945312, 0.012982368469238281, 0.01343536376953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 8.0, 25.0, 60.0, 172.0, 615.0, 4753.0, 4183202.0, 4506.0, 631.0, 167.0, 66.0, 31.0, 14.0, 5.0, 4.0, 0.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019195556640625, -0.018497228622436523, -0.017798900604248047, -0.01710057258605957, -0.016402244567871094, -0.015703916549682617, -0.01500558853149414, -0.014307260513305664, -0.013608932495117188, -0.012910604476928711, -0.012212276458740234, -0.011513948440551758, -0.010815620422363281, -0.010117292404174805, -0.009418964385986328, -0.008720636367797852, -0.008022308349609375, -0.0073239803314208984, -0.006625652313232422, -0.005927324295043945, -0.005228996276855469, -0.004530668258666992, -0.0038323402404785156, -0.003134012222290039, -0.0024356842041015625, -0.001737356185913086, -0.0010390281677246094, -0.0003407001495361328, 0.00035762786865234375, 0.0010559558868408203, 0.0017542839050292969, 0.0024526119232177734, 0.00315093994140625, 0.0038492679595947266, 0.004547595977783203, 0.00524592399597168, 0.005944252014160156, 0.006642580032348633, 0.007340908050537109, 0.008039236068725586, 0.008737564086914062, 0.009435892105102539, 0.010134220123291016, 0.010832548141479492, 0.011530876159667969, 0.012229204177856445, 0.012927532196044922, 0.013625860214233398, 0.014324188232421875, 0.015022516250610352, 0.015720844268798828, 0.016419172286987305, 0.01711750030517578, 0.017815828323364258, 0.018514156341552734, 0.01921248435974121, 0.019910812377929688, 0.020609140396118164, 0.02130746841430664, 0.022005796432495117, 0.022704124450683594, 0.02340245246887207, 0.024100780487060547, 0.024799108505249023, 0.0254974365234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 12.0, 24.0, 29.0, 121.0, 3778.0, 65.0, 24.0, 15.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00901031494140625, -0.00878685712814331, -0.008563399314880371, -0.008339941501617432, -0.008116483688354492, -0.007893025875091553, -0.007669568061828613, -0.007446110248565674, -0.007222652435302734, -0.006999194622039795, -0.0067757368087768555, -0.006552278995513916, -0.0063288211822509766, -0.006105363368988037, -0.005881905555725098, -0.005658447742462158, -0.005434989929199219, -0.005211532115936279, -0.00498807430267334, -0.0047646164894104, -0.004541158676147461, -0.0043177008628845215, -0.004094243049621582, -0.0038707852363586426, -0.003647327423095703, -0.0034238696098327637, -0.0032004117965698242, -0.0029769539833068848, -0.0027534961700439453, -0.002530038356781006, -0.0023065805435180664, -0.002083122730255127, -0.0018596649169921875, -0.001636207103729248, -0.0014127492904663086, -0.0011892914772033691, -0.0009658336639404297, -0.0007423758506774902, -0.0005189180374145508, -0.00029546022415161133, -7.200241088867188e-05, 0.00015145540237426758, 0.00037491321563720703, 0.0005983710289001465, 0.0008218288421630859, 0.0010452866554260254, 0.0012687444686889648, 0.0014922022819519043, 0.0017156600952148438, 0.0019391179084777832, 0.0021625757217407227, 0.002386033535003662, 0.0026094913482666016, 0.002832949161529541, 0.0030564069747924805, 0.00327986478805542, 0.0035033226013183594, 0.003726780414581299, 0.003950238227844238, 0.004173696041107178, 0.004397153854370117, 0.004620611667633057, 0.004844069480895996, 0.0050675272941589355, 0.005290985107421875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1006.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14005768299102783, -0.13662545382976532, -0.1331932246685028, -0.1297610104084015, -0.12632878124713898, -0.12289655208587646, -0.11946432292461395, -0.11603209376335144, -0.11259986460208893, -0.10916763544082642, -0.1057354137301445, -0.10230318456888199, -0.09887095540761948, -0.09543873369693756, -0.09200650453567505, -0.08857427537441254, -0.08514205366373062, -0.08170982450246811, -0.0782776027917862, -0.07484537363052368, -0.07141314446926117, -0.06798091530799866, -0.06454869359731674, -0.06111646443605423, -0.057684239000082016, -0.0542520135641098, -0.05081978440284729, -0.047387558966875076, -0.04395533353090286, -0.04052310436964035, -0.03709087893366814, -0.03365865349769592, -0.03022642433643341, -0.026794197037816048, -0.023361969739198685, -0.01992974430322647, -0.016497517004609108, -0.013065289705991745, -0.009633064270019531, -0.006200836971402168, -0.0027686096727848053, 0.0006636171601712704, 0.004095843993127346, 0.007528070360422134, 0.010960297659039497, 0.01439252495765686, 0.017824750393629074, 0.021256977692246437, 0.0246892049908638, 0.028121432289481163, 0.031553659588098526, 0.03498588502407074, 0.03841811418533325, 0.041850339621305466, 0.04528256505727768, 0.04871479421854019, 0.052147019654512405, 0.05557924509048462, 0.05901147425174713, 0.062443699687719345, 0.06587592512369156, 0.06930815428495407, 0.07274037599563599, 0.0761726051568985, 0.07960483431816101]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 11.0, 10.0, 14.0, 24.0, 36.0, 44.0, 51.0, 67.0, 74.0, 93.0, 82.0, 88.0, 78.0, 72.0, 61.0, 52.0, 38.0, 33.0, 23.0, 16.0, 9.0, 9.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011494576930999756, -0.011146392673254013, -0.01079820841550827, -0.010450024157762527, -0.010101839900016785, -0.009753655642271042, -0.009405471384525299, -0.009057287126779556, -0.008709102869033813, -0.00836091861128807, -0.008012734353542328, -0.007664550095796585, -0.007316365838050842, -0.0069681815803050995, -0.006619997322559357, -0.006271813064813614, -0.005923628807067871, -0.005575444549322128, -0.0052272602915763855, -0.004879076033830643, -0.0045308917760849, -0.004182707518339157, -0.0038345232605934143, -0.0034863390028476715, -0.0031381547451019287, -0.002789970487356186, -0.002441786229610443, -0.0020936019718647003, -0.0017454177141189575, -0.0013972334563732147, -0.001049049198627472, -0.0007008649408817291, -0.00035268068313598633, -4.49642539024353e-06, 0.00034368783235549927, 0.0006918720901012421, 0.0010400563478469849, 0.0013882406055927277, 0.0017364248633384705, 0.0020846091210842133, 0.002432793378829956, 0.002780977636575699, 0.0031291618943214417, 0.0034773461520671844, 0.0038255304098129272, 0.00417371466755867, 0.004521898925304413, 0.004870083183050156, 0.0052182674407958984, 0.005566451698541641, 0.005914635956287384, 0.006262820214033127, 0.00661100447177887, 0.006959188729524612, 0.007307372987270355, 0.007655557245016098, 0.00800374150276184, 0.008351925760507584, 0.008700110018253326, 0.00904829427599907, 0.009396478533744812, 0.009744662791490555, 0.010092847049236298, 0.01044103130698204, 0.010789215564727783]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 0.0, 2.0, 7.0, 4.0, 10.0, 9.0, 16.0, 27.0, 39.0, 60.0, 75.0, 146.0, 243.0, 439.0, 892.0, 1939.0, 5538.0, 22755.0, 939082.0, 62352.0, 9144.0, 3101.0, 1329.0, 564.0, 331.0, 203.0, 91.0, 46.0, 35.0, 21.0, 15.0, 11.0, 9.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0269622802734375, -0.02605462074279785, -0.025146961212158203, -0.024239301681518555, -0.023331642150878906, -0.022423982620239258, -0.02151632308959961, -0.02060866355895996, -0.019701004028320312, -0.018793344497680664, -0.017885684967041016, -0.016978025436401367, -0.01607036590576172, -0.01516270637512207, -0.014255046844482422, -0.013347387313842773, -0.012439727783203125, -0.011532068252563477, -0.010624408721923828, -0.00971674919128418, -0.008809089660644531, -0.007901430130004883, -0.006993770599365234, -0.006086111068725586, -0.0051784515380859375, -0.004270792007446289, -0.0033631324768066406, -0.002455472946166992, -0.0015478134155273438, -0.0006401538848876953, 0.0002675056457519531, 0.0011751651763916016, 0.00208282470703125, 0.0029904842376708984, 0.003898143768310547, 0.004805803298950195, 0.005713462829589844, 0.006621122360229492, 0.007528781890869141, 0.008436441421508789, 0.009344100952148438, 0.010251760482788086, 0.011159420013427734, 0.012067079544067383, 0.012974739074707031, 0.01388239860534668, 0.014790058135986328, 0.015697717666625977, 0.016605377197265625, 0.017513036727905273, 0.018420696258544922, 0.01932835578918457, 0.02023601531982422, 0.021143674850463867, 0.022051334381103516, 0.022958993911743164, 0.023866653442382812, 0.02477431297302246, 0.02568197250366211, 0.026589632034301758, 0.027497291564941406, 0.028404951095581055, 0.029312610626220703, 0.03022027015686035, 0.0311279296875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 2.0, 5.0, 7.0, 8.0, 9.0, 11.0, 19.0, 27.0, 62.0, 179.0, 298.0, 177.0, 79.0, 18.0, 13.0, 15.0, 9.0, 10.0, 6.0, 5.0, 5.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01555633544921875, -0.015103340148925781, -0.014650344848632812, -0.014197349548339844, -0.013744354248046875, -0.013291358947753906, -0.012838363647460938, -0.012385368347167969, -0.011932373046875, -0.011479377746582031, -0.011026382446289062, -0.010573387145996094, -0.010120391845703125, -0.009667396545410156, -0.009214401245117188, -0.008761405944824219, -0.00830841064453125, -0.007855415344238281, -0.0074024200439453125, -0.006949424743652344, -0.006496429443359375, -0.006043434143066406, -0.0055904388427734375, -0.005137443542480469, -0.0046844482421875, -0.004231452941894531, -0.0037784576416015625, -0.0033254623413085938, -0.002872467041015625, -0.0024194717407226562, -0.0019664764404296875, -0.0015134811401367188, -0.00106048583984375, -0.0006074905395507812, -0.0001544952392578125, 0.00029850006103515625, 0.000751495361328125, 0.0012044906616210938, 0.0016574859619140625, 0.0021104812622070312, 0.0025634765625, 0.0030164718627929688, 0.0034694671630859375, 0.003922462463378906, 0.004375457763671875, 0.004828453063964844, 0.0052814483642578125, 0.005734443664550781, 0.00618743896484375, 0.006640434265136719, 0.0070934295654296875, 0.007546424865722656, 0.007999420166015625, 0.008452415466308594, 0.008905410766601562, 0.009358406066894531, 0.0098114013671875, 0.010264396667480469, 0.010717391967773438, 0.011170387268066406, 0.011623382568359375, 0.012076377868652344, 0.012529373168945312, 0.012982368469238281, 0.01343536376953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 15.0, 7.0, 5.0, 12.0, 19.0, 31.0, 24.0, 34.0, 59.0, 59.0, 102.0, 155.0, 230.0, 545.0, 1549.0, 17758.0, 1020960.0, 4814.0, 1086.0, 381.0, 211.0, 133.0, 95.0, 77.0, 42.0, 27.0, 37.0, 15.0, 17.0, 15.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0487060546875, -0.04698753356933594, -0.045269012451171875, -0.04355049133300781, -0.04183197021484375, -0.04011344909667969, -0.038394927978515625, -0.03667640686035156, -0.0349578857421875, -0.03323936462402344, -0.031520843505859375, -0.029802322387695312, -0.02808380126953125, -0.026365280151367188, -0.024646759033203125, -0.022928237915039062, -0.021209716796875, -0.019491195678710938, -0.017772674560546875, -0.016054153442382812, -0.01433563232421875, -0.012617111206054688, -0.010898590087890625, -0.009180068969726562, -0.0074615478515625, -0.0057430267333984375, -0.004024505615234375, -0.0023059844970703125, -0.00058746337890625, 0.0011310577392578125, 0.002849578857421875, 0.0045680999755859375, 0.00628662109375, 0.008005142211914062, 0.009723663330078125, 0.011442184448242188, 0.01316070556640625, 0.014879226684570312, 0.016597747802734375, 0.018316268920898438, 0.0200347900390625, 0.021753311157226562, 0.023471832275390625, 0.025190353393554688, 0.02690887451171875, 0.028627395629882812, 0.030345916748046875, 0.03206443786621094, 0.033782958984375, 0.03550148010253906, 0.037220001220703125, 0.03893852233886719, 0.04065704345703125, 0.04237556457519531, 0.044094085693359375, 0.04581260681152344, 0.0475311279296875, 0.04924964904785156, 0.050968170166015625, 0.05268669128417969, 0.05440521240234375, 0.05612373352050781, 0.057842254638671875, 0.05956077575683594, 0.061279296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 15.0, 7.0, 4.0, 12.0, 14.0, 29.0, 20.0, 24.0, 31.0, 35.0, 42.0, 44.0, 43.0, 39.0, 51.0, 50.0, 44.0, 61.0, 48.0, 52.0, 50.0, 44.0, 40.0, 41.0, 28.0, 20.0, 31.0, 15.0, 17.0, 14.0, 10.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034637451171875, -0.03341484069824219, -0.032192230224609375, -0.030969619750976562, -0.02974700927734375, -0.028524398803710938, -0.027301788330078125, -0.026079177856445312, -0.0248565673828125, -0.023633956909179688, -0.022411346435546875, -0.021188735961914062, -0.01996612548828125, -0.018743515014648438, -0.017520904541015625, -0.016298294067382812, -0.01507568359375, -0.013853073120117188, -0.012630462646484375, -0.011407852172851562, -0.01018524169921875, -0.008962631225585938, -0.007740020751953125, -0.0065174102783203125, -0.0052947998046875, -0.0040721893310546875, -0.002849578857421875, -0.0016269683837890625, -0.00040435791015625, 0.0008182525634765625, 0.002040863037109375, 0.0032634735107421875, 0.004486083984375, 0.0057086944580078125, 0.006931304931640625, 0.008153915405273438, 0.00937652587890625, 0.010599136352539062, 0.011821746826171875, 0.013044357299804688, 0.0142669677734375, 0.015489578247070312, 0.016712188720703125, 0.017934799194335938, 0.01915740966796875, 0.020380020141601562, 0.021602630615234375, 0.022825241088867188, 0.0240478515625, 0.025270462036132812, 0.026493072509765625, 0.027715682983398438, 0.02893829345703125, 0.030160903930664062, 0.031383514404296875, 0.03260612487792969, 0.0338287353515625, 0.03505134582519531, 0.036273956298828125, 0.03749656677246094, 0.03871917724609375, 0.03994178771972656, 0.041164398193359375, 0.04238700866699219, 0.043609619140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 7.0, 12.0, 12.0, 18.0, 25.0, 57.0, 86.0, 166.0, 328.0, 830.0, 3655.0, 39080.0, 985984.0, 14649.0, 2356.0, 671.0, 263.0, 148.0, 83.0, 43.0, 20.0, 28.0, 9.0, 8.0, 0.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.615285873413086e-05, -1.5540048480033875e-05, -1.492723822593689e-05, -1.4314427971839905e-05, -1.370161771774292e-05, -1.3088807463645935e-05, -1.247599720954895e-05, -1.1863186955451965e-05, -1.125037670135498e-05, -1.0637566447257996e-05, -1.002475619316101e-05, -9.411945939064026e-06, -8.799135684967041e-06, -8.186325430870056e-06, -7.573515176773071e-06, -6.9607049226760864e-06, -6.3478946685791016e-06, -5.735084414482117e-06, -5.122274160385132e-06, -4.509463906288147e-06, -3.896653652191162e-06, -3.2838433980941772e-06, -2.6710331439971924e-06, -2.0582228899002075e-06, -1.4454126358032227e-06, -8.326023817062378e-07, -2.1979212760925293e-07, 3.9301812648773193e-07, 1.0058283805847168e-06, 1.6186386346817017e-06, 2.2314488887786865e-06, 2.8442591428756714e-06, 3.4570693969726562e-06, 4.069879651069641e-06, 4.682689905166626e-06, 5.295500159263611e-06, 5.908310413360596e-06, 6.5211206674575806e-06, 7.1339309215545654e-06, 7.74674117565155e-06, 8.359551429748535e-06, 8.97236168384552e-06, 9.585171937942505e-06, 1.019798219203949e-05, 1.0810792446136475e-05, 1.142360270023346e-05, 1.2036412954330444e-05, 1.264922320842743e-05, 1.3262033462524414e-05, 1.3874843716621399e-05, 1.4487653970718384e-05, 1.5100464224815369e-05, 1.5713274478912354e-05, 1.632608473300934e-05, 1.6938894987106323e-05, 1.7551705241203308e-05, 1.8164515495300293e-05, 1.8777325749397278e-05, 1.9390136003494263e-05, 2.0002946257591248e-05, 2.0615756511688232e-05, 2.1228566765785217e-05, 2.1841377019882202e-05, 2.2454187273979187e-05, 2.3066997528076172e-05]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 9.0, 6.0, 17.0, 9.0, 14.0, 16.0, 32.0, 12.0, 30.0, 25.0, 56.0, 60.0, 84.0, 91.0, 158.0, 71.0, 78.0, 45.0, 34.0, 34.0, 32.0, 21.0, 14.0, 18.0, 8.0, 12.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.841255187988281e-06, -5.6335702538490295e-06, -5.425885319709778e-06, -5.218200385570526e-06, -5.010515451431274e-06, -4.802830517292023e-06, -4.595145583152771e-06, -4.387460649013519e-06, -4.179775714874268e-06, -3.972090780735016e-06, -3.764405846595764e-06, -3.5567209124565125e-06, -3.3490359783172607e-06, -3.141351044178009e-06, -2.9336661100387573e-06, -2.7259811758995056e-06, -2.518296241760254e-06, -2.310611307621002e-06, -2.1029263734817505e-06, -1.8952414393424988e-06, -1.687556505203247e-06, -1.4798715710639954e-06, -1.2721866369247437e-06, -1.064501702785492e-06, -8.568167686462402e-07, -6.491318345069885e-07, -4.414469003677368e-07, -2.337619662284851e-07, -2.60770320892334e-08, 1.816079020500183e-07, 3.8929283618927e-07, 5.969777703285217e-07, 8.046627044677734e-07, 1.0123476386070251e-06, 1.2200325727462769e-06, 1.4277175068855286e-06, 1.6354024410247803e-06, 1.843087375164032e-06, 2.0507723093032837e-06, 2.2584572434425354e-06, 2.466142177581787e-06, 2.673827111721039e-06, 2.8815120458602905e-06, 3.0891969799995422e-06, 3.296881914138794e-06, 3.5045668482780457e-06, 3.7122517824172974e-06, 3.919936716556549e-06, 4.127621650695801e-06, 4.3353065848350525e-06, 4.542991518974304e-06, 4.750676453113556e-06, 4.958361387252808e-06, 5.166046321392059e-06, 5.373731255531311e-06, 5.581416189670563e-06, 5.7891011238098145e-06, 5.996786057949066e-06, 6.204470992088318e-06, 6.41215592622757e-06, 6.619840860366821e-06, 6.827525794506073e-06, 7.035210728645325e-06, 7.242895662784576e-06, 7.450580596923828e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 8.0, 5.0, 15.0, 23.0, 23.0, 78.0, 118.0, 535.0, 1003753.0, 43306.0, 435.0, 128.0, 51.0, 24.0, 17.0, 5.0, 8.0, 6.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9723854064941406e-05, -5.806237459182739e-05, -5.640089511871338e-05, -5.4739415645599365e-05, -5.307793617248535e-05, -5.141645669937134e-05, -4.9754977226257324e-05, -4.809349775314331e-05, -4.64320182800293e-05, -4.477053880691528e-05, -4.310905933380127e-05, -4.1447579860687256e-05, -3.978610038757324e-05, -3.812462091445923e-05, -3.6463141441345215e-05, -3.48016619682312e-05, -3.314018249511719e-05, -3.1478703022003174e-05, -2.981722354888916e-05, -2.8155744075775146e-05, -2.6494264602661133e-05, -2.483278512954712e-05, -2.3171305656433105e-05, -2.1509826183319092e-05, -1.9848346710205078e-05, -1.8186867237091064e-05, -1.652538776397705e-05, -1.4863908290863037e-05, -1.3202428817749023e-05, -1.154094934463501e-05, -9.879469871520996e-06, -8.217990398406982e-06, -6.556510925292969e-06, -4.895031452178955e-06, -3.2335519790649414e-06, -1.5720725059509277e-06, 8.940696716308594e-08, 1.7508864402770996e-06, 3.4123659133911133e-06, 5.073845386505127e-06, 6.735324859619141e-06, 8.396804332733154e-06, 1.0058283805847168e-05, 1.1719763278961182e-05, 1.3381242752075195e-05, 1.5042722225189209e-05, 1.6704201698303223e-05, 1.8365681171417236e-05, 2.002716064453125e-05, 2.1688640117645264e-05, 2.3350119590759277e-05, 2.501159906387329e-05, 2.6673078536987305e-05, 2.833455801010132e-05, 2.9996037483215332e-05, 3.1657516956329346e-05, 3.331899642944336e-05, 3.498047590255737e-05, 3.664195537567139e-05, 3.83034348487854e-05, 3.9964914321899414e-05, 4.162639379501343e-05, 4.328787326812744e-05, 4.4949352741241455e-05, 4.661083221435547e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 10.0, 12.0, 7.0, 24.0, 29.0, 89.0, 461.0, 209.0, 69.0, 43.0, 16.0, 3.0, 8.0, 1.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2438507080078125e-05, -4.12575900554657e-05, -4.007667303085327e-05, -3.8895756006240845e-05, -3.771483898162842e-05, -3.653392195701599e-05, -3.5353004932403564e-05, -3.417208790779114e-05, -3.299117088317871e-05, -3.1810253858566284e-05, -3.062933683395386e-05, -2.944841980934143e-05, -2.8267502784729004e-05, -2.7086585760116577e-05, -2.590566873550415e-05, -2.4724751710891724e-05, -2.3543834686279297e-05, -2.236291766166687e-05, -2.1182000637054443e-05, -2.0001083612442017e-05, -1.882016658782959e-05, -1.7639249563217163e-05, -1.6458332538604736e-05, -1.527741551399231e-05, -1.4096498489379883e-05, -1.2915581464767456e-05, -1.173466444015503e-05, -1.0553747415542603e-05, -9.372830390930176e-06, -8.191913366317749e-06, -7.010996341705322e-06, -5.8300793170928955e-06, -4.649162292480469e-06, -3.468245267868042e-06, -2.2873282432556152e-06, -1.1064112186431885e-06, 7.450580596923828e-08, 1.255422830581665e-06, 2.436339855194092e-06, 3.6172568798065186e-06, 4.798173904418945e-06, 5.979090929031372e-06, 7.160007953643799e-06, 8.340924978256226e-06, 9.521842002868652e-06, 1.0702759027481079e-05, 1.1883676052093506e-05, 1.3064593076705933e-05, 1.424551010131836e-05, 1.5426427125930786e-05, 1.6607344150543213e-05, 1.778826117515564e-05, 1.8969178199768066e-05, 2.0150095224380493e-05, 2.133101224899292e-05, 2.2511929273605347e-05, 2.3692846298217773e-05, 2.48737633228302e-05, 2.6054680347442627e-05, 2.7235597372055054e-05, 2.841651439666748e-05, 2.9597431421279907e-05, 3.0778348445892334e-05, 3.195926547050476e-05, 3.314018249511719e-05]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 10.0, 72.0, 759.0, 142.0, 22.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18875259160995483, -0.1807757467031479, -0.17279891669750214, -0.1648220717906952, -0.15684524178504944, -0.1488683968782425, -0.14089155197143555, -0.1329147219657898, -0.12493788450956345, -0.1169610470533371, -0.10898420959711075, -0.1010073721408844, -0.09303052723407745, -0.0850536972284317, -0.07707685232162476, -0.06910001486539841, -0.06112317740917206, -0.05314633995294571, -0.04516950249671936, -0.03719266131520271, -0.029215823858976364, -0.021238986402750015, -0.013262145221233368, -0.005285307765007019, 0.00269152969121933, 0.010668368078768253, 0.018645206466317177, 0.026622045785188675, 0.034598883241415024, 0.04257572069764137, 0.05055256187915802, 0.05852939933538437, 0.06650623679161072, 0.07448307424783707, 0.08245991170406342, 0.09043675661087036, 0.09841358661651611, 0.10639043152332306, 0.11436726897954941, 0.12234410643577576, 0.1303209364414215, 0.13829778134822845, 0.1462746113538742, 0.15425145626068115, 0.1622282862663269, 0.17020513117313385, 0.1781819760799408, 0.18615880608558655, 0.1941356509923935, 0.20211249589920044, 0.2100893259048462, 0.21806617081165314, 0.2260430008172989, 0.23401984572410583, 0.2419966757297516, 0.24997352063655853, 0.2579503655433655, 0.26592719554901123, 0.27390405535697937, 0.2818808853626251, 0.2898577153682709, 0.2978345453739166, 0.30581140518188477, 0.3137882351875305, 0.32176506519317627]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 10.0, 2.0, 14.0, 13.0, 11.0, 16.0, 21.0, 19.0, 25.0, 15.0, 28.0, 26.0, 27.0, 46.0, 56.0, 48.0, 58.0, 52.0, 41.0, 44.0, 47.0, 46.0, 35.0, 37.0, 22.0, 35.0, 36.0, 26.0, 16.0, 25.0, 16.0, 11.0, 9.0, 12.0, 12.0, 12.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357970237731934, -0.15804588794708252, -0.1525120735168457, -0.1469782590866089, -0.14144444465637207, -0.13591064512729645, -0.13037683069705963, -0.12484301626682281, -0.119309201836586, -0.11377538740634918, -0.10824157297611237, -0.10270776599645615, -0.09717395156621933, -0.09164013713598251, -0.0861063301563263, -0.08057251572608948, -0.07503870129585266, -0.06950488686561584, -0.06397107243537903, -0.05843726545572281, -0.05290345102548599, -0.047369636595249176, -0.04183582589030266, -0.03630201518535614, -0.030768200755119324, -0.025234388187527657, -0.01970057561993599, -0.014166763052344322, -0.008632950484752655, -0.003099137917160988, 0.0024346746504306793, 0.007968485355377197, 0.013502299785614014, 0.01903611235320568, 0.024569924920797348, 0.030103737488389015, 0.03563755005598068, 0.0411713644862175, 0.04670517519116402, 0.052238985896110535, 0.05777280032634735, 0.06330661475658417, 0.06884042918682098, 0.0743742361664772, 0.07990805059671402, 0.08544186502695084, 0.09097567200660706, 0.09650948643684387, 0.10204330086708069, 0.1075771152973175, 0.11311092972755432, 0.11864473670721054, 0.12417855113744736, 0.12971235811710358, 0.1352461725473404, 0.1407799869775772, 0.14631380140781403, 0.15184761583805084, 0.15738143026828766, 0.16291524469852448, 0.1684490442276001, 0.17398285865783691, 0.17951667308807373, 0.18505048751831055, 0.19058430194854736]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 2.0, 8.0, 4.0, 6.0, 7.0, 12.0, 14.0, 15.0, 26.0, 97.0, 197.0, 4193578.0, 141.0, 62.0, 22.0, 16.0, 10.0, 10.0, 8.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0020580291748046875, -0.001988232135772705, -0.0019184350967407227, -0.0018486380577087402, -0.0017788410186767578, -0.0017090439796447754, -0.001639246940612793, -0.0015694499015808105, -0.0014996528625488281, -0.0014298558235168457, -0.0013600587844848633, -0.0012902617454528809, -0.0012204647064208984, -0.001150667667388916, -0.0010808706283569336, -0.0010110735893249512, -0.0009412765502929688, -0.0008714795112609863, -0.0008016824722290039, -0.0007318854331970215, -0.0006620883941650391, -0.0005922913551330566, -0.0005224943161010742, -0.0004526972770690918, -0.0003829002380371094, -0.00031310319900512695, -0.00024330615997314453, -0.0001735091209411621, -0.00010371208190917969, -3.3915042877197266e-05, 3.5881996154785156e-05, 0.00010567903518676758, 0.00017547607421875, 0.0002452731132507324, 0.00031507015228271484, 0.00038486719131469727, 0.0004546642303466797, 0.0005244612693786621, 0.0005942583084106445, 0.000664055347442627, 0.0007338523864746094, 0.0008036494255065918, 0.0008734464645385742, 0.0009432435035705566, 0.001013040542602539, 0.0010828375816345215, 0.001152634620666504, 0.0012224316596984863, 0.0012922286987304688, 0.0013620257377624512, 0.0014318227767944336, 0.001501619815826416, 0.0015714168548583984, 0.0016412138938903809, 0.0017110109329223633, 0.0017808079719543457, 0.0018506050109863281, 0.0019204020500183105, 0.001990199089050293, 0.0020599961280822754, 0.002129793167114258, 0.0021995902061462402, 0.0022693872451782227, 0.002339184284210205, 0.0024089813232421875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 6.0, 8.0, 7.0, 9.0, 11.0, 18.0, 24.0, 76.0, 176.0, 292.0, 174.0, 79.0, 20.0, 15.0, 13.0, 9.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015411376953125, -0.014962434768676758, -0.014513492584228516, -0.014064550399780273, -0.013615608215332031, -0.013166666030883789, -0.012717723846435547, -0.012268781661987305, -0.011819839477539062, -0.01137089729309082, -0.010921955108642578, -0.010473012924194336, -0.010024070739746094, -0.009575128555297852, -0.00912618637084961, -0.008677244186401367, -0.008228302001953125, -0.007779359817504883, -0.007330417633056641, -0.0068814754486083984, -0.006432533264160156, -0.005983591079711914, -0.005534648895263672, -0.00508570671081543, -0.0046367645263671875, -0.004187822341918945, -0.003738880157470703, -0.003289937973022461, -0.0028409957885742188, -0.0023920536041259766, -0.0019431114196777344, -0.0014941692352294922, -0.00104522705078125, -0.0005962848663330078, -0.00014734268188476562, 0.00030159950256347656, 0.0007505416870117188, 0.001199483871459961, 0.0016484260559082031, 0.0020973682403564453, 0.0025463104248046875, 0.0029952526092529297, 0.003444194793701172, 0.003893136978149414, 0.004342079162597656, 0.0047910213470458984, 0.005239963531494141, 0.005688905715942383, 0.006137847900390625, 0.006586790084838867, 0.007035732269287109, 0.0074846744537353516, 0.007933616638183594, 0.008382558822631836, 0.008831501007080078, 0.00928044319152832, 0.009729385375976562, 0.010178327560424805, 0.010627269744873047, 0.011076211929321289, 0.011525154113769531, 0.011974096298217773, 0.012423038482666016, 0.012871980667114258, 0.0133209228515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 20.0, 26.0, 46.0, 66.0, 114.0, 93.0, 93.0, 4193380.0, 111.0, 101.0, 108.0, 62.0, 35.0, 18.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007624626159667969, -0.0007400959730148315, -0.0007177293300628662, -0.0006953626871109009, -0.0006729960441589355, -0.0006506294012069702, -0.0006282627582550049, -0.0006058961153030396, -0.0005835294723510742, -0.0005611628293991089, -0.0005387961864471436, -0.0005164295434951782, -0.0004940629005432129, -0.00047169625759124756, -0.0004493296146392822, -0.0004269629716873169, -0.00040459632873535156, -0.00038222968578338623, -0.0003598630428314209, -0.00033749639987945557, -0.00031512975692749023, -0.0002927631139755249, -0.00027039647102355957, -0.00024802982807159424, -0.0002256631851196289, -0.00020329654216766357, -0.00018092989921569824, -0.0001585632562637329, -0.00013619661331176758, -0.00011382997035980225, -9.146332740783691e-05, -6.909668445587158e-05, -4.673004150390625e-05, -2.4363398551940918e-05, -1.996755599975586e-06, 2.0369887351989746e-05, 4.273653030395508e-05, 6.510317325592041e-05, 8.746981620788574e-05, 0.00010983645915985107, 0.0001322031021118164, 0.00015456974506378174, 0.00017693638801574707, 0.0001993030309677124, 0.00022166967391967773, 0.00024403631687164307, 0.0002664029598236084, 0.00028876960277557373, 0.00031113624572753906, 0.0003335028886795044, 0.0003558695316314697, 0.00037823617458343506, 0.0004006028175354004, 0.0004229694604873657, 0.00044533610343933105, 0.0004677027463912964, 0.0004900693893432617, 0.000512436032295227, 0.0005348026752471924, 0.0005571693181991577, 0.000579535961151123, 0.0006019026041030884, 0.0006242692470550537, 0.000646635890007019, 0.0006690025329589844]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4095.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, 2.7958303689956665e-06, 5.949288606643677e-06, 9.102746844291687e-06, 1.2256205081939697e-05, 1.5409663319587708e-05, 1.8563121557235718e-05, 2.1716579794883728e-05, 2.4870038032531738e-05, 2.802349627017975e-05, 3.117695450782776e-05, 3.433041274547577e-05, 3.748387098312378e-05, 4.063732922077179e-05, 4.37907874584198e-05, 4.694424569606781e-05, 5.009770393371582e-05, 5.325116217136383e-05, 5.640462040901184e-05, 5.955807864665985e-05, 6.271153688430786e-05, 6.586499512195587e-05, 6.901845335960388e-05, 7.217191159725189e-05, 7.53253698348999e-05, 7.847882807254791e-05, 8.163228631019592e-05, 8.478574454784393e-05, 8.793920278549194e-05, 9.109266102313995e-05, 9.424611926078796e-05, 9.739957749843597e-05, 0.00010055303573608398, 0.000103706493973732, 0.00010685995221138, 0.00011001341044902802, 0.00011316686868667603, 0.00011632032692432404, 0.00011947378516197205, 0.00012262724339962006, 0.00012578070163726807, 0.00012893415987491608, 0.0001320876181125641, 0.0001352410763502121, 0.0001383945345878601, 0.00014154799282550812, 0.00014470145106315613, 0.00014785490930080414, 0.00015100836753845215, 0.00015416182577610016, 0.00015731528401374817, 0.00016046874225139618, 0.0001636222004890442, 0.0001667756587266922, 0.0001699291169643402, 0.00017308257520198822, 0.00017623603343963623, 0.00017938949167728424, 0.00018254294991493225, 0.00018569640815258026, 0.00018884986639022827, 0.00019200332462787628, 0.0001951567828655243, 0.0001983102411031723, 0.0002014636993408203]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1002.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012502116151154041, -0.0011965295998379588, -0.0011428474681451917, -0.0010891654528677464, -0.0010354833211749792, -0.000981801305897534, -0.0009281192324124277, -0.0008744371589273214, -0.0008207551436498761, -0.0007670730701647699, -0.0007133909966796637, -0.0006597089814022183, -0.0006060269079171121, -0.0005523448344320059, -0.0004986627609468997, -0.0004449807165656239, -0.0003912986139766872, -0.00033761654049158096, -0.0002839344961103052, -0.00023025242262519896, -0.00017657036369200796, -0.00012288830475881696, -6.920623127371073e-05, -1.5524186892434955e-05, 3.8157886592671275e-05, 9.183994552586228e-05, 0.00014552200445905328, 0.0001992040779441595, 0.00025288615142926574, 0.0003065681958105415, 0.00036025026929564774, 0.0004139323136769235, 0.00046761438716202974, 0.000521296460647136, 0.0005749785341322422, 0.0006286605494096875, 0.0006823426228947937, 0.0007360246963799, 0.0007897067698650062, 0.0008433888433501124, 0.0008970708586275578, 0.000950752932112664, 0.0010044350055977702, 0.0010581170208752155, 0.0011117991525679827, 0.001165481167845428, 0.0012191631831228733, 0.0012728453148156404, 0.0013265274465084076, 0.001380209461785853, 0.00143389159347862, 0.0014875736087560654, 0.0015412557404488325, 0.0015949377557262778, 0.0016486197710037231, 0.0017023019026964903, 0.0017559839179739356, 0.001809665933251381, 0.001863348064944148, 0.0019170300802215934, 0.0019707120954990387, 0.002024394227191806, 0.002078076358884573, 0.0021317582577466965, 0.0021854403894394636]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 11.0, 17.0, 31.0, 82.0, 156.0, 192.0, 174.0, 133.0, 103.0, 43.0, 26.0, 13.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017642974853515625, -0.00016728229820728302, -0.0001581348478794098, -0.00014898739755153656, -0.00013983994722366333, -0.0001306924968957901, -0.00012154504656791687, -0.00011239759624004364, -0.00010325014591217041, -9.410269558429718e-05, -8.495524525642395e-05, -7.580779492855072e-05, -6.666034460067749e-05, -5.751289427280426e-05, -4.836544394493103e-05, -3.92179936170578e-05, -3.007054328918457e-05, -2.092309296131134e-05, -1.177564263343811e-05, -2.6281923055648804e-06, 6.51925802230835e-06, 1.566670835018158e-05, 2.481415867805481e-05, 3.396160900592804e-05, 4.310905933380127e-05, 5.22565096616745e-05, 6.140395998954773e-05, 7.055141031742096e-05, 7.969886064529419e-05, 8.884631097316742e-05, 9.799376130104065e-05, 0.00010714121162891388, 0.00011628866195678711, 0.00012543611228466034, 0.00013458356261253357, 0.0001437310129404068, 0.00015287846326828003, 0.00016202591359615326, 0.0001711733639240265, 0.00018032081425189972, 0.00018946826457977295, 0.00019861571490764618, 0.0002077631652355194, 0.00021691061556339264, 0.00022605806589126587, 0.0002352055162191391, 0.00024435296654701233, 0.00025350041687488556, 0.0002626478672027588, 0.000271795317530632, 0.00028094276785850525, 0.0002900902181863785, 0.0002992376685142517, 0.00030838511884212494, 0.00031753256916999817, 0.0003266800194978714, 0.00033582746982574463, 0.00034497492015361786, 0.0003541223704814911, 0.0003632698208093643, 0.00037241727113723755, 0.0003815647214651108, 0.000390712171792984, 0.00039985962212085724, 0.00040900707244873047]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 3.0, 7.0, 2.0, 10.0, 9.0, 17.0, 30.0, 27.0, 50.0, 57.0, 94.0, 133.0, 193.0, 289.0, 529.0, 881.0, 1822.0, 4622.0, 19322.0, 940231.0, 65824.0, 8488.0, 2826.0, 1315.0, 645.0, 384.0, 237.0, 148.0, 104.0, 72.0, 38.0, 31.0, 25.0, 22.0, 15.0, 14.0, 3.0, 7.0, 6.0, 6.0, 4.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.037109375, -0.03597593307495117, -0.034842491149902344, -0.033709049224853516, -0.03257560729980469, -0.03144216537475586, -0.03030872344970703, -0.029175281524658203, -0.028041839599609375, -0.026908397674560547, -0.02577495574951172, -0.02464151382446289, -0.023508071899414062, -0.022374629974365234, -0.021241188049316406, -0.020107746124267578, -0.01897430419921875, -0.017840862274169922, -0.016707420349121094, -0.015573978424072266, -0.014440536499023438, -0.01330709457397461, -0.012173652648925781, -0.011040210723876953, -0.009906768798828125, -0.008773326873779297, -0.007639884948730469, -0.006506443023681641, -0.0053730010986328125, -0.004239559173583984, -0.0031061172485351562, -0.001972675323486328, -0.0008392333984375, 0.0002942085266113281, 0.0014276504516601562, 0.0025610923767089844, 0.0036945343017578125, 0.004827976226806641, 0.005961418151855469, 0.007094860076904297, 0.008228302001953125, 0.009361743927001953, 0.010495185852050781, 0.01162862777709961, 0.012762069702148438, 0.013895511627197266, 0.015028953552246094, 0.016162395477294922, 0.01729583740234375, 0.018429279327392578, 0.019562721252441406, 0.020696163177490234, 0.021829605102539062, 0.02296304702758789, 0.02409648895263672, 0.025229930877685547, 0.026363372802734375, 0.027496814727783203, 0.02863025665283203, 0.02976369857788086, 0.030897140502929688, 0.032030582427978516, 0.033164024353027344, 0.03429746627807617, 0.035430908203125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 6.0, 8.0, 7.0, 9.0, 11.0, 18.0, 24.0, 76.0, 176.0, 292.0, 174.0, 79.0, 20.0, 15.0, 13.0, 9.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015411376953125, -0.014962434768676758, -0.014513492584228516, -0.014064550399780273, -0.013615608215332031, -0.013166666030883789, -0.012717723846435547, -0.012268781661987305, -0.011819839477539062, -0.01137089729309082, -0.010921955108642578, -0.010473012924194336, -0.010024070739746094, -0.009575128555297852, -0.00912618637084961, -0.008677244186401367, -0.008228302001953125, -0.007779359817504883, -0.007330417633056641, -0.0068814754486083984, -0.006432533264160156, -0.005983591079711914, -0.005534648895263672, -0.00508570671081543, -0.0046367645263671875, -0.004187822341918945, -0.003738880157470703, -0.003289937973022461, -0.0028409957885742188, -0.0023920536041259766, -0.0019431114196777344, -0.0014941692352294922, -0.00104522705078125, -0.0005962848663330078, -0.00014734268188476562, 0.00030159950256347656, 0.0007505416870117188, 0.001199483871459961, 0.0016484260559082031, 0.0020973682403564453, 0.0025463104248046875, 0.0029952526092529297, 0.003444194793701172, 0.003893136978149414, 0.004342079162597656, 0.0047910213470458984, 0.005239963531494141, 0.005688905715942383, 0.006137847900390625, 0.006586790084838867, 0.007035732269287109, 0.0074846744537353516, 0.007933616638183594, 0.008382558822631836, 0.008831501007080078, 0.00928044319152832, 0.009729385375976562, 0.010178327560424805, 0.010627269744873047, 0.011076211929321289, 0.011525154113769531, 0.011974096298217773, 0.012423038482666016, 0.012871980667114258, 0.0133209228515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 2.0, 6.0, 5.0, 10.0, 10.0, 16.0, 18.0, 26.0, 20.0, 34.0, 52.0, 65.0, 77.0, 128.0, 177.0, 250.0, 469.0, 1082.0, 3567.0, 1002224.0, 36716.0, 1751.0, 731.0, 329.0, 227.0, 139.0, 102.0, 83.0, 55.0, 46.0, 29.0, 28.0, 18.0, 10.0, 11.0, 7.0, 12.0, 6.0, 10.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.058319091796875, -0.05668830871582031, -0.055057525634765625, -0.05342674255371094, -0.05179595947265625, -0.05016517639160156, -0.048534393310546875, -0.04690361022949219, -0.0452728271484375, -0.04364204406738281, -0.042011260986328125, -0.04038047790527344, -0.03874969482421875, -0.03711891174316406, -0.035488128662109375, -0.03385734558105469, -0.0322265625, -0.030595779418945312, -0.028964996337890625, -0.027334213256835938, -0.02570343017578125, -0.024072647094726562, -0.022441864013671875, -0.020811080932617188, -0.0191802978515625, -0.017549514770507812, -0.015918731689453125, -0.014287948608398438, -0.01265716552734375, -0.011026382446289062, -0.009395599365234375, -0.0077648162841796875, -0.006134033203125, -0.0045032501220703125, -0.002872467041015625, -0.0012416839599609375, 0.00038909912109375, 0.0020198822021484375, 0.003650665283203125, 0.0052814483642578125, 0.0069122314453125, 0.008543014526367188, 0.010173797607421875, 0.011804580688476562, 0.01343536376953125, 0.015066146850585938, 0.016696929931640625, 0.018327713012695312, 0.01995849609375, 0.021589279174804688, 0.023220062255859375, 0.024850845336914062, 0.02648162841796875, 0.028112411499023438, 0.029743194580078125, 0.03137397766113281, 0.0330047607421875, 0.03463554382324219, 0.036266326904296875, 0.03789710998535156, 0.03952789306640625, 0.04115867614746094, 0.042789459228515625, 0.04442024230957031, 0.046051025390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 2.0, 6.0, 4.0, 10.0, 10.0, 14.0, 17.0, 21.0, 15.0, 18.0, 28.0, 32.0, 30.0, 31.0, 46.0, 35.0, 47.0, 48.0, 39.0, 47.0, 45.0, 46.0, 52.0, 43.0, 44.0, 35.0, 35.0, 34.0, 25.0, 31.0, 19.0, 22.0, 13.0, 7.0, 11.0, 7.0, 12.0, 6.0, 9.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0399169921875, -0.03880023956298828, -0.03768348693847656, -0.036566734313964844, -0.035449981689453125, -0.034333229064941406, -0.03321647644042969, -0.03209972381591797, -0.03098297119140625, -0.02986621856689453, -0.028749465942382812, -0.027632713317871094, -0.026515960693359375, -0.025399208068847656, -0.024282455444335938, -0.02316570281982422, -0.0220489501953125, -0.02093219757080078, -0.019815444946289062, -0.018698692321777344, -0.017581939697265625, -0.016465187072753906, -0.015348434448242188, -0.014231681823730469, -0.01311492919921875, -0.011998176574707031, -0.010881423950195312, -0.009764671325683594, -0.008647918701171875, -0.007531166076660156, -0.0064144134521484375, -0.005297660827636719, -0.004180908203125, -0.0030641555786132812, -0.0019474029541015625, -0.0008306503295898438, 0.000286102294921875, 0.0014028549194335938, 0.0025196075439453125, 0.0036363601684570312, 0.00475311279296875, 0.005869865417480469, 0.0069866180419921875, 0.008103370666503906, 0.009220123291015625, 0.010336875915527344, 0.011453628540039062, 0.012570381164550781, 0.0136871337890625, 0.014803886413574219, 0.015920639038085938, 0.017037391662597656, 0.018154144287109375, 0.019270896911621094, 0.020387649536132812, 0.02150440216064453, 0.02262115478515625, 0.02373790740966797, 0.024854660034179688, 0.025971412658691406, 0.027088165283203125, 0.028204917907714844, 0.029321670532226562, 0.03043842315673828, 0.03155517578125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 6.0, 6.0, 10.0, 19.0, 34.0, 76.0, 168.0, 339.0, 925.0, 3793.0, 29545.0, 978812.0, 29317.0, 3870.0, 995.0, 318.0, 146.0, 64.0, 42.0, 22.0, 15.0, 12.0, 7.0, 5.0, 0.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2695789337158203e-05, -1.2279488146305084e-05, -1.1863186955451965e-05, -1.1446885764598846e-05, -1.1030584573745728e-05, -1.0614283382892609e-05, -1.019798219203949e-05, -9.781681001186371e-06, -9.365379810333252e-06, -8.949078619480133e-06, -8.532777428627014e-06, -8.116476237773895e-06, -7.700175046920776e-06, -7.2838738560676575e-06, -6.8675726652145386e-06, -6.45127147436142e-06, -6.034970283508301e-06, -5.618669092655182e-06, -5.202367901802063e-06, -4.786066710948944e-06, -4.369765520095825e-06, -3.953464329242706e-06, -3.5371631383895874e-06, -3.1208619475364685e-06, -2.7045607566833496e-06, -2.2882595658302307e-06, -1.8719583749771118e-06, -1.455657184123993e-06, -1.039355993270874e-06, -6.230548024177551e-07, -2.0675361156463623e-07, 2.0954757928848267e-07, 6.258487701416016e-07, 1.0421499609947205e-06, 1.4584511518478394e-06, 1.8747523427009583e-06, 2.291053533554077e-06, 2.707354724407196e-06, 3.123655915260315e-06, 3.539957106113434e-06, 3.956258296966553e-06, 4.372559487819672e-06, 4.7888606786727905e-06, 5.2051618695259094e-06, 5.621463060379028e-06, 6.037764251232147e-06, 6.454065442085266e-06, 6.870366632938385e-06, 7.286667823791504e-06, 7.702969014644623e-06, 8.119270205497742e-06, 8.53557139635086e-06, 8.95187258720398e-06, 9.368173778057098e-06, 9.784474968910217e-06, 1.0200776159763336e-05, 1.0617077350616455e-05, 1.1033378541469574e-05, 1.1449679732322693e-05, 1.1865980923175812e-05, 1.228228211402893e-05, 1.269858330488205e-05, 1.3114884495735168e-05, 1.3531185686588287e-05, 1.3947486877441406e-05]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 11.0, 17.0, 43.0, 31.0, 40.0, 72.0, 140.0, 163.0, 132.0, 114.0, 80.0, 50.0, 25.0, 21.0, 15.0, 13.0, 7.0, 5.0, 3.0, 1.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.357929229736328e-06, -9.043142199516296e-06, -8.728355169296265e-06, -8.413568139076233e-06, -8.098781108856201e-06, -7.78399407863617e-06, -7.469207048416138e-06, -7.154420018196106e-06, -6.839632987976074e-06, -6.5248459577560425e-06, -6.210058927536011e-06, -5.895271897315979e-06, -5.580484867095947e-06, -5.2656978368759155e-06, -4.950910806655884e-06, -4.636123776435852e-06, -4.32133674621582e-06, -4.0065497159957886e-06, -3.691762685775757e-06, -3.376975655555725e-06, -3.0621886253356934e-06, -2.7474015951156616e-06, -2.43261456489563e-06, -2.117827534675598e-06, -1.8030405044555664e-06, -1.4882534742355347e-06, -1.173466444015503e-06, -8.586794137954712e-07, -5.438923835754395e-07, -2.2910535335540771e-07, 8.568167686462402e-08, 4.0046870708465576e-07, 7.152557373046875e-07, 1.0300427675247192e-06, 1.344829797744751e-06, 1.6596168279647827e-06, 1.9744038581848145e-06, 2.289190888404846e-06, 2.603977918624878e-06, 2.9187649488449097e-06, 3.2335519790649414e-06, 3.548339009284973e-06, 3.863126039505005e-06, 4.177913069725037e-06, 4.492700099945068e-06, 4.8074871301651e-06, 5.122274160385132e-06, 5.4370611906051636e-06, 5.751848220825195e-06, 6.066635251045227e-06, 6.381422281265259e-06, 6.6962093114852905e-06, 7.010996341705322e-06, 7.325783371925354e-06, 7.640570402145386e-06, 7.955357432365417e-06, 8.27014446258545e-06, 8.584931492805481e-06, 8.899718523025513e-06, 9.214505553245544e-06, 9.529292583465576e-06, 9.844079613685608e-06, 1.015886664390564e-05, 1.0473653674125671e-05, 1.0788440704345703e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 8.0, 10.0, 11.0, 17.0, 15.0, 38.0, 41.0, 66.0, 136.0, 209.0, 505.0, 2506.0, 1038942.0, 4787.0, 648.0, 244.0, 126.0, 85.0, 44.0, 24.0, 27.0, 11.0, 13.0, 11.0, 8.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8371810913085938e-05, -2.741347998380661e-05, -2.6455149054527283e-05, -2.5496818125247955e-05, -2.4538487195968628e-05, -2.35801562666893e-05, -2.2621825337409973e-05, -2.1663494408130646e-05, -2.070516347885132e-05, -1.974683254957199e-05, -1.8788501620292664e-05, -1.7830170691013336e-05, -1.687183976173401e-05, -1.591350883245468e-05, -1.4955177903175354e-05, -1.3996846973896027e-05, -1.30385160446167e-05, -1.2080185115337372e-05, -1.1121854186058044e-05, -1.0163523256778717e-05, -9.20519232749939e-06, -8.246861398220062e-06, -7.288530468940735e-06, -6.3301995396614075e-06, -5.37186861038208e-06, -4.413537681102753e-06, -3.4552067518234253e-06, -2.496875822544098e-06, -1.5385448932647705e-06, -5.802139639854431e-07, 3.781169652938843e-07, 1.3364478945732117e-06, 2.294778823852539e-06, 3.2531097531318665e-06, 4.211440682411194e-06, 5.169771611690521e-06, 6.128102540969849e-06, 7.086433470249176e-06, 8.044764399528503e-06, 9.00309532880783e-06, 9.961426258087158e-06, 1.0919757187366486e-05, 1.1878088116645813e-05, 1.283641904592514e-05, 1.3794749975204468e-05, 1.4753080904483795e-05, 1.5711411833763123e-05, 1.666974276304245e-05, 1.7628073692321777e-05, 1.8586404621601105e-05, 1.9544735550880432e-05, 2.050306648015976e-05, 2.1461397409439087e-05, 2.2419728338718414e-05, 2.3378059267997742e-05, 2.433639019727707e-05, 2.5294721126556396e-05, 2.6253052055835724e-05, 2.721138298511505e-05, 2.816971391439438e-05, 2.9128044843673706e-05, 3.0086375772953033e-05, 3.104470670223236e-05, 3.200303763151169e-05, 3.2961368560791016e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 2.0, 5.0, 6.0, 7.0, 11.0, 9.0, 17.0, 21.0, 19.0, 51.0, 44.0, 46.0, 72.0, 349.0, 91.0, 58.0, 53.0, 25.0, 28.0, 21.0, 11.0, 10.0, 9.0, 10.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9431114196777344e-05, -1.8775463104248047e-05, -1.811981201171875e-05, -1.7464160919189453e-05, -1.6808509826660156e-05, -1.615285873413086e-05, -1.5497207641601562e-05, -1.4841556549072266e-05, -1.4185905456542969e-05, -1.3530254364013672e-05, -1.2874603271484375e-05, -1.2218952178955078e-05, -1.1563301086425781e-05, -1.0907649993896484e-05, -1.0251998901367188e-05, -9.59634780883789e-06, -8.940696716308594e-06, -8.285045623779297e-06, -7.62939453125e-06, -6.973743438720703e-06, -6.318092346191406e-06, -5.662441253662109e-06, -5.0067901611328125e-06, -4.351139068603516e-06, -3.6954879760742188e-06, -3.039836883544922e-06, -2.384185791015625e-06, -1.7285346984863281e-06, -1.0728836059570312e-06, -4.172325134277344e-07, 2.384185791015625e-07, 8.940696716308594e-07, 1.5497207641601562e-06, 2.205371856689453e-06, 2.86102294921875e-06, 3.516674041748047e-06, 4.172325134277344e-06, 4.827976226806641e-06, 5.4836273193359375e-06, 6.139278411865234e-06, 6.794929504394531e-06, 7.450580596923828e-06, 8.106231689453125e-06, 8.761882781982422e-06, 9.417533874511719e-06, 1.0073184967041016e-05, 1.0728836059570312e-05, 1.138448715209961e-05, 1.2040138244628906e-05, 1.2695789337158203e-05, 1.33514404296875e-05, 1.4007091522216797e-05, 1.4662742614746094e-05, 1.531839370727539e-05, 1.5974044799804688e-05, 1.6629695892333984e-05, 1.728534698486328e-05, 1.7940998077392578e-05, 1.8596649169921875e-05, 1.9252300262451172e-05, 1.990795135498047e-05, 2.0563602447509766e-05, 2.1219253540039062e-05, 2.187490463256836e-05, 2.2530555725097656e-05]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 41.0, 959.0, 17.0], "bins": [-1.3814324140548706, -1.359308123588562, -1.337183952331543, -1.3150596618652344, -1.2929354906082153, -1.2708112001419067, -1.2486870288848877, -1.226562738418579, -1.20443856716156, -1.1823142766952515, -1.1601901054382324, -1.1380658149719238, -1.1159416437149048, -1.0938173532485962, -1.0716931819915771, -1.0495688915252686, -1.02744460105896, -1.0053203105926514, -0.9831961393356323, -0.9610719084739685, -0.9389476776123047, -0.9168234467506409, -0.894699215888977, -0.8725749254226685, -0.8504507541656494, -0.8283265233039856, -0.8062022924423218, -0.784078061580658, -0.7619538307189941, -0.7398295998573303, -0.7177053689956665, -0.6955810785293579, -0.6734568476676941, -0.6513326168060303, -0.6292083859443665, -0.6070841550827026, -0.5849599242210388, -0.562835693359375, -0.5407114028930664, -0.5185872316360474, -0.49646297097206116, -0.47433874011039734, -0.4522145092487335, -0.4300902485847473, -0.4079660177230835, -0.3858417868614197, -0.36371755599975586, -0.34159332513809204, -0.3194690942764282, -0.2973448634147644, -0.2752206325531006, -0.25309640169143677, -0.23097215592861176, -0.20884792506694794, -0.18672367930412292, -0.1645994484424591, -0.1424752175807953, -0.12035098671913147, -0.09822674840688705, -0.07610251009464264, -0.05397827923297882, -0.031854048371315, -0.00972980260848999, 0.012394428253173828, 0.03451865166425705]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 3.0, 6.0, 6.0, 6.0, 10.0, 9.0, 4.0, 12.0, 14.0, 15.0, 21.0, 29.0, 25.0, 31.0, 31.0, 39.0, 45.0, 44.0, 36.0, 62.0, 71.0, 50.0, 48.0, 46.0, 43.0, 47.0, 36.0, 39.0, 32.0, 24.0, 18.0, 18.0, 20.0, 14.0, 7.0, 6.0, 5.0, 2.0, 3.0, 5.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.16391116380691528, -0.15799196064472198, -0.15207277238368988, -0.14615356922149658, -0.14023438096046448, -0.13431517779827118, -0.12839597463607788, -0.12247677892446518, -0.11655758321285248, -0.11063838750123978, -0.10471919178962708, -0.09879998862743378, -0.09288079291582108, -0.08696159720420837, -0.08104239404201508, -0.07512319833040237, -0.06920400261878967, -0.06328480690717697, -0.05736560747027397, -0.05144640803337097, -0.04552721232175827, -0.03960801661014557, -0.03368881717324257, -0.02776961773633957, -0.021850422024726868, -0.015931224450469017, -0.010012026876211166, -0.004092829301953316, 0.001826368272304535, 0.0077455658465623856, 0.013664763420820236, 0.019583962857723236, 0.025503158569335938, 0.03142235428094864, 0.03734155371785164, 0.04326075315475464, 0.04917994886636734, 0.05509914457798004, 0.06101834401488304, 0.06693754345178604, 0.07285673916339874, 0.07877593487501144, 0.08469513058662415, 0.09061433374881744, 0.09653352946043015, 0.10245272517204285, 0.10837192833423615, 0.11429112404584885, 0.12021031975746155, 0.12612952291965485, 0.13204871118068695, 0.13796791434288025, 0.14388710260391235, 0.14980630576610565, 0.15572550892829895, 0.16164469718933105, 0.16756390035152435, 0.17348310351371765, 0.17940229177474976, 0.18532149493694305, 0.19124069809913635, 0.19715988636016846, 0.20307908952236176, 0.20899829268455505, 0.21491748094558716]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 1.0, 1.0, 0.0, 2.0, 8.0, 6.0, 10.0, 6.0, 10.0, 13.0, 12.0, 11.0, 27.0, 22.0, 31.0, 36.0, 155.0, 341.0, 4192780.0, 426.0, 135.0, 69.0, 37.0, 22.0, 23.0, 10.0, 14.0, 10.0, 7.0, 8.0, 6.0, 6.0, 7.0, 5.0, 4.0, 7.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0], "bins": [-0.002178192138671875, -0.00210493803024292, -0.002031683921813965, -0.0019584298133850098, -0.0018851757049560547, -0.0018119215965270996, -0.0017386674880981445, -0.0016654133796691895, -0.0015921592712402344, -0.0015189051628112793, -0.0014456510543823242, -0.0013723969459533691, -0.001299142837524414, -0.001225888729095459, -0.001152634620666504, -0.0010793805122375488, -0.0010061264038085938, -0.0009328722953796387, -0.0008596181869506836, -0.0007863640785217285, -0.0007131099700927734, -0.0006398558616638184, -0.0005666017532348633, -0.0004933476448059082, -0.0004200935363769531, -0.00034683942794799805, -0.00027358531951904297, -0.0002003312110900879, -0.0001270771026611328, -5.3822994232177734e-05, 1.9431114196777344e-05, 9.268522262573242e-05, 0.0001659393310546875, 0.00023919343948364258, 0.00031244754791259766, 0.00038570165634155273, 0.0004589557647705078, 0.0005322098731994629, 0.000605463981628418, 0.000678718090057373, 0.0007519721984863281, 0.0008252263069152832, 0.0008984804153442383, 0.0009717345237731934, 0.0010449886322021484, 0.0011182427406311035, 0.0011914968490600586, 0.0012647509574890137, 0.0013380050659179688, 0.0014112591743469238, 0.001484513282775879, 0.001557767391204834, 0.001631021499633789, 0.0017042756080627441, 0.0017775297164916992, 0.0018507838249206543, 0.0019240379333496094, 0.0019972920417785645, 0.0020705461502075195, 0.0021438002586364746, 0.0022170543670654297, 0.0022903084754943848, 0.00236356258392334, 0.002436816692352295, 0.00251007080078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 2.0, 5.0, 7.0, 7.0, 10.0, 10.0, 19.0, 36.0, 71.0, 181.0, 289.0, 170.0, 77.0, 19.0, 15.0, 11.0, 12.0, 7.0, 6.0, 5.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01532745361328125, -0.014880061149597168, -0.014432668685913086, -0.013985276222229004, -0.013537883758544922, -0.01309049129486084, -0.012643098831176758, -0.012195706367492676, -0.011748313903808594, -0.011300921440124512, -0.01085352897644043, -0.010406136512756348, -0.009958744049072266, -0.009511351585388184, -0.009063959121704102, -0.00861656665802002, -0.008169174194335938, -0.0077217817306518555, -0.0072743892669677734, -0.006826996803283691, -0.006379604339599609, -0.005932211875915527, -0.005484819412231445, -0.005037426948547363, -0.004590034484863281, -0.004142642021179199, -0.003695249557495117, -0.003247857093811035, -0.002800464630126953, -0.002353072166442871, -0.001905679702758789, -0.001458287239074707, -0.001010894775390625, -0.000563502311706543, -0.00011610984802246094, 0.0003312826156616211, 0.0007786750793457031, 0.0012260675430297852, 0.0016734600067138672, 0.0021208524703979492, 0.0025682449340820312, 0.0030156373977661133, 0.0034630298614501953, 0.003910422325134277, 0.004357814788818359, 0.004805207252502441, 0.0052525997161865234, 0.0056999921798706055, 0.0061473846435546875, 0.0065947771072387695, 0.0070421695709228516, 0.007489562034606934, 0.007936954498291016, 0.008384346961975098, 0.00883173942565918, 0.009279131889343262, 0.009726524353027344, 0.010173916816711426, 0.010621309280395508, 0.01106870174407959, 0.011516094207763672, 0.011963486671447754, 0.012410879135131836, 0.012858271598815918, 0.0133056640625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 16.0, 33.0, 49.0, 84.0, 97.0, 224.0, 4192306.0, 953.0, 178.0, 123.0, 102.0, 61.0, 27.0, 16.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015439987182617188, -0.0014886707067489624, -0.001433342695236206, -0.0013780146837234497, -0.0013226866722106934, -0.001267358660697937, -0.0012120306491851807, -0.0011567026376724243, -0.001101374626159668, -0.0010460466146469116, -0.0009907186031341553, -0.0009353905916213989, -0.0008800625801086426, -0.0008247345685958862, -0.0007694065570831299, -0.0007140785455703735, -0.0006587505340576172, -0.0006034225225448608, -0.0005480945110321045, -0.0004927664995193481, -0.0004374384880065918, -0.00038211047649383545, -0.0003267824649810791, -0.00027145445346832275, -0.0002161264419555664, -0.00016079843044281006, -0.00010547041893005371, -5.014240741729736e-05, 5.185604095458984e-06, 6.051361560821533e-05, 0.00011584162712097168, 0.00017116963863372803, 0.00022649765014648438, 0.0002818256616592407, 0.00033715367317199707, 0.0003924816846847534, 0.00044780969619750977, 0.0005031377077102661, 0.0005584657192230225, 0.0006137937307357788, 0.0006691217422485352, 0.0007244497537612915, 0.0007797777652740479, 0.0008351057767868042, 0.0008904337882995605, 0.0009457617998123169, 0.0010010898113250732, 0.0010564178228378296, 0.001111745834350586, 0.0011670738458633423, 0.0012224018573760986, 0.001277729868888855, 0.0013330578804016113, 0.0013883858919143677, 0.001443713903427124, 0.0014990419149398804, 0.0015543699264526367, 0.001609697937965393, 0.0016650259494781494, 0.0017203539609909058, 0.0017756819725036621, 0.0018310099840164185, 0.0018863379955291748, 0.0019416660070419312, 0.0019969940185546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4090.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005674362182617188, -0.0005564577877521515, -0.0005454793572425842, -0.000534500926733017, -0.0005235224962234497, -0.0005125440657138824, -0.0005015656352043152, -0.0004905872046947479, -0.00047960877418518066, -0.0004686303436756134, -0.00045765191316604614, -0.0004466734826564789, -0.0004356950521469116, -0.00042471662163734436, -0.0004137381911277771, -0.00040275976061820984, -0.0003917813301086426, -0.0003808028995990753, -0.00036982446908950806, -0.0003588460385799408, -0.00034786760807037354, -0.0003368891775608063, -0.000325910747051239, -0.00031493231654167175, -0.0003039538860321045, -0.00029297545552253723, -0.00028199702501296997, -0.0002710185945034027, -0.00026004016399383545, -0.0002490617334842682, -0.00023808330297470093, -0.00022710487246513367, -0.0002161264419555664, -0.00020514801144599915, -0.00019416958093643188, -0.00018319115042686462, -0.00017221271991729736, -0.0001612342894077301, -0.00015025585889816284, -0.00013927742838859558, -0.00012829899787902832, -0.00011732056736946106, -0.0001063421368598938, -9.536370635032654e-05, -8.438527584075928e-05, -7.340684533119202e-05, -6.242841482162476e-05, -5.1449984312057495e-05, -4.0471553802490234e-05, -2.9493123292922974e-05, -1.8514692783355713e-05, -7.536262273788452e-06, 3.4421682357788086e-06, 1.442059874534607e-05, 2.539902925491333e-05, 3.637745976448059e-05, 4.735589027404785e-05, 5.833432078361511e-05, 6.931275129318237e-05, 8.029118180274963e-05, 9.12696123123169e-05, 0.00010224804282188416, 0.00011322647333145142, 0.00012420490384101868, 0.00013518333435058594]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 85.0, 920.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007186708971858025, -0.0006677109631709754, -0.0006167510291561484, -0.0005657911533489823, -0.0005148311611264944, -0.00046387125621549785, -0.0004129113513045013, -0.0003619514172896743, -0.00031099148327484727, -0.00026003154926002026, -0.00020907162979710847, -0.0001581117103341967, -0.00010715177631936967, -5.619184230454266e-05, -5.2319373935461044e-06, 4.572799662128091e-05, 9.668793063610792e-05, 0.00014764786465093493, 0.00019860778411384672, 0.0002495677035767585, 0.0003005276375915855, 0.00035148757160641253, 0.0004024474765174091, 0.0004534074105322361, 0.0005043673445470631, 0.0005553272785618901, 0.0006062872125767171, 0.0006572471465915442, 0.0007082070223987103, 0.0007591670146211982, 0.0008101268904283643, 0.0008610868244431913, 0.0009120467584580183, 0.0009630066924728453, 0.0010139666264876723, 0.0010649265022948384, 0.0011158864945173264, 0.0011668463703244925, 0.0012178062461316586, 0.0012687662383541465, 0.0013197262305766344, 0.0013706861063838005, 0.0014216460986062884, 0.0014726059744134545, 0.0015235659666359425, 0.0015745258424431086, 0.0016254857182502747, 0.0016764457104727626, 0.0017274055862799287, 0.0017783654620870948, 0.0018293254543095827, 0.0018802853301167488, 0.0019312453223392367, 0.0019822053145617247, 0.0020331651903688908, 0.002084125066176057, 0.002135084941983223, 0.002186044817790389, 0.002237004693597555, 0.002287964802235365, 0.002338924678042531, 0.002389884553849697, 0.002440844429656863, 0.0024918043054640293, 0.002542764414101839]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 13.0, 34.0, 46.0, 93.0, 127.0, 184.0, 164.0, 120.0, 101.0, 60.0, 25.0, 10.0, 10.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009229779243469238, -0.0009011449292302132, -0.0008793119341135025, -0.0008574789389967918, -0.0008356459438800812, -0.0008138129487633705, -0.0007919799536466599, -0.0007701469585299492, -0.0007483139634132385, -0.0007264809682965279, -0.0007046479731798172, -0.0006828149780631065, -0.0006609819829463959, -0.0006391489878296852, -0.0006173159927129745, -0.0005954829975962639, -0.0005736500024795532, -0.0005518170073628426, -0.0005299840122461319, -0.0005081510171294212, -0.00048631802201271057, -0.0004644850268959999, -0.00044265203177928925, -0.0004208190366625786, -0.0003989860415458679, -0.00037715304642915726, -0.0003553200513124466, -0.00033348705619573593, -0.00031165406107902527, -0.0002898210659623146, -0.00026798807084560394, -0.0002461550757288933, -0.00022432208061218262, -0.00020248908549547195, -0.0001806560903787613, -0.00015882309526205063, -0.00013699010014533997, -0.0001151571050286293, -9.332410991191864e-05, -7.149111479520798e-05, -4.9658119678497314e-05, -2.782512456178665e-05, -5.992129445075989e-06, 1.5840865671634674e-05, 3.767386078834534e-05, 5.9506855905056e-05, 8.133985102176666e-05, 0.00010317284613847733, 0.000125005841255188, 0.00014683883637189865, 0.00016867183148860931, 0.00019050482660531998, 0.00021233782172203064, 0.0002341708168387413, 0.00025600381195545197, 0.00027783680707216263, 0.0002996698021888733, 0.00032150279730558395, 0.0003433357924222946, 0.0003651687875390053, 0.00038700178265571594, 0.0004088347777724266, 0.00043066777288913727, 0.00045250076800584793, 0.0004743337631225586]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 7.0, 11.0, 4.0, 13.0, 21.0, 15.0, 32.0, 30.0, 57.0, 80.0, 109.0, 150.0, 218.0, 381.0, 560.0, 998.0, 1840.0, 3916.0, 10821.0, 75711.0, 916932.0, 23889.0, 6506.0, 2699.0, 1377.0, 786.0, 491.0, 254.0, 202.0, 139.0, 69.0, 65.0, 57.0, 36.0, 16.0, 9.0, 11.0, 8.0, 9.0, 11.0, 8.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.041778564453125, -0.04055929183959961, -0.03934001922607422, -0.03812074661254883, -0.03690147399902344, -0.03568220138549805, -0.034462928771972656, -0.033243656158447266, -0.032024383544921875, -0.030805110931396484, -0.029585838317871094, -0.028366565704345703, -0.027147293090820312, -0.025928020477294922, -0.02470874786376953, -0.02348947525024414, -0.02227020263671875, -0.02105093002319336, -0.01983165740966797, -0.018612384796142578, -0.017393112182617188, -0.016173839569091797, -0.014954566955566406, -0.013735294342041016, -0.012516021728515625, -0.011296749114990234, -0.010077476501464844, -0.008858203887939453, -0.0076389312744140625, -0.006419658660888672, -0.005200386047363281, -0.003981113433837891, -0.0027618408203125, -0.0015425682067871094, -0.00032329559326171875, 0.0008959770202636719, 0.0021152496337890625, 0.003334522247314453, 0.004553794860839844, 0.005773067474365234, 0.006992340087890625, 0.008211612701416016, 0.009430885314941406, 0.010650157928466797, 0.011869430541992188, 0.013088703155517578, 0.014307975769042969, 0.01552724838256836, 0.01674652099609375, 0.01796579360961914, 0.01918506622314453, 0.020404338836669922, 0.021623611450195312, 0.022842884063720703, 0.024062156677246094, 0.025281429290771484, 0.026500701904296875, 0.027719974517822266, 0.028939247131347656, 0.030158519744873047, 0.03137779235839844, 0.03259706497192383, 0.03381633758544922, 0.03503561019897461, 0.0362548828125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 2.0, 5.0, 7.0, 7.0, 10.0, 10.0, 19.0, 36.0, 71.0, 181.0, 289.0, 170.0, 77.0, 19.0, 15.0, 11.0, 12.0, 7.0, 6.0, 5.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01532745361328125, -0.014880061149597168, -0.014432668685913086, -0.013985276222229004, -0.013537883758544922, -0.01309049129486084, -0.012643098831176758, -0.012195706367492676, -0.011748313903808594, -0.011300921440124512, -0.01085352897644043, -0.010406136512756348, -0.009958744049072266, -0.009511351585388184, -0.009063959121704102, -0.00861656665802002, -0.008169174194335938, -0.0077217817306518555, -0.0072743892669677734, -0.006826996803283691, -0.006379604339599609, -0.005932211875915527, -0.005484819412231445, -0.005037426948547363, -0.004590034484863281, -0.004142642021179199, -0.003695249557495117, -0.003247857093811035, -0.002800464630126953, -0.002353072166442871, -0.001905679702758789, -0.001458287239074707, -0.001010894775390625, -0.000563502311706543, -0.00011610984802246094, 0.0003312826156616211, 0.0007786750793457031, 0.0012260675430297852, 0.0016734600067138672, 0.0021208524703979492, 0.0025682449340820312, 0.0030156373977661133, 0.0034630298614501953, 0.003910422325134277, 0.004357814788818359, 0.004805207252502441, 0.0052525997161865234, 0.0056999921798706055, 0.0061473846435546875, 0.0065947771072387695, 0.0070421695709228516, 0.007489562034606934, 0.007936954498291016, 0.008384346961975098, 0.00883173942565918, 0.009279131889343262, 0.009726524353027344, 0.010173916816711426, 0.010621309280395508, 0.01106870174407959, 0.011516094207763672, 0.011963486671447754, 0.012410879135131836, 0.012858271598815918, 0.0133056640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 12.0, 3.0, 10.0, 8.0, 12.0, 14.0, 17.0, 22.0, 17.0, 22.0, 36.0, 36.0, 48.0, 70.0, 101.0, 180.0, 402.0, 848.0, 2015.0, 32153.0, 1005614.0, 4214.0, 1300.0, 582.0, 282.0, 137.0, 89.0, 51.0, 44.0, 36.0, 27.0, 25.0, 20.0, 17.0, 17.0, 15.0, 7.0, 12.0, 4.0, 7.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.043182373046875, -0.04170656204223633, -0.040230751037597656, -0.038754940032958984, -0.03727912902832031, -0.03580331802368164, -0.03432750701904297, -0.0328516960144043, -0.031375885009765625, -0.029900074005126953, -0.02842426300048828, -0.02694845199584961, -0.025472640991210938, -0.023996829986572266, -0.022521018981933594, -0.021045207977294922, -0.01956939697265625, -0.018093585968017578, -0.016617774963378906, -0.015141963958740234, -0.013666152954101562, -0.01219034194946289, -0.010714530944824219, -0.009238719940185547, -0.007762908935546875, -0.006287097930908203, -0.004811286926269531, -0.0033354759216308594, -0.0018596649169921875, -0.0003838539123535156, 0.0010919570922851562, 0.002567768096923828, 0.0040435791015625, 0.005519390106201172, 0.006995201110839844, 0.008471012115478516, 0.009946823120117188, 0.01142263412475586, 0.012898445129394531, 0.014374256134033203, 0.015850067138671875, 0.017325878143310547, 0.01880168914794922, 0.02027750015258789, 0.021753311157226562, 0.023229122161865234, 0.024704933166503906, 0.026180744171142578, 0.02765655517578125, 0.029132366180419922, 0.030608177185058594, 0.032083988189697266, 0.03355979919433594, 0.03503561019897461, 0.03651142120361328, 0.03798723220825195, 0.039463043212890625, 0.0409388542175293, 0.04241466522216797, 0.04389047622680664, 0.04536628723144531, 0.046842098236083984, 0.048317909240722656, 0.04979372024536133, 0.05126953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 12.0, 4.0, 9.0, 8.0, 12.0, 15.0, 16.0, 22.0, 16.0, 24.0, 29.0, 30.0, 29.0, 36.0, 33.0, 22.0, 46.0, 28.0, 36.0, 44.0, 46.0, 40.0, 33.0, 41.0, 25.0, 39.0, 33.0, 31.0, 36.0, 29.0, 27.0, 24.0, 19.0, 18.0, 17.0, 15.0, 7.0, 12.0, 4.0, 7.0, 5.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.025634765625, -0.024758577346801758, -0.023882389068603516, -0.023006200790405273, -0.02213001251220703, -0.02125382423400879, -0.020377635955810547, -0.019501447677612305, -0.018625259399414062, -0.01774907112121582, -0.016872882843017578, -0.015996694564819336, -0.015120506286621094, -0.014244318008422852, -0.01336812973022461, -0.012491941452026367, -0.011615753173828125, -0.010739564895629883, -0.00986337661743164, -0.008987188339233398, -0.008111000061035156, -0.007234811782836914, -0.006358623504638672, -0.00548243522644043, -0.0046062469482421875, -0.0037300586700439453, -0.002853870391845703, -0.001977682113647461, -0.0011014938354492188, -0.00022530555725097656, 0.0006508827209472656, 0.0015270709991455078, 0.00240325927734375, 0.003279447555541992, 0.004155635833740234, 0.0050318241119384766, 0.005908012390136719, 0.006784200668334961, 0.007660388946533203, 0.008536577224731445, 0.009412765502929688, 0.01028895378112793, 0.011165142059326172, 0.012041330337524414, 0.012917518615722656, 0.013793706893920898, 0.01466989517211914, 0.015546083450317383, 0.016422271728515625, 0.017298460006713867, 0.01817464828491211, 0.01905083656311035, 0.019927024841308594, 0.020803213119506836, 0.021679401397705078, 0.02255558967590332, 0.023431777954101562, 0.024307966232299805, 0.025184154510498047, 0.02606034278869629, 0.02693653106689453, 0.027812719345092773, 0.028688907623291016, 0.029565095901489258, 0.0304412841796875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 6.0, 4.0, 11.0, 12.0, 17.0, 10.0, 33.0, 42.0, 42.0, 73.0, 161.0, 196.0, 344.0, 981.0, 1970.0, 5414.0, 52990.0, 923864.0, 48956.0, 9517.0, 1969.0, 845.0, 458.0, 192.0, 114.0, 76.0, 76.0, 32.0, 31.0, 34.0, 23.0, 12.0, 16.0, 7.0, 7.0, 7.0, 4.0, 0.0, 7.0, 0.0, 1.0, 1.0], "bins": [-7.808208465576172e-06, -7.6107680797576904e-06, -7.413327693939209e-06, -7.2158873081207275e-06, -7.018446922302246e-06, -6.821006536483765e-06, -6.623566150665283e-06, -6.426125764846802e-06, -6.22868537902832e-06, -6.031244993209839e-06, -5.833804607391357e-06, -5.636364221572876e-06, -5.4389238357543945e-06, -5.241483449935913e-06, -5.044043064117432e-06, -4.84660267829895e-06, -4.649162292480469e-06, -4.451721906661987e-06, -4.254281520843506e-06, -4.056841135025024e-06, -3.859400749206543e-06, -3.6619603633880615e-06, -3.46451997756958e-06, -3.2670795917510986e-06, -3.069639205932617e-06, -2.8721988201141357e-06, -2.6747584342956543e-06, -2.477318048477173e-06, -2.2798776626586914e-06, -2.08243727684021e-06, -1.8849968910217285e-06, -1.687556505203247e-06, -1.4901161193847656e-06, -1.2926757335662842e-06, -1.0952353477478027e-06, -8.977949619293213e-07, -7.003545761108398e-07, -5.029141902923584e-07, -3.0547380447387695e-07, -1.0803341865539551e-07, 8.940696716308594e-08, 2.868473529815674e-07, 4.842877388000488e-07, 6.817281246185303e-07, 8.791685104370117e-07, 1.0766088962554932e-06, 1.2740492820739746e-06, 1.471489667892456e-06, 1.6689300537109375e-06, 1.866370439529419e-06, 2.0638108253479004e-06, 2.261251211166382e-06, 2.4586915969848633e-06, 2.6561319828033447e-06, 2.853572368621826e-06, 3.0510127544403076e-06, 3.248453140258789e-06, 3.4458935260772705e-06, 3.643333911895752e-06, 3.840774297714233e-06, 4.038214683532715e-06, 4.235655069351196e-06, 4.433095455169678e-06, 4.630535840988159e-06, 4.827976226806641e-06]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 4.0, 8.0, 9.0, 7.0, 7.0, 10.0, 16.0, 13.0, 18.0, 23.0, 37.0, 60.0, 43.0, 52.0, 84.0, 68.0, 92.0, 85.0, 63.0, 42.0, 57.0, 38.0, 24.0, 30.0, 12.0, 25.0, 14.0, 11.0, 12.0, 10.0, 10.0, 9.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.516674041748047e-06, -3.376975655555725e-06, -3.2372772693634033e-06, -3.0975788831710815e-06, -2.9578804969787598e-06, -2.818182110786438e-06, -2.678483724594116e-06, -2.5387853384017944e-06, -2.3990869522094727e-06, -2.259388566017151e-06, -2.119690179824829e-06, -1.9799917936325073e-06, -1.8402934074401855e-06, -1.7005950212478638e-06, -1.560896635055542e-06, -1.4211982488632202e-06, -1.2814998626708984e-06, -1.1418014764785767e-06, -1.0021030902862549e-06, -8.624047040939331e-07, -7.227063179016113e-07, -5.830079317092896e-07, -4.4330954551696777e-07, -3.03611159324646e-07, -1.6391277313232422e-07, -2.421438694000244e-08, 1.1548399925231934e-07, 2.551823854446411e-07, 3.948807716369629e-07, 5.345791578292847e-07, 6.742775440216064e-07, 8.139759302139282e-07, 9.5367431640625e-07, 1.0933727025985718e-06, 1.2330710887908936e-06, 1.3727694749832153e-06, 1.5124678611755371e-06, 1.6521662473678589e-06, 1.7918646335601807e-06, 1.9315630197525024e-06, 2.0712614059448242e-06, 2.210959792137146e-06, 2.3506581783294678e-06, 2.4903565645217896e-06, 2.6300549507141113e-06, 2.769753336906433e-06, 2.909451723098755e-06, 3.0491501092910767e-06, 3.1888484954833984e-06, 3.3285468816757202e-06, 3.468245267868042e-06, 3.6079436540603638e-06, 3.7476420402526855e-06, 3.887340426445007e-06, 4.027038812637329e-06, 4.166737198829651e-06, 4.306435585021973e-06, 4.4461339712142944e-06, 4.585832357406616e-06, 4.725530743598938e-06, 4.86522912979126e-06, 5.0049275159835815e-06, 5.144625902175903e-06, 5.284324288368225e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 7.0, 12.0, 13.0, 13.0, 16.0, 18.0, 38.0, 80.0, 108.0, 253.0, 685.0, 4193.0, 1038851.0, 3096.0, 594.0, 263.0, 112.0, 53.0, 33.0, 21.0, 18.0, 12.0, 10.0, 7.0, 9.0, 5.0, 5.0, 8.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1278858184814453e-05, -2.067815512418747e-05, -2.0077452063560486e-05, -1.9476749002933502e-05, -1.887604594230652e-05, -1.8275342881679535e-05, -1.767463982105255e-05, -1.7073936760425568e-05, -1.6473233699798584e-05, -1.58725306391716e-05, -1.5271827578544617e-05, -1.4671124517917633e-05, -1.407042145729065e-05, -1.3469718396663666e-05, -1.2869015336036682e-05, -1.2268312275409698e-05, -1.1667609214782715e-05, -1.1066906154155731e-05, -1.0466203093528748e-05, -9.865500032901764e-06, -9.26479697227478e-06, -8.664093911647797e-06, -8.063390851020813e-06, -7.462687790393829e-06, -6.861984729766846e-06, -6.261281669139862e-06, -5.660578608512878e-06, -5.059875547885895e-06, -4.459172487258911e-06, -3.8584694266319275e-06, -3.257766366004944e-06, -2.65706330537796e-06, -2.0563602447509766e-06, -1.455657184123993e-06, -8.549541234970093e-07, -2.5425106287002563e-07, 3.46451997756958e-07, 9.471550583839417e-07, 1.5478581190109253e-06, 2.148561179637909e-06, 2.7492642402648926e-06, 3.3499673008918762e-06, 3.95067036151886e-06, 4.5513734221458435e-06, 5.152076482772827e-06, 5.752779543399811e-06, 6.3534826040267944e-06, 6.954185664653778e-06, 7.554888725280762e-06, 8.155591785907745e-06, 8.756294846534729e-06, 9.356997907161713e-06, 9.957700967788696e-06, 1.055840402841568e-05, 1.1159107089042664e-05, 1.1759810149669647e-05, 1.2360513210296631e-05, 1.2961216270923615e-05, 1.3561919331550598e-05, 1.4162622392177582e-05, 1.4763325452804565e-05, 1.536402851343155e-05, 1.5964731574058533e-05, 1.6565434634685516e-05, 1.71661376953125e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 11.0, 9.0, 12.0, 15.0, 12.0, 22.0, 29.0, 22.0, 42.0, 54.0, 58.0, 378.0, 49.0, 50.0, 43.0, 39.0, 25.0, 22.0, 14.0, 14.0, 10.0, 10.0, 6.0, 8.0, 6.0, 5.0, 7.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2576580047607422e-05, -1.2220814824104309e-05, -1.1865049600601196e-05, -1.1509284377098083e-05, -1.115351915359497e-05, -1.0797753930091858e-05, -1.0441988706588745e-05, -1.0086223483085632e-05, -9.73045825958252e-06, -9.374693036079407e-06, -9.018927812576294e-06, -8.663162589073181e-06, -8.307397365570068e-06, -7.951632142066956e-06, -7.595866918563843e-06, -7.24010169506073e-06, -6.884336471557617e-06, -6.528571248054504e-06, -6.172806024551392e-06, -5.817040801048279e-06, -5.461275577545166e-06, -5.105510354042053e-06, -4.7497451305389404e-06, -4.393979907035828e-06, -4.038214683532715e-06, -3.682449460029602e-06, -3.3266842365264893e-06, -2.9709190130233765e-06, -2.6151537895202637e-06, -2.259388566017151e-06, -1.903623342514038e-06, -1.5478581190109253e-06, -1.1920928955078125e-06, -8.363276720046997e-07, -4.805624485015869e-07, -1.2479722499847412e-07, 2.3096799850463867e-07, 5.867332220077515e-07, 9.424984455108643e-07, 1.298263669013977e-06, 1.6540288925170898e-06, 2.0097941160202026e-06, 2.3655593395233154e-06, 2.7213245630264282e-06, 3.077089786529541e-06, 3.432855010032654e-06, 3.7886202335357666e-06, 4.144385457038879e-06, 4.500150680541992e-06, 4.855915904045105e-06, 5.211681127548218e-06, 5.5674463510513306e-06, 5.923211574554443e-06, 6.278976798057556e-06, 6.634742021560669e-06, 6.990507245063782e-06, 7.3462724685668945e-06, 7.702037692070007e-06, 8.05780291557312e-06, 8.413568139076233e-06, 8.769333362579346e-06, 9.125098586082458e-06, 9.480863809585571e-06, 9.836629033088684e-06, 1.0192394256591797e-05]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 14.0, 50.0, 445.0, 446.0, 48.0, 6.0, 2.0], "bins": [-0.3506965637207031, -0.34485143423080444, -0.33900633454322815, -0.33316123485565186, -0.3273161053657532, -0.3214709758758545, -0.3156258761882782, -0.3097807765007019, -0.3039356470108032, -0.29809051752090454, -0.29224541783332825, -0.28640031814575195, -0.28055518865585327, -0.2747100591659546, -0.2688649594783783, -0.263019859790802, -0.2571747303009033, -0.25132960081100464, -0.24548450112342834, -0.23963938653469086, -0.23379427194595337, -0.22794915735721588, -0.2221040427684784, -0.2162589281797409, -0.21041381359100342, -0.20456869900226593, -0.19872358441352844, -0.19287846982479095, -0.18703335523605347, -0.18118824064731598, -0.1753431260585785, -0.169498011469841, -0.16365289688110352, -0.15780778229236603, -0.15196266770362854, -0.14611755311489105, -0.14027243852615356, -0.13442732393741608, -0.1285822093486786, -0.1227370947599411, -0.11689198017120361, -0.11104686558246613, -0.10520175099372864, -0.09935663640499115, -0.09351152181625366, -0.08766640722751617, -0.08182129263877869, -0.0759761780500412, -0.07013106346130371, -0.06428594887256622, -0.058440834283828735, -0.05259571969509125, -0.04675060510635376, -0.04090549051761627, -0.035060375928878784, -0.029215261340141296, -0.02337014488875866, -0.01752503030002117, -0.011679915711283684, -0.005834801122546196, 1.0313466191291809e-05, 0.00585542805492878, 0.011700542643666267, 0.017545657232403755, 0.023390771821141243]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 8.0, 10.0, 15.0, 15.0, 15.0, 17.0, 19.0, 25.0, 30.0, 35.0, 38.0, 59.0, 42.0, 56.0, 56.0, 60.0, 62.0, 50.0, 42.0, 63.0, 39.0, 45.0, 44.0, 32.0, 24.0, 24.0, 15.0, 17.0, 8.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15005552768707275, -0.14446653425693512, -0.1388775259256363, -0.13328853249549866, -0.12769952416419983, -0.1221105307340622, -0.11652152985334396, -0.11093252897262573, -0.1053435280919075, -0.09975452721118927, -0.09416552633047104, -0.08857652544975281, -0.08298753201961517, -0.07739852368831635, -0.07180953025817871, -0.06622052937746048, -0.06063152849674225, -0.05504252761602402, -0.049453526735305786, -0.04386452957987785, -0.03827552869915962, -0.03268652781844139, -0.027097530663013458, -0.021508529782295227, -0.015919528901576996, -0.01033052895218134, -0.004741529002785683, 0.0008474700152873993, 0.0064364708960056305, 0.012025471776723862, 0.017614468932151794, 0.023203469812870026, 0.028792470693588257, 0.03438147157430649, 0.03997047245502472, 0.04555946961045265, 0.05114847049117088, 0.056737471371889114, 0.06232646852731705, 0.06791546940803528, 0.07350447028875351, 0.07909347116947174, 0.08468247205018997, 0.0902714729309082, 0.09586046636104584, 0.10144947469234467, 0.1070384681224823, 0.11262746900320053, 0.11821646988391876, 0.123805470764637, 0.12939447164535522, 0.13498346507549286, 0.1405724734067917, 0.14616146683692932, 0.15175047516822815, 0.15733946859836578, 0.16292846202850342, 0.16851745545864105, 0.17410646378993988, 0.17969545722007751, 0.18528446555137634, 0.19087345898151398, 0.1964624524116516, 0.20205146074295044, 0.20764046907424927]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 2.0, 8.0, 4.0, 8.0, 9.0, 13.0, 12.0, 16.0, 42.0, 119.0, 274.0, 4193501.0, 122.0, 48.0, 18.0, 16.0, 7.0, 13.0, 7.0, 1.0, 5.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0011272430419921875, -0.0010886043310165405, -0.0010499656200408936, -0.0010113269090652466, -0.0009726881980895996, -0.0009340494871139526, -0.0008954107761383057, -0.0008567720651626587, -0.0008181333541870117, -0.0007794946432113647, -0.0007408559322357178, -0.0007022172212600708, -0.0006635785102844238, -0.0006249397993087769, -0.0005863010883331299, -0.0005476623773574829, -0.0005090236663818359, -0.00047038495540618896, -0.000431746244430542, -0.000393107533454895, -0.00035446882247924805, -0.0003158301115036011, -0.0002771914005279541, -0.00023855268955230713, -0.00019991397857666016, -0.00016127526760101318, -0.0001226365566253662, -8.399784564971924e-05, -4.5359134674072266e-05, -6.720423698425293e-06, 3.191828727722168e-05, 7.055699825286865e-05, 0.00010919570922851562, 0.0001478344202041626, 0.00018647313117980957, 0.00022511184215545654, 0.0002637505531311035, 0.0003023892641067505, 0.00034102797508239746, 0.00037966668605804443, 0.0004183053970336914, 0.0004569441080093384, 0.0004955828189849854, 0.0005342215299606323, 0.0005728602409362793, 0.0006114989519119263, 0.0006501376628875732, 0.0006887763738632202, 0.0007274150848388672, 0.0007660537958145142, 0.0008046925067901611, 0.0008433312177658081, 0.0008819699287414551, 0.000920608639717102, 0.000959247350692749, 0.000997886061668396, 0.001036524772644043, 0.00107516348361969, 0.001113802194595337, 0.0011524409055709839, 0.0011910796165466309, 0.0012297183275222778, 0.0012683570384979248, 0.0013069957494735718, 0.0013456344604492188]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 2.0, 5.0, 7.0, 6.0, 11.0, 12.0, 16.0, 36.0, 73.0, 182.0, 287.0, 169.0, 79.0, 18.0, 16.0, 12.0, 10.0, 7.0, 6.0, 6.0, 6.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01531219482421875, -0.014865279197692871, -0.014418363571166992, -0.013971447944641113, -0.013524532318115234, -0.013077616691589355, -0.012630701065063477, -0.012183785438537598, -0.011736869812011719, -0.01128995418548584, -0.010843038558959961, -0.010396122932434082, -0.009949207305908203, -0.009502291679382324, -0.009055376052856445, -0.008608460426330566, -0.008161544799804688, -0.007714629173278809, -0.00726771354675293, -0.006820797920227051, -0.006373882293701172, -0.005926966667175293, -0.005480051040649414, -0.005033135414123535, -0.004586219787597656, -0.004139304161071777, -0.0036923885345458984, -0.0032454729080200195, -0.0027985572814941406, -0.0023516416549682617, -0.0019047260284423828, -0.001457810401916504, -0.001010894775390625, -0.0005639791488647461, -0.00011706352233886719, 0.0003298521041870117, 0.0007767677307128906, 0.0012236833572387695, 0.0016705989837646484, 0.0021175146102905273, 0.0025644302368164062, 0.003011345863342285, 0.003458261489868164, 0.003905177116394043, 0.004352092742919922, 0.004799008369445801, 0.00524592399597168, 0.005692839622497559, 0.0061397552490234375, 0.006586670875549316, 0.007033586502075195, 0.007480502128601074, 0.007927417755126953, 0.008374333381652832, 0.008821249008178711, 0.00926816463470459, 0.009715080261230469, 0.010161995887756348, 0.010608911514282227, 0.011055827140808105, 0.011502742767333984, 0.011949658393859863, 0.012396574020385742, 0.012843489646911621, 0.0132904052734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 9.0, 19.0, 48.0, 86.0, 119.0, 137.0, 4193412.0, 143.0, 110.0, 79.0, 57.0, 34.0, 20.0, 10.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0052337646484375, -0.005111336708068848, -0.004988908767700195, -0.004866480827331543, -0.004744052886962891, -0.004621624946594238, -0.004499197006225586, -0.004376769065856934, -0.004254341125488281, -0.004131913185119629, -0.0040094852447509766, -0.0038870573043823242, -0.003764629364013672, -0.0036422014236450195, -0.003519773483276367, -0.003397345542907715, -0.0032749176025390625, -0.00315248966217041, -0.003030061721801758, -0.0029076337814331055, -0.002785205841064453, -0.0026627779006958008, -0.0025403499603271484, -0.002417922019958496, -0.0022954940795898438, -0.0021730661392211914, -0.002050638198852539, -0.0019282102584838867, -0.0018057823181152344, -0.001683354377746582, -0.0015609264373779297, -0.0014384984970092773, -0.001316070556640625, -0.0011936426162719727, -0.0010712146759033203, -0.000948786735534668, -0.0008263587951660156, -0.0007039308547973633, -0.0005815029144287109, -0.0004590749740600586, -0.00033664703369140625, -0.0002142190933227539, -9.179115295410156e-05, 3.063678741455078e-05, 0.00015306472778320312, 0.00027549266815185547, 0.0003979206085205078, 0.0005203485488891602, 0.0006427764892578125, 0.0007652044296264648, 0.0008876323699951172, 0.0010100603103637695, 0.0011324882507324219, 0.0012549161911010742, 0.0013773441314697266, 0.001499772071838379, 0.0016222000122070312, 0.0017446279525756836, 0.001867055892944336, 0.0019894838333129883, 0.0021119117736816406, 0.002234339714050293, 0.0023567676544189453, 0.0024791955947875977, 0.00260162353515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4095.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-06, 1.2765638530254364e-05, 3.0001625418663025e-05, 4.7237612307071686e-05, 6.447359919548035e-05, 8.170958608388901e-05, 9.894557297229767e-05, 0.00011618155986070633, 0.000133417546749115, 0.00015065353363752365, 0.0001678895205259323, 0.00018512550741434097, 0.00020236149430274963, 0.0002195974811911583, 0.00023683346807956696, 0.0002540694549679756, 0.0002713054418563843, 0.00028854142874479294, 0.0003057774156332016, 0.00032301340252161026, 0.0003402493894100189, 0.0003574853762984276, 0.00037472136318683624, 0.0003919573500752449, 0.00040919333696365356, 0.0004264293238520622, 0.0004436653107404709, 0.00046090129762887955, 0.0004781372845172882, 0.0004953732714056969, 0.0005126092582941055, 0.0005298452451825142, 0.0005470812320709229, 0.0005643172189593315, 0.0005815532058477402, 0.0005987891927361488, 0.0006160251796245575, 0.0006332611665129662, 0.0006504971534013748, 0.0006677331402897835, 0.0006849691271781921, 0.0007022051140666008, 0.0007194411009550095, 0.0007366770878434181, 0.0007539130747318268, 0.0007711490616202354, 0.0007883850485086441, 0.0008056210353970528, 0.0008228570222854614, 0.0008400930091738701, 0.0008573289960622787, 0.0008745649829506874, 0.0008918009698390961, 0.0009090369567275047, 0.0009262729436159134, 0.000943508930504322, 0.0009607449173927307, 0.0009779809042811394, 0.000995216891169548, 0.0010124528780579567, 0.0010296888649463654, 0.001046924851834774, 0.0010641608387231827, 0.0010813968256115913, 0.0010986328125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 10.0, 991.0, 10.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004412984009832144, -0.004280544817447662, -0.004148106090724468, -0.004015666898339987, -0.0038832281716167927, -0.0037507889792323112, -0.0036183500196784735, -0.0034859110601246357, -0.003353472100570798, -0.00322103314101696, -0.0030885941814631224, -0.0029561552219092846, -0.002823716029524803, -0.002691277302801609, -0.0025588381104171276, -0.00242639915086329, -0.002293960191309452, -0.0021615212317556143, -0.0020290822722017765, -0.001896643196232617, -0.0017642042366787791, -0.0016317652771249413, -0.0014993262011557817, -0.001366887241601944, -0.0012344482820481062, -0.0011020093224942684, -0.0009695703047327697, -0.000837131286971271, -0.0007046923274174333, -0.0005722533678635955, -0.0004398143501020968, -0.0003073753323405981, -0.00017493590712547302, -4.249691846780479e-05, 8.994207018986344e-05, 0.00022238105884753168, 0.0003548200475051999, 0.0004872590070590377, 0.0006196980248205364, 0.0007521370425820351, 0.0008845760021358728, 0.0010170149616897106, 0.0011494539212435484, 0.001281892997212708, 0.0014143319567665458, 0.0015467709163203835, 0.0016792099922895432, 0.001811648951843381, 0.0019440879113972187, 0.0020765268709510565, 0.0022089658305048943, 0.002341404790058732, 0.00247384374961257, 0.0026062829419970512, 0.002738721901550889, 0.002871160861104727, 0.0030035998206585646, 0.0031360387802124023, 0.00326847773976624, 0.003400916699320078, 0.0035333558917045593, 0.0036657946184277534, 0.003798233810812235, 0.003930673003196716, 0.00406311172991991]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 14.0, 22.0, 82.0, 143.0, 181.0, 198.0, 173.0, 90.0, 55.0, 15.0, 7.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009084939956665039, -0.000858621671795845, -0.0008087493479251862, -0.0007588770240545273, -0.0007090047001838684, -0.0006591323763132095, -0.0006092600524425507, -0.0005593877285718918, -0.0005095154047012329, -0.00045964308083057404, -0.00040977075695991516, -0.0003598984330892563, -0.0003100261092185974, -0.00026015378534793854, -0.00021028146147727966, -0.0001604091376066208, -0.00011053681373596191, -6.066448986530304e-05, -1.0792165994644165e-05, 3.908015787601471e-05, 8.895248174667358e-05, 0.00013882480561733246, 0.00018869712948799133, 0.0002385694533586502, 0.0002884417772293091, 0.00033831410109996796, 0.00038818642497062683, 0.0004380587488412857, 0.0004879310727119446, 0.0005378033965826035, 0.0005876757204532623, 0.0006375480443239212, 0.0006874203681945801, 0.000737292692065239, 0.0007871650159358978, 0.0008370373398065567, 0.0008869096636772156, 0.0009367819875478745, 0.0009866543114185333, 0.0010365266352891922, 0.001086398959159851, 0.00113627128303051, 0.0011861436069011688, 0.0012360159307718277, 0.0012858882546424866, 0.0013357605785131454, 0.0013856329023838043, 0.0014355052262544632, 0.001485377550125122, 0.001535249873995781, 0.0015851221978664398, 0.0016349945217370987, 0.0016848668456077576, 0.0017347391694784164, 0.0017846114933490753, 0.0018344838172197342, 0.001884356141090393, 0.001934228464961052, 0.001984100788831711, 0.0020339731127023697, 0.0020838454365730286, 0.0021337177604436874, 0.0021835900843143463, 0.002233462408185005, 0.002283334732055664]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 7.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 6.0, 10.0, 7.0, 13.0, 25.0, 27.0, 48.0, 84.0, 151.0, 312.0, 819.0, 2406.0, 11707.0, 960226.0, 64346.0, 5757.0, 1461.0, 566.0, 253.0, 120.0, 59.0, 45.0, 30.0, 10.0, 12.0, 12.0, 3.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.054656982421875, -0.05282258987426758, -0.050988197326660156, -0.049153804779052734, -0.04731941223144531, -0.04548501968383789, -0.04365062713623047, -0.04181623458862305, -0.039981842041015625, -0.0381474494934082, -0.03631305694580078, -0.03447866439819336, -0.03264427185058594, -0.030809879302978516, -0.028975486755371094, -0.027141094207763672, -0.02530670166015625, -0.023472309112548828, -0.021637916564941406, -0.019803524017333984, -0.017969131469726562, -0.01613473892211914, -0.014300346374511719, -0.012465953826904297, -0.010631561279296875, -0.008797168731689453, -0.006962776184082031, -0.005128383636474609, -0.0032939910888671875, -0.0014595985412597656, 0.00037479400634765625, 0.002209186553955078, 0.0040435791015625, 0.005877971649169922, 0.007712364196777344, 0.009546756744384766, 0.011381149291992188, 0.01321554183959961, 0.015049934387207031, 0.016884326934814453, 0.018718719482421875, 0.020553112030029297, 0.02238750457763672, 0.02422189712524414, 0.026056289672851562, 0.027890682220458984, 0.029725074768066406, 0.03155946731567383, 0.03339385986328125, 0.03522825241088867, 0.037062644958496094, 0.038897037506103516, 0.04073143005371094, 0.04256582260131836, 0.04440021514892578, 0.0462346076965332, 0.048069000244140625, 0.04990339279174805, 0.05173778533935547, 0.05357217788696289, 0.05540657043457031, 0.057240962982177734, 0.059075355529785156, 0.06090974807739258, 0.062744140625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 2.0, 5.0, 7.0, 6.0, 11.0, 12.0, 16.0, 36.0, 73.0, 182.0, 287.0, 169.0, 79.0, 18.0, 16.0, 12.0, 10.0, 7.0, 6.0, 6.0, 6.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01531219482421875, -0.014865279197692871, -0.014418363571166992, -0.013971447944641113, -0.013524532318115234, -0.013077616691589355, -0.012630701065063477, -0.012183785438537598, -0.011736869812011719, -0.01128995418548584, -0.010843038558959961, -0.010396122932434082, -0.009949207305908203, -0.009502291679382324, -0.009055376052856445, -0.008608460426330566, -0.008161544799804688, -0.007714629173278809, -0.00726771354675293, -0.006820797920227051, -0.006373882293701172, -0.005926966667175293, -0.005480051040649414, -0.005033135414123535, -0.004586219787597656, -0.004139304161071777, -0.0036923885345458984, -0.0032454729080200195, -0.0027985572814941406, -0.0023516416549682617, -0.0019047260284423828, -0.001457810401916504, -0.001010894775390625, -0.0005639791488647461, -0.00011706352233886719, 0.0003298521041870117, 0.0007767677307128906, 0.0012236833572387695, 0.0016705989837646484, 0.0021175146102905273, 0.0025644302368164062, 0.003011345863342285, 0.003458261489868164, 0.003905177116394043, 0.004352092742919922, 0.004799008369445801, 0.00524592399597168, 0.005692839622497559, 0.0061397552490234375, 0.006586670875549316, 0.007033586502075195, 0.007480502128601074, 0.007927417755126953, 0.008374333381652832, 0.008821249008178711, 0.00926816463470459, 0.009715080261230469, 0.010161995887756348, 0.010608911514282227, 0.011055827140808105, 0.011502742767333984, 0.011949658393859863, 0.012396574020385742, 0.012843489646911621, 0.0132904052734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 5.0, 6.0, 6.0, 11.0, 7.0, 11.0, 14.0, 21.0, 10.0, 25.0, 24.0, 25.0, 38.0, 39.0, 49.0, 79.0, 176.0, 347.0, 790.0, 2515.0, 641604.0, 398634.0, 2429.0, 779.0, 342.0, 166.0, 92.0, 46.0, 30.0, 36.0, 30.0, 20.0, 22.0, 18.0, 12.0, 12.0, 15.0, 13.0, 4.0, 8.0, 6.0, 9.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.042449951171875, -0.0411229133605957, -0.039795875549316406, -0.03846883773803711, -0.03714179992675781, -0.035814762115478516, -0.03448772430419922, -0.03316068649291992, -0.031833648681640625, -0.030506610870361328, -0.02917957305908203, -0.027852535247802734, -0.026525497436523438, -0.02519845962524414, -0.023871421813964844, -0.022544384002685547, -0.02121734619140625, -0.019890308380126953, -0.018563270568847656, -0.01723623275756836, -0.015909194946289062, -0.014582157135009766, -0.013255119323730469, -0.011928081512451172, -0.010601043701171875, -0.009274005889892578, -0.007946968078613281, -0.006619930267333984, -0.0052928924560546875, -0.003965854644775391, -0.0026388168334960938, -0.0013117790222167969, 1.52587890625e-05, 0.0013422966003417969, 0.0026693344116210938, 0.003996372222900391, 0.0053234100341796875, 0.006650447845458984, 0.007977485656738281, 0.009304523468017578, 0.010631561279296875, 0.011958599090576172, 0.013285636901855469, 0.014612674713134766, 0.015939712524414062, 0.01726675033569336, 0.018593788146972656, 0.019920825958251953, 0.02124786376953125, 0.022574901580810547, 0.023901939392089844, 0.02522897720336914, 0.026556015014648438, 0.027883052825927734, 0.02921009063720703, 0.030537128448486328, 0.031864166259765625, 0.03319120407104492, 0.03451824188232422, 0.035845279693603516, 0.03717231750488281, 0.03849935531616211, 0.039826393127441406, 0.0411534309387207, 0.04248046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 5.0, 7.0, 6.0, 10.0, 8.0, 11.0, 13.0, 21.0, 10.0, 25.0, 24.0, 27.0, 35.0, 32.0, 33.0, 28.0, 31.0, 44.0, 30.0, 43.0, 40.0, 46.0, 32.0, 39.0, 42.0, 36.0, 37.0, 26.0, 26.0, 37.0, 30.0, 21.0, 21.0, 18.0, 13.0, 11.0, 14.0, 14.0, 4.0, 8.0, 6.0, 9.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.0263824462890625, -0.025557279586791992, -0.024732112884521484, -0.023906946182250977, -0.02308177947998047, -0.02225661277770996, -0.021431446075439453, -0.020606279373168945, -0.019781112670898438, -0.01895594596862793, -0.018130779266357422, -0.017305612564086914, -0.016480445861816406, -0.0156552791595459, -0.01483011245727539, -0.014004945755004883, -0.013179779052734375, -0.012354612350463867, -0.01152944564819336, -0.010704278945922852, -0.009879112243652344, -0.009053945541381836, -0.008228778839111328, -0.00740361213684082, -0.0065784454345703125, -0.005753278732299805, -0.004928112030029297, -0.004102945327758789, -0.0032777786254882812, -0.0024526119232177734, -0.0016274452209472656, -0.0008022785186767578, 2.288818359375e-05, 0.0008480548858642578, 0.0016732215881347656, 0.0024983882904052734, 0.0033235549926757812, 0.004148721694946289, 0.004973888397216797, 0.005799055099487305, 0.0066242218017578125, 0.00744938850402832, 0.008274555206298828, 0.009099721908569336, 0.009924888610839844, 0.010750055313110352, 0.01157522201538086, 0.012400388717651367, 0.013225555419921875, 0.014050722122192383, 0.01487588882446289, 0.0157010555267334, 0.016526222229003906, 0.017351388931274414, 0.018176555633544922, 0.01900172233581543, 0.019826889038085938, 0.020652055740356445, 0.021477222442626953, 0.02230238914489746, 0.02312755584716797, 0.023952722549438477, 0.024777889251708984, 0.025603055953979492, 0.02642822265625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 6.0, 4.0, 8.0, 14.0, 21.0, 16.0, 29.0, 44.0, 70.0, 99.0, 178.0, 310.0, 735.0, 2189.0, 10327.0, 854326.0, 170036.0, 6475.0, 2171.0, 704.0, 308.0, 153.0, 104.0, 59.0, 66.0, 27.0, 23.0, 11.0, 11.0, 4.0, 8.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.761882781982422e-06, -8.469447493553162e-06, -8.177012205123901e-06, -7.884576916694641e-06, -7.592141628265381e-06, -7.299706339836121e-06, -7.00727105140686e-06, -6.7148357629776e-06, -6.42240047454834e-06, -6.12996518611908e-06, -5.837529897689819e-06, -5.545094609260559e-06, -5.252659320831299e-06, -4.9602240324020386e-06, -4.667788743972778e-06, -4.375353455543518e-06, -4.082918167114258e-06, -3.7904828786849976e-06, -3.4980475902557373e-06, -3.205612301826477e-06, -2.913177013397217e-06, -2.6207417249679565e-06, -2.3283064365386963e-06, -2.035871148109436e-06, -1.7434358596801758e-06, -1.4510005712509155e-06, -1.1585652828216553e-06, -8.66129994392395e-07, -5.736947059631348e-07, -2.812594175338745e-07, 1.1175870895385742e-08, 3.03611159324646e-07, 5.960464477539062e-07, 8.884817361831665e-07, 1.1809170246124268e-06, 1.473352313041687e-06, 1.7657876014709473e-06, 2.0582228899002075e-06, 2.3506581783294678e-06, 2.643093466758728e-06, 2.9355287551879883e-06, 3.2279640436172485e-06, 3.520399332046509e-06, 3.812834620475769e-06, 4.105269908905029e-06, 4.3977051973342896e-06, 4.69014048576355e-06, 4.98257577419281e-06, 5.27501106262207e-06, 5.5674463510513306e-06, 5.859881639480591e-06, 6.152316927909851e-06, 6.444752216339111e-06, 6.737187504768372e-06, 7.029622793197632e-06, 7.322058081626892e-06, 7.614493370056152e-06, 7.906928658485413e-06, 8.199363946914673e-06, 8.491799235343933e-06, 8.784234523773193e-06, 9.076669812202454e-06, 9.369105100631714e-06, 9.661540389060974e-06, 9.953975677490234e-06]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 9.0, 6.0, 8.0, 18.0, 17.0, 23.0, 37.0, 47.0, 36.0, 76.0, 38.0, 75.0, 73.0, 84.0, 65.0, 50.0, 67.0, 35.0, 65.0, 37.0, 24.0, 27.0, 15.0, 21.0, 16.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.112720489501953e-06, -3.959052264690399e-06, -3.8053840398788452e-06, -3.6517158150672913e-06, -3.4980475902557373e-06, -3.3443793654441833e-06, -3.1907111406326294e-06, -3.0370429158210754e-06, -2.8833746910095215e-06, -2.7297064661979675e-06, -2.5760382413864136e-06, -2.4223700165748596e-06, -2.2687017917633057e-06, -2.1150335669517517e-06, -1.9613653421401978e-06, -1.8076971173286438e-06, -1.6540288925170898e-06, -1.5003606677055359e-06, -1.346692442893982e-06, -1.193024218082428e-06, -1.039355993270874e-06, -8.856877684593201e-07, -7.320195436477661e-07, -5.783513188362122e-07, -4.246830940246582e-07, -2.7101486921310425e-07, -1.1734664440155029e-07, 3.632158041000366e-08, 1.8998980522155762e-07, 3.4365803003311157e-07, 4.973262548446655e-07, 6.509944796562195e-07, 8.046627044677734e-07, 9.583309292793274e-07, 1.1119991540908813e-06, 1.2656673789024353e-06, 1.4193356037139893e-06, 1.5730038285255432e-06, 1.7266720533370972e-06, 1.8803402781486511e-06, 2.034008502960205e-06, 2.187676727771759e-06, 2.341344952583313e-06, 2.495013177394867e-06, 2.648681402206421e-06, 2.802349627017975e-06, 2.956017851829529e-06, 3.1096860766410828e-06, 3.2633543014526367e-06, 3.4170225262641907e-06, 3.5706907510757446e-06, 3.7243589758872986e-06, 3.8780272006988525e-06, 4.0316954255104065e-06, 4.1853636503219604e-06, 4.339031875133514e-06, 4.492700099945068e-06, 4.646368324756622e-06, 4.800036549568176e-06, 4.95370477437973e-06, 5.107372999191284e-06, 5.261041224002838e-06, 5.414709448814392e-06, 5.568377673625946e-06, 5.7220458984375e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 18.0, 32.0, 34.0, 65.0, 155.0, 610.0, 1031175.0, 15767.0, 408.0, 122.0, 69.0, 36.0, 20.0, 4.0, 4.0, 2.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.796815872192383e-05, -3.684777766466141e-05, -3.572739660739899e-05, -3.4607015550136566e-05, -3.3486634492874146e-05, -3.2366253435611725e-05, -3.1245872378349304e-05, -3.0125491321086884e-05, -2.9005110263824463e-05, -2.7884729206562042e-05, -2.676434814929962e-05, -2.56439670920372e-05, -2.452358603477478e-05, -2.340320497751236e-05, -2.228282392024994e-05, -2.116244286298752e-05, -2.0042061805725098e-05, -1.8921680748462677e-05, -1.7801299691200256e-05, -1.6680918633937836e-05, -1.5560537576675415e-05, -1.4440156519412994e-05, -1.3319775462150574e-05, -1.2199394404888153e-05, -1.1079013347625732e-05, -9.958632290363312e-06, -8.838251233100891e-06, -7.71787017583847e-06, -6.59748911857605e-06, -5.477108061313629e-06, -4.3567270040512085e-06, -3.236345946788788e-06, -2.115964889526367e-06, -9.955838322639465e-07, 1.2479722499847412e-07, 1.2451782822608948e-06, 2.3655593395233154e-06, 3.485940396785736e-06, 4.606321454048157e-06, 5.726702511310577e-06, 6.847083568572998e-06, 7.967464625835419e-06, 9.08784568309784e-06, 1.020822674036026e-05, 1.132860779762268e-05, 1.2448988854885101e-05, 1.3569369912147522e-05, 1.4689750969409943e-05, 1.5810132026672363e-05, 1.6930513083934784e-05, 1.8050894141197205e-05, 1.9171275198459625e-05, 2.0291656255722046e-05, 2.1412037312984467e-05, 2.2532418370246887e-05, 2.3652799427509308e-05, 2.477318048477173e-05, 2.589356154203415e-05, 2.701394259929657e-05, 2.813432365655899e-05, 2.925470471382141e-05, 3.0375085771083832e-05, 3.149546682834625e-05, 3.261584788560867e-05, 3.3736228942871094e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 12.0, 19.0, 16.0, 35.0, 42.0, 68.0, 485.0, 106.0, 73.0, 46.0, 35.0, 16.0, 11.0, 2.0, 3.0, 1.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3603439331054688e-05, -2.290681004524231e-05, -2.221018075942993e-05, -2.1513551473617554e-05, -2.0816922187805176e-05, -2.0120292901992798e-05, -1.942366361618042e-05, -1.8727034330368042e-05, -1.8030405044555664e-05, -1.7333775758743286e-05, -1.6637146472930908e-05, -1.594051718711853e-05, -1.5243887901306152e-05, -1.4547258615493774e-05, -1.3850629329681396e-05, -1.3154000043869019e-05, -1.245737075805664e-05, -1.1760741472244263e-05, -1.1064112186431885e-05, -1.0367482900619507e-05, -9.670853614807129e-06, -8.974224328994751e-06, -8.277595043182373e-06, -7.580965757369995e-06, -6.884336471557617e-06, -6.187707185745239e-06, -5.491077899932861e-06, -4.794448614120483e-06, -4.0978193283081055e-06, -3.4011900424957275e-06, -2.7045607566833496e-06, -2.0079314708709717e-06, -1.3113021850585938e-06, -6.146728992462158e-07, 8.195638656616211e-08, 7.7858567237854e-07, 1.475214958190918e-06, 2.171844244003296e-06, 2.868473529815674e-06, 3.5651028156280518e-06, 4.26173210144043e-06, 4.958361387252808e-06, 5.6549906730651855e-06, 6.3516199588775635e-06, 7.048249244689941e-06, 7.74487853050232e-06, 8.441507816314697e-06, 9.138137102127075e-06, 9.834766387939453e-06, 1.0531395673751831e-05, 1.1228024959564209e-05, 1.1924654245376587e-05, 1.2621283531188965e-05, 1.3317912817001343e-05, 1.401454210281372e-05, 1.4711171388626099e-05, 1.5407800674438477e-05, 1.6104429960250854e-05, 1.6801059246063232e-05, 1.749768853187561e-05, 1.8194317817687988e-05, 1.8890947103500366e-05, 1.9587576389312744e-05, 2.0284205675125122e-05, 2.09808349609375e-05]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 12.0, 956.0, 50.0], "bins": [-1.4032156467437744, -1.3808462619781494, -1.3584768772125244, -1.3361074924468994, -1.3137381076812744, -1.2913687229156494, -1.2689993381500244, -1.2466299533843994, -1.2242605686187744, -1.2018911838531494, -1.1795217990875244, -1.1571524143218994, -1.1347830295562744, -1.1124136447906494, -1.0900442600250244, -1.0676748752593994, -1.0453054904937744, -1.0229361057281494, -1.0005667209625244, -0.9781973361968994, -0.9558279514312744, -0.9334585666656494, -0.9110891819000244, -0.8887197971343994, -0.8663503527641296, -0.8439809679985046, -0.8216115832328796, -0.7992421984672546, -0.7768728137016296, -0.7545034289360046, -0.7321340441703796, -0.7097646594047546, -0.6873952150344849, -0.6650258302688599, -0.6426564455032349, -0.6202870607376099, -0.5979176759719849, -0.5755482912063599, -0.5531789064407349, -0.5308095216751099, -0.5084401369094849, -0.48607075214385986, -0.46370136737823486, -0.44133198261260986, -0.41896259784698486, -0.39659321308135986, -0.37422382831573486, -0.35185444355010986, -0.32948505878448486, -0.30711567401885986, -0.28474628925323486, -0.26237690448760986, -0.24000751972198486, -0.21763813495635986, -0.19526873528957367, -0.17289935052394867, -0.15052996575832367, -0.12816058099269867, -0.10579119622707367, -0.08342180401086807, -0.06105241924524307, -0.03868303447961807, -0.016313642263412476, 0.006055742502212524, 0.028425127267837524]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 10.0, 5.0, 7.0, 9.0, 12.0, 24.0, 35.0, 28.0, 43.0, 41.0, 54.0, 53.0, 64.0, 82.0, 93.0, 85.0, 64.0, 58.0, 52.0, 43.0, 33.0, 30.0, 22.0, 14.0, 12.0, 20.0, 8.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20088762044906616, -0.19381478428840637, -0.18674196302890778, -0.17966912686824799, -0.1725962907075882, -0.1655234694480896, -0.1584506332874298, -0.15137779712677002, -0.14430496096611023, -0.13723212480545044, -0.13015930354595184, -0.12308646738529205, -0.11601363122463226, -0.10894080251455307, -0.10186797380447388, -0.09479513764381409, -0.08772231638431549, -0.0806494876742363, -0.07357665151357651, -0.06650382280349731, -0.05943099036812782, -0.05235815793275833, -0.04528532922267914, -0.03821249678730965, -0.031139664351940155, -0.024066831916570663, -0.01699400134384632, -0.009921170771121979, -0.002848338335752487, 0.004224494099617004, 0.011297322809696198, 0.01837015524506569, 0.02544298768043518, 0.03251582011580467, 0.039588652551174164, 0.04666148126125336, 0.05373431369662285, 0.06080714613199234, 0.06787997484207153, 0.07495281100273132, 0.08202563971281052, 0.08909846842288971, 0.0961713045835495, 0.10324413329362869, 0.11031696200370789, 0.11738979816436768, 0.12446262687444687, 0.13153545558452606, 0.13860829174518585, 0.14568112790584564, 0.15275394916534424, 0.15982678532600403, 0.16689962148666382, 0.1739724576473236, 0.1810452789068222, 0.188118115067482, 0.1951909363269806, 0.20226377248764038, 0.20933659374713898, 0.21640942990779877, 0.22348226606845856, 0.23055508732795715, 0.23762792348861694, 0.24470075964927673, 0.2517735958099365]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 8.0, 7.0, 6.0, 4.0, 0.0, 6.0, 6.0, 16.0, 23.0, 10.0, 20.0, 31.0, 24.0, 28.0, 53.0, 63.0, 94.0, 122.0, 384.0, 981.0, 4188650.0, 2520.0, 515.0, 221.0, 121.0, 72.0, 63.0, 33.0, 36.0, 25.0, 15.0, 23.0, 11.0, 12.0, 15.0, 9.0, 8.0, 13.0, 6.0, 4.0, 5.0, 8.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0], "bins": [-0.0022335052490234375, -0.002158612012863159, -0.002083718776702881, -0.0020088255405426025, -0.0019339323043823242, -0.001859039068222046, -0.0017841458320617676, -0.0017092525959014893, -0.001634359359741211, -0.0015594661235809326, -0.0014845728874206543, -0.001409679651260376, -0.0013347864151000977, -0.0012598931789398193, -0.001184999942779541, -0.0011101067066192627, -0.0010352134704589844, -0.0009603202342987061, -0.0008854269981384277, -0.0008105337619781494, -0.0007356405258178711, -0.0006607472896575928, -0.0005858540534973145, -0.0005109608173370361, -0.0004360675811767578, -0.0003611743450164795, -0.00028628110885620117, -0.00021138787269592285, -0.00013649463653564453, -6.160140037536621e-05, 1.329183578491211e-05, 8.818507194519043e-05, 0.00016307830810546875, 0.00023797154426574707, 0.0003128647804260254, 0.0003877580165863037, 0.00046265125274658203, 0.0005375444889068604, 0.0006124377250671387, 0.000687330961227417, 0.0007622241973876953, 0.0008371174335479736, 0.000912010669708252, 0.0009869039058685303, 0.0010617971420288086, 0.001136690378189087, 0.0012115836143493652, 0.0012864768505096436, 0.0013613700866699219, 0.0014362633228302002, 0.0015111565589904785, 0.0015860497951507568, 0.0016609430313110352, 0.0017358362674713135, 0.0018107295036315918, 0.0018856227397918701, 0.0019605159759521484, 0.0020354092121124268, 0.002110302448272705, 0.0021851956844329834, 0.0022600889205932617, 0.00233498215675354, 0.0024098753929138184, 0.0024847686290740967, 0.002559661865234375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 6.0, 12.0, 12.0, 16.0, 35.0, 76.0, 180.0, 287.0, 168.0, 79.0, 20.0, 15.0, 12.0, 11.0, 6.0, 6.0, 5.0, 7.0, 2.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0152740478515625, -0.014828205108642578, -0.014382362365722656, -0.013936519622802734, -0.013490676879882812, -0.01304483413696289, -0.012598991394042969, -0.012153148651123047, -0.011707305908203125, -0.011261463165283203, -0.010815620422363281, -0.01036977767944336, -0.009923934936523438, -0.009478092193603516, -0.009032249450683594, -0.008586406707763672, -0.00814056396484375, -0.007694721221923828, -0.007248878479003906, -0.006803035736083984, -0.0063571929931640625, -0.005911350250244141, -0.005465507507324219, -0.005019664764404297, -0.004573822021484375, -0.004127979278564453, -0.0036821365356445312, -0.0032362937927246094, -0.0027904510498046875, -0.0023446083068847656, -0.0018987655639648438, -0.0014529228210449219, -0.001007080078125, -0.0005612373352050781, -0.00011539459228515625, 0.0003304481506347656, 0.0007762908935546875, 0.0012221336364746094, 0.0016679763793945312, 0.002113819122314453, 0.002559661865234375, 0.003005504608154297, 0.0034513473510742188, 0.0038971900939941406, 0.0043430328369140625, 0.004788875579833984, 0.005234718322753906, 0.005680561065673828, 0.00612640380859375, 0.006572246551513672, 0.007018089294433594, 0.007463932037353516, 0.007909774780273438, 0.00835561752319336, 0.008801460266113281, 0.009247303009033203, 0.009693145751953125, 0.010138988494873047, 0.010584831237792969, 0.01103067398071289, 0.011476516723632812, 0.011922359466552734, 0.012368202209472656, 0.012814044952392578, 0.0132598876953125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 11.0, 19.0, 48.0, 106.0, 188.0, 463.0, 1304.0, 4183296.0, 7034.0, 1103.0, 388.0, 173.0, 82.0, 36.0, 19.0, 12.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003284454345703125, -0.003206104040145874, -0.003127753734588623, -0.003049403429031372, -0.002971053123474121, -0.00289270281791687, -0.002814352512359619, -0.002736002206802368, -0.002657651901245117, -0.002579301595687866, -0.0025009512901306152, -0.0024226009845733643, -0.0023442506790161133, -0.0022659003734588623, -0.0021875500679016113, -0.0021091997623443604, -0.0020308494567871094, -0.0019524991512298584, -0.0018741488456726074, -0.0017957985401153564, -0.0017174482345581055, -0.0016390979290008545, -0.0015607476234436035, -0.0014823973178863525, -0.0014040470123291016, -0.0013256967067718506, -0.0012473464012145996, -0.0011689960956573486, -0.0010906457901000977, -0.0010122954845428467, -0.0009339451789855957, -0.0008555948734283447, -0.0007772445678710938, -0.0006988942623138428, -0.0006205439567565918, -0.0005421936511993408, -0.00046384334564208984, -0.00038549304008483887, -0.0003071427345275879, -0.00022879242897033691, -0.00015044212341308594, -7.209181785583496e-05, 6.258487701416016e-06, 8.460879325866699e-05, 0.00016295909881591797, 0.00024130940437316895, 0.0003196597099304199, 0.0003980100154876709, 0.0004763603210449219, 0.0005547106266021729, 0.0006330609321594238, 0.0007114112377166748, 0.0007897615432739258, 0.0008681118488311768, 0.0009464621543884277, 0.0010248124599456787, 0.0011031627655029297, 0.0011815130710601807, 0.0012598633766174316, 0.0013382136821746826, 0.0014165639877319336, 0.0014949142932891846, 0.0015732645988464355, 0.0016516149044036865, 0.0017299652099609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4054.0, 23.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006580352783203125, -0.0006280094385147095, -0.0005979835987091064, -0.0005679577589035034, -0.0005379319190979004, -0.0005079060792922974, -0.00047788023948669434, -0.0004478543996810913, -0.0004178285598754883, -0.00038780272006988525, -0.0003577768802642822, -0.0003277510404586792, -0.00029772520065307617, -0.00026769936084747314, -0.00023767352104187012, -0.0002076476812362671, -0.00017762184143066406, -0.00014759600162506104, -0.00011757016181945801, -8.754432201385498e-05, -5.751848220825195e-05, -2.7492642402648926e-05, 2.5331974029541016e-06, 3.255903720855713e-05, 6.258487701416016e-05, 9.261071681976318e-05, 0.0001226365566253662, 0.00015266239643096924, 0.00018268823623657227, 0.0002127140760421753, 0.00024273991584777832, 0.00027276575565338135, 0.0003027915954589844, 0.0003328174352645874, 0.00036284327507019043, 0.00039286911487579346, 0.0004228949546813965, 0.0004529207944869995, 0.00048294663429260254, 0.0005129724740982056, 0.0005429983139038086, 0.0005730241537094116, 0.0006030499935150146, 0.0006330758333206177, 0.0006631016731262207, 0.0006931275129318237, 0.0007231533527374268, 0.0007531791925430298, 0.0007832050323486328, 0.0008132308721542358, 0.0008432567119598389, 0.0008732825517654419, 0.0009033083915710449, 0.000933334231376648, 0.000963360071182251, 0.000993385910987854, 0.001023411750793457, 0.00105343759059906, 0.001083463430404663, 0.0011134892702102661, 0.0011435151100158691, 0.0011735409498214722, 0.0012035667896270752, 0.0012335926294326782, 0.0012636184692382812]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 35.0, 833.0, 133.0, 8.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.004044258035719395, -0.003970435354858637, -0.0038966129068285227, -0.003822790225967765, -0.003748967545107007, -0.003675145097076893, -0.003601322416216135, -0.003527499735355377, -0.003453677287325263, -0.003379854606464505, -0.003306032158434391, -0.003232209477573633, -0.0031583867967128754, -0.003084564348682761, -0.0030107416678220034, -0.002936919219791889, -0.0028630965389311314, -0.0027892738580703735, -0.0027154514100402594, -0.0026416287291795015, -0.0025678060483187437, -0.0024939836002886295, -0.0024201609194278717, -0.002346338238567114, -0.002272515557706356, -0.0021986928768455982, -0.002124870428815484, -0.0020510477479547262, -0.0019772250670939684, -0.0019034026190638542, -0.0018295799382030964, -0.0017557573737576604, -0.0016819348093122244, -0.0016081122448667884, -0.0015342895640060306, -0.0014604669995605946, -0.0013866444351151586, -0.0013128218706697226, -0.0012389991898089647, -0.0011651766253635287, -0.0010913540609180927, -0.0010175314964726567, -0.0009437088738195598, -0.0008698862511664629, -0.0007960636867210269, -0.00072224106406793, -0.0006484184414148331, -0.0005745958769693971, -0.0005007731961086392, -0.0004269506025593728, -0.0003531280090101063, -0.0002793053863570094, -0.00020548279280774295, -0.0001316601992584765, -5.783757660537958e-05, 1.598498784005642e-05, 8.980761049315333e-05, 0.0001636302040424198, 0.00023745281214360148, 0.00031127542024478316, 0.0003850980137940496, 0.0004589206073433161, 0.000532743229996413, 0.000606565794441849, 0.0006803884170949459]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 10.0, 10.0, 16.0, 13.0, 25.0, 36.0, 41.0, 38.0, 59.0, 81.0, 106.0, 98.0, 94.0, 63.0, 71.0, 57.0, 44.0, 40.0, 27.0, 16.0, 17.0, 12.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011906623840332031, -0.0011424385011196136, -0.0010942146182060242, -0.0010459907352924347, -0.0009977668523788452, -0.0009495429694652557, -0.0009013190865516663, -0.0008530952036380768, -0.0008048713207244873, -0.0007566474378108978, -0.0007084235548973083, -0.0006601996719837189, -0.0006119757890701294, -0.0005637519061565399, -0.0005155280232429504, -0.00046730414032936096, -0.0004190802574157715, -0.000370856374502182, -0.00032263249158859253, -0.00027440860867500305, -0.00022618472576141357, -0.0001779608428478241, -0.00012973695993423462, -8.151307702064514e-05, -3.3289194107055664e-05, 1.4934688806533813e-05, 6.315857172012329e-05, 0.00011138245463371277, 0.00015960633754730225, 0.00020783022046089172, 0.0002560541033744812, 0.0003042779862880707, 0.00035250186920166016, 0.00040072575211524963, 0.0004489496350288391, 0.0004971735179424286, 0.0005453974008560181, 0.0005936212837696075, 0.000641845166683197, 0.0006900690495967865, 0.000738292932510376, 0.0007865168154239655, 0.0008347406983375549, 0.0008829645812511444, 0.0009311884641647339, 0.0009794123470783234, 0.0010276362299919128, 0.0010758601129055023, 0.0011240839958190918, 0.0011723078787326813, 0.0012205317616462708, 0.0012687556445598602, 0.0013169795274734497, 0.0013652034103870392, 0.0014134272933006287, 0.0014616511762142181, 0.0015098750591278076, 0.001558098942041397, 0.0016063228249549866, 0.001654546707868576, 0.0017027705907821655, 0.001750994473695755, 0.0017992183566093445, 0.001847442239522934, 0.0018956661224365234]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 5.0, 4.0, 6.0, 8.0, 16.0, 16.0, 15.0, 20.0, 42.0, 55.0, 80.0, 103.0, 162.0, 329.0, 629.0, 1255.0, 3148.0, 9977.0, 94080.0, 912470.0, 17974.0, 4546.0, 1687.0, 781.0, 420.0, 243.0, 134.0, 92.0, 76.0, 39.0, 31.0, 27.0, 20.0, 12.0, 9.0, 5.0, 6.0, 10.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.037872314453125, -0.03676462173461914, -0.03565692901611328, -0.03454923629760742, -0.03344154357910156, -0.0323338508605957, -0.031226158142089844, -0.030118465423583984, -0.029010772705078125, -0.027903079986572266, -0.026795387268066406, -0.025687694549560547, -0.024580001831054688, -0.023472309112548828, -0.02236461639404297, -0.02125692367553711, -0.02014923095703125, -0.01904153823852539, -0.01793384552001953, -0.016826152801513672, -0.015718460083007812, -0.014610767364501953, -0.013503074645996094, -0.012395381927490234, -0.011287689208984375, -0.010179996490478516, -0.009072303771972656, -0.007964611053466797, -0.0068569183349609375, -0.005749225616455078, -0.004641532897949219, -0.0035338401794433594, -0.0024261474609375, -0.0013184547424316406, -0.00021076202392578125, 0.0008969306945800781, 0.0020046234130859375, 0.003112316131591797, 0.004220008850097656, 0.005327701568603516, 0.006435394287109375, 0.007543087005615234, 0.008650779724121094, 0.009758472442626953, 0.010866165161132812, 0.011973857879638672, 0.013081550598144531, 0.01418924331665039, 0.01529693603515625, 0.01640462875366211, 0.01751232147216797, 0.018620014190673828, 0.019727706909179688, 0.020835399627685547, 0.021943092346191406, 0.023050785064697266, 0.024158477783203125, 0.025266170501708984, 0.026373863220214844, 0.027481555938720703, 0.028589248657226562, 0.029696941375732422, 0.03080463409423828, 0.03191232681274414, 0.03302001953125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 6.0, 12.0, 12.0, 16.0, 35.0, 76.0, 180.0, 287.0, 168.0, 79.0, 20.0, 15.0, 12.0, 11.0, 6.0, 6.0, 5.0, 7.0, 2.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0152740478515625, -0.014828205108642578, -0.014382362365722656, -0.013936519622802734, -0.013490676879882812, -0.01304483413696289, -0.012598991394042969, -0.012153148651123047, -0.011707305908203125, -0.011261463165283203, -0.010815620422363281, -0.01036977767944336, -0.009923934936523438, -0.009478092193603516, -0.009032249450683594, -0.008586406707763672, -0.00814056396484375, -0.007694721221923828, -0.007248878479003906, -0.006803035736083984, -0.0063571929931640625, -0.005911350250244141, -0.005465507507324219, -0.005019664764404297, -0.004573822021484375, -0.004127979278564453, -0.0036821365356445312, -0.0032362937927246094, -0.0027904510498046875, -0.0023446083068847656, -0.0018987655639648438, -0.0014529228210449219, -0.001007080078125, -0.0005612373352050781, -0.00011539459228515625, 0.0003304481506347656, 0.0007762908935546875, 0.0012221336364746094, 0.0016679763793945312, 0.002113819122314453, 0.002559661865234375, 0.003005504608154297, 0.0034513473510742188, 0.0038971900939941406, 0.0043430328369140625, 0.004788875579833984, 0.005234718322753906, 0.005680561065673828, 0.00612640380859375, 0.006572246551513672, 0.007018089294433594, 0.007463932037353516, 0.007909774780273438, 0.00835561752319336, 0.008801460266113281, 0.009247303009033203, 0.009693145751953125, 0.010138988494873047, 0.010584831237792969, 0.01103067398071289, 0.011476516723632812, 0.011922359466552734, 0.012368202209472656, 0.012814044952392578, 0.0132598876953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 3.0, 8.0, 6.0, 12.0, 13.0, 21.0, 20.0, 21.0, 36.0, 31.0, 26.0, 48.0, 84.0, 152.0, 368.0, 935.0, 4307.0, 1017606.0, 22239.0, 1465.0, 526.0, 210.0, 99.0, 59.0, 43.0, 29.0, 30.0, 29.0, 23.0, 20.0, 13.0, 12.0, 20.0, 4.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050628662109375, -0.04897928237915039, -0.04732990264892578, -0.04568052291870117, -0.04403114318847656, -0.04238176345825195, -0.040732383728027344, -0.039083003997802734, -0.037433624267578125, -0.035784244537353516, -0.034134864807128906, -0.0324854850769043, -0.030836105346679688, -0.029186725616455078, -0.02753734588623047, -0.02588796615600586, -0.02423858642578125, -0.02258920669555664, -0.02093982696533203, -0.019290447235107422, -0.017641067504882812, -0.015991687774658203, -0.014342308044433594, -0.012692928314208984, -0.011043548583984375, -0.009394168853759766, -0.007744789123535156, -0.006095409393310547, -0.0044460296630859375, -0.002796649932861328, -0.0011472702026367188, 0.0005021095275878906, 0.0021514892578125, 0.0038008689880371094, 0.005450248718261719, 0.007099628448486328, 0.008749008178710938, 0.010398387908935547, 0.012047767639160156, 0.013697147369384766, 0.015346527099609375, 0.016995906829833984, 0.018645286560058594, 0.020294666290283203, 0.021944046020507812, 0.023593425750732422, 0.02524280548095703, 0.02689218521118164, 0.02854156494140625, 0.03019094467163086, 0.03184032440185547, 0.03348970413208008, 0.03513908386230469, 0.0367884635925293, 0.038437843322753906, 0.040087223052978516, 0.041736602783203125, 0.043385982513427734, 0.045035362243652344, 0.04668474197387695, 0.04833412170410156, 0.04998350143432617, 0.05163288116455078, 0.05328226089477539, 0.054931640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 3.0, 8.0, 6.0, 12.0, 12.0, 22.0, 20.0, 19.0, 38.0, 29.0, 22.0, 35.0, 36.0, 39.0, 40.0, 48.0, 56.0, 44.0, 49.0, 53.0, 42.0, 41.0, 38.0, 40.0, 37.0, 27.0, 29.0, 28.0, 23.0, 21.0, 13.0, 12.0, 20.0, 4.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028411865234375, -0.027486562728881836, -0.026561260223388672, -0.025635957717895508, -0.024710655212402344, -0.02378535270690918, -0.022860050201416016, -0.02193474769592285, -0.021009445190429688, -0.020084142684936523, -0.01915884017944336, -0.018233537673950195, -0.01730823516845703, -0.016382932662963867, -0.015457630157470703, -0.014532327651977539, -0.013607025146484375, -0.012681722640991211, -0.011756420135498047, -0.010831117630004883, -0.009905815124511719, -0.008980512619018555, -0.00805521011352539, -0.0071299076080322266, -0.0062046051025390625, -0.0052793025970458984, -0.004354000091552734, -0.0034286975860595703, -0.0025033950805664062, -0.0015780925750732422, -0.0006527900695800781, 0.00027251243591308594, 0.00119781494140625, 0.002123117446899414, 0.003048419952392578, 0.003973722457885742, 0.004899024963378906, 0.00582432746887207, 0.006749629974365234, 0.0076749324798583984, 0.008600234985351562, 0.009525537490844727, 0.01045083999633789, 0.011376142501831055, 0.012301445007324219, 0.013226747512817383, 0.014152050018310547, 0.015077352523803711, 0.016002655029296875, 0.01692795753479004, 0.017853260040283203, 0.018778562545776367, 0.01970386505126953, 0.020629167556762695, 0.02155447006225586, 0.022479772567749023, 0.023405075073242188, 0.02433037757873535, 0.025255680084228516, 0.02618098258972168, 0.027106285095214844, 0.028031587600708008, 0.028956890106201172, 0.029882192611694336, 0.0308074951171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 11.0, 7.0, 14.0, 23.0, 28.0, 53.0, 111.0, 214.0, 855.0, 4844.0, 853485.0, 184269.0, 3466.0, 765.0, 177.0, 82.0, 52.0, 23.0, 18.0, 23.0, 16.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3649463653564453e-05, -1.3221986591815948e-05, -1.2794509530067444e-05, -1.236703246831894e-05, -1.1939555406570435e-05, -1.151207834482193e-05, -1.1084601283073425e-05, -1.065712422132492e-05, -1.0229647159576416e-05, -9.802170097827911e-06, -9.374693036079407e-06, -8.947215974330902e-06, -8.519738912582397e-06, -8.092261850833893e-06, -7.664784789085388e-06, -7.2373077273368835e-06, -6.809830665588379e-06, -6.382353603839874e-06, -5.95487654209137e-06, -5.527399480342865e-06, -5.09992241859436e-06, -4.672445356845856e-06, -4.244968295097351e-06, -3.8174912333488464e-06, -3.390014171600342e-06, -2.962537109851837e-06, -2.5350600481033325e-06, -2.107582986354828e-06, -1.6801059246063232e-06, -1.2526288628578186e-06, -8.25151801109314e-07, -3.976747393608093e-07, 2.9802322387695312e-08, 4.5727938413619995e-07, 8.847564458847046e-07, 1.3122335076332092e-06, 1.7397105693817139e-06, 2.1671876311302185e-06, 2.594664692878723e-06, 3.0221417546272278e-06, 3.4496188163757324e-06, 3.877095878124237e-06, 4.304572939872742e-06, 4.732050001621246e-06, 5.159527063369751e-06, 5.587004125118256e-06, 6.01448118686676e-06, 6.441958248615265e-06, 6.8694353103637695e-06, 7.296912372112274e-06, 7.724389433860779e-06, 8.151866495609283e-06, 8.579343557357788e-06, 9.006820619106293e-06, 9.434297680854797e-06, 9.861774742603302e-06, 1.0289251804351807e-05, 1.0716728866100311e-05, 1.1144205927848816e-05, 1.157168298959732e-05, 1.1999160051345825e-05, 1.242663711309433e-05, 1.2854114174842834e-05, 1.3281591236591339e-05, 1.3709068298339844e-05]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 7.0, 9.0, 11.0, 9.0, 16.0, 18.0, 31.0, 29.0, 51.0, 82.0, 95.0, 84.0, 138.0, 102.0, 71.0, 75.0, 37.0, 36.0, 21.0, 21.0, 7.0, 9.0, 10.0, 12.0, 8.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.616115570068359e-06, -6.410293281078339e-06, -6.204470992088318e-06, -5.998648703098297e-06, -5.792826414108276e-06, -5.587004125118256e-06, -5.381181836128235e-06, -5.175359547138214e-06, -4.969537258148193e-06, -4.763714969158173e-06, -4.557892680168152e-06, -4.352070391178131e-06, -4.14624810218811e-06, -3.94042581319809e-06, -3.734603524208069e-06, -3.528781235218048e-06, -3.3229589462280273e-06, -3.1171366572380066e-06, -2.911314368247986e-06, -2.705492079257965e-06, -2.4996697902679443e-06, -2.2938475012779236e-06, -2.088025212287903e-06, -1.882202923297882e-06, -1.6763806343078613e-06, -1.4705583453178406e-06, -1.2647360563278198e-06, -1.058913767337799e-06, -8.530914783477783e-07, -6.472691893577576e-07, -4.414469003677368e-07, -2.3562461137771606e-07, -2.9802322387695312e-08, 1.7601996660232544e-07, 3.818422555923462e-07, 5.876645445823669e-07, 7.934868335723877e-07, 9.993091225624084e-07, 1.2051314115524292e-06, 1.41095370054245e-06, 1.6167759895324707e-06, 1.8225982785224915e-06, 2.028420567512512e-06, 2.234242856502533e-06, 2.4400651454925537e-06, 2.6458874344825745e-06, 2.8517097234725952e-06, 3.057532012462616e-06, 3.2633543014526367e-06, 3.4691765904426575e-06, 3.6749988794326782e-06, 3.880821168422699e-06, 4.08664345741272e-06, 4.2924657464027405e-06, 4.498288035392761e-06, 4.704110324382782e-06, 4.909932613372803e-06, 5.1157549023628235e-06, 5.321577191352844e-06, 5.527399480342865e-06, 5.733221769332886e-06, 5.9390440583229065e-06, 6.144866347312927e-06, 6.350688636302948e-06, 6.556510925292969e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 12.0, 10.0, 7.0, 11.0, 17.0, 37.0, 54.0, 179.0, 601.0, 111355.0, 935243.0, 668.0, 172.0, 61.0, 45.0, 22.0, 14.0, 8.0, 9.0, 5.0, 10.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5928020477294922e-05, -2.480205148458481e-05, -2.3676082491874695e-05, -2.255011349916458e-05, -2.1424144506454468e-05, -2.0298175513744354e-05, -1.917220652103424e-05, -1.8046237528324127e-05, -1.6920268535614014e-05, -1.57942995429039e-05, -1.4668330550193787e-05, -1.3542361557483673e-05, -1.241639256477356e-05, -1.1290423572063446e-05, -1.0164454579353333e-05, -9.038485586643219e-06, -7.912516593933105e-06, -6.786547601222992e-06, -5.660578608512878e-06, -4.534609615802765e-06, -3.4086406230926514e-06, -2.282671630382538e-06, -1.1567026376724243e-06, -3.073364496231079e-08, 1.0952353477478027e-06, 2.2212043404579163e-06, 3.3471733331680298e-06, 4.473142325878143e-06, 5.599111318588257e-06, 6.72508031129837e-06, 7.851049304008484e-06, 8.977018296718597e-06, 1.0102987289428711e-05, 1.1228956282138824e-05, 1.2354925274848938e-05, 1.3480894267559052e-05, 1.4606863260269165e-05, 1.573283225297928e-05, 1.6858801245689392e-05, 1.7984770238399506e-05, 1.911073923110962e-05, 2.0236708223819733e-05, 2.1362677216529846e-05, 2.248864620923996e-05, 2.3614615201950073e-05, 2.4740584194660187e-05, 2.58665531873703e-05, 2.6992522180080414e-05, 2.8118491172790527e-05, 2.924446016550064e-05, 3.0370429158210754e-05, 3.149639815092087e-05, 3.262236714363098e-05, 3.3748336136341095e-05, 3.487430512905121e-05, 3.600027412176132e-05, 3.7126243114471436e-05, 3.825221210718155e-05, 3.937818109989166e-05, 4.0504150092601776e-05, 4.163011908531189e-05, 4.2756088078022e-05, 4.388205707073212e-05, 4.500802606344223e-05, 4.6133995056152344e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 10.0, 8.0, 7.0, 10.0, 12.0, 25.0, 18.0, 43.0, 75.0, 95.0, 476.0, 58.0, 40.0, 28.0, 29.0, 18.0, 10.0, 7.0, 7.0, 4.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4543533325195312e-05, -1.3912096619606018e-05, -1.3280659914016724e-05, -1.264922320842743e-05, -1.2017786502838135e-05, -1.138634979724884e-05, -1.0754913091659546e-05, -1.0123476386070251e-05, -9.492039680480957e-06, -8.860602974891663e-06, -8.229166269302368e-06, -7.597729563713074e-06, -6.966292858123779e-06, -6.334856152534485e-06, -5.7034194469451904e-06, -5.071982741355896e-06, -4.4405460357666016e-06, -3.809109330177307e-06, -3.1776726245880127e-06, -2.5462359189987183e-06, -1.914799213409424e-06, -1.2833625078201294e-06, -6.51925802230835e-07, -2.0489096641540527e-08, 6.109476089477539e-07, 1.2423843145370483e-06, 1.8738210201263428e-06, 2.505257725715637e-06, 3.1366944313049316e-06, 3.768131136894226e-06, 4.3995678424835205e-06, 5.031004548072815e-06, 5.662441253662109e-06, 6.293877959251404e-06, 6.925314664840698e-06, 7.556751370429993e-06, 8.188188076019287e-06, 8.819624781608582e-06, 9.451061487197876e-06, 1.008249819278717e-05, 1.0713934898376465e-05, 1.134537160396576e-05, 1.1976808309555054e-05, 1.2608245015144348e-05, 1.3239681720733643e-05, 1.3871118426322937e-05, 1.4502555131912231e-05, 1.5133991837501526e-05, 1.576542854309082e-05, 1.6396865248680115e-05, 1.702830195426941e-05, 1.7659738659858704e-05, 1.8291175365447998e-05, 1.8922612071037292e-05, 1.9554048776626587e-05, 2.018548548221588e-05, 2.0816922187805176e-05, 2.144835889339447e-05, 2.2079795598983765e-05, 2.271123230457306e-05, 2.3342669010162354e-05, 2.3974105715751648e-05, 2.4605542421340942e-05, 2.5236979126930237e-05, 2.586841583251953e-05]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 5.0, 20.0, 215.0, 729.0, 40.0, 4.0, 2.0, 1.0], "bins": [-0.4111841917037964, -0.40424156188964844, -0.3972989618778229, -0.3903563320636749, -0.38341373205184937, -0.3764711022377014, -0.36952847242355347, -0.3625858724117279, -0.35564324259757996, -0.348700612783432, -0.34175801277160645, -0.3348153829574585, -0.32787275314331055, -0.320930153131485, -0.31398752331733704, -0.3070449233055115, -0.3001022934913635, -0.2931596636772156, -0.28621706366539, -0.27927443385124207, -0.2723318338394165, -0.26538920402526855, -0.2584465742111206, -0.25150397419929504, -0.2445613443851471, -0.23761872947216034, -0.23067611455917358, -0.22373348474502563, -0.21679086983203888, -0.20984825491905212, -0.20290562510490417, -0.19596301019191742, -0.18902039527893066, -0.1820777803659439, -0.17513516545295715, -0.1681925356388092, -0.16124992072582245, -0.1543073058128357, -0.14736467599868774, -0.140422061085701, -0.13347944617271423, -0.12653683125972748, -0.11959420889616013, -0.11265158653259277, -0.10570897161960602, -0.09876635670661926, -0.09182373434305191, -0.08488111197948456, -0.0779384970664978, -0.07099588215351105, -0.0640532597899437, -0.05711064115166664, -0.05016802251338959, -0.043225403875112534, -0.03628278523683548, -0.029340166598558426, -0.02239755168557167, -0.015454933047294617, -0.008512314409017563, -0.001569695770740509, 0.005372922867536545, 0.012315541505813599, 0.019258160144090652, 0.026200778782367706, 0.03314339742064476]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 7.0, 2.0, 2.0, 6.0, 9.0, 9.0, 14.0, 11.0, 21.0, 14.0, 17.0, 25.0, 25.0, 25.0, 30.0, 31.0, 49.0, 42.0, 35.0, 68.0, 53.0, 54.0, 60.0, 48.0, 46.0, 50.0, 40.0, 30.0, 35.0, 34.0, 21.0, 20.0, 19.0, 14.0, 13.0, 5.0, 3.0, 8.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10456359386444092, -0.1002875566482544, -0.09601151198148727, -0.09173547476530075, -0.08745943009853363, -0.0831833928823471, -0.07890735566616058, -0.07463131844997406, -0.07035527378320694, -0.06607923656702042, -0.061803191900253296, -0.05752715468406677, -0.05325111374258995, -0.04897507280111313, -0.044699035584926605, -0.04042299464344978, -0.03614695370197296, -0.03187091276049614, -0.027594873681664467, -0.023318834602832794, -0.019042793661355972, -0.01476675271987915, -0.010490713641047478, -0.006214674562215805, -0.0019386336207389832, 0.002337406389415264, 0.006613446399569511, 0.010889486409723759, 0.015165526419878006, 0.019441567361354828, 0.0237176064401865, 0.027993645519018173, 0.032269686460494995, 0.03654572740197182, 0.04082176834344864, 0.04509780555963516, 0.049373846501111984, 0.053649887442588806, 0.05792592465877533, 0.06220196560025215, 0.06647800654172897, 0.0707540437579155, 0.07503008842468262, 0.07930612564086914, 0.08358216285705566, 0.08785820752382278, 0.09213424474000931, 0.09641028940677643, 0.10068632662296295, 0.10496236383914948, 0.1092384085059166, 0.11351444572210312, 0.11779049038887024, 0.12206652760505676, 0.1263425648212433, 0.1306186020374298, 0.13489463925361633, 0.13917067646980286, 0.14344671368598938, 0.1477227658033371, 0.15199880301952362, 0.15627484023571014, 0.16055087745189667, 0.1648269146680832, 0.1691029667854309]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 1.0, 2.0, 6.0, 7.0, 7.0, 7.0, 12.0, 15.0, 21.0, 21.0, 23.0, 31.0, 46.0, 47.0, 92.0, 116.0, 220.0, 453.0, 1255.0, 52026.0, 4136978.0, 1758.0, 475.0, 228.0, 128.0, 68.0, 54.0, 45.0, 33.0, 25.0, 17.0, 11.0, 12.0, 11.0, 6.0, 4.0, 5.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.15865707397460938, -0.15386199951171875, -0.14906692504882812, -0.1442718505859375, -0.13947677612304688, -0.13468170166015625, -0.12988662719726562, -0.125091552734375, -0.12029647827148438, -0.11550140380859375, -0.11070632934570312, -0.1059112548828125, -0.10111618041992188, -0.09632110595703125, -0.09152603149414062, -0.08673095703125, -0.08193588256835938, -0.07714080810546875, -0.07234573364257812, -0.0675506591796875, -0.06275558471679688, -0.05796051025390625, -0.053165435791015625, -0.048370361328125, -0.043575286865234375, -0.03878021240234375, -0.033985137939453125, -0.0291900634765625, -0.024394989013671875, -0.01959991455078125, -0.014804840087890625, -0.010009765625, -0.005214691162109375, -0.00041961669921875, 0.004375457763671875, 0.0091705322265625, 0.013965606689453125, 0.01876068115234375, 0.023555755615234375, 0.028350830078125, 0.033145904541015625, 0.03794097900390625, 0.042736053466796875, 0.0475311279296875, 0.052326202392578125, 0.05712127685546875, 0.061916351318359375, 0.06671142578125, 0.07150650024414062, 0.07630157470703125, 0.08109664916992188, 0.0858917236328125, 0.09068679809570312, 0.09548187255859375, 0.10027694702148438, 0.105072021484375, 0.10986709594726562, 0.11466217041015625, 0.11945724487304688, 0.1242523193359375, 0.12904739379882812, 0.13384246826171875, 0.13863754272460938, 0.1434326171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 3.0, 4.0, 5.0, 7.0, 12.0, 12.0, 18.0, 40.0, 78.0, 206.0, 277.0, 159.0, 65.0, 19.0, 15.0, 13.0, 10.0, 6.0, 5.0, 8.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01520538330078125, -0.014760255813598633, -0.014315128326416016, -0.013870000839233398, -0.013424873352050781, -0.012979745864868164, -0.012534618377685547, -0.01208949089050293, -0.011644363403320312, -0.011199235916137695, -0.010754108428955078, -0.010308980941772461, -0.009863853454589844, -0.009418725967407227, -0.00897359848022461, -0.008528470993041992, -0.008083343505859375, -0.007638216018676758, -0.007193088531494141, -0.0067479610443115234, -0.006302833557128906, -0.005857706069946289, -0.005412578582763672, -0.004967451095581055, -0.0045223236083984375, -0.00407719612121582, -0.003632068634033203, -0.003186941146850586, -0.0027418136596679688, -0.0022966861724853516, -0.0018515586853027344, -0.0014064311981201172, -0.0009613037109375, -0.0005161762237548828, -7.104873657226562e-05, 0.00037407875061035156, 0.0008192062377929688, 0.001264333724975586, 0.0017094612121582031, 0.0021545886993408203, 0.0025997161865234375, 0.0030448436737060547, 0.003489971160888672, 0.003935098648071289, 0.004380226135253906, 0.0048253536224365234, 0.005270481109619141, 0.005715608596801758, 0.006160736083984375, 0.006605863571166992, 0.007050991058349609, 0.0074961185455322266, 0.007941246032714844, 0.008386373519897461, 0.008831501007080078, 0.009276628494262695, 0.009721755981445312, 0.01016688346862793, 0.010612010955810547, 0.011057138442993164, 0.011502265930175781, 0.011947393417358398, 0.012392520904541016, 0.012837648391723633, 0.01328277587890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 9.0, 8.0, 14.0, 16.0, 18.0, 33.0, 36.0, 52.0, 80.0, 148.0, 639.0, 5418.0, 4130820.0, 54168.0, 2111.0, 328.0, 99.0, 55.0, 37.0, 38.0, 29.0, 22.0, 17.0, 18.0, 11.0, 8.0, 7.0, 6.0, 2.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.045745849609375, -0.04426145553588867, -0.042777061462402344, -0.041292667388916016, -0.03980827331542969, -0.03832387924194336, -0.03683948516845703, -0.0353550910949707, -0.033870697021484375, -0.03238630294799805, -0.03090190887451172, -0.02941751480102539, -0.027933120727539062, -0.026448726654052734, -0.024964332580566406, -0.023479938507080078, -0.02199554443359375, -0.020511150360107422, -0.019026756286621094, -0.017542362213134766, -0.016057968139648438, -0.01457357406616211, -0.013089179992675781, -0.011604785919189453, -0.010120391845703125, -0.008635997772216797, -0.007151603698730469, -0.005667209625244141, -0.0041828155517578125, -0.0026984214782714844, -0.0012140274047851562, 0.0002703666687011719, 0.0017547607421875, 0.003239154815673828, 0.004723548889160156, 0.006207942962646484, 0.0076923370361328125, 0.00917673110961914, 0.010661125183105469, 0.012145519256591797, 0.013629913330078125, 0.015114307403564453, 0.01659870147705078, 0.01808309555053711, 0.019567489624023438, 0.021051883697509766, 0.022536277770996094, 0.024020671844482422, 0.02550506591796875, 0.026989459991455078, 0.028473854064941406, 0.029958248138427734, 0.03144264221191406, 0.03292703628540039, 0.03441143035888672, 0.03589582443237305, 0.037380218505859375, 0.0388646125793457, 0.04034900665283203, 0.04183340072631836, 0.04331779479980469, 0.044802188873291016, 0.046286582946777344, 0.04777097702026367, 0.04925537109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 5.0, 8.0, 11.0, 8.0, 10.0, 22.0, 88.0, 250.0, 1091.0, 2056.0, 311.0, 94.0, 38.0, 13.0, 9.0, 6.0, 9.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.025054931640625, -0.02432107925415039, -0.02358722686767578, -0.022853374481201172, -0.022119522094726562, -0.021385669708251953, -0.020651817321777344, -0.019917964935302734, -0.019184112548828125, -0.018450260162353516, -0.017716407775878906, -0.016982555389404297, -0.016248703002929688, -0.015514850616455078, -0.014780998229980469, -0.01404714584350586, -0.01331329345703125, -0.01257944107055664, -0.011845588684082031, -0.011111736297607422, -0.010377883911132812, -0.009644031524658203, -0.008910179138183594, -0.008176326751708984, -0.007442474365234375, -0.006708621978759766, -0.005974769592285156, -0.005240917205810547, -0.0045070648193359375, -0.003773212432861328, -0.0030393600463867188, -0.0023055076599121094, -0.0015716552734375, -0.0008378028869628906, -0.00010395050048828125, 0.0006299018859863281, 0.0013637542724609375, 0.002097606658935547, 0.0028314590454101562, 0.0035653114318847656, 0.004299163818359375, 0.005033016204833984, 0.005766868591308594, 0.006500720977783203, 0.0072345733642578125, 0.007968425750732422, 0.008702278137207031, 0.00943613052368164, 0.01016998291015625, 0.01090383529663086, 0.011637687683105469, 0.012371540069580078, 0.013105392456054688, 0.013839244842529297, 0.014573097229003906, 0.015306949615478516, 0.016040802001953125, 0.016774654388427734, 0.017508506774902344, 0.018242359161376953, 0.018976211547851562, 0.019710063934326172, 0.02044391632080078, 0.02117776870727539, 0.02191162109375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 12.0, 743.0, 260.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11418446153402328, -0.10598792880773544, -0.0977913960814476, -0.08959487080574036, -0.08139833807945251, -0.07320180535316467, -0.06500527262687683, -0.05680873990058899, -0.04861220717430115, -0.040415674448013306, -0.032219141721725464, -0.02402261272072792, -0.01582607999444008, -0.007629547268152237, 0.0005669817328453064, 0.008763514459133148, 0.01696004718542099, 0.025156579911708832, 0.033353112637996674, 0.04154964163899422, 0.04974617436528206, 0.0579427070915699, 0.06613923609256744, 0.07433576881885529, 0.08253230154514313, 0.09072883427143097, 0.09892536699771881, 0.10712189972400665, 0.1153184324502945, 0.12351496517658234, 0.13171148300170898, 0.13990801572799683, 0.14810457825660706, 0.1563011109828949, 0.16449764370918274, 0.17269417643547058, 0.18089070916175842, 0.18908724188804626, 0.1972837746143341, 0.20548030734062195, 0.2136768400669098, 0.22187337279319763, 0.23006990551948547, 0.23826643824577332, 0.24646297097206116, 0.254659503698349, 0.26285603642463684, 0.2710525691509247, 0.27924907207489014, 0.287445604801178, 0.2956421375274658, 0.30383867025375366, 0.3120352029800415, 0.32023173570632935, 0.3284282684326172, 0.33662480115890503, 0.34482133388519287, 0.3530178666114807, 0.36121439933776855, 0.3694109320640564, 0.37760746479034424, 0.3858039975166321, 0.3940005302429199, 0.40219706296920776, 0.4103935956954956]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 10.0, 5.0, 7.0, 6.0, 14.0, 18.0, 15.0, 20.0, 18.0, 25.0, 30.0, 28.0, 32.0, 39.0, 41.0, 44.0, 35.0, 38.0, 47.0, 58.0, 49.0, 49.0, 46.0, 42.0, 47.0, 35.0, 34.0, 33.0, 14.0, 18.0, 25.0, 17.0, 11.0, 9.0, 9.0, 7.0, 3.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05383265018463135, -0.05201491340994835, -0.05019717663526535, -0.04837943986058235, -0.04656170308589935, -0.044743966311216354, -0.042926229536533356, -0.04110849276185036, -0.03929075598716736, -0.03747301921248436, -0.03565528243780136, -0.03383754566311836, -0.032019808888435364, -0.030202072113752365, -0.028384335339069366, -0.026566598564386368, -0.02474886178970337, -0.02293112501502037, -0.021113388240337372, -0.019295651465654373, -0.017477914690971375, -0.015660177916288376, -0.013842441141605377, -0.012024704366922379, -0.01020696759223938, -0.008389230817556381, -0.006571494042873383, -0.004753757268190384, -0.0029360204935073853, -0.0011182837188243866, 0.0006994530558586121, 0.0025171898305416107, 0.004334926605224609, 0.006152663379907608, 0.007970400154590607, 0.009788136929273605, 0.011605873703956604, 0.013423610478639603, 0.015241347253322601, 0.0170590840280056, 0.0188768208026886, 0.020694557577371597, 0.022512294352054596, 0.024330031126737595, 0.026147767901420593, 0.027965504676103592, 0.02978324145078659, 0.03160097822546959, 0.03341871500015259, 0.03523645177483559, 0.037054188549518585, 0.038871925324201584, 0.04068966209888458, 0.04250739887356758, 0.04432513564825058, 0.04614287242293358, 0.04796060919761658, 0.049778345972299576, 0.051596082746982574, 0.05341381952166557, 0.05523155629634857, 0.05704929307103157, 0.05886702984571457, 0.06068476662039757, 0.06250250339508057]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 11.0, 13.0, 22.0, 25.0, 18.0, 20.0, 44.0, 53.0, 69.0, 102.0, 137.0, 156.0, 274.0, 358.0, 550.0, 798.0, 1300.0, 2337.0, 4993.0, 15911.0, 747332.0, 249048.0, 14093.0, 4733.0, 2308.0, 1285.0, 846.0, 518.0, 353.0, 222.0, 154.0, 139.0, 94.0, 64.0, 36.0, 33.0, 21.0, 23.0, 15.0, 11.0, 5.0, 5.0, 10.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0631103515625, -0.061003684997558594, -0.05889701843261719, -0.05679035186767578, -0.054683685302734375, -0.05257701873779297, -0.05047035217285156, -0.048363685607910156, -0.04625701904296875, -0.044150352478027344, -0.04204368591308594, -0.03993701934814453, -0.037830352783203125, -0.03572368621826172, -0.03361701965332031, -0.031510353088378906, -0.0294036865234375, -0.027297019958496094, -0.025190353393554688, -0.02308368682861328, -0.020977020263671875, -0.01887035369873047, -0.016763687133789062, -0.014657020568847656, -0.01255035400390625, -0.010443687438964844, -0.008337020874023438, -0.006230354309082031, -0.004123687744140625, -0.0020170211791992188, 8.96453857421875e-05, 0.0021963119506835938, 0.004302978515625, 0.006409645080566406, 0.008516311645507812, 0.010622978210449219, 0.012729644775390625, 0.014836311340332031, 0.016942977905273438, 0.019049644470214844, 0.02115631103515625, 0.023262977600097656, 0.025369644165039062, 0.02747631072998047, 0.029582977294921875, 0.03168964385986328, 0.03379631042480469, 0.035902976989746094, 0.0380096435546875, 0.040116310119628906, 0.04222297668457031, 0.04432964324951172, 0.046436309814453125, 0.04854297637939453, 0.05064964294433594, 0.052756309509277344, 0.05486297607421875, 0.056969642639160156, 0.05907630920410156, 0.06118297576904297, 0.06328964233398438, 0.06539630889892578, 0.06750297546386719, 0.0696096420288086, 0.07171630859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 2.0, 5.0, 6.0, 6.0, 12.0, 12.0, 18.0, 38.0, 75.0, 199.0, 280.0, 165.0, 67.0, 19.0, 15.0, 14.0, 9.0, 7.0, 5.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01519012451171875, -0.014745831489562988, -0.014301538467407227, -0.013857245445251465, -0.013412952423095703, -0.012968659400939941, -0.01252436637878418, -0.012080073356628418, -0.011635780334472656, -0.011191487312316895, -0.010747194290161133, -0.010302901268005371, -0.00985860824584961, -0.009414315223693848, -0.008970022201538086, -0.008525729179382324, -0.008081436157226562, -0.007637143135070801, -0.007192850112915039, -0.006748557090759277, -0.006304264068603516, -0.005859971046447754, -0.005415678024291992, -0.0049713850021362305, -0.004527091979980469, -0.004082798957824707, -0.0036385059356689453, -0.0031942129135131836, -0.002749919891357422, -0.00230562686920166, -0.0018613338470458984, -0.0014170408248901367, -0.000972747802734375, -0.0005284547805786133, -8.416175842285156e-05, 0.00036013126373291016, 0.0008044242858886719, 0.0012487173080444336, 0.0016930103302001953, 0.002137303352355957, 0.0025815963745117188, 0.0030258893966674805, 0.003470182418823242, 0.003914475440979004, 0.004358768463134766, 0.004803061485290527, 0.005247354507446289, 0.005691647529602051, 0.0061359405517578125, 0.006580233573913574, 0.007024526596069336, 0.007468819618225098, 0.00791311264038086, 0.008357405662536621, 0.008801698684692383, 0.009245991706848145, 0.009690284729003906, 0.010134577751159668, 0.01057887077331543, 0.011023163795471191, 0.011467456817626953, 0.011911749839782715, 0.012356042861938477, 0.012800335884094238, 0.01324462890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 8.0, 12.0, 18.0, 10.0, 13.0, 24.0, 29.0, 35.0, 49.0, 67.0, 76.0, 70.0, 120.0, 172.0, 270.0, 407.0, 788.0, 2243.0, 77426.0, 959479.0, 4584.0, 1002.0, 516.0, 320.0, 184.0, 140.0, 104.0, 66.0, 60.0, 45.0, 33.0, 44.0, 28.0, 22.0, 20.0, 15.0, 7.0, 11.0, 2.0, 8.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.059295654296875, -0.057393550872802734, -0.05549144744873047, -0.0535893440246582, -0.05168724060058594, -0.04978513717651367, -0.047883033752441406, -0.04598093032836914, -0.044078826904296875, -0.04217672348022461, -0.040274620056152344, -0.03837251663208008, -0.03647041320800781, -0.03456830978393555, -0.03266620635986328, -0.030764102935791016, -0.02886199951171875, -0.026959896087646484, -0.02505779266357422, -0.023155689239501953, -0.021253585815429688, -0.019351482391357422, -0.017449378967285156, -0.01554727554321289, -0.013645172119140625, -0.01174306869506836, -0.009840965270996094, -0.007938861846923828, -0.0060367584228515625, -0.004134654998779297, -0.0022325515747070312, -0.0003304481506347656, 0.0015716552734375, 0.0034737586975097656, 0.005375862121582031, 0.007277965545654297, 0.009180068969726562, 0.011082172393798828, 0.012984275817871094, 0.01488637924194336, 0.016788482666015625, 0.01869058609008789, 0.020592689514160156, 0.022494792938232422, 0.024396896362304688, 0.026298999786376953, 0.02820110321044922, 0.030103206634521484, 0.03200531005859375, 0.033907413482666016, 0.03580951690673828, 0.03771162033081055, 0.03961372375488281, 0.04151582717895508, 0.043417930603027344, 0.04532003402709961, 0.047222137451171875, 0.04912424087524414, 0.051026344299316406, 0.05292844772338867, 0.05483055114746094, 0.0567326545715332, 0.05863475799560547, 0.060536861419677734, 0.06243896484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 7.0, 7.0, 11.0, 12.0, 6.0, 8.0, 16.0, 16.0, 18.0, 22.0, 31.0, 25.0, 24.0, 31.0, 39.0, 34.0, 54.0, 42.0, 43.0, 35.0, 39.0, 56.0, 43.0, 45.0, 37.0, 38.0, 35.0, 32.0, 22.0, 19.0, 23.0, 18.0, 22.0, 18.0, 13.0, 12.0, 11.0, 6.0, 9.0, 2.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0260467529296875, -0.025211572647094727, -0.024376392364501953, -0.02354121208190918, -0.022706031799316406, -0.021870851516723633, -0.02103567123413086, -0.020200490951538086, -0.019365310668945312, -0.01853013038635254, -0.017694950103759766, -0.016859769821166992, -0.01602458953857422, -0.015189409255981445, -0.014354228973388672, -0.013519048690795898, -0.012683868408203125, -0.011848688125610352, -0.011013507843017578, -0.010178327560424805, -0.009343147277832031, -0.008507966995239258, -0.007672786712646484, -0.006837606430053711, -0.0060024261474609375, -0.005167245864868164, -0.004332065582275391, -0.003496885299682617, -0.0026617050170898438, -0.0018265247344970703, -0.0009913444519042969, -0.00015616416931152344, 0.00067901611328125, 0.0015141963958740234, 0.002349376678466797, 0.0031845569610595703, 0.004019737243652344, 0.004854917526245117, 0.005690097808837891, 0.006525278091430664, 0.0073604583740234375, 0.008195638656616211, 0.009030818939208984, 0.009865999221801758, 0.010701179504394531, 0.011536359786987305, 0.012371540069580078, 0.013206720352172852, 0.014041900634765625, 0.014877080917358398, 0.015712261199951172, 0.016547441482543945, 0.01738262176513672, 0.018217802047729492, 0.019052982330322266, 0.01988816261291504, 0.020723342895507812, 0.021558523178100586, 0.02239370346069336, 0.023228883743286133, 0.024064064025878906, 0.02489924430847168, 0.025734424591064453, 0.026569604873657227, 0.02740478515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 15.0, 10.0, 18.0, 28.0, 50.0, 69.0, 124.0, 234.0, 553.0, 1557.0, 7168.0, 963003.0, 69474.0, 4251.0, 1120.0, 387.0, 172.0, 113.0, 79.0, 42.0, 34.0, 10.0, 8.0, 13.0, 4.0, 3.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.733966827392578e-05, -5.5480748414993286e-05, -5.362182855606079e-05, -5.1762908697128296e-05, -4.99039888381958e-05, -4.8045068979263306e-05, -4.618614912033081e-05, -4.4327229261398315e-05, -4.246830940246582e-05, -4.0609389543533325e-05, -3.875046968460083e-05, -3.6891549825668335e-05, -3.503262996673584e-05, -3.3173710107803345e-05, -3.131479024887085e-05, -2.9455870389938354e-05, -2.759695053100586e-05, -2.5738030672073364e-05, -2.387911081314087e-05, -2.2020190954208374e-05, -2.016127109527588e-05, -1.8302351236343384e-05, -1.644343137741089e-05, -1.4584511518478394e-05, -1.2725591659545898e-05, -1.0866671800613403e-05, -9.007751941680908e-06, -7.148832082748413e-06, -5.289912223815918e-06, -3.430992364883423e-06, -1.5720725059509277e-06, 2.868473529815674e-07, 2.1457672119140625e-06, 4.004687070846558e-06, 5.863606929779053e-06, 7.722526788711548e-06, 9.581446647644043e-06, 1.1440366506576538e-05, 1.3299286365509033e-05, 1.5158206224441528e-05, 1.7017126083374023e-05, 1.887604594230652e-05, 2.0734965801239014e-05, 2.259388566017151e-05, 2.4452805519104004e-05, 2.63117253780365e-05, 2.8170645236968994e-05, 3.002956509590149e-05, 3.1888484954833984e-05, 3.374740481376648e-05, 3.5606324672698975e-05, 3.746524453163147e-05, 3.9324164390563965e-05, 4.118308424949646e-05, 4.3042004108428955e-05, 4.490092396736145e-05, 4.6759843826293945e-05, 4.861876368522644e-05, 5.0477683544158936e-05, 5.233660340309143e-05, 5.4195523262023926e-05, 5.605444312095642e-05, 5.7913362979888916e-05, 5.977228283882141e-05, 6.16312026977539e-05]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 3.0, 6.0, 4.0, 11.0, 13.0, 18.0, 23.0, 35.0, 50.0, 75.0, 139.0, 225.0, 133.0, 88.0, 55.0, 29.0, 21.0, 19.0, 16.0, 10.0, 10.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1517276763916016e-05, -2.0891427993774414e-05, -2.0265579223632812e-05, -1.963973045349121e-05, -1.901388168334961e-05, -1.8388032913208008e-05, -1.7762184143066406e-05, -1.7136335372924805e-05, -1.6510486602783203e-05, -1.58846378326416e-05, -1.52587890625e-05, -1.4632940292358398e-05, -1.4007091522216797e-05, -1.3381242752075195e-05, -1.2755393981933594e-05, -1.2129545211791992e-05, -1.150369644165039e-05, -1.0877847671508789e-05, -1.0251998901367188e-05, -9.626150131225586e-06, -9.000301361083984e-06, -8.374452590942383e-06, -7.748603820800781e-06, -7.12275505065918e-06, -6.496906280517578e-06, -5.8710575103759766e-06, -5.245208740234375e-06, -4.6193599700927734e-06, -3.993511199951172e-06, -3.3676624298095703e-06, -2.7418136596679688e-06, -2.115964889526367e-06, -1.4901161193847656e-06, -8.642673492431641e-07, -2.384185791015625e-07, 3.8743019104003906e-07, 1.0132789611816406e-06, 1.6391277313232422e-06, 2.2649765014648438e-06, 2.8908252716064453e-06, 3.516674041748047e-06, 4.1425228118896484e-06, 4.76837158203125e-06, 5.3942203521728516e-06, 6.020069122314453e-06, 6.645917892456055e-06, 7.271766662597656e-06, 7.897615432739258e-06, 8.52346420288086e-06, 9.149312973022461e-06, 9.775161743164062e-06, 1.0401010513305664e-05, 1.1026859283447266e-05, 1.1652708053588867e-05, 1.2278556823730469e-05, 1.290440559387207e-05, 1.3530254364013672e-05, 1.4156103134155273e-05, 1.4781951904296875e-05, 1.5407800674438477e-05, 1.6033649444580078e-05, 1.665949821472168e-05, 1.728534698486328e-05, 1.7911195755004883e-05, 1.8537044525146484e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 4.0, 15.0, 14.0, 15.0, 19.0, 28.0, 52.0, 92.0, 122.0, 259.0, 635.0, 8907.0, 1035424.0, 2009.0, 426.0, 211.0, 99.0, 52.0, 36.0, 39.0, 19.0, 18.0, 20.0, 6.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8710575103759766e-05, -5.647912621498108e-05, -5.424767732620239e-05, -5.2016228437423706e-05, -4.978477954864502e-05, -4.755333065986633e-05, -4.5321881771087646e-05, -4.309043288230896e-05, -4.0858983993530273e-05, -3.862753510475159e-05, -3.63960862159729e-05, -3.4164637327194214e-05, -3.193318843841553e-05, -2.970173954963684e-05, -2.7470290660858154e-05, -2.5238841772079468e-05, -2.300739288330078e-05, -2.0775943994522095e-05, -1.8544495105743408e-05, -1.631304621696472e-05, -1.4081597328186035e-05, -1.1850148439407349e-05, -9.618699550628662e-06, -7.387250661849976e-06, -5.155801773071289e-06, -2.9243528842926025e-06, -6.92903995513916e-07, 1.5385448932647705e-06, 3.769993782043457e-06, 6.0014426708221436e-06, 8.23289155960083e-06, 1.0464340448379517e-05, 1.2695789337158203e-05, 1.492723822593689e-05, 1.7158687114715576e-05, 1.9390136003494263e-05, 2.162158489227295e-05, 2.3853033781051636e-05, 2.6084482669830322e-05, 2.831593155860901e-05, 3.0547380447387695e-05, 3.277882933616638e-05, 3.501027822494507e-05, 3.7241727113723755e-05, 3.947317600250244e-05, 4.170462489128113e-05, 4.3936073780059814e-05, 4.61675226688385e-05, 4.839897155761719e-05, 5.0630420446395874e-05, 5.286186933517456e-05, 5.509331822395325e-05, 5.7324767112731934e-05, 5.955621600151062e-05, 6.17876648902893e-05, 6.401911377906799e-05, 6.625056266784668e-05, 6.848201155662537e-05, 7.071346044540405e-05, 7.294490933418274e-05, 7.517635822296143e-05, 7.740780711174011e-05, 7.96392560005188e-05, 8.187070488929749e-05, 8.410215377807617e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 4.0, 6.0, 7.0, 8.0, 7.0, 4.0, 20.0, 19.0, 24.0, 32.0, 48.0, 64.0, 94.0, 341.0, 95.0, 52.0, 40.0, 27.0, 16.0, 17.0, 14.0, 16.0, 10.0, 6.0, 9.0, 2.0, 5.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1219253540039062e-05, -2.0310282707214355e-05, -1.940131187438965e-05, -1.849234104156494e-05, -1.7583370208740234e-05, -1.6674399375915527e-05, -1.576542854309082e-05, -1.4856457710266113e-05, -1.3947486877441406e-05, -1.30385160446167e-05, -1.2129545211791992e-05, -1.1220574378967285e-05, -1.0311603546142578e-05, -9.402632713317871e-06, -8.493661880493164e-06, -7.584691047668457e-06, -6.67572021484375e-06, -5.766749382019043e-06, -4.857778549194336e-06, -3.948807716369629e-06, -3.039836883544922e-06, -2.130866050720215e-06, -1.2218952178955078e-06, -3.129243850708008e-07, 5.960464477539062e-07, 1.5050172805786133e-06, 2.4139881134033203e-06, 3.3229589462280273e-06, 4.231929779052734e-06, 5.140900611877441e-06, 6.0498714447021484e-06, 6.9588422775268555e-06, 7.867813110351562e-06, 8.77678394317627e-06, 9.685754776000977e-06, 1.0594725608825684e-05, 1.150369644165039e-05, 1.2412667274475098e-05, 1.3321638107299805e-05, 1.4230608940124512e-05, 1.5139579772949219e-05, 1.6048550605773926e-05, 1.6957521438598633e-05, 1.786649227142334e-05, 1.8775463104248047e-05, 1.9684433937072754e-05, 2.059340476989746e-05, 2.1502375602722168e-05, 2.2411346435546875e-05, 2.3320317268371582e-05, 2.422928810119629e-05, 2.5138258934020996e-05, 2.6047229766845703e-05, 2.695620059967041e-05, 2.7865171432495117e-05, 2.8774142265319824e-05, 2.968311309814453e-05, 3.059208393096924e-05, 3.1501054763793945e-05, 3.241002559661865e-05, 3.331899642944336e-05, 3.4227967262268066e-05, 3.5136938095092773e-05, 3.604590892791748e-05, 3.695487976074219e-05]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 36.0, 963.0, 16.0, 0.0, 0.0, 1.0], "bins": [-1.3189458847045898, -1.296772837638855, -1.2745997905731201, -1.2524266242980957, -1.2302535772323608, -1.208080530166626, -1.1859074831008911, -1.1637344360351562, -1.1415613889694214, -1.1193883419036865, -1.0972152948379517, -1.0750422477722168, -1.0528690814971924, -1.0306960344314575, -1.0085229873657227, -0.9863499402999878, -0.9641768336296082, -0.9420037865638733, -0.9198306798934937, -0.8976576328277588, -0.8754845857620239, -0.8533115386962891, -0.8311384320259094, -0.8089653849601746, -0.7867922782897949, -0.7646192312240601, -0.7424461245536804, -0.7202730774879456, -0.6981000304222107, -0.675926923751831, -0.6537538766860962, -0.6315808296203613, -0.6094077825546265, -0.5872347354888916, -0.565061628818512, -0.5428885817527771, -0.5207155346870422, -0.498542457818985, -0.47636938095092773, -0.45419633388519287, -0.43202322721481323, -0.409850150346756, -0.3876771032810211, -0.36550402641296387, -0.343330979347229, -0.32115790247917175, -0.2989848256111145, -0.27681177854537964, -0.2546387314796448, -0.23246566951274872, -0.21029260754585266, -0.1881195306777954, -0.16594646871089935, -0.1437734067440033, -0.12160032987594604, -0.09942726790904999, -0.07725419104099274, -0.05508112534880638, -0.032908059656620026, -0.010734990239143372, 0.011438071727752686, 0.03361113369464874, 0.055784210562705994, 0.07795727252960205, 0.10013033449649811]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 9.0, 8.0, 9.0, 14.0, 16.0, 12.0, 23.0, 19.0, 30.0, 34.0, 38.0, 37.0, 56.0, 50.0, 68.0, 63.0, 59.0, 65.0, 55.0, 44.0, 34.0, 45.0, 24.0, 32.0, 19.0, 17.0, 16.0, 15.0, 14.0, 12.0, 9.0, 3.0, 7.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.13214337825775146, -0.1281299889087677, -0.12411660701036453, -0.12010322511196136, -0.1160898357629776, -0.11207645386457443, -0.10806307196617126, -0.1040496826171875, -0.10003630071878433, -0.09602291882038116, -0.0920095294713974, -0.08799614757299423, -0.08398276567459106, -0.0799693763256073, -0.07595599442720413, -0.07194261252880096, -0.0679292231798172, -0.06391584128141403, -0.05990245193243027, -0.0558890700340271, -0.05187568441033363, -0.04786229878664017, -0.043848916888237, -0.03983553126454353, -0.03582214564085007, -0.0318087600171566, -0.027795376256108284, -0.023781992495059967, -0.0197686068713665, -0.015755221247673035, -0.011741837486624718, -0.007728453725576401, -0.0037150681018829346, 0.000298316590487957, 0.004311701282858849, 0.00832508597522974, 0.012338470667600632, 0.016351856291294098, 0.020365240052342415, 0.024378623813390732, 0.028392009437084198, 0.032405395060777664, 0.03641878068447113, 0.0404321625828743, 0.044445548206567764, 0.04845893383026123, 0.0524723157286644, 0.056485701352357864, 0.06049908697605133, 0.0645124688744545, 0.06852585822343826, 0.07253924012184143, 0.0765526294708252, 0.08056601136922836, 0.08457939326763153, 0.0885927826166153, 0.09260616451501846, 0.09661954641342163, 0.1006329357624054, 0.10464631766080856, 0.10865969955921173, 0.1126730889081955, 0.11668647080659866, 0.12069985270500183, 0.1247132420539856]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 4.0, 9.0, 8.0, 9.0, 10.0, 11.0, 18.0, 28.0, 29.0, 52.0, 96.0, 285.0, 95905.0, 4097154.0, 339.0, 108.0, 52.0, 38.0, 20.0, 25.0, 16.0, 9.0, 11.0, 3.0, 8.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.27734375, -4.15155029296875, -4.0257568359375, -3.89996337890625, -3.774169921875, -3.64837646484375, -3.5225830078125, -3.39678955078125, -3.27099609375, -3.14520263671875, -3.0194091796875, -2.89361572265625, -2.767822265625, -2.64202880859375, -2.5162353515625, -2.39044189453125, -2.2646484375, -2.13885498046875, -2.0130615234375, -1.88726806640625, -1.761474609375, -1.63568115234375, -1.5098876953125, -1.38409423828125, -1.25830078125, -1.13250732421875, -1.0067138671875, -0.88092041015625, -0.755126953125, -0.62933349609375, -0.5035400390625, -0.37774658203125, -0.251953125, -0.12615966796875, -0.0003662109375, 0.12542724609375, 0.251220703125, 0.37701416015625, 0.5028076171875, 0.62860107421875, 0.75439453125, 0.88018798828125, 1.0059814453125, 1.13177490234375, 1.257568359375, 1.38336181640625, 1.5091552734375, 1.63494873046875, 1.7607421875, 1.88653564453125, 2.0123291015625, 2.13812255859375, 2.263916015625, 2.38970947265625, 2.5155029296875, 2.64129638671875, 2.76708984375, 2.89288330078125, 3.0186767578125, 3.14447021484375, 3.270263671875, 3.39605712890625, 3.5218505859375, 3.64764404296875, 3.7734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 6.0, 7.0, 12.0, 10.0, 20.0, 36.0, 76.0, 188.0, 287.0, 166.0, 71.0, 18.0, 16.0, 14.0, 10.0, 6.0, 6.0, 7.0, 4.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01519012451171875, -0.01474618911743164, -0.014302253723144531, -0.013858318328857422, -0.013414382934570312, -0.012970447540283203, -0.012526512145996094, -0.012082576751708984, -0.011638641357421875, -0.011194705963134766, -0.010750770568847656, -0.010306835174560547, -0.009862899780273438, -0.009418964385986328, -0.008975028991699219, -0.00853109359741211, -0.008087158203125, -0.007643222808837891, -0.007199287414550781, -0.006755352020263672, -0.0063114166259765625, -0.005867481231689453, -0.005423545837402344, -0.004979610443115234, -0.004535675048828125, -0.004091739654541016, -0.0036478042602539062, -0.003203868865966797, -0.0027599334716796875, -0.002315998077392578, -0.0018720626831054688, -0.0014281272888183594, -0.00098419189453125, -0.0005402565002441406, -9.632110595703125e-05, 0.0003476142883300781, 0.0007915496826171875, 0.0012354850769042969, 0.0016794204711914062, 0.0021233558654785156, 0.002567291259765625, 0.0030112266540527344, 0.0034551620483398438, 0.003899097442626953, 0.0043430328369140625, 0.004786968231201172, 0.005230903625488281, 0.005674839019775391, 0.0061187744140625, 0.006562709808349609, 0.007006645202636719, 0.007450580596923828, 0.007894515991210938, 0.008338451385498047, 0.008782386779785156, 0.009226322174072266, 0.009670257568359375, 0.010114192962646484, 0.010558128356933594, 0.011002063751220703, 0.011445999145507812, 0.011889934539794922, 0.012333869934082031, 0.01277780532836914, 0.01322174072265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 3.0, 9.0, 10.0, 14.0, 24.0, 37.0, 52.0, 89.0, 166.0, 387.0, 877.0, 2880.0, 15440.0, 4137858.0, 30417.0, 3909.0, 1147.0, 453.0, 195.0, 122.0, 66.0, 35.0, 19.0, 14.0, 21.0, 9.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.083984375, -0.08124256134033203, -0.07850074768066406, -0.0757589340209961, -0.07301712036132812, -0.07027530670166016, -0.06753349304199219, -0.06479167938232422, -0.06204986572265625, -0.05930805206298828, -0.05656623840332031, -0.053824424743652344, -0.051082611083984375, -0.048340797424316406, -0.04559898376464844, -0.04285717010498047, -0.0401153564453125, -0.03737354278564453, -0.03463172912597656, -0.031889915466308594, -0.029148101806640625, -0.026406288146972656, -0.023664474487304688, -0.02092266082763672, -0.01818084716796875, -0.015439033508300781, -0.012697219848632812, -0.009955406188964844, -0.007213592529296875, -0.004471778869628906, -0.0017299652099609375, 0.0010118484497070312, 0.003753662109375, 0.006495475769042969, 0.009237289428710938, 0.011979103088378906, 0.014720916748046875, 0.017462730407714844, 0.020204544067382812, 0.02294635772705078, 0.02568817138671875, 0.02842998504638672, 0.031171798706054688, 0.033913612365722656, 0.036655426025390625, 0.039397239685058594, 0.04213905334472656, 0.04488086700439453, 0.0476226806640625, 0.05036449432373047, 0.05310630798339844, 0.055848121643066406, 0.058589935302734375, 0.061331748962402344, 0.06407356262207031, 0.06681537628173828, 0.06955718994140625, 0.07229900360107422, 0.07504081726074219, 0.07778263092041016, 0.08052444458007812, 0.0832662582397461, 0.08600807189941406, 0.08874988555908203, 0.09149169921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 3.0, 3.0, 5.0, 11.0, 6.0, 9.0, 13.0, 25.0, 71.0, 379.0, 3144.0, 240.0, 69.0, 27.0, 15.0, 8.0, 5.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.024444580078125, -0.023772239685058594, -0.023099899291992188, -0.02242755889892578, -0.021755218505859375, -0.02108287811279297, -0.020410537719726562, -0.019738197326660156, -0.01906585693359375, -0.018393516540527344, -0.017721176147460938, -0.01704883575439453, -0.016376495361328125, -0.01570415496826172, -0.015031814575195312, -0.014359474182128906, -0.0136871337890625, -0.013014793395996094, -0.012342453002929688, -0.011670112609863281, -0.010997772216796875, -0.010325431823730469, -0.009653091430664062, -0.008980751037597656, -0.00830841064453125, -0.007636070251464844, -0.0069637298583984375, -0.006291389465332031, -0.005619049072265625, -0.004946708679199219, -0.0042743682861328125, -0.0036020278930664062, -0.0029296875, -0.0022573471069335938, -0.0015850067138671875, -0.0009126663208007812, -0.000240325927734375, 0.00043201446533203125, 0.0011043548583984375, 0.0017766952514648438, 0.00244903564453125, 0.0031213760375976562, 0.0037937164306640625, 0.004466056823730469, 0.005138397216796875, 0.005810737609863281, 0.0064830780029296875, 0.007155418395996094, 0.0078277587890625, 0.008500099182128906, 0.009172439575195312, 0.009844779968261719, 0.010517120361328125, 0.011189460754394531, 0.011861801147460938, 0.012534141540527344, 0.01320648193359375, 0.013878822326660156, 0.014551162719726562, 0.015223503112792969, 0.015895843505859375, 0.01656818389892578, 0.017240524291992188, 0.017912864685058594, 0.018585205078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 546.0, 282.0, 86.0, 45.0, 13.0, 11.0, 13.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10803594440221786, -0.07928316295146942, -0.05053038150072098, -0.021777600049972534, 0.006975181400775909, 0.035727955400943756, 0.0644807443022728, 0.09323353320360184, 0.12198630720376968, 0.15073908865451813, 0.17949187755584717, 0.20824465155601501, 0.23699742555618286, 0.2657501995563507, 0.29450300335884094, 0.3232557773590088, 0.35200855135917664, 0.3807613253593445, 0.4095141291618347, 0.43826690316200256, 0.4670196771621704, 0.49577245116233826, 0.5245252251625061, 0.5532780289649963, 0.5820308327674866, 0.6107836365699768, 0.6395363807678223, 0.6682891845703125, 0.6970419883728027, 0.7257947325706482, 0.7545475363731384, 0.7833002805709839, 0.8120530843734741, 0.8408058881759644, 0.8695586323738098, 0.8983114361763, 0.9270641803741455, 0.9558169841766357, 0.984569787979126, 1.0133225917816162, 1.0420753955841064, 1.0708281993865967, 1.099581003189087, 1.1283336877822876, 1.1570864915847778, 1.185839295387268, 1.2145920991897583, 1.2433449029922485, 1.2720975875854492, 1.3008503913879395, 1.3296031951904297, 1.3583558797836304, 1.3871086835861206, 1.4158614873886108, 1.444614291191101, 1.4733670949935913, 1.502119779586792, 1.5308725833892822, 1.5596253871917725, 1.5883780717849731, 1.6171308755874634, 1.6458836793899536, 1.6746364831924438, 1.703389286994934, 1.7321420907974243]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 2.0, 5.0, 8.0, 10.0, 13.0, 12.0, 21.0, 23.0, 34.0, 42.0, 45.0, 48.0, 72.0, 76.0, 78.0, 87.0, 75.0, 72.0, 53.0, 52.0, 34.0, 32.0, 30.0, 20.0, 15.0, 9.0, 7.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.17775225639343262, -0.17252172529697418, -0.16729119420051575, -0.1620606780052185, -0.15683014690876007, -0.15159961581230164, -0.1463690847158432, -0.14113855361938477, -0.13590803742408752, -0.1306775063276291, -0.12544697523117065, -0.12021645158529282, -0.11498592793941498, -0.10975539684295654, -0.10452486574649811, -0.09929433465003967, -0.09406380355358124, -0.0888332724571228, -0.08360274881124496, -0.07837221771478653, -0.07314169406890869, -0.06791116297245026, -0.06268063187599182, -0.057450104504823685, -0.05221957713365555, -0.04698904976248741, -0.041758522391319275, -0.03652799129486084, -0.0312974639236927, -0.026066936552524567, -0.02083640545606613, -0.015605878084897995, -0.010375350713729858, -0.005144822411239147, 8.570589125156403e-05, 0.00531623512506485, 0.010546762496232986, 0.015777289867401123, 0.021007820963859558, 0.026238348335027695, 0.03146887570619583, 0.03669940307736397, 0.041929930448532104, 0.04716046154499054, 0.052390988916158676, 0.05762151628732681, 0.06285204738378525, 0.06808257102966309, 0.07331310212612152, 0.07854363322257996, 0.0837741568684578, 0.08900468796491623, 0.09423521161079407, 0.0994657427072525, 0.10469627380371094, 0.10992680490016937, 0.11515732854604721, 0.12038785964250565, 0.12561838328838348, 0.13084891438484192, 0.13607944548130035, 0.1413099765777588, 0.14654049277305603, 0.15177102386951447, 0.1570015549659729]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 7.0, 12.0, 13.0, 12.0, 21.0, 40.0, 86.0, 132.0, 266.0, 560.0, 1357.0, 3632.0, 14866.0, 908167.0, 106130.0, 8983.0, 2481.0, 901.0, 381.0, 192.0, 111.0, 71.0, 36.0, 34.0, 8.0, 15.0, 9.0, 6.0, 6.0, 2.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.137451171875, -0.13350582122802734, -0.1295604705810547, -0.12561511993408203, -0.12166976928710938, -0.11772441864013672, -0.11377906799316406, -0.1098337173461914, -0.10588836669921875, -0.1019430160522461, -0.09799766540527344, -0.09405231475830078, -0.09010696411132812, -0.08616161346435547, -0.08221626281738281, -0.07827091217041016, -0.0743255615234375, -0.07038021087646484, -0.06643486022949219, -0.06248950958251953, -0.058544158935546875, -0.05459880828857422, -0.05065345764160156, -0.046708106994628906, -0.04276275634765625, -0.038817405700683594, -0.03487205505371094, -0.03092670440673828, -0.026981353759765625, -0.02303600311279297, -0.019090652465820312, -0.015145301818847656, -0.011199951171875, -0.007254600524902344, -0.0033092498779296875, 0.0006361007690429688, 0.004581451416015625, 0.008526802062988281, 0.012472152709960938, 0.016417503356933594, 0.02036285400390625, 0.024308204650878906, 0.028253555297851562, 0.03219890594482422, 0.036144256591796875, 0.04008960723876953, 0.04403495788574219, 0.047980308532714844, 0.0519256591796875, 0.055871009826660156, 0.05981636047363281, 0.06376171112060547, 0.06770706176757812, 0.07165241241455078, 0.07559776306152344, 0.0795431137084961, 0.08348846435546875, 0.0874338150024414, 0.09137916564941406, 0.09532451629638672, 0.09926986694335938, 0.10321521759033203, 0.10716056823730469, 0.11110591888427734, 0.11505126953125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 7.0, 5.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 14.0, 16.0, 25.0, 53.0, 115.0, 221.0, 246.0, 119.0, 54.0, 23.0, 16.0, 12.0, 8.0, 12.0, 2.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01549530029296875, -0.015050768852233887, -0.014606237411499023, -0.01416170597076416, -0.013717174530029297, -0.013272643089294434, -0.01282811164855957, -0.012383580207824707, -0.011939048767089844, -0.01149451732635498, -0.011049985885620117, -0.010605454444885254, -0.01016092300415039, -0.009716391563415527, -0.009271860122680664, -0.0088273286819458, -0.008382797241210938, -0.007938265800476074, -0.007493734359741211, -0.007049202919006348, -0.006604671478271484, -0.006160140037536621, -0.005715608596801758, -0.0052710771560668945, -0.004826545715332031, -0.004382014274597168, -0.003937482833862305, -0.0034929513931274414, -0.003048419952392578, -0.002603888511657715, -0.0021593570709228516, -0.0017148256301879883, -0.001270294189453125, -0.0008257627487182617, -0.00038123130798339844, 6.330013275146484e-05, 0.0005078315734863281, 0.0009523630142211914, 0.0013968944549560547, 0.001841425895690918, 0.0022859573364257812, 0.0027304887771606445, 0.003175020217895508, 0.003619551658630371, 0.004064083099365234, 0.004508614540100098, 0.004953145980834961, 0.005397677421569824, 0.0058422088623046875, 0.006286740303039551, 0.006731271743774414, 0.007175803184509277, 0.007620334625244141, 0.008064866065979004, 0.008509397506713867, 0.00895392894744873, 0.009398460388183594, 0.009842991828918457, 0.01028752326965332, 0.010732054710388184, 0.011176586151123047, 0.01162111759185791, 0.012065649032592773, 0.012510180473327637, 0.0129547119140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 14.0, 10.0, 8.0, 21.0, 16.0, 28.0, 30.0, 54.0, 68.0, 123.0, 117.0, 214.0, 345.0, 521.0, 1049.0, 2042.0, 5014.0, 15478.0, 68752.0, 764549.0, 151111.0, 25703.0, 7454.0, 2770.0, 1202.0, 620.0, 391.0, 263.0, 169.0, 108.0, 88.0, 52.0, 53.0, 26.0, 20.0, 24.0, 9.0, 8.0, 8.0, 11.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04937744140625, -0.0478668212890625, -0.046356201171875, -0.0448455810546875, -0.0433349609375, -0.0418243408203125, -0.040313720703125, -0.0388031005859375, -0.03729248046875, -0.0357818603515625, -0.034271240234375, -0.0327606201171875, -0.03125, -0.0297393798828125, -0.028228759765625, -0.0267181396484375, -0.02520751953125, -0.0236968994140625, -0.022186279296875, -0.0206756591796875, -0.0191650390625, -0.0176544189453125, -0.016143798828125, -0.0146331787109375, -0.01312255859375, -0.0116119384765625, -0.010101318359375, -0.0085906982421875, -0.007080078125, -0.0055694580078125, -0.004058837890625, -0.0025482177734375, -0.00103759765625, 0.0004730224609375, 0.001983642578125, 0.0034942626953125, 0.0050048828125, 0.0065155029296875, 0.008026123046875, 0.0095367431640625, 0.01104736328125, 0.0125579833984375, 0.014068603515625, 0.0155792236328125, 0.01708984375, 0.0186004638671875, 0.020111083984375, 0.0216217041015625, 0.02313232421875, 0.0246429443359375, 0.026153564453125, 0.0276641845703125, 0.0291748046875, 0.0306854248046875, 0.032196044921875, 0.0337066650390625, 0.03521728515625, 0.0367279052734375, 0.038238525390625, 0.0397491455078125, 0.041259765625, 0.0427703857421875, 0.044281005859375, 0.0457916259765625, 0.04730224609375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 9.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 22.0, 12.0, 18.0, 26.0, 29.0, 44.0, 33.0, 38.0, 26.0, 41.0, 47.0, 45.0, 42.0, 57.0, 46.0, 57.0, 57.0, 43.0, 37.0, 31.0, 30.0, 32.0, 24.0, 31.0, 23.0, 16.0, 16.0, 13.0, 7.0, 9.0, 7.0, 4.0, 7.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0218048095703125, -0.0209043025970459, -0.020003795623779297, -0.019103288650512695, -0.018202781677246094, -0.017302274703979492, -0.01640176773071289, -0.015501260757446289, -0.014600753784179688, -0.013700246810913086, -0.012799739837646484, -0.011899232864379883, -0.010998725891113281, -0.01009821891784668, -0.009197711944580078, -0.008297204971313477, -0.007396697998046875, -0.0064961910247802734, -0.005595684051513672, -0.00469517707824707, -0.0037946701049804688, -0.002894163131713867, -0.0019936561584472656, -0.001093149185180664, -0.0001926422119140625, 0.0007078647613525391, 0.0016083717346191406, 0.002508878707885742, 0.0034093856811523438, 0.004309892654418945, 0.005210399627685547, 0.0061109066009521484, 0.00701141357421875, 0.007911920547485352, 0.008812427520751953, 0.009712934494018555, 0.010613441467285156, 0.011513948440551758, 0.01241445541381836, 0.013314962387084961, 0.014215469360351562, 0.015115976333618164, 0.016016483306884766, 0.016916990280151367, 0.01781749725341797, 0.01871800422668457, 0.019618511199951172, 0.020519018173217773, 0.021419525146484375, 0.022320032119750977, 0.023220539093017578, 0.02412104606628418, 0.02502155303955078, 0.025922060012817383, 0.026822566986083984, 0.027723073959350586, 0.028623580932617188, 0.02952408790588379, 0.03042459487915039, 0.03132510185241699, 0.032225608825683594, 0.033126115798950195, 0.0340266227722168, 0.0349271297454834, 0.03582763671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 2.0, 9.0, 10.0, 30.0, 70.0, 140.0, 274.0, 719.0, 2360.0, 14891.0, 771997.0, 244063.0, 10885.0, 1952.0, 630.0, 265.0, 101.0, 67.0, 25.0, 17.0, 7.0, 6.0, 2.0, 8.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0044403076171875, -0.004301249980926514, -0.004162192344665527, -0.004023134708404541, -0.0038840770721435547, -0.0037450194358825684, -0.003605961799621582, -0.0034669041633605957, -0.0033278465270996094, -0.003188788890838623, -0.0030497312545776367, -0.0029106736183166504, -0.002771615982055664, -0.0026325583457946777, -0.0024935007095336914, -0.002354443073272705, -0.0022153854370117188, -0.0020763278007507324, -0.001937270164489746, -0.0017982125282287598, -0.0016591548919677734, -0.0015200972557067871, -0.0013810396194458008, -0.0012419819831848145, -0.0011029243469238281, -0.0009638667106628418, -0.0008248090744018555, -0.0006857514381408691, -0.0005466938018798828, -0.0004076361656188965, -0.00026857852935791016, -0.00012952089309692383, 9.5367431640625e-06, 0.00014859437942504883, 0.00028765201568603516, 0.0004267096519470215, 0.0005657672882080078, 0.0007048249244689941, 0.0008438825607299805, 0.0009829401969909668, 0.0011219978332519531, 0.0012610554695129395, 0.0014001131057739258, 0.0015391707420349121, 0.0016782283782958984, 0.0018172860145568848, 0.001956343650817871, 0.0020954012870788574, 0.0022344589233398438, 0.00237351655960083, 0.0025125741958618164, 0.0026516318321228027, 0.002790689468383789, 0.0029297471046447754, 0.0030688047409057617, 0.003207862377166748, 0.0033469200134277344, 0.0034859776496887207, 0.003625035285949707, 0.0037640929222106934, 0.0039031505584716797, 0.004042208194732666, 0.004181265830993652, 0.004320323467254639, 0.004459381103515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 5.0, 15.0, 112.0, 825.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001628398895263672, -0.00015778280794620514, -0.0001527257263660431, -0.00014766864478588104, -0.000142611563205719, -0.00013755448162555695, -0.0001324974000453949, -0.00012744031846523285, -0.0001223832368850708, -0.00011732615530490875, -0.0001122690737247467, -0.00010721199214458466, -0.00010215491056442261, -9.709782898426056e-05, -9.204074740409851e-05, -8.698366582393646e-05, -8.192658424377441e-05, -7.686950266361237e-05, -7.181242108345032e-05, -6.675533950328827e-05, -6.169825792312622e-05, -5.664117634296417e-05, -5.1584094762802124e-05, -4.6527013182640076e-05, -4.146993160247803e-05, -3.641285002231598e-05, -3.135576844215393e-05, -2.6298686861991882e-05, -2.1241605281829834e-05, -1.6184523701667786e-05, -1.1127442121505737e-05, -6.070360541343689e-06, -1.0132789611816406e-06, 4.043802618980408e-06, 9.100884199142456e-06, 1.4157965779304504e-05, 1.9215047359466553e-05, 2.42721289396286e-05, 2.932921051979065e-05, 3.43862920999527e-05, 3.9443373680114746e-05, 4.4500455260276794e-05, 4.955753684043884e-05, 5.461461842060089e-05, 5.967170000076294e-05, 6.472878158092499e-05, 6.978586316108704e-05, 7.484294474124908e-05, 7.990002632141113e-05, 8.495710790157318e-05, 9.001418948173523e-05, 9.507127106189728e-05, 0.00010012835264205933, 0.00010518543422222137, 0.00011024251580238342, 0.00011529959738254547, 0.00012035667896270752, 0.00012541376054286957, 0.00013047084212303162, 0.00013552792370319366, 0.0001405850052833557, 0.00014564208686351776, 0.0001506991684436798, 0.00015575625002384186, 0.0001608133316040039]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 7.0, 12.0, 18.0, 23.0, 30.0, 49.0, 88.0, 168.0, 289.0, 719.0, 2067.0, 9582.0, 162628.0, 852911.0, 15433.0, 2790.0, 893.0, 389.0, 185.0, 104.0, 76.0, 37.0, 18.0, 12.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00411224365234375, -0.003988087177276611, -0.0038639307022094727, -0.003739774227142334, -0.0036156177520751953, -0.0034914612770080566, -0.003367304801940918, -0.0032431483268737793, -0.0031189918518066406, -0.002994835376739502, -0.0028706789016723633, -0.0027465224266052246, -0.002622365951538086, -0.0024982094764709473, -0.0023740530014038086, -0.00224989652633667, -0.0021257400512695312, -0.0020015835762023926, -0.001877427101135254, -0.0017532706260681152, -0.0016291141510009766, -0.0015049576759338379, -0.0013808012008666992, -0.0012566447257995605, -0.0011324882507324219, -0.0010083317756652832, -0.0008841753005981445, -0.0007600188255310059, -0.0006358623504638672, -0.0005117058753967285, -0.00038754940032958984, -0.00026339292526245117, -0.0001392364501953125, -1.5079975128173828e-05, 0.00010907649993896484, 0.00023323297500610352, 0.0003573894500732422, 0.00048154592514038086, 0.0006057024002075195, 0.0007298588752746582, 0.0008540153503417969, 0.0009781718254089355, 0.0011023283004760742, 0.0012264847755432129, 0.0013506412506103516, 0.0014747977256774902, 0.001598954200744629, 0.0017231106758117676, 0.0018472671508789062, 0.001971423625946045, 0.0020955801010131836, 0.0022197365760803223, 0.002343893051147461, 0.0024680495262145996, 0.0025922060012817383, 0.002716362476348877, 0.0028405189514160156, 0.0029646754264831543, 0.003088831901550293, 0.0032129883766174316, 0.0033371448516845703, 0.003461301326751709, 0.0035854578018188477, 0.0037096142768859863, 0.003833770751953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 21.0, 19.0, 19.0, 27.0, 41.0, 64.0, 101.0, 132.0, 172.0, 119.0, 66.0, 46.0, 49.0, 30.0, 25.0, 18.0, 11.0, 11.0, 8.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016765594482421875, -0.0016101300716400146, -0.0015437006950378418, -0.001477271318435669, -0.001410841941833496, -0.0013444125652313232, -0.0012779831886291504, -0.0012115538120269775, -0.0011451244354248047, -0.0010786950588226318, -0.001012265682220459, -0.0009458363056182861, -0.0008794069290161133, -0.0008129775524139404, -0.0007465481758117676, -0.0006801187992095947, -0.0006136894226074219, -0.000547260046005249, -0.00048083066940307617, -0.0004144012928009033, -0.00034797191619873047, -0.0002815425395965576, -0.00021511316299438477, -0.00014868378639221191, -8.225440979003906e-05, -1.582503318786621e-05, 5.060434341430664e-05, 0.00011703372001647949, 0.00018346309661865234, 0.0002498924732208252, 0.00031632184982299805, 0.0003827512264251709, 0.00044918060302734375, 0.0005156099796295166, 0.0005820393562316895, 0.0006484687328338623, 0.0007148981094360352, 0.000781327486038208, 0.0008477568626403809, 0.0009141862392425537, 0.0009806156158447266, 0.0010470449924468994, 0.0011134743690490723, 0.0011799037456512451, 0.001246333122253418, 0.0013127624988555908, 0.0013791918754577637, 0.0014456212520599365, 0.0015120506286621094, 0.0015784800052642822, 0.001644909381866455, 0.001711338758468628, 0.0017777681350708008, 0.0018441975116729736, 0.0019106268882751465, 0.0019770562648773193, 0.002043485641479492, 0.002109915018081665, 0.002176344394683838, 0.0022427737712860107, 0.0023092031478881836, 0.0023756325244903564, 0.0024420619010925293, 0.002508491277694702, 0.002574920654296875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 8.0, 8.0, 15.0, 23.0, 38.0, 87.0, 216.0, 320.0, 147.0, 54.0, 32.0, 15.0, 10.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24901744723320007, -0.24101783335208893, -0.23301821947097778, -0.22501862049102783, -0.2170190066099167, -0.20901939272880554, -0.2010197937488556, -0.19302017986774445, -0.1850205659866333, -0.17702095210552216, -0.169021338224411, -0.16102173924446106, -0.15302212536334991, -0.14502251148223877, -0.13702291250228882, -0.12902329862117767, -0.12102368474006653, -0.11302407085895538, -0.10502446442842484, -0.09702485799789429, -0.08902524411678314, -0.081025630235672, -0.07302602380514145, -0.0650264173746109, -0.057026803493499756, -0.04902719333767891, -0.04102758318185806, -0.033027973026037216, -0.02502836287021637, -0.017028752714395523, -0.009029142558574677, -0.00102953240275383, 0.006970047950744629, 0.014969658106565475, 0.022969268262386322, 0.03096887841820717, 0.038968488574028015, 0.04696809872984886, 0.05496770888566971, 0.06296731531620026, 0.0709669291973114, 0.07896654307842255, 0.0869661495089531, 0.09496575593948364, 0.10296536982059479, 0.11096498370170593, 0.11896459013223648, 0.12696419656276703, 0.13496381044387817, 0.14296342432498932, 0.15096303820610046, 0.15896263718605042, 0.16696225106716156, 0.1749618649482727, 0.18296146392822266, 0.1909610778093338, 0.19896069169044495, 0.2069603055715561, 0.21495991945266724, 0.2229595184326172, 0.23095913231372833, 0.23895874619483948, 0.24695834517478943, 0.25495797395706177, 0.2629575729370117]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 3.0, 10.0, 6.0, 7.0, 17.0, 16.0, 19.0, 15.0, 31.0, 19.0, 39.0, 30.0, 43.0, 43.0, 56.0, 67.0, 65.0, 65.0, 57.0, 60.0, 33.0, 33.0, 46.0, 33.0, 31.0, 28.0, 15.0, 18.0, 15.0, 16.0, 13.0, 9.0, 7.0, 11.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1345527172088623, -0.13073469698429108, -0.12691669166088104, -0.12309867143630981, -0.11928065866231918, -0.11546264588832855, -0.11164462566375732, -0.1078266128897667, -0.10400860011577606, -0.10019058734178543, -0.0963725745677948, -0.09255455434322357, -0.08873654156923294, -0.08491852879524231, -0.08110050857067108, -0.07728249579668045, -0.07346448302268982, -0.06964647024869919, -0.06582845747470856, -0.06201043725013733, -0.0581924244761467, -0.05437441170215607, -0.05055639520287514, -0.04673837870359421, -0.04292036592960358, -0.039102353155612946, -0.035284336656332016, -0.031466320157051086, -0.027648307383060455, -0.023830292746424675, -0.020012278109788895, -0.016194263473153114, -0.012376248836517334, -0.008558234199881554, -0.004740219563245773, -0.000922204926609993, 0.0028958097100257874, 0.006713824346661568, 0.010531838983297348, 0.014349853619933128, 0.01816786825656891, 0.02198588289320469, 0.02580389752984047, 0.02962191216647625, 0.03343992680311203, 0.03725793957710266, 0.04107595607638359, 0.04489397257566452, 0.04871198534965515, 0.05252999812364578, 0.05634801462292671, 0.06016603112220764, 0.06398404389619827, 0.0678020566701889, 0.07162007689476013, 0.07543808966875076, 0.0792561024427414, 0.08307411521673203, 0.08689212799072266, 0.09071014821529388, 0.09452816098928452, 0.09834617376327515, 0.10216419398784637, 0.105982206761837, 0.10980021953582764]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 12.0, 4.0, 7.0, 3.0, 7.0, 12.0, 28.0, 28.0, 55.0, 96.0, 225.0, 846.0, 4191751.0, 733.0, 235.0, 91.0, 54.0, 27.0, 16.0, 11.0, 9.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.424560546875, -0.41257476806640625, -0.4005889892578125, -0.38860321044921875, -0.376617431640625, -0.36463165283203125, -0.3526458740234375, -0.34066009521484375, -0.32867431640625, -0.31668853759765625, -0.3047027587890625, -0.29271697998046875, -0.280731201171875, -0.26874542236328125, -0.2567596435546875, -0.24477386474609375, -0.2327880859375, -0.22080230712890625, -0.2088165283203125, -0.19683074951171875, -0.184844970703125, -0.17285919189453125, -0.1608734130859375, -0.14888763427734375, -0.13690185546875, -0.12491607666015625, -0.1129302978515625, -0.10094451904296875, -0.088958740234375, -0.07697296142578125, -0.0649871826171875, -0.05300140380859375, -0.041015625, -0.02902984619140625, -0.0170440673828125, -0.00505828857421875, 0.006927490234375, 0.01891326904296875, 0.0308990478515625, 0.04288482666015625, 0.05487060546875, 0.06685638427734375, 0.0788421630859375, 0.09082794189453125, 0.102813720703125, 0.11479949951171875, 0.1267852783203125, 0.13877105712890625, 0.1507568359375, 0.16274261474609375, 0.1747283935546875, 0.18671417236328125, 0.198699951171875, 0.21068572998046875, 0.2226715087890625, 0.23465728759765625, 0.24664306640625, 0.25862884521484375, 0.2706146240234375, 0.28260040283203125, 0.294586181640625, 0.30657196044921875, 0.3185577392578125, 0.33054351806640625, 0.342529296875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 5.0, 4.0, 4.0, 3.0, 4.0, 4.0, 5.0, 12.0, 15.0, 36.0, 53.0, 109.0, 155.0, 193.0, 153.0, 99.0, 50.0, 37.0, 13.0, 8.0, 12.0, 3.0, 4.0, 4.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0153961181640625, -0.014971375465393066, -0.014546632766723633, -0.0141218900680542, -0.013697147369384766, -0.013272404670715332, -0.012847661972045898, -0.012422919273376465, -0.011998176574707031, -0.011573433876037598, -0.011148691177368164, -0.01072394847869873, -0.010299205780029297, -0.009874463081359863, -0.00944972038269043, -0.009024977684020996, -0.008600234985351562, -0.008175492286682129, -0.007750749588012695, -0.007326006889343262, -0.006901264190673828, -0.0064765214920043945, -0.006051778793334961, -0.005627036094665527, -0.005202293395996094, -0.00477755069732666, -0.0043528079986572266, -0.003928065299987793, -0.0035033226013183594, -0.0030785799026489258, -0.002653837203979492, -0.0022290945053100586, -0.001804351806640625, -0.0013796091079711914, -0.0009548664093017578, -0.0005301237106323242, -0.00010538101196289062, 0.00031936168670654297, 0.0007441043853759766, 0.0011688470840454102, 0.0015935897827148438, 0.0020183324813842773, 0.002443075180053711, 0.0028678178787231445, 0.003292560577392578, 0.0037173032760620117, 0.004142045974731445, 0.004566788673400879, 0.0049915313720703125, 0.005416274070739746, 0.00584101676940918, 0.006265759468078613, 0.006690502166748047, 0.0071152448654174805, 0.007539987564086914, 0.007964730262756348, 0.008389472961425781, 0.008814215660095215, 0.009238958358764648, 0.009663701057434082, 0.010088443756103516, 0.01051318645477295, 0.010937929153442383, 0.011362671852111816, 0.01178741455078125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 13.0, 9.0, 17.0, 45.0, 50.0, 89.0, 159.0, 256.0, 429.0, 806.0, 1564.0, 3567.0, 9055.0, 30687.0, 719494.0, 3369073.0, 39883.0, 10989.0, 4278.0, 1833.0, 948.0, 450.0, 232.0, 136.0, 80.0, 56.0, 26.0, 21.0, 9.0, 6.0, 10.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0201416015625, -0.019626379013061523, -0.019111156463623047, -0.01859593391418457, -0.018080711364746094, -0.017565488815307617, -0.01705026626586914, -0.016535043716430664, -0.016019821166992188, -0.015504598617553711, -0.014989376068115234, -0.014474153518676758, -0.013958930969238281, -0.013443708419799805, -0.012928485870361328, -0.012413263320922852, -0.011898040771484375, -0.011382818222045898, -0.010867595672607422, -0.010352373123168945, -0.009837150573730469, -0.009321928024291992, -0.008806705474853516, -0.008291482925415039, -0.0077762603759765625, -0.007261037826538086, -0.006745815277099609, -0.006230592727661133, -0.005715370178222656, -0.00520014762878418, -0.004684925079345703, -0.0041697025299072266, -0.00365447998046875, -0.0031392574310302734, -0.002624034881591797, -0.0021088123321533203, -0.0015935897827148438, -0.0010783672332763672, -0.0005631446838378906, -4.792213439941406e-05, 0.0004673004150390625, 0.000982522964477539, 0.0014977455139160156, 0.002012968063354492, 0.0025281906127929688, 0.0030434131622314453, 0.003558635711669922, 0.0040738582611083984, 0.004589080810546875, 0.0051043033599853516, 0.005619525909423828, 0.006134748458862305, 0.006649971008300781, 0.007165193557739258, 0.007680416107177734, 0.008195638656616211, 0.008710861206054688, 0.009226083755493164, 0.00974130630493164, 0.010256528854370117, 0.010771751403808594, 0.01128697395324707, 0.011802196502685547, 0.012317419052124023, 0.0128326416015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 10.0, 10.0, 15.0, 13.0, 23.0, 32.0, 67.0, 157.0, 665.0, 1887.0, 808.0, 180.0, 51.0, 23.0, 23.0, 19.0, 6.0, 14.0, 7.0, 7.0, 2.0, 5.0, 5.0, 6.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184173583984375, -0.01791369915008545, -0.0174100399017334, -0.016906380653381348, -0.016402721405029297, -0.015899062156677246, -0.015395402908325195, -0.014891743659973145, -0.014388084411621094, -0.013884425163269043, -0.013380765914916992, -0.012877106666564941, -0.01237344741821289, -0.01186978816986084, -0.011366128921508789, -0.010862469673156738, -0.010358810424804688, -0.009855151176452637, -0.009351491928100586, -0.008847832679748535, -0.008344173431396484, -0.007840514183044434, -0.007336854934692383, -0.006833195686340332, -0.006329536437988281, -0.0058258771896362305, -0.00532221794128418, -0.004818558692932129, -0.004314899444580078, -0.0038112401962280273, -0.0033075809478759766, -0.0028039216995239258, -0.002300262451171875, -0.0017966032028198242, -0.0012929439544677734, -0.0007892847061157227, -0.0002856254577636719, 0.0002180337905883789, 0.0007216930389404297, 0.0012253522872924805, 0.0017290115356445312, 0.002232670783996582, 0.002736330032348633, 0.0032399892807006836, 0.0037436485290527344, 0.004247307777404785, 0.004750967025756836, 0.005254626274108887, 0.0057582855224609375, 0.006261944770812988, 0.006765604019165039, 0.00726926326751709, 0.007772922515869141, 0.008276581764221191, 0.008780241012573242, 0.009283900260925293, 0.009787559509277344, 0.010291218757629395, 0.010794878005981445, 0.011298537254333496, 0.011802196502685547, 0.012305855751037598, 0.012809514999389648, 0.0133131742477417, 0.01381683349609375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 13.0, 20.0, 32.0, 79.0, 133.0, 229.0, 162.0, 95.0, 67.0, 57.0, 26.0, 22.0, 21.0, 8.0, 7.0, 9.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08664816617965698, -0.0833834707736969, -0.08011876791715622, -0.07685407251119614, -0.07358937710523605, -0.07032467424869537, -0.06705997884273529, -0.06379528343677521, -0.060530584305524826, -0.057265885174274445, -0.05400118976831436, -0.05073649063706398, -0.0474717915058136, -0.044207096099853516, -0.040942396968603134, -0.03767769783735275, -0.03441300243139267, -0.031148305162787437, -0.027883607894182205, -0.024618908762931824, -0.02135421149432659, -0.01808951422572136, -0.014824815094470978, -0.011560117825865746, -0.008295420557260513, -0.005030722822993994, -0.0017660250887274742, 0.0014986731112003326, 0.004763370379805565, 0.008028067648410797, 0.011292766779661179, 0.01455746404826641, 0.01782216876745224, 0.021086866036057472, 0.024351563304662704, 0.027616262435913086, 0.030880959704518318, 0.03414565697312355, 0.03741035610437393, 0.040675051510334015, 0.043939750641584396, 0.04720444977283478, 0.05046914517879486, 0.05373384431004524, 0.056998543441295624, 0.06026323884725571, 0.06352794170379639, 0.06679263710975647, 0.07005733251571655, 0.07332202792167664, 0.07658673077821732, 0.0798514261841774, 0.08311612159013748, 0.08638082444667816, 0.08964551985263824, 0.09291021525859833, 0.09617491066455841, 0.0994396060705185, 0.10270430892705917, 0.10596900433301926, 0.10923369973897934, 0.11249840259552002, 0.1157630980014801, 0.11902779340744019, 0.12229249626398087]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 2.0, 7.0, 15.0, 13.0, 17.0, 20.0, 20.0, 18.0, 25.0, 33.0, 37.0, 35.0, 50.0, 44.0, 51.0, 61.0, 59.0, 60.0, 55.0, 41.0, 35.0, 47.0, 24.0, 35.0, 27.0, 30.0, 17.0, 19.0, 19.0, 17.0, 11.0, 10.0, 10.0, 7.0, 8.0, 6.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.05677533149719238, -0.054933320730924606, -0.05309130996465683, -0.05124930292367935, -0.049407292157411575, -0.0475652813911438, -0.04572327435016632, -0.043881263583898544, -0.04203925281763077, -0.04019724205136299, -0.038355231285095215, -0.03651322424411774, -0.03467121347784996, -0.032829202711582184, -0.030987193807959557, -0.02914518490433693, -0.027303174138069153, -0.025461163371801376, -0.02361915446817875, -0.021777145564556122, -0.019935134798288345, -0.01809312403202057, -0.01625111512839794, -0.01440910529345274, -0.012567095458507538, -0.010725085623562336, -0.008883075788617134, -0.007041065953671932, -0.00519905611872673, -0.0033570462837815285, -0.0015150364488363266, 0.0003269733861088753, 0.002168983221054077, 0.004010993055999279, 0.005853002890944481, 0.007695012725889683, 0.009537022560834885, 0.011379032395780087, 0.013221042230725288, 0.01506305206567049, 0.016905061900615692, 0.01874707266688347, 0.020589081570506096, 0.022431090474128723, 0.0242731012403965, 0.026115112006664276, 0.027957120910286903, 0.02979912981390953, 0.03164114058017731, 0.033483151346445084, 0.03532516211271286, 0.03716716915369034, 0.039009179919958115, 0.04085119068622589, 0.04269319772720337, 0.044535208493471146, 0.04637721925973892, 0.0482192300260067, 0.050061240792274475, 0.05190324783325195, 0.05374525859951973, 0.055587269365787506, 0.057429276406764984, 0.05927128717303276, 0.06111329793930054]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 4.0, 7.0, 8.0, 8.0, 11.0, 16.0, 16.0, 28.0, 36.0, 42.0, 63.0, 78.0, 94.0, 130.0, 171.0, 267.0, 396.0, 609.0, 961.0, 1701.0, 3157.0, 7346.0, 22804.0, 154407.0, 768083.0, 62120.0, 14108.0, 5301.0, 2537.0, 1396.0, 913.0, 542.0, 366.0, 247.0, 151.0, 124.0, 86.0, 65.0, 45.0, 28.0, 20.0, 15.0, 15.0, 8.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 1.0], "bins": [-0.02508544921875, -0.024374961853027344, -0.023664474487304688, -0.02295398712158203, -0.022243499755859375, -0.02153301239013672, -0.020822525024414062, -0.020112037658691406, -0.01940155029296875, -0.018691062927246094, -0.017980575561523438, -0.01727008819580078, -0.016559600830078125, -0.01584911346435547, -0.015138626098632812, -0.014428138732910156, -0.0137176513671875, -0.013007164001464844, -0.012296676635742188, -0.011586189270019531, -0.010875701904296875, -0.010165214538574219, -0.009454727172851562, -0.008744239807128906, -0.00803375244140625, -0.007323265075683594, -0.0066127777099609375, -0.005902290344238281, -0.005191802978515625, -0.004481315612792969, -0.0037708282470703125, -0.0030603408813476562, -0.002349853515625, -0.0016393661499023438, -0.0009288787841796875, -0.00021839141845703125, 0.000492095947265625, 0.0012025833129882812, 0.0019130706787109375, 0.0026235580444335938, 0.00333404541015625, 0.004044532775878906, 0.0047550201416015625, 0.005465507507324219, 0.006175994873046875, 0.006886482238769531, 0.0075969696044921875, 0.008307456970214844, 0.0090179443359375, 0.009728431701660156, 0.010438919067382812, 0.011149406433105469, 0.011859893798828125, 0.012570381164550781, 0.013280868530273438, 0.013991355895996094, 0.01470184326171875, 0.015412330627441406, 0.016122817993164062, 0.01683330535888672, 0.017543792724609375, 0.01825428009033203, 0.018964767456054688, 0.019675254821777344, 0.0203857421875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 7.0, 7.0, 9.0, 21.0, 43.0, 68.0, 97.0, 133.0, 173.0, 137.0, 121.0, 57.0, 32.0, 30.0, 11.0, 5.0, 11.0, 3.0, 1.0, 8.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01459503173828125, -0.014193058013916016, -0.013791084289550781, -0.013389110565185547, -0.012987136840820312, -0.012585163116455078, -0.012183189392089844, -0.01178121566772461, -0.011379241943359375, -0.01097726821899414, -0.010575294494628906, -0.010173320770263672, -0.009771347045898438, -0.009369373321533203, -0.008967399597167969, -0.008565425872802734, -0.0081634521484375, -0.007761478424072266, -0.007359504699707031, -0.006957530975341797, -0.0065555572509765625, -0.006153583526611328, -0.005751609802246094, -0.005349636077880859, -0.004947662353515625, -0.004545688629150391, -0.004143714904785156, -0.003741741180419922, -0.0033397674560546875, -0.002937793731689453, -0.0025358200073242188, -0.0021338462829589844, -0.00173187255859375, -0.0013298988342285156, -0.0009279251098632812, -0.0005259513854980469, -0.0001239776611328125, 0.0002779960632324219, 0.0006799697875976562, 0.0010819435119628906, 0.001483917236328125, 0.0018858909606933594, 0.0022878646850585938, 0.002689838409423828, 0.0030918121337890625, 0.003493785858154297, 0.0038957595825195312, 0.004297733306884766, 0.00469970703125, 0.005101680755615234, 0.005503654479980469, 0.005905628204345703, 0.0063076019287109375, 0.006709575653076172, 0.007111549377441406, 0.007513523101806641, 0.007915496826171875, 0.00831747055053711, 0.008719444274902344, 0.009121417999267578, 0.009523391723632812, 0.009925365447998047, 0.010327339172363281, 0.010729312896728516, 0.01113128662109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 6.0, 8.0, 8.0, 6.0, 13.0, 24.0, 26.0, 26.0, 35.0, 49.0, 79.0, 103.0, 150.0, 187.0, 278.0, 415.0, 586.0, 1042.0, 1966.0, 4158.0, 11453.0, 45105.0, 396370.0, 515362.0, 49361.0, 12211.0, 4392.0, 2031.0, 1077.0, 603.0, 405.0, 284.0, 171.0, 129.0, 107.0, 74.0, 55.0, 47.0, 33.0, 22.0, 19.0, 19.0, 12.0, 11.0, 16.0, 6.0, 11.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.0177459716796875, -0.01719188690185547, -0.016637802124023438, -0.016083717346191406, -0.015529632568359375, -0.014975547790527344, -0.014421463012695312, -0.013867378234863281, -0.01331329345703125, -0.012759208679199219, -0.012205123901367188, -0.011651039123535156, -0.011096954345703125, -0.010542869567871094, -0.009988784790039062, -0.009434700012207031, -0.008880615234375, -0.008326530456542969, -0.0077724456787109375, -0.007218360900878906, -0.006664276123046875, -0.006110191345214844, -0.0055561065673828125, -0.005002021789550781, -0.00444793701171875, -0.0038938522338867188, -0.0033397674560546875, -0.0027856826782226562, -0.002231597900390625, -0.0016775131225585938, -0.0011234283447265625, -0.0005693435668945312, -1.52587890625e-05, 0.0005388259887695312, 0.0010929107666015625, 0.0016469955444335938, 0.002201080322265625, 0.0027551651000976562, 0.0033092498779296875, 0.0038633346557617188, 0.00441741943359375, 0.004971504211425781, 0.0055255889892578125, 0.006079673767089844, 0.006633758544921875, 0.007187843322753906, 0.0077419281005859375, 0.008296012878417969, 0.00885009765625, 0.009404182434082031, 0.009958267211914062, 0.010512351989746094, 0.011066436767578125, 0.011620521545410156, 0.012174606323242188, 0.012728691101074219, 0.01328277587890625, 0.013836860656738281, 0.014390945434570312, 0.014945030212402344, 0.015499114990234375, 0.016053199768066406, 0.016607284545898438, 0.01716136932373047, 0.0177154541015625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 11.0, 8.0, 8.0, 8.0, 10.0, 15.0, 14.0, 26.0, 12.0, 17.0, 24.0, 37.0, 34.0, 33.0, 42.0, 30.0, 34.0, 37.0, 38.0, 39.0, 49.0, 30.0, 53.0, 42.0, 35.0, 37.0, 33.0, 31.0, 29.0, 34.0, 24.0, 18.0, 8.0, 18.0, 8.0, 10.0, 13.0, 7.0, 6.0, 11.0, 6.0, 2.0, 2.0, 3.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.01934814453125, -0.018675804138183594, -0.018003463745117188, -0.01733112335205078, -0.016658782958984375, -0.01598644256591797, -0.015314102172851562, -0.014641761779785156, -0.01396942138671875, -0.013297080993652344, -0.012624740600585938, -0.011952400207519531, -0.011280059814453125, -0.010607719421386719, -0.009935379028320312, -0.009263038635253906, -0.0085906982421875, -0.007918357849121094, -0.0072460174560546875, -0.006573677062988281, -0.005901336669921875, -0.005228996276855469, -0.0045566558837890625, -0.0038843154907226562, -0.00321197509765625, -0.0025396347045898438, -0.0018672943115234375, -0.0011949539184570312, -0.000522613525390625, 0.00014972686767578125, 0.0008220672607421875, 0.0014944076538085938, 0.002166748046875, 0.0028390884399414062, 0.0035114288330078125, 0.004183769226074219, 0.004856109619140625, 0.005528450012207031, 0.0062007904052734375, 0.006873130798339844, 0.00754547119140625, 0.008217811584472656, 0.008890151977539062, 0.009562492370605469, 0.010234832763671875, 0.010907173156738281, 0.011579513549804688, 0.012251853942871094, 0.0129241943359375, 0.013596534729003906, 0.014268875122070312, 0.014941215515136719, 0.015613555908203125, 0.01628589630126953, 0.016958236694335938, 0.017630577087402344, 0.01830291748046875, 0.018975257873535156, 0.019647598266601562, 0.02031993865966797, 0.020992279052734375, 0.02166461944580078, 0.022336959838867188, 0.023009300231933594, 0.023681640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 11.0, 14.0, 16.0, 28.0, 53.0, 129.0, 283.0, 797.0, 2364.0, 9059.0, 80079.0, 919155.0, 28639.0, 5411.0, 1559.0, 516.0, 190.0, 100.0, 46.0, 34.0, 19.0, 7.0, 14.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00518035888671875, -0.005014955997467041, -0.004849553108215332, -0.004684150218963623, -0.004518747329711914, -0.004353344440460205, -0.004187941551208496, -0.004022538661956787, -0.003857135772705078, -0.003691732883453369, -0.00352632999420166, -0.003360927104949951, -0.003195524215698242, -0.003030121326446533, -0.0028647184371948242, -0.0026993155479431152, -0.0025339126586914062, -0.0023685097694396973, -0.0022031068801879883, -0.0020377039909362793, -0.0018723011016845703, -0.0017068982124328613, -0.0015414953231811523, -0.0013760924339294434, -0.0012106895446777344, -0.0010452866554260254, -0.0008798837661743164, -0.0007144808769226074, -0.0005490779876708984, -0.00038367509841918945, -0.00021827220916748047, -5.2869319915771484e-05, 0.0001125335693359375, 0.0002779364585876465, 0.00044333934783935547, 0.0006087422370910645, 0.0007741451263427734, 0.0009395480155944824, 0.0011049509048461914, 0.0012703537940979004, 0.0014357566833496094, 0.0016011595726013184, 0.0017665624618530273, 0.0019319653511047363, 0.0020973682403564453, 0.0022627711296081543, 0.0024281740188598633, 0.0025935769081115723, 0.0027589797973632812, 0.0029243826866149902, 0.0030897855758666992, 0.003255188465118408, 0.003420591354370117, 0.003585994243621826, 0.003751397132873535, 0.003916800022125244, 0.004082202911376953, 0.004247605800628662, 0.004413008689880371, 0.00457841157913208, 0.004743814468383789, 0.004909217357635498, 0.005074620246887207, 0.005240023136138916, 0.005405426025390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 2.0, 8.0, 8.0, 6.0, 22.0, 20.0, 24.0, 29.0, 32.0, 45.0, 54.0, 39.0, 80.0, 49.0, 35.0, 73.0, 45.0, 42.0, 63.0, 40.0, 33.0, 42.0, 27.0, 38.0, 29.0, 17.0, 26.0, 14.0, 9.0, 11.0, 6.0, 8.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.291534423828125e-06, -4.150904715061188e-06, -4.0102750062942505e-06, -3.869645297527313e-06, -3.729015588760376e-06, -3.5883858799934387e-06, -3.4477561712265015e-06, -3.307126462459564e-06, -3.166496753692627e-06, -3.0258670449256897e-06, -2.8852373361587524e-06, -2.744607627391815e-06, -2.603977918624878e-06, -2.4633482098579407e-06, -2.3227185010910034e-06, -2.182088792324066e-06, -2.041459083557129e-06, -1.9008293747901917e-06, -1.7601996660232544e-06, -1.6195699572563171e-06, -1.4789402484893799e-06, -1.3383105397224426e-06, -1.1976808309555054e-06, -1.0570511221885681e-06, -9.164214134216309e-07, -7.757917046546936e-07, -6.351619958877563e-07, -4.945322871208191e-07, -3.5390257835388184e-07, -2.1327286958694458e-07, -7.264316082000732e-08, 6.798654794692993e-08, 2.086162567138672e-07, 3.4924596548080444e-07, 4.898756742477417e-07, 6.30505383014679e-07, 7.711350917816162e-07, 9.117648005485535e-07, 1.0523945093154907e-06, 1.193024218082428e-06, 1.3336539268493652e-06, 1.4742836356163025e-06, 1.6149133443832397e-06, 1.755543053150177e-06, 1.8961727619171143e-06, 2.0368024706840515e-06, 2.1774321794509888e-06, 2.318061888217926e-06, 2.4586915969848633e-06, 2.5993213057518005e-06, 2.739951014518738e-06, 2.880580723285675e-06, 3.0212104320526123e-06, 3.1618401408195496e-06, 3.302469849586487e-06, 3.443099558353424e-06, 3.5837292671203613e-06, 3.7243589758872986e-06, 3.864988684654236e-06, 4.005618393421173e-06, 4.14624810218811e-06, 4.286877810955048e-06, 4.427507519721985e-06, 4.568137228488922e-06, 4.708766937255859e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 9.0, 18.0, 11.0, 15.0, 26.0, 51.0, 64.0, 114.0, 176.0, 357.0, 768.0, 1988.0, 6871.0, 47978.0, 934424.0, 45318.0, 6820.0, 1941.0, 723.0, 361.0, 178.0, 107.0, 75.0, 51.0, 29.0, 22.0, 15.0, 7.0, 10.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0062103271484375, -0.006048977375030518, -0.005887627601623535, -0.005726277828216553, -0.00556492805480957, -0.005403578281402588, -0.0052422285079956055, -0.005080878734588623, -0.004919528961181641, -0.004758179187774658, -0.004596829414367676, -0.004435479640960693, -0.004274129867553711, -0.0041127800941467285, -0.003951430320739746, -0.0037900805473327637, -0.0036287307739257812, -0.003467381000518799, -0.0033060312271118164, -0.003144681453704834, -0.0029833316802978516, -0.002821981906890869, -0.0026606321334838867, -0.0024992823600769043, -0.002337932586669922, -0.0021765828132629395, -0.002015233039855957, -0.0018538832664489746, -0.0016925334930419922, -0.0015311837196350098, -0.0013698339462280273, -0.001208484172821045, -0.0010471343994140625, -0.0008857846260070801, -0.0007244348526000977, -0.0005630850791931152, -0.0004017353057861328, -0.0002403855323791504, -7.903575897216797e-05, 8.231401443481445e-05, 0.00024366378784179688, 0.0004050135612487793, 0.0005663633346557617, 0.0007277131080627441, 0.0008890628814697266, 0.001050412654876709, 0.0012117624282836914, 0.0013731122016906738, 0.0015344619750976562, 0.0016958117485046387, 0.001857161521911621, 0.0020185112953186035, 0.002179861068725586, 0.0023412108421325684, 0.0025025606155395508, 0.002663910388946533, 0.0028252601623535156, 0.002986609935760498, 0.0031479597091674805, 0.003309309482574463, 0.0034706592559814453, 0.0036320090293884277, 0.00379335880279541, 0.003954708576202393, 0.004116058349609375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 8.0, 6.0, 10.0, 19.0, 17.0, 12.0, 28.0, 50.0, 58.0, 90.0, 94.0, 117.0, 115.0, 84.0, 63.0, 49.0, 33.0, 18.0, 20.0, 10.0, 11.0, 12.0, 8.0, 5.0, 5.0, 4.0, 4.0, 6.0, 4.0, 2.0, 8.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-0.00460052490234375, -0.004481256008148193, -0.004361987113952637, -0.00424271821975708, -0.0041234493255615234, -0.004004180431365967, -0.00388491153717041, -0.0037656426429748535, -0.003646373748779297, -0.0035271048545837402, -0.0034078359603881836, -0.003288567066192627, -0.0031692981719970703, -0.0030500292778015137, -0.002930760383605957, -0.0028114914894104004, -0.0026922225952148438, -0.002572953701019287, -0.0024536848068237305, -0.002334415912628174, -0.002215147018432617, -0.0020958781242370605, -0.001976609230041504, -0.0018573403358459473, -0.0017380714416503906, -0.001618802547454834, -0.0014995336532592773, -0.0013802647590637207, -0.001260995864868164, -0.0011417269706726074, -0.0010224580764770508, -0.0009031891822814941, -0.0007839202880859375, -0.0006646513938903809, -0.0005453824996948242, -0.0004261136054992676, -0.00030684471130371094, -0.0001875758171081543, -6.830692291259766e-05, 5.0961971282958984e-05, 0.00017023086547851562, 0.00028949975967407227, 0.0004087686538696289, 0.0005280375480651855, 0.0006473064422607422, 0.0007665753364562988, 0.0008858442306518555, 0.0010051131248474121, 0.0011243820190429688, 0.0012436509132385254, 0.001362919807434082, 0.0014821887016296387, 0.0016014575958251953, 0.001720726490020752, 0.0018399953842163086, 0.0019592642784118652, 0.002078533172607422, 0.0021978020668029785, 0.002317070960998535, 0.002436339855194092, 0.0025556087493896484, 0.002674877643585205, 0.0027941465377807617, 0.0029134154319763184, 0.003032684326171875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 9.0, 16.0, 44.0, 154.0, 457.0, 209.0, 79.0, 17.0, 10.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17986637353897095, -0.17224445939064026, -0.16462256014347076, -0.15700064599514008, -0.1493787318468094, -0.1417568325996399, -0.1341349184513092, -0.12651300430297852, -0.11889109760522842, -0.11126919090747833, -0.10364727675914764, -0.09602537006139755, -0.08840346336364746, -0.08078154921531677, -0.07315964251756668, -0.06553773581981659, -0.0579158216714859, -0.05029391124844551, -0.04267200082540512, -0.03505009412765503, -0.02742818370461464, -0.01980627328157425, -0.012184366583824158, -0.004562456160783768, 0.0030594542622566223, 0.010681363753974438, 0.018303273245692253, 0.025925181806087494, 0.033547092229127884, 0.041169002652168274, 0.048790909349918365, 0.056412819772958755, 0.06403473019599915, 0.07165663689374924, 0.07927855104207993, 0.08690045773983002, 0.0945223718881607, 0.1021442785859108, 0.10976618528366089, 0.11738809943199158, 0.12501001358032227, 0.13263192772865295, 0.14025382697582245, 0.14787574112415314, 0.15549765527248383, 0.16311955451965332, 0.170741468667984, 0.1783633828163147, 0.1859852820634842, 0.19360719621181488, 0.20122909545898438, 0.20885100960731506, 0.21647292375564575, 0.22409483790397644, 0.23171673715114594, 0.23933865129947662, 0.24696055054664612, 0.2545824646949768, 0.2622043788433075, 0.2698262929916382, 0.2774481773376465, 0.2850700914859772, 0.29269200563430786, 0.30031391978263855, 0.30793583393096924]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 11.0, 10.0, 8.0, 6.0, 22.0, 13.0, 20.0, 21.0, 32.0, 34.0, 34.0, 39.0, 43.0, 40.0, 59.0, 66.0, 93.0, 67.0, 58.0, 54.0, 32.0, 30.0, 37.0, 30.0, 28.0, 28.0, 14.0, 19.0, 9.0, 7.0, 5.0, 11.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10372227430343628, -0.10031667351722717, -0.09691108018159866, -0.09350547939538956, -0.09009988605976105, -0.08669428527355194, -0.08328868448734283, -0.07988308370113373, -0.07647749036550522, -0.07307188957929611, -0.0696662962436676, -0.0662606954574585, -0.06285509467124939, -0.05944950133562088, -0.056043900549411774, -0.052638303488492966, -0.04923270642757416, -0.04582710936665535, -0.04242151230573654, -0.039015911519527435, -0.03561031445860863, -0.03220471739768982, -0.028799118474125862, -0.025393519550561905, -0.021987922489643097, -0.01858232542872429, -0.015176726505160332, -0.011771128512918949, -0.008365530520677567, -0.0049599334597587585, -0.0015543345361948013, 0.0018512643873691559, 0.005256861448287964, 0.008662459440529346, 0.012068057432770729, 0.015473655425012112, 0.018879253417253494, 0.022284850478172302, 0.02569044940173626, 0.029096048325300217, 0.032501645386219025, 0.03590724244713783, 0.03931283950805664, 0.04271844029426575, 0.046124037355184555, 0.04952963441610336, 0.05293523520231247, 0.05634083226323128, 0.059746429324150085, 0.06315203011035919, 0.0665576234459877, 0.06996322423219681, 0.07336881756782532, 0.07677441835403442, 0.08018001914024353, 0.08358561992645264, 0.08699121326208115, 0.09039681404829025, 0.09380240738391876, 0.09720800817012787, 0.10061360895633698, 0.10401920229196548, 0.10742480307817459, 0.1108303964138031, 0.11423599720001221]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 7.0, 5.0, 15.0, 17.0, 32.0, 39.0, 57.0, 88.0, 136.0, 221.0, 391.0, 736.0, 1698.0, 4984.0, 19167.0, 125593.0, 2648132.0, 1265164.0, 90215.0, 22518.0, 8309.0, 3605.0, 1733.0, 797.0, 355.0, 124.0, 52.0, 34.0, 13.0, 7.0, 13.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007747650146484375, -0.007548511028289795, -0.007349371910095215, -0.007150232791900635, -0.006951093673706055, -0.006751954555511475, -0.0065528154373168945, -0.0063536763191223145, -0.006154537200927734, -0.005955398082733154, -0.005756258964538574, -0.005557119846343994, -0.005357980728149414, -0.005158841609954834, -0.004959702491760254, -0.004760563373565674, -0.004561424255371094, -0.004362285137176514, -0.004163146018981934, -0.0039640069007873535, -0.0037648677825927734, -0.0035657286643981934, -0.0033665895462036133, -0.003167450428009033, -0.002968311309814453, -0.002769172191619873, -0.002570033073425293, -0.002370893955230713, -0.002171754837036133, -0.0019726157188415527, -0.0017734766006469727, -0.0015743374824523926, -0.0013751983642578125, -0.0011760592460632324, -0.0009769201278686523, -0.0007777810096740723, -0.0005786418914794922, -0.0003795027732849121, -0.00018036365509033203, 1.8775463104248047e-05, 0.00021791458129882812, 0.0004170536994934082, 0.0006161928176879883, 0.0008153319358825684, 0.0010144710540771484, 0.0012136101722717285, 0.0014127492904663086, 0.0016118884086608887, 0.0018110275268554688, 0.002010166645050049, 0.002209305763244629, 0.002408444881439209, 0.002607583999633789, 0.002806723117828369, 0.0030058622360229492, 0.0032050013542175293, 0.0034041404724121094, 0.0036032795906066895, 0.0038024187088012695, 0.00400155782699585, 0.00420069694519043, 0.00439983606338501, 0.00459897518157959, 0.00479811429977417, 0.00499725341796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 16.0, 22.0, 33.0, 36.0, 73.0, 85.0, 104.0, 122.0, 121.0, 97.0, 81.0, 73.0, 35.0, 22.0, 17.0, 12.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014068603515625, -0.013693451881408691, -0.013318300247192383, -0.012943148612976074, -0.012567996978759766, -0.012192845344543457, -0.011817693710327148, -0.01144254207611084, -0.011067390441894531, -0.010692238807678223, -0.010317087173461914, -0.009941935539245605, -0.009566783905029297, -0.009191632270812988, -0.00881648063659668, -0.008441329002380371, -0.008066177368164062, -0.007691025733947754, -0.007315874099731445, -0.006940722465515137, -0.006565570831298828, -0.0061904191970825195, -0.005815267562866211, -0.005440115928649902, -0.005064964294433594, -0.004689812660217285, -0.0043146610260009766, -0.003939509391784668, -0.0035643577575683594, -0.0031892061233520508, -0.002814054489135742, -0.0024389028549194336, -0.002063751220703125, -0.0016885995864868164, -0.0013134479522705078, -0.0009382963180541992, -0.0005631446838378906, -0.00018799304962158203, 0.00018715858459472656, 0.0005623102188110352, 0.0009374618530273438, 0.0013126134872436523, 0.001687765121459961, 0.0020629167556762695, 0.002438068389892578, 0.0028132200241088867, 0.0031883716583251953, 0.003563523292541504, 0.0039386749267578125, 0.004313826560974121, 0.00468897819519043, 0.005064129829406738, 0.005439281463623047, 0.0058144330978393555, 0.006189584732055664, 0.006564736366271973, 0.006939888000488281, 0.00731503963470459, 0.0076901912689208984, 0.008065342903137207, 0.008440494537353516, 0.008815646171569824, 0.009190797805786133, 0.009565949440002441, 0.00994110107421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 2.0, 4.0, 7.0, 8.0, 13.0, 24.0, 34.0, 58.0, 87.0, 150.0, 295.0, 620.0, 1258.0, 3010.0, 9960.0, 61238.0, 3955022.0, 140960.0, 14350.0, 3698.0, 1522.0, 702.0, 459.0, 284.0, 196.0, 91.0, 75.0, 47.0, 33.0, 21.0, 8.0, 10.0, 12.0, 6.0, 2.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01119232177734375, -0.010859489440917969, -0.010526657104492188, -0.010193824768066406, -0.009860992431640625, -0.009528160095214844, -0.009195327758789062, -0.008862495422363281, -0.0085296630859375, -0.008196830749511719, -0.007863998413085938, -0.007531166076660156, -0.007198333740234375, -0.006865501403808594, -0.0065326690673828125, -0.006199836730957031, -0.00586700439453125, -0.005534172058105469, -0.0052013397216796875, -0.004868507385253906, -0.004535675048828125, -0.004202842712402344, -0.0038700103759765625, -0.0035371780395507812, -0.003204345703125, -0.0028715133666992188, -0.0025386810302734375, -0.0022058486938476562, -0.001873016357421875, -0.0015401840209960938, -0.0012073516845703125, -0.0008745193481445312, -0.00054168701171875, -0.00020885467529296875, 0.0001239776611328125, 0.00045680999755859375, 0.000789642333984375, 0.0011224746704101562, 0.0014553070068359375, 0.0017881393432617188, 0.0021209716796875, 0.0024538040161132812, 0.0027866363525390625, 0.0031194686889648438, 0.003452301025390625, 0.0037851333618164062, 0.0041179656982421875, 0.004450798034667969, 0.00478363037109375, 0.005116462707519531, 0.0054492950439453125, 0.005782127380371094, 0.006114959716796875, 0.006447792053222656, 0.0067806243896484375, 0.007113456726074219, 0.0074462890625, 0.007779121398925781, 0.008111953735351562, 0.008444786071777344, 0.008777618408203125, 0.009110450744628906, 0.009443283081054688, 0.009776115417480469, 0.01010894775390625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 2.0, 8.0, 13.0, 10.0, 19.0, 33.0, 49.0, 124.0, 564.0, 1577.0, 1117.0, 331.0, 84.0, 37.0, 25.0, 21.0, 13.0, 13.0, 9.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0117950439453125, -0.011399149894714355, -0.011003255844116211, -0.010607361793518066, -0.010211467742919922, -0.009815573692321777, -0.009419679641723633, -0.009023785591125488, -0.008627891540527344, -0.0082319974899292, -0.007836103439331055, -0.00744020938873291, -0.007044315338134766, -0.006648421287536621, -0.0062525272369384766, -0.005856633186340332, -0.0054607391357421875, -0.005064845085144043, -0.0046689510345458984, -0.004273056983947754, -0.0038771629333496094, -0.003481268882751465, -0.0030853748321533203, -0.0026894807815551758, -0.0022935867309570312, -0.0018976926803588867, -0.0015017986297607422, -0.0011059045791625977, -0.0007100105285644531, -0.0003141164779663086, 8.177757263183594e-05, 0.00047767162322998047, 0.000873565673828125, 0.0012694597244262695, 0.001665353775024414, 0.0020612478256225586, 0.002457141876220703, 0.0028530359268188477, 0.003248929977416992, 0.0036448240280151367, 0.004040718078613281, 0.004436612129211426, 0.00483250617980957, 0.005228400230407715, 0.005624294281005859, 0.006020188331604004, 0.0064160823822021484, 0.006811976432800293, 0.0072078704833984375, 0.007603764533996582, 0.007999658584594727, 0.008395552635192871, 0.008791446685791016, 0.00918734073638916, 0.009583234786987305, 0.00997912883758545, 0.010375022888183594, 0.010770916938781738, 0.011166810989379883, 0.011562705039978027, 0.011958599090576172, 0.012354493141174316, 0.012750387191772461, 0.013146281242370605, 0.01354217529296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 5.0, 7.0, 11.0, 21.0, 53.0, 153.0, 290.0, 234.0, 120.0, 48.0, 28.0, 15.0, 7.0, 4.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06490784883499146, -0.06255923211574554, -0.06021061912178993, -0.05786200240254402, -0.05551338940858841, -0.0531647726893425, -0.05081615597009659, -0.048467542976140976, -0.046118929982185364, -0.04377031326293945, -0.04142170026898384, -0.03907308354973793, -0.03672447055578232, -0.03437585383653641, -0.0320272371172905, -0.029678624123334885, -0.027330007404088974, -0.024981392547488213, -0.02263277769088745, -0.02028416097164154, -0.01793554797768593, -0.015586932189762592, -0.013238316401839256, -0.010889701545238495, -0.008541086688637733, -0.006192471832036972, -0.0038438565097749233, -0.0014952411875128746, 0.0008533736690878868, 0.0032019885256886482, 0.005550604313611984, 0.007899219170212746, 0.010247834026813507, 0.012596448883414268, 0.01494506374001503, 0.01729368045926094, 0.019642293453216553, 0.021990910172462463, 0.024339525029063225, 0.026688139885663986, 0.029036754742264748, 0.03138536959886551, 0.03373398631811142, 0.03608259931206703, 0.03843121603131294, 0.040779829025268555, 0.043128445744514465, 0.045477062463760376, 0.04782567545771599, 0.0501742921769619, 0.05252290517091751, 0.05487152189016342, 0.057220134884119034, 0.059568751603364944, 0.06191736459732056, 0.06426598131656647, 0.06661459803581238, 0.06896321475505829, 0.0713118314743042, 0.07366044074296951, 0.07600905746221542, 0.07835767418146133, 0.08070629090070724, 0.08305490016937256, 0.08540351688861847]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 3.0, 8.0, 9.0, 13.0, 14.0, 14.0, 27.0, 35.0, 39.0, 36.0, 55.0, 65.0, 61.0, 59.0, 66.0, 74.0, 59.0, 58.0, 48.0, 56.0, 50.0, 30.0, 40.0, 24.0, 9.0, 8.0, 11.0, 10.0, 4.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.06639635562896729, -0.06474145501852036, -0.06308656185865402, -0.06143166124820709, -0.05977676436305046, -0.05812186747789383, -0.0564669668674469, -0.05481206998229027, -0.053157173097133636, -0.051502276211977005, -0.049847379326820374, -0.048192478716373444, -0.04653758183121681, -0.04488268494606018, -0.04322778433561325, -0.04157288745045662, -0.03991799056529999, -0.038263093680143356, -0.036608196794986725, -0.034953296184539795, -0.03329839929938316, -0.03164350241422653, -0.02998860366642475, -0.02833370491862297, -0.02667880803346634, -0.025023911148309708, -0.023369012400507927, -0.021714113652706146, -0.020059216767549515, -0.018404319882392883, -0.016749421134591103, -0.015094523318111897, -0.01343962550163269, -0.011784727685153484, -0.010129829868674278, -0.008474932052195072, -0.006820034235715866, -0.00516513641923666, -0.003510238602757454, -0.0018553407862782478, -0.00020044296979904175, 0.0014544548466801643, 0.0031093526631593704, 0.0047642504796385765, 0.006419148296117783, 0.008074046112596989, 0.009728943929076195, 0.0113838417455554, 0.013038739562034607, 0.014693637378513813, 0.01634853519499302, 0.0180034339427948, 0.01965833082795143, 0.021313227713108063, 0.022968126460909843, 0.024623025208711624, 0.026277922093868256, 0.027932818979024887, 0.029587717726826668, 0.03124261647462845, 0.03289751335978508, 0.03455241024494171, 0.03620731085538864, 0.03786220774054527, 0.039517104625701904]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 11.0, 17.0, 17.0, 20.0, 32.0, 66.0, 87.0, 137.0, 221.0, 362.0, 607.0, 1180.0, 2365.0, 5656.0, 17005.0, 76593.0, 516897.0, 353798.0, 51488.0, 12726.0, 4556.0, 2039.0, 1077.0, 571.0, 335.0, 208.0, 149.0, 97.0, 65.0, 43.0, 41.0, 26.0, 14.0, 5.0, 10.0, 5.0, 6.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.01139068603515625, -0.01109004020690918, -0.01078939437866211, -0.010488748550415039, -0.010188102722167969, -0.009887456893920898, -0.009586811065673828, -0.009286165237426758, -0.008985519409179688, -0.008684873580932617, -0.008384227752685547, -0.008083581924438477, -0.007782936096191406, -0.007482290267944336, -0.007181644439697266, -0.006880998611450195, -0.006580352783203125, -0.006279706954956055, -0.005979061126708984, -0.005678415298461914, -0.005377769470214844, -0.0050771236419677734, -0.004776477813720703, -0.004475831985473633, -0.0041751861572265625, -0.003874540328979492, -0.003573894500732422, -0.0032732486724853516, -0.0029726028442382812, -0.002671957015991211, -0.0023713111877441406, -0.0020706653594970703, -0.00177001953125, -0.0014693737030029297, -0.0011687278747558594, -0.0008680820465087891, -0.0005674362182617188, -0.00026679039001464844, 3.3855438232421875e-05, 0.0003345012664794922, 0.0006351470947265625, 0.0009357929229736328, 0.0012364387512207031, 0.0015370845794677734, 0.0018377304077148438, 0.002138376235961914, 0.0024390220642089844, 0.0027396678924560547, 0.003040313720703125, 0.0033409595489501953, 0.0036416053771972656, 0.003942251205444336, 0.004242897033691406, 0.0045435428619384766, 0.004844188690185547, 0.005144834518432617, 0.0054454803466796875, 0.005746126174926758, 0.006046772003173828, 0.0063474178314208984, 0.006648063659667969, 0.006948709487915039, 0.007249355316162109, 0.00755000114440918, 0.00785064697265625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 9.0, 12.0, 12.0, 31.0, 36.0, 53.0, 76.0, 100.0, 102.0, 111.0, 119.0, 88.0, 86.0, 48.0, 29.0, 27.0, 21.0, 6.0, 7.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0134735107421875, -0.013110876083374023, -0.012748241424560547, -0.01238560676574707, -0.012022972106933594, -0.011660337448120117, -0.01129770278930664, -0.010935068130493164, -0.010572433471679688, -0.010209798812866211, -0.009847164154052734, -0.009484529495239258, -0.009121894836425781, -0.008759260177612305, -0.008396625518798828, -0.008033990859985352, -0.007671356201171875, -0.0073087215423583984, -0.006946086883544922, -0.006583452224731445, -0.006220817565917969, -0.005858182907104492, -0.005495548248291016, -0.005132913589477539, -0.0047702789306640625, -0.004407644271850586, -0.004045009613037109, -0.003682374954223633, -0.0033197402954101562, -0.0029571056365966797, -0.002594470977783203, -0.0022318363189697266, -0.00186920166015625, -0.0015065670013427734, -0.0011439323425292969, -0.0007812976837158203, -0.00041866302490234375, -5.602836608886719e-05, 0.0003066062927246094, 0.0006692409515380859, 0.0010318756103515625, 0.001394510269165039, 0.0017571449279785156, 0.002119779586791992, 0.0024824142456054688, 0.0028450489044189453, 0.003207683563232422, 0.0035703182220458984, 0.003932952880859375, 0.0042955875396728516, 0.004658222198486328, 0.005020856857299805, 0.005383491516113281, 0.005746126174926758, 0.006108760833740234, 0.006471395492553711, 0.0068340301513671875, 0.007196664810180664, 0.007559299468994141, 0.007921934127807617, 0.008284568786621094, 0.00864720344543457, 0.009009838104248047, 0.009372472763061523, 0.009735107421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 11.0, 22.0, 18.0, 30.0, 50.0, 55.0, 86.0, 123.0, 167.0, 319.0, 489.0, 887.0, 1860.0, 6263.0, 49319.0, 833358.0, 138931.0, 11049.0, 2819.0, 1082.0, 598.0, 319.0, 216.0, 140.0, 96.0, 69.0, 44.0, 39.0, 23.0, 20.0, 12.0, 10.0, 9.0, 7.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.021697998046875, -0.021053552627563477, -0.020409107208251953, -0.01976466178894043, -0.019120216369628906, -0.018475770950317383, -0.01783132553100586, -0.017186880111694336, -0.016542434692382812, -0.01589798927307129, -0.015253543853759766, -0.014609098434448242, -0.013964653015136719, -0.013320207595825195, -0.012675762176513672, -0.012031316757202148, -0.011386871337890625, -0.010742425918579102, -0.010097980499267578, -0.009453535079956055, -0.008809089660644531, -0.008164644241333008, -0.007520198822021484, -0.006875753402709961, -0.0062313079833984375, -0.005586862564086914, -0.004942417144775391, -0.004297971725463867, -0.0036535263061523438, -0.0030090808868408203, -0.002364635467529297, -0.0017201900482177734, -0.00107574462890625, -0.00043129920959472656, 0.00021314620971679688, 0.0008575916290283203, 0.0015020370483398438, 0.002146482467651367, 0.0027909278869628906, 0.003435373306274414, 0.0040798187255859375, 0.004724264144897461, 0.005368709564208984, 0.006013154983520508, 0.006657600402832031, 0.007302045822143555, 0.007946491241455078, 0.008590936660766602, 0.009235382080078125, 0.009879827499389648, 0.010524272918701172, 0.011168718338012695, 0.011813163757324219, 0.012457609176635742, 0.013102054595947266, 0.013746500015258789, 0.014390945434570312, 0.015035390853881836, 0.01567983627319336, 0.016324281692504883, 0.016968727111816406, 0.01761317253112793, 0.018257617950439453, 0.018902063369750977, 0.0195465087890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 12.0, 8.0, 16.0, 6.0, 18.0, 25.0, 25.0, 32.0, 33.0, 32.0, 41.0, 47.0, 50.0, 51.0, 50.0, 72.0, 59.0, 57.0, 54.0, 54.0, 50.0, 39.0, 32.0, 29.0, 24.0, 8.0, 16.0, 12.0, 15.0, 7.0, 5.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0310516357421875, -0.030171632766723633, -0.029291629791259766, -0.0284116268157959, -0.02753162384033203, -0.026651620864868164, -0.025771617889404297, -0.02489161491394043, -0.024011611938476562, -0.023131608963012695, -0.022251605987548828, -0.02137160301208496, -0.020491600036621094, -0.019611597061157227, -0.01873159408569336, -0.017851591110229492, -0.016971588134765625, -0.016091585159301758, -0.01521158218383789, -0.014331579208374023, -0.013451576232910156, -0.012571573257446289, -0.011691570281982422, -0.010811567306518555, -0.009931564331054688, -0.00905156135559082, -0.008171558380126953, -0.007291555404663086, -0.006411552429199219, -0.0055315494537353516, -0.004651546478271484, -0.003771543502807617, -0.00289154052734375, -0.002011537551879883, -0.0011315345764160156, -0.00025153160095214844, 0.0006284713745117188, 0.001508474349975586, 0.002388477325439453, 0.0032684803009033203, 0.0041484832763671875, 0.005028486251831055, 0.005908489227294922, 0.006788492202758789, 0.007668495178222656, 0.008548498153686523, 0.00942850112915039, 0.010308504104614258, 0.011188507080078125, 0.012068510055541992, 0.01294851303100586, 0.013828516006469727, 0.014708518981933594, 0.015588521957397461, 0.016468524932861328, 0.017348527908325195, 0.018228530883789062, 0.01910853385925293, 0.019988536834716797, 0.020868539810180664, 0.02174854278564453, 0.0226285457611084, 0.023508548736572266, 0.024388551712036133, 0.0252685546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 7.0, 10.0, 17.0, 24.0, 40.0, 67.0, 131.0, 259.0, 691.0, 2631.0, 15167.0, 271095.0, 727627.0, 25405.0, 3825.0, 917.0, 312.0, 144.0, 58.0, 52.0, 20.0, 10.0, 11.0, 15.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0040740966796875, -0.003958076238632202, -0.0038420557975769043, -0.0037260353565216064, -0.0036100149154663086, -0.0034939944744110107, -0.003377974033355713, -0.003261953592300415, -0.003145933151245117, -0.0030299127101898193, -0.0029138922691345215, -0.0027978718280792236, -0.0026818513870239258, -0.002565830945968628, -0.00244981050491333, -0.0023337900638580322, -0.0022177696228027344, -0.0021017491817474365, -0.0019857287406921387, -0.0018697082996368408, -0.001753687858581543, -0.0016376674175262451, -0.0015216469764709473, -0.0014056265354156494, -0.0012896060943603516, -0.0011735856533050537, -0.0010575652122497559, -0.000941544771194458, -0.0008255243301391602, -0.0007095038890838623, -0.0005934834480285645, -0.0004774630069732666, -0.00036144256591796875, -0.0002454221248626709, -0.00012940168380737305, -1.3381242752075195e-05, 0.00010263919830322266, 0.0002186596393585205, 0.00033468008041381836, 0.0004507005214691162, 0.0005667209625244141, 0.0006827414035797119, 0.0007987618446350098, 0.0009147822856903076, 0.0010308027267456055, 0.0011468231678009033, 0.0012628436088562012, 0.001378864049911499, 0.0014948844909667969, 0.0016109049320220947, 0.0017269253730773926, 0.0018429458141326904, 0.0019589662551879883, 0.002074986696243286, 0.002191007137298584, 0.002307027578353882, 0.0024230480194091797, 0.0025390684604644775, 0.0026550889015197754, 0.0027711093425750732, 0.002887129783630371, 0.003003150224685669, 0.003119170665740967, 0.0032351911067962646, 0.0033512115478515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 9.0, 10.0, 12.0, 11.0, 26.0, 33.0, 30.0, 67.0, 68.0, 61.0, 87.0, 63.0, 67.0, 92.0, 39.0, 85.0, 59.0, 30.0, 31.0, 30.0, 14.0, 21.0, 11.0, 9.0, 9.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.52346420288086e-06, -8.306466042995453e-06, -8.089467883110046e-06, -7.87246972322464e-06, -7.655471563339233e-06, -7.438473403453827e-06, -7.22147524356842e-06, -7.004477083683014e-06, -6.787478923797607e-06, -6.570480763912201e-06, -6.3534826040267944e-06, -6.136484444141388e-06, -5.9194862842559814e-06, -5.702488124370575e-06, -5.4854899644851685e-06, -5.268491804599762e-06, -5.0514936447143555e-06, -4.834495484828949e-06, -4.6174973249435425e-06, -4.400499165058136e-06, -4.1835010051727295e-06, -3.966502845287323e-06, -3.7495046854019165e-06, -3.53250652551651e-06, -3.3155083656311035e-06, -3.098510205745697e-06, -2.8815120458602905e-06, -2.664513885974884e-06, -2.4475157260894775e-06, -2.230517566204071e-06, -2.0135194063186646e-06, -1.796521246433258e-06, -1.5795230865478516e-06, -1.362524926662445e-06, -1.1455267667770386e-06, -9.285286068916321e-07, -7.115304470062256e-07, -4.945322871208191e-07, -2.775341272354126e-07, -6.05359673500061e-08, 1.564621925354004e-07, 3.734603524208069e-07, 5.904585123062134e-07, 8.074566721916199e-07, 1.0244548320770264e-06, 1.2414529919624329e-06, 1.4584511518478394e-06, 1.6754493117332458e-06, 1.8924474716186523e-06, 2.109445631504059e-06, 2.3264437913894653e-06, 2.543441951274872e-06, 2.7604401111602783e-06, 2.977438271045685e-06, 3.1944364309310913e-06, 3.411434590816498e-06, 3.6284327507019043e-06, 3.845430910587311e-06, 4.062429070472717e-06, 4.279427230358124e-06, 4.49642539024353e-06, 4.713423550128937e-06, 4.930421710014343e-06, 5.14741986989975e-06, 5.364418029785156e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 0.0, 6.0, 9.0, 5.0, 10.0, 9.0, 10.0, 21.0, 32.0, 42.0, 61.0, 104.0, 149.0, 288.0, 511.0, 1167.0, 2810.0, 8760.0, 47769.0, 707846.0, 245990.0, 23597.0, 5609.0, 1904.0, 814.0, 402.0, 228.0, 147.0, 85.0, 52.0, 35.0, 20.0, 17.0, 11.0, 6.0, 5.0, 6.0, 3.0, 5.0, 7.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0026397705078125, -0.002563953399658203, -0.0024881362915039062, -0.0024123191833496094, -0.0023365020751953125, -0.0022606849670410156, -0.0021848678588867188, -0.002109050750732422, -0.002033233642578125, -0.001957416534423828, -0.0018815994262695312, -0.0018057823181152344, -0.0017299652099609375, -0.0016541481018066406, -0.0015783309936523438, -0.0015025138854980469, -0.00142669677734375, -0.0013508796691894531, -0.0012750625610351562, -0.0011992454528808594, -0.0011234283447265625, -0.0010476112365722656, -0.0009717941284179688, -0.0008959770202636719, -0.000820159912109375, -0.0007443428039550781, -0.0006685256958007812, -0.0005927085876464844, -0.0005168914794921875, -0.0004410743713378906, -0.00036525726318359375, -0.0002894401550292969, -0.000213623046875, -0.00013780593872070312, -6.198883056640625e-05, 1.3828277587890625e-05, 8.96453857421875e-05, 0.00016546249389648438, 0.00024127960205078125, 0.0003170967102050781, 0.000392913818359375, 0.0004687309265136719, 0.0005445480346679688, 0.0006203651428222656, 0.0006961822509765625, 0.0007719993591308594, 0.0008478164672851562, 0.0009236335754394531, 0.00099945068359375, 0.0010752677917480469, 0.0011510848999023438, 0.0012269020080566406, 0.0013027191162109375, 0.0013785362243652344, 0.0014543533325195312, 0.0015301704406738281, 0.001605987548828125, 0.0016818046569824219, 0.0017576217651367188, 0.0018334388732910156, 0.0019092559814453125, 0.0019850730895996094, 0.0020608901977539062, 0.002136707305908203, 0.0022125244140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 7.0, 7.0, 10.0, 9.0, 13.0, 19.0, 30.0, 23.0, 34.0, 59.0, 53.0, 87.0, 71.0, 95.0, 104.0, 80.0, 72.0, 55.0, 32.0, 33.0, 14.0, 17.0, 14.0, 9.0, 13.0, 8.0, 7.0, 3.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.002960205078125, -0.0028723180294036865, -0.002784430980682373, -0.0026965439319610596, -0.002608656883239746, -0.0025207698345184326, -0.002432882785797119, -0.0023449957370758057, -0.002257108688354492, -0.0021692216396331787, -0.0020813345909118652, -0.0019934475421905518, -0.0019055604934692383, -0.0018176734447479248, -0.0017297863960266113, -0.0016418993473052979, -0.0015540122985839844, -0.001466125249862671, -0.0013782382011413574, -0.001290351152420044, -0.0012024641036987305, -0.001114577054977417, -0.0010266900062561035, -0.00093880295753479, -0.0008509159088134766, -0.0007630288600921631, -0.0006751418113708496, -0.0005872547626495361, -0.0004993677139282227, -0.0004114806652069092, -0.0003235936164855957, -0.00023570656776428223, -0.00014781951904296875, -5.9932470321655273e-05, 2.7954578399658203e-05, 0.00011584162712097168, 0.00020372867584228516, 0.00029161572456359863, 0.0003795027732849121, 0.0004673898220062256, 0.0005552768707275391, 0.0006431639194488525, 0.000731050968170166, 0.0008189380168914795, 0.000906825065612793, 0.0009947121143341064, 0.00108259916305542, 0.0011704862117767334, 0.0012583732604980469, 0.0013462603092193604, 0.0014341473579406738, 0.0015220344066619873, 0.0016099214553833008, 0.0016978085041046143, 0.0017856955528259277, 0.0018735826015472412, 0.0019614696502685547, 0.002049356698989868, 0.0021372437477111816, 0.002225130796432495, 0.0023130178451538086, 0.002400904893875122, 0.0024887919425964355, 0.002576678991317749, 0.0026645660400390625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 9.0, 13.0, 16.0, 46.0, 111.0, 180.0, 313.0, 188.0, 56.0, 33.0, 12.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09691417962312698, -0.0934278592467308, -0.08994154632091522, -0.08645522594451904, -0.08296890556812286, -0.07948258519172668, -0.0759962648153305, -0.07250995188951492, -0.06902363151311874, -0.06553731113672256, -0.062050994485616684, -0.0585646778345108, -0.055078357458114624, -0.051592037081718445, -0.048105720430612564, -0.04461940377950668, -0.041133083403110504, -0.037646763026714325, -0.034160446375608444, -0.030674127861857414, -0.027187809348106384, -0.023701490834355354, -0.020215172320604324, -0.016728853806853294, -0.013242535293102264, -0.009756216779351234, -0.0062698982656002045, -0.0027835797518491745, 0.0007027387619018555, 0.0041890572756528854, 0.007675375789403915, 0.011161694303154945, 0.014648005366325378, 0.01813432388007641, 0.02162064239382744, 0.02510696090757847, 0.0285932794213295, 0.03207959979772568, 0.03556591644883156, 0.03905223309993744, 0.04253855347633362, 0.0460248738527298, 0.04951119050383568, 0.05299750715494156, 0.05648382753133774, 0.05997014790773392, 0.0634564608335495, 0.06694278120994568, 0.07042910158634186, 0.07391542196273804, 0.07740174233913422, 0.0808880552649498, 0.08437437564134598, 0.08786069601774216, 0.09134700894355774, 0.09483332931995392, 0.0983196496963501, 0.10180597007274628, 0.10529229044914246, 0.10877860337495804, 0.11226492375135422, 0.1157512441277504, 0.11923755705356598, 0.12272387742996216, 0.12621019780635834]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 3.0, 4.0, 6.0, 10.0, 3.0, 12.0, 15.0, 11.0, 15.0, 20.0, 25.0, 32.0, 32.0, 31.0, 33.0, 46.0, 46.0, 42.0, 76.0, 78.0, 68.0, 44.0, 47.0, 34.0, 34.0, 27.0, 37.0, 26.0, 31.0, 23.0, 16.0, 19.0, 12.0, 8.0, 5.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09674960374832153, -0.09375861287117004, -0.09076762199401855, -0.08777663111686707, -0.08478564023971558, -0.08179464191198349, -0.078803651034832, -0.07581266015768051, -0.07282166928052902, -0.06983067840337753, -0.06683968752622604, -0.06384869664907455, -0.06085770204663277, -0.05786671116948128, -0.05487571656703949, -0.051884725689888, -0.04889373481273651, -0.04590274393558502, -0.04291175305843353, -0.039920758455991745, -0.036929767578840256, -0.033938776701688766, -0.030947783961892128, -0.02795679122209549, -0.024965800344944, -0.02197480946779251, -0.018983816727995872, -0.015992823988199234, -0.013001833111047745, -0.010010841302573681, -0.007019849494099617, -0.0040288567543029785, -0.0010378658771514893, 0.0019531259313225746, 0.0049441177397966385, 0.007935109548270702, 0.010926101356744766, 0.01391709316521883, 0.016908084973692894, 0.019899077713489532, 0.02289006859064102, 0.02588105946779251, 0.02887205220758915, 0.03186304494738579, 0.03485403582453728, 0.037845026701688766, 0.040836021304130554, 0.04382701218128204, 0.04681800305843353, 0.04980899393558502, 0.05279998481273651, 0.0557909794151783, 0.05878197029232979, 0.06177296116948128, 0.06476395577192307, 0.06775494664907455, 0.07074593752622604, 0.07373692840337753, 0.07672791928052902, 0.07971891015768051, 0.0827099084854126, 0.08570089936256409, 0.08869189023971558, 0.09168288111686707, 0.09467387199401855]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 13.0, 12.0, 18.0, 23.0, 29.0, 43.0, 40.0, 85.0, 111.0, 177.0, 270.0, 489.0, 1106.0, 3542.0, 12836.0, 81001.0, 1429064.0, 2471430.0, 147398.0, 27727.0, 10145.0, 4359.0, 2290.0, 1188.0, 427.0, 176.0, 96.0, 54.0, 38.0, 25.0, 16.0, 15.0, 7.0, 9.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00720977783203125, -0.007015585899353027, -0.006821393966674805, -0.006627202033996582, -0.006433010101318359, -0.006238818168640137, -0.006044626235961914, -0.005850434303283691, -0.005656242370605469, -0.005462050437927246, -0.0052678585052490234, -0.005073666572570801, -0.004879474639892578, -0.0046852827072143555, -0.004491090774536133, -0.00429689884185791, -0.0041027069091796875, -0.003908514976501465, -0.003714323043823242, -0.0035201311111450195, -0.003325939178466797, -0.0031317472457885742, -0.0029375553131103516, -0.002743363380432129, -0.0025491714477539062, -0.0023549795150756836, -0.002160787582397461, -0.0019665956497192383, -0.0017724037170410156, -0.001578211784362793, -0.0013840198516845703, -0.0011898279190063477, -0.000995635986328125, -0.0008014440536499023, -0.0006072521209716797, -0.00041306018829345703, -0.00021886825561523438, -2.467632293701172e-05, 0.00016951560974121094, 0.0003637075424194336, 0.0005578994750976562, 0.0007520914077758789, 0.0009462833404541016, 0.0011404752731323242, 0.0013346672058105469, 0.0015288591384887695, 0.0017230510711669922, 0.0019172430038452148, 0.0021114349365234375, 0.00230562686920166, 0.002499818801879883, 0.0026940107345581055, 0.002888202667236328, 0.0030823945999145508, 0.0032765865325927734, 0.003470778465270996, 0.0036649703979492188, 0.0038591623306274414, 0.004053354263305664, 0.004247546195983887, 0.004441738128662109, 0.004635930061340332, 0.004830121994018555, 0.005024313926696777, 0.005218505859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 10.0, 15.0, 25.0, 36.0, 49.0, 62.0, 71.0, 93.0, 123.0, 111.0, 104.0, 91.0, 65.0, 39.0, 31.0, 23.0, 14.0, 12.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01348876953125, -0.013149619102478027, -0.012810468673706055, -0.012471318244934082, -0.01213216781616211, -0.011793017387390137, -0.011453866958618164, -0.011114716529846191, -0.010775566101074219, -0.010436415672302246, -0.010097265243530273, -0.0097581148147583, -0.009418964385986328, -0.009079813957214355, -0.008740663528442383, -0.00840151309967041, -0.008062362670898438, -0.007723212242126465, -0.007384061813354492, -0.0070449113845825195, -0.006705760955810547, -0.006366610527038574, -0.0060274600982666016, -0.005688309669494629, -0.005349159240722656, -0.005010008811950684, -0.004670858383178711, -0.004331707954406738, -0.003992557525634766, -0.003653407096862793, -0.0033142566680908203, -0.0029751062393188477, -0.002635955810546875, -0.0022968053817749023, -0.0019576549530029297, -0.001618504524230957, -0.0012793540954589844, -0.0009402036666870117, -0.0006010532379150391, -0.0002619028091430664, 7.724761962890625e-05, 0.0004163980484008789, 0.0007555484771728516, 0.0010946989059448242, 0.0014338493347167969, 0.0017729997634887695, 0.002112150192260742, 0.002451300621032715, 0.0027904510498046875, 0.00312960147857666, 0.003468751907348633, 0.0038079023361206055, 0.004147052764892578, 0.004486203193664551, 0.0048253536224365234, 0.005164504051208496, 0.005503654479980469, 0.005842804908752441, 0.006181955337524414, 0.006521105766296387, 0.006860256195068359, 0.007199406623840332, 0.007538557052612305, 0.007877707481384277, 0.00821685791015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 11.0, 16.0, 25.0, 24.0, 48.0, 92.0, 176.0, 407.0, 1143.0, 6010.0, 139997.0, 4019522.0, 22354.0, 2857.0, 806.0, 379.0, 199.0, 94.0, 57.0, 28.0, 18.0, 10.0, 10.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01380157470703125, -0.013345479965209961, -0.012889385223388672, -0.012433290481567383, -0.011977195739746094, -0.011521100997924805, -0.011065006256103516, -0.010608911514282227, -0.010152816772460938, -0.009696722030639648, -0.00924062728881836, -0.00878453254699707, -0.008328437805175781, -0.007872343063354492, -0.007416248321533203, -0.006960153579711914, -0.006504058837890625, -0.006047964096069336, -0.005591869354248047, -0.005135774612426758, -0.004679679870605469, -0.00422358512878418, -0.0037674903869628906, -0.0033113956451416016, -0.0028553009033203125, -0.0023992061614990234, -0.0019431114196777344, -0.0014870166778564453, -0.0010309219360351562, -0.0005748271942138672, -0.00011873245239257812, 0.00033736228942871094, 0.00079345703125, 0.001249551773071289, 0.0017056465148925781, 0.002161741256713867, 0.0026178359985351562, 0.0030739307403564453, 0.0035300254821777344, 0.0039861202239990234, 0.0044422149658203125, 0.0048983097076416016, 0.005354404449462891, 0.00581049919128418, 0.006266593933105469, 0.006722688674926758, 0.007178783416748047, 0.007634878158569336, 0.008090972900390625, 0.008547067642211914, 0.009003162384033203, 0.009459257125854492, 0.009915351867675781, 0.01037144660949707, 0.01082754135131836, 0.011283636093139648, 0.011739730834960938, 0.012195825576782227, 0.012651920318603516, 0.013108015060424805, 0.013564109802246094, 0.014020204544067383, 0.014476299285888672, 0.014932394027709961, 0.01538848876953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 5.0, 7.0, 7.0, 10.0, 20.0, 66.0, 237.0, 992.0, 1692.0, 745.0, 161.0, 49.0, 32.0, 15.0, 10.0, 11.0, 3.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0090789794921875, -0.00863504409790039, -0.008191108703613281, -0.007747173309326172, -0.0073032379150390625, -0.006859302520751953, -0.006415367126464844, -0.005971431732177734, -0.005527496337890625, -0.005083560943603516, -0.004639625549316406, -0.004195690155029297, -0.0037517547607421875, -0.003307819366455078, -0.0028638839721679688, -0.0024199485778808594, -0.00197601318359375, -0.0015320777893066406, -0.0010881423950195312, -0.0006442070007324219, -0.0002002716064453125, 0.00024366378784179688, 0.0006875991821289062, 0.0011315345764160156, 0.001575469970703125, 0.0020194053649902344, 0.0024633407592773438, 0.002907276153564453, 0.0033512115478515625, 0.003795146942138672, 0.004239082336425781, 0.004683017730712891, 0.005126953125, 0.005570888519287109, 0.006014823913574219, 0.006458759307861328, 0.0069026947021484375, 0.007346630096435547, 0.007790565490722656, 0.008234500885009766, 0.008678436279296875, 0.009122371673583984, 0.009566307067871094, 0.010010242462158203, 0.010454177856445312, 0.010898113250732422, 0.011342048645019531, 0.01178598403930664, 0.01222991943359375, 0.01267385482788086, 0.013117790222167969, 0.013561725616455078, 0.014005661010742188, 0.014449596405029297, 0.014893531799316406, 0.015337467193603516, 0.015781402587890625, 0.016225337982177734, 0.016669273376464844, 0.017113208770751953, 0.017557144165039062, 0.018001079559326172, 0.01844501495361328, 0.01888895034790039, 0.0193328857421875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 8.0, 51.0, 309.0, 457.0, 111.0, 36.0, 12.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0705290138721466, -0.0658613070845604, -0.06119360029697418, -0.05652588978409767, -0.05185818299651146, -0.04719047620892525, -0.04252276569604874, -0.037855058908462524, -0.03318735212087631, -0.0285196453332901, -0.02385193668305874, -0.019184228032827377, -0.014516521245241165, -0.009848814457654953, -0.005181105807423592, -0.0005133971571922302, 0.004154309630393982, 0.008822017349302769, 0.013489725068211555, 0.018157433718442917, 0.02282514050602913, 0.02749284729361534, 0.03216055780649185, 0.036828264594078064, 0.041495971381664276, 0.04616367816925049, 0.0508313849568367, 0.05549909546971321, 0.06016680225729942, 0.06483450531959534, 0.06950221955776215, 0.07416992634534836, 0.07883763313293457, 0.08350533992052078, 0.088173046708107, 0.0928407534956932, 0.09750846028327942, 0.10217617452144623, 0.10684388130903244, 0.11151158809661865, 0.11617929488420486, 0.12084700167179108, 0.12551471590995789, 0.1301824152469635, 0.1348501294851303, 0.13951782882213593, 0.14418554306030273, 0.14885324239730835, 0.15352095663547516, 0.15818867087364197, 0.16285637021064758, 0.1675240844488144, 0.17219178378582, 0.17685949802398682, 0.18152719736099243, 0.18619491159915924, 0.19086262583732605, 0.19553034007549286, 0.20019803941249847, 0.20486575365066528, 0.2095334529876709, 0.2142011672258377, 0.21886886656284332, 0.22353658080101013, 0.22820428013801575]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 7.0, 9.0, 11.0, 22.0, 24.0, 23.0, 36.0, 46.0, 48.0, 61.0, 72.0, 67.0, 75.0, 67.0, 68.0, 62.0, 55.0, 49.0, 42.0, 47.0, 33.0, 17.0, 19.0, 10.0, 14.0, 7.0, 8.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05067718029022217, -0.049203068017959595, -0.04772895574569702, -0.04625484347343445, -0.044780731201171875, -0.0433066189289093, -0.04183250665664673, -0.040358394384384155, -0.03888428211212158, -0.03741016983985901, -0.035936057567596436, -0.03446194529533386, -0.03298783302307129, -0.031513720750808716, -0.030039608478546143, -0.02856549620628357, -0.027091383934020996, -0.025617271661758423, -0.02414315938949585, -0.022669047117233276, -0.021194934844970703, -0.01972082257270813, -0.018246710300445557, -0.016772598028182983, -0.01529848575592041, -0.013824373483657837, -0.012350261211395264, -0.01087614893913269, -0.009402036666870117, -0.007927924394607544, -0.006453812122344971, -0.0049796998500823975, -0.0035055875778198242, -0.002031475305557251, -0.0005573630332946777, 0.0009167492389678955, 0.0023908615112304688, 0.003864973783493042, 0.005339086055755615, 0.0068131983280181885, 0.008287310600280762, 0.009761422872543335, 0.011235535144805908, 0.012709647417068481, 0.014183759689331055, 0.015657871961593628, 0.0171319842338562, 0.018606096506118774, 0.020080208778381348, 0.02155432105064392, 0.023028433322906494, 0.024502545595169067, 0.02597665786743164, 0.027450770139694214, 0.028924882411956787, 0.03039899468421936, 0.031873106956481934, 0.03334721922874451, 0.03482133150100708, 0.03629544377326965, 0.03776955604553223, 0.0392436683177948, 0.04071778059005737, 0.042191892862319946, 0.04366600513458252]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 7.0, 8.0, 9.0, 14.0, 23.0, 21.0, 25.0, 28.0, 45.0, 59.0, 87.0, 139.0, 177.0, 255.0, 381.0, 527.0, 885.0, 1537.0, 2997.0, 6621.0, 17979.0, 60983.0, 250028.0, 477317.0, 163457.0, 40934.0, 13087.0, 5065.0, 2418.0, 1247.0, 745.0, 463.0, 283.0, 229.0, 129.0, 91.0, 76.0, 45.0, 35.0, 23.0, 29.0, 9.0, 11.0, 8.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.006378173828125, -0.0061869025230407715, -0.005995631217956543, -0.0058043599128723145, -0.005613088607788086, -0.005421817302703857, -0.005230545997619629, -0.0050392746925354, -0.004848003387451172, -0.004656732082366943, -0.004465460777282715, -0.004274189472198486, -0.004082918167114258, -0.0038916468620300293, -0.0037003755569458008, -0.0035091042518615723, -0.0033178329467773438, -0.0031265616416931152, -0.0029352903366088867, -0.002744019031524658, -0.0025527477264404297, -0.002361476421356201, -0.0021702051162719727, -0.001978933811187744, -0.0017876625061035156, -0.0015963912010192871, -0.0014051198959350586, -0.00121384859085083, -0.0010225772857666016, -0.000831305980682373, -0.0006400346755981445, -0.000448763370513916, -0.0002574920654296875, -6.622076034545898e-05, 0.00012505054473876953, 0.00031632184982299805, 0.0005075931549072266, 0.0006988644599914551, 0.0008901357650756836, 0.0010814070701599121, 0.0012726783752441406, 0.0014639496803283691, 0.0016552209854125977, 0.0018464922904968262, 0.0020377635955810547, 0.002229034900665283, 0.0024203062057495117, 0.0026115775108337402, 0.0028028488159179688, 0.0029941201210021973, 0.0031853914260864258, 0.0033766627311706543, 0.003567934036254883, 0.0037592053413391113, 0.00395047664642334, 0.004141747951507568, 0.004333019256591797, 0.004524290561676025, 0.004715561866760254, 0.004906833171844482, 0.005098104476928711, 0.0052893757820129395, 0.005480647087097168, 0.0056719183921813965, 0.005863189697265625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 9.0, 16.0, 26.0, 36.0, 49.0, 78.0, 74.0, 95.0, 109.0, 111.0, 98.0, 104.0, 71.0, 31.0, 30.0, 18.0, 12.0, 11.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01348114013671875, -0.013149142265319824, -0.012817144393920898, -0.012485146522521973, -0.012153148651123047, -0.011821150779724121, -0.011489152908325195, -0.01115715503692627, -0.010825157165527344, -0.010493159294128418, -0.010161161422729492, -0.009829163551330566, -0.00949716567993164, -0.009165167808532715, -0.008833169937133789, -0.008501172065734863, -0.008169174194335938, -0.007837176322937012, -0.007505178451538086, -0.00717318058013916, -0.006841182708740234, -0.006509184837341309, -0.006177186965942383, -0.005845189094543457, -0.005513191223144531, -0.0051811933517456055, -0.00484919548034668, -0.004517197608947754, -0.004185199737548828, -0.0038532018661499023, -0.0035212039947509766, -0.0031892061233520508, -0.002857208251953125, -0.0025252103805541992, -0.0021932125091552734, -0.0018612146377563477, -0.0015292167663574219, -0.001197218894958496, -0.0008652210235595703, -0.0005332231521606445, -0.00020122528076171875, 0.00013077259063720703, 0.0004627704620361328, 0.0007947683334350586, 0.0011267662048339844, 0.0014587640762329102, 0.001790761947631836, 0.0021227598190307617, 0.0024547576904296875, 0.0027867555618286133, 0.003118753433227539, 0.003450751304626465, 0.0037827491760253906, 0.004114747047424316, 0.004446744918823242, 0.004778742790222168, 0.005110740661621094, 0.0054427385330200195, 0.005774736404418945, 0.006106734275817871, 0.006438732147216797, 0.006770730018615723, 0.0071027278900146484, 0.007434725761413574, 0.0077667236328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 8.0, 18.0, 22.0, 23.0, 34.0, 49.0, 80.0, 131.0, 237.0, 476.0, 994.0, 2397.0, 7521.0, 33828.0, 197468.0, 638011.0, 134321.0, 23643.0, 5588.0, 1924.0, 802.0, 388.0, 227.0, 134.0, 80.0, 53.0, 34.0, 15.0, 18.0, 10.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00833892822265625, -0.008045196533203125, -0.00775146484375, -0.007457733154296875, -0.00716400146484375, -0.006870269775390625, -0.0065765380859375, -0.006282806396484375, -0.00598907470703125, -0.005695343017578125, -0.005401611328125, -0.005107879638671875, -0.00481414794921875, -0.004520416259765625, -0.0042266845703125, -0.003932952880859375, -0.00363922119140625, -0.003345489501953125, -0.0030517578125, -0.002758026123046875, -0.00246429443359375, -0.002170562744140625, -0.0018768310546875, -0.001583099365234375, -0.00128936767578125, -0.000995635986328125, -0.000701904296875, -0.000408172607421875, -0.00011444091796875, 0.000179290771484375, 0.0004730224609375, 0.000766754150390625, 0.00106048583984375, 0.001354217529296875, 0.00164794921875, 0.001941680908203125, 0.00223541259765625, 0.002529144287109375, 0.0028228759765625, 0.003116607666015625, 0.00341033935546875, 0.003704071044921875, 0.003997802734375, 0.004291534423828125, 0.00458526611328125, 0.004878997802734375, 0.0051727294921875, 0.005466461181640625, 0.00576019287109375, 0.006053924560546875, 0.00634765625, 0.006641387939453125, 0.00693511962890625, 0.007228851318359375, 0.0075225830078125, 0.007816314697265625, 0.00811004638671875, 0.008403778076171875, 0.008697509765625, 0.008991241455078125, 0.00928497314453125, 0.009578704833984375, 0.0098724365234375, 0.010166168212890625, 0.01045989990234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 3.0, 12.0, 15.0, 18.0, 20.0, 21.0, 18.0, 28.0, 27.0, 33.0, 25.0, 40.0, 36.0, 35.0, 44.0, 32.0, 44.0, 47.0, 52.0, 50.0, 40.0, 39.0, 39.0, 41.0, 33.0, 31.0, 30.0, 26.0, 21.0, 21.0, 14.0, 17.0, 13.0, 8.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0190582275390625, -0.01848149299621582, -0.01790475845336914, -0.01732802391052246, -0.01675128936767578, -0.0161745548248291, -0.015597820281982422, -0.015021085739135742, -0.014444351196289062, -0.013867616653442383, -0.013290882110595703, -0.012714147567749023, -0.012137413024902344, -0.011560678482055664, -0.010983943939208984, -0.010407209396362305, -0.009830474853515625, -0.009253740310668945, -0.008677005767822266, -0.008100271224975586, -0.007523536682128906, -0.0069468021392822266, -0.006370067596435547, -0.005793333053588867, -0.0052165985107421875, -0.004639863967895508, -0.004063129425048828, -0.0034863948822021484, -0.0029096603393554688, -0.002332925796508789, -0.0017561912536621094, -0.0011794567108154297, -0.00060272216796875, -2.5987625122070312e-05, 0.0005507469177246094, 0.001127481460571289, 0.0017042160034179688, 0.0022809505462646484, 0.002857685089111328, 0.003434419631958008, 0.0040111541748046875, 0.004587888717651367, 0.005164623260498047, 0.0057413578033447266, 0.006318092346191406, 0.006894826889038086, 0.007471561431884766, 0.008048295974731445, 0.008625030517578125, 0.009201765060424805, 0.009778499603271484, 0.010355234146118164, 0.010931968688964844, 0.011508703231811523, 0.012085437774658203, 0.012662172317504883, 0.013238906860351562, 0.013815641403198242, 0.014392375946044922, 0.014969110488891602, 0.015545845031738281, 0.01612257957458496, 0.01669931411743164, 0.01727604866027832, 0.017852783203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 8.0, 6.0, 13.0, 14.0, 17.0, 16.0, 23.0, 44.0, 60.0, 69.0, 131.0, 208.0, 336.0, 552.0, 1009.0, 1991.0, 4027.0, 9334.0, 23613.0, 79037.0, 591523.0, 253355.0, 51536.0, 17512.0, 7250.0, 3176.0, 1602.0, 806.0, 451.0, 276.0, 194.0, 102.0, 76.0, 46.0, 37.0, 19.0, 19.0, 10.0, 13.0, 7.0, 10.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.0021572113037109375, -0.002091526985168457, -0.0020258426666259766, -0.001960158348083496, -0.0018944740295410156, -0.0018287897109985352, -0.0017631053924560547, -0.0016974210739135742, -0.0016317367553710938, -0.0015660524368286133, -0.0015003681182861328, -0.0014346837997436523, -0.0013689994812011719, -0.0013033151626586914, -0.001237630844116211, -0.0011719465255737305, -0.00110626220703125, -0.0010405778884887695, -0.0009748935699462891, -0.0009092092514038086, -0.0008435249328613281, -0.0007778406143188477, -0.0007121562957763672, -0.0006464719772338867, -0.0005807876586914062, -0.0005151033401489258, -0.0004494190216064453, -0.00038373470306396484, -0.0003180503845214844, -0.0002523660659790039, -0.00018668174743652344, -0.00012099742889404297, -5.53131103515625e-05, 1.0371208190917969e-05, 7.605552673339844e-05, 0.0001417398452758789, 0.00020742416381835938, 0.00027310848236083984, 0.0003387928009033203, 0.0004044771194458008, 0.00047016143798828125, 0.0005358457565307617, 0.0006015300750732422, 0.0006672143936157227, 0.0007328987121582031, 0.0007985830307006836, 0.0008642673492431641, 0.0009299516677856445, 0.000995635986328125, 0.0010613203048706055, 0.001127004623413086, 0.0011926889419555664, 0.0012583732604980469, 0.0013240575790405273, 0.0013897418975830078, 0.0014554262161254883, 0.0015211105346679688, 0.0015867948532104492, 0.0016524791717529297, 0.0017181634902954102, 0.0017838478088378906, 0.001849532127380371, 0.0019152164459228516, 0.001980900764465332, 0.0020465850830078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 7.0, 11.0, 8.0, 14.0, 16.0, 22.0, 13.0, 27.0, 17.0, 9.0, 41.0, 36.0, 16.0, 43.0, 33.0, 16.0, 45.0, 46.0, 29.0, 52.0, 44.0, 42.0, 26.0, 47.0, 44.0, 22.0, 43.0, 49.0, 12.0, 29.0, 17.0, 13.0, 27.0, 12.0, 8.0, 7.0, 11.0, 8.0, 7.0, 8.0, 8.0, 1.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.2782554626464844e-06, -3.1776726245880127e-06, -3.077089786529541e-06, -2.9765069484710693e-06, -2.8759241104125977e-06, -2.775341272354126e-06, -2.6747584342956543e-06, -2.5741755962371826e-06, -2.473592758178711e-06, -2.3730099201202393e-06, -2.2724270820617676e-06, -2.171844244003296e-06, -2.0712614059448242e-06, -1.9706785678863525e-06, -1.8700957298278809e-06, -1.7695128917694092e-06, -1.6689300537109375e-06, -1.5683472156524658e-06, -1.4677643775939941e-06, -1.3671815395355225e-06, -1.2665987014770508e-06, -1.166015863418579e-06, -1.0654330253601074e-06, -9.648501873016357e-07, -8.642673492431641e-07, -7.636845111846924e-07, -6.631016731262207e-07, -5.62518835067749e-07, -4.6193599700927734e-07, -3.6135315895080566e-07, -2.60770320892334e-07, -1.601874828338623e-07, -5.960464477539063e-08, 4.0978193283081055e-08, 1.4156103134155273e-07, 2.421438694000244e-07, 3.427267074584961e-07, 4.4330954551696777e-07, 5.438923835754395e-07, 6.444752216339111e-07, 7.450580596923828e-07, 8.456408977508545e-07, 9.462237358093262e-07, 1.0468065738677979e-06, 1.1473894119262695e-06, 1.2479722499847412e-06, 1.3485550880432129e-06, 1.4491379261016846e-06, 1.5497207641601562e-06, 1.650303602218628e-06, 1.7508864402770996e-06, 1.8514692783355713e-06, 1.952052116394043e-06, 2.0526349544525146e-06, 2.1532177925109863e-06, 2.253800630569458e-06, 2.3543834686279297e-06, 2.4549663066864014e-06, 2.555549144744873e-06, 2.6561319828033447e-06, 2.7567148208618164e-06, 2.857297658920288e-06, 2.9578804969787598e-06, 3.0584633350372314e-06, 3.159046173095703e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 8.0, 10.0, 14.0, 21.0, 28.0, 24.0, 57.0, 93.0, 152.0, 272.0, 659.0, 1424.0, 3898.0, 13638.0, 74142.0, 720978.0, 195909.0, 26839.0, 6374.0, 2192.0, 877.0, 416.0, 197.0, 121.0, 63.0, 42.0, 29.0, 20.0, 18.0, 12.0, 6.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0026264190673828125, -0.0025409162044525146, -0.002455413341522217, -0.002369910478591919, -0.002284407615661621, -0.0021989047527313232, -0.0021134018898010254, -0.0020278990268707275, -0.0019423961639404297, -0.0018568933010101318, -0.001771390438079834, -0.0016858875751495361, -0.0016003847122192383, -0.0015148818492889404, -0.0014293789863586426, -0.0013438761234283447, -0.0012583732604980469, -0.001172870397567749, -0.0010873675346374512, -0.0010018646717071533, -0.0009163618087768555, -0.0008308589458465576, -0.0007453560829162598, -0.0006598532199859619, -0.0005743503570556641, -0.0004888474941253662, -0.00040334463119506836, -0.0003178417682647705, -0.00023233890533447266, -0.0001468360424041748, -6.133317947387695e-05, 2.41696834564209e-05, 0.00010967254638671875, 0.0001951754093170166, 0.00028067827224731445, 0.0003661811351776123, 0.00045168399810791016, 0.000537186861038208, 0.0006226897239685059, 0.0007081925868988037, 0.0007936954498291016, 0.0008791983127593994, 0.0009647011756896973, 0.0010502040386199951, 0.001135706901550293, 0.0012212097644805908, 0.0013067126274108887, 0.0013922154903411865, 0.0014777183532714844, 0.0015632212162017822, 0.00164872407913208, 0.001734226942062378, 0.0018197298049926758, 0.0019052326679229736, 0.0019907355308532715, 0.0020762383937835693, 0.002161741256713867, 0.002247244119644165, 0.002332746982574463, 0.0024182498455047607, 0.0025037527084350586, 0.0025892555713653564, 0.0026747584342956543, 0.002760261297225952, 0.00284576416015625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 8.0, 7.0, 14.0, 28.0, 26.0, 36.0, 62.0, 75.0, 102.0, 136.0, 125.0, 105.0, 80.0, 64.0, 47.0, 31.0, 19.0, 9.0, 4.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0044097900390625, -0.004275918006896973, -0.004142045974731445, -0.004008173942565918, -0.0038743019104003906, -0.0037404298782348633, -0.003606557846069336, -0.0034726858139038086, -0.0033388137817382812, -0.003204941749572754, -0.0030710697174072266, -0.0029371976852416992, -0.002803325653076172, -0.0026694536209106445, -0.002535581588745117, -0.00240170955657959, -0.0022678375244140625, -0.002133965492248535, -0.002000093460083008, -0.0018662214279174805, -0.0017323493957519531, -0.0015984773635864258, -0.0014646053314208984, -0.001330733299255371, -0.0011968612670898438, -0.0010629892349243164, -0.0009291172027587891, -0.0007952451705932617, -0.0006613731384277344, -0.000527501106262207, -0.0003936290740966797, -0.00025975704193115234, -0.000125885009765625, 7.987022399902344e-06, 0.0001418590545654297, 0.00027573108673095703, 0.0004096031188964844, 0.0005434751510620117, 0.0006773471832275391, 0.0008112192153930664, 0.0009450912475585938, 0.001078963279724121, 0.0012128353118896484, 0.0013467073440551758, 0.0014805793762207031, 0.0016144514083862305, 0.0017483234405517578, 0.0018821954727172852, 0.0020160675048828125, 0.00214993953704834, 0.002283811569213867, 0.0024176836013793945, 0.002551555633544922, 0.0026854276657104492, 0.0028192996978759766, 0.002953171730041504, 0.0030870437622070312, 0.0032209157943725586, 0.003354787826538086, 0.0034886598587036133, 0.0036225318908691406, 0.003756403923034668, 0.0038902759552001953, 0.004024147987365723, 0.00415802001953125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 14.0, 14.0, 37.0, 60.0, 208.0, 367.0, 198.0, 62.0, 18.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.143324077129364, -0.14003857970237732, -0.13675309717655182, -0.13346759974956512, -0.13018210232257843, -0.12689660489559174, -0.12361112236976624, -0.12032562494277954, -0.11704012751579285, -0.11375463753938675, -0.11046914011240005, -0.10718365013599396, -0.10389815270900726, -0.10061266273260117, -0.09732717275619507, -0.09404167532920837, -0.09075618535280228, -0.08747069537639618, -0.08418519794940948, -0.08089970797300339, -0.0776142105460167, -0.0743287205696106, -0.0710432231426239, -0.0677577331662178, -0.0644722431898117, -0.06118674948811531, -0.057901255786418915, -0.05461576581001282, -0.05133026838302612, -0.048044778406620026, -0.04475928470492363, -0.041473791003227234, -0.03818829357624054, -0.034902799874544144, -0.03161730617284775, -0.0283318143337965, -0.025046320632100105, -0.02176082693040371, -0.018475335091352463, -0.015189841389656067, -0.011904347687959671, -0.008618853986263275, -0.005333361215889454, -0.0020478684455156326, 0.0012376252561807632, 0.004523118957877159, 0.007808610796928406, 0.011094104498624802, 0.014379598200321198, 0.017665091902017593, 0.02095058560371399, 0.024236077442765236, 0.027521571144461632, 0.030807064846158028, 0.034092556685209274, 0.03737805038690567, 0.040663544088602066, 0.04394903779029846, 0.04723453149199486, 0.050520025193691254, 0.05380551517009735, 0.057091012597084045, 0.06037650257349014, 0.06366199254989624, 0.06694748997688293]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 6.0, 8.0, 7.0, 7.0, 12.0, 15.0, 18.0, 26.0, 24.0, 27.0, 28.0, 29.0, 40.0, 46.0, 49.0, 59.0, 88.0, 73.0, 77.0, 50.0, 31.0, 29.0, 32.0, 33.0, 26.0, 20.0, 16.0, 17.0, 14.0, 10.0, 15.0, 10.0, 4.0, 10.0, 6.0, 4.0, 5.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.07070803642272949, -0.06848625838756561, -0.06626448035240173, -0.06404269486665726, -0.06182091683149338, -0.0595991387963295, -0.05737735703587532, -0.05515557527542114, -0.05293379724025726, -0.050712019205093384, -0.048490237444639206, -0.04626845568418503, -0.04404667764902115, -0.04182489961385727, -0.03960311785340309, -0.037381336092948914, -0.035159558057785034, -0.032937780022621155, -0.030715998262166977, -0.02849421836435795, -0.02627243846654892, -0.02405065856873989, -0.021828878670930862, -0.019607098773121834, -0.017385318875312805, -0.015163538977503777, -0.012941759079694748, -0.01071997918188572, -0.00849819928407669, -0.006276419386267662, -0.004054639488458633, -0.0018328595906496048, 0.00038892030715942383, 0.0026107002049684525, 0.004832480102777481, 0.00705426000058651, 0.009276039898395538, 0.011497819796204567, 0.013719599694013596, 0.015941379591822624, 0.018163159489631653, 0.02038493938744068, 0.02260671928524971, 0.02482849918305874, 0.027050279080867767, 0.029272058978676796, 0.031493838876485825, 0.03371562063694, 0.03593739867210388, 0.03815917670726776, 0.04038095846772194, 0.04260274022817612, 0.044824518263339996, 0.047046296298503876, 0.049268078058958054, 0.05148985981941223, 0.05371163785457611, 0.05593341588973999, 0.05815519765019417, 0.060376979410648346, 0.06259875744581223, 0.0648205354809761, 0.06704232096672058, 0.06926409900188446, 0.07148587703704834]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 13.0, 20.0, 32.0, 34.0, 75.0, 148.0, 333.0, 933.0, 7109.0, 258755.0, 3771485.0, 132904.0, 16259.0, 4481.0, 1233.0, 278.0, 64.0, 42.0, 25.0, 16.0, 8.0, 7.0, 2.0, 2.0, 1.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01087188720703125, -0.01055610179901123, -0.010240316390991211, -0.009924530982971191, -0.009608745574951172, -0.009292960166931152, -0.008977174758911133, -0.008661389350891113, -0.008345603942871094, -0.008029818534851074, -0.007714033126831055, -0.007398247718811035, -0.007082462310791016, -0.006766676902770996, -0.0064508914947509766, -0.006135106086730957, -0.0058193206787109375, -0.005503535270690918, -0.0051877498626708984, -0.004871964454650879, -0.004556179046630859, -0.00424039363861084, -0.00392460823059082, -0.0036088228225708008, -0.0032930374145507812, -0.0029772520065307617, -0.002661466598510742, -0.0023456811904907227, -0.002029895782470703, -0.0017141103744506836, -0.001398324966430664, -0.0010825395584106445, -0.000766754150390625, -0.00045096874237060547, -0.00013518333435058594, 0.0001806020736694336, 0.0004963874816894531, 0.0008121728897094727, 0.0011279582977294922, 0.0014437437057495117, 0.0017595291137695312, 0.0020753145217895508, 0.0023910999298095703, 0.00270688533782959, 0.0030226707458496094, 0.003338456153869629, 0.0036542415618896484, 0.003970026969909668, 0.0042858123779296875, 0.004601597785949707, 0.0049173831939697266, 0.005233168601989746, 0.005548954010009766, 0.005864739418029785, 0.006180524826049805, 0.006496310234069824, 0.006812095642089844, 0.007127881050109863, 0.007443666458129883, 0.007759451866149902, 0.008075237274169922, 0.008391022682189941, 0.008706808090209961, 0.00902259349822998, 0.00933837890625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 7.0, 13.0, 26.0, 37.0, 52.0, 59.0, 87.0, 110.0, 117.0, 115.0, 95.0, 74.0, 64.0, 47.0, 27.0, 15.0, 16.0, 16.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01348114013671875, -0.013149023056030273, -0.012816905975341797, -0.01248478889465332, -0.012152671813964844, -0.011820554733276367, -0.01148843765258789, -0.011156320571899414, -0.010824203491210938, -0.010492086410522461, -0.010159969329833984, -0.009827852249145508, -0.009495735168457031, -0.009163618087768555, -0.008831501007080078, -0.008499383926391602, -0.008167266845703125, -0.007835149765014648, -0.007503032684326172, -0.007170915603637695, -0.006838798522949219, -0.006506681442260742, -0.006174564361572266, -0.005842447280883789, -0.0055103302001953125, -0.005178213119506836, -0.004846096038818359, -0.004513978958129883, -0.004181861877441406, -0.0038497447967529297, -0.003517627716064453, -0.0031855106353759766, -0.0028533935546875, -0.0025212764739990234, -0.002189159393310547, -0.0018570423126220703, -0.0015249252319335938, -0.0011928081512451172, -0.0008606910705566406, -0.0005285739898681641, -0.0001964569091796875, 0.00013566017150878906, 0.0004677772521972656, 0.0007998943328857422, 0.0011320114135742188, 0.0014641284942626953, 0.0017962455749511719, 0.0021283626556396484, 0.002460479736328125, 0.0027925968170166016, 0.003124713897705078, 0.0034568309783935547, 0.0037889480590820312, 0.004121065139770508, 0.004453182220458984, 0.004785299301147461, 0.0051174163818359375, 0.005449533462524414, 0.005781650543212891, 0.006113767623901367, 0.006445884704589844, 0.00677800178527832, 0.007110118865966797, 0.0074422359466552734, 0.00777435302734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 15.0, 26.0, 63.0, 131.0, 182.0, 278.0, 3683.0, 4188731.0, 611.0, 232.0, 160.0, 94.0, 50.0, 16.0, 11.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06011962890625, -0.058136940002441406, -0.05615425109863281, -0.05417156219482422, -0.052188873291015625, -0.05020618438720703, -0.04822349548339844, -0.046240806579589844, -0.04425811767578125, -0.042275428771972656, -0.04029273986816406, -0.03831005096435547, -0.036327362060546875, -0.03434467315673828, -0.03236198425292969, -0.030379295349121094, -0.0283966064453125, -0.026413917541503906, -0.024431228637695312, -0.02244853973388672, -0.020465850830078125, -0.01848316192626953, -0.016500473022460938, -0.014517784118652344, -0.01253509521484375, -0.010552406311035156, -0.008569717407226562, -0.006587028503417969, -0.004604339599609375, -0.0026216506958007812, -0.0006389617919921875, 0.0013437271118164062, 0.003326416015625, 0.005309104919433594, 0.0072917938232421875, 0.009274482727050781, 0.011257171630859375, 0.013239860534667969, 0.015222549438476562, 0.017205238342285156, 0.01918792724609375, 0.021170616149902344, 0.023153305053710938, 0.02513599395751953, 0.027118682861328125, 0.02910137176513672, 0.031084060668945312, 0.033066749572753906, 0.0350494384765625, 0.037032127380371094, 0.03901481628417969, 0.04099750518798828, 0.042980194091796875, 0.04496288299560547, 0.04694557189941406, 0.048928260803222656, 0.05091094970703125, 0.052893638610839844, 0.05487632751464844, 0.05685901641845703, 0.058841705322265625, 0.06082439422607422, 0.06280708312988281, 0.0647897720336914, 0.0667724609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 10.0, 47.0, 1657.0, 2278.0, 65.0, 20.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045166015625, -0.04398059844970703, -0.04279518127441406, -0.041609764099121094, -0.040424346923828125, -0.039238929748535156, -0.03805351257324219, -0.03686809539794922, -0.03568267822265625, -0.03449726104736328, -0.03331184387207031, -0.032126426696777344, -0.030941009521484375, -0.029755592346191406, -0.028570175170898438, -0.02738475799560547, -0.0261993408203125, -0.02501392364501953, -0.023828506469726562, -0.022643089294433594, -0.021457672119140625, -0.020272254943847656, -0.019086837768554688, -0.01790142059326172, -0.01671600341796875, -0.015530586242675781, -0.014345169067382812, -0.013159751892089844, -0.011974334716796875, -0.010788917541503906, -0.009603500366210938, -0.008418083190917969, -0.007232666015625, -0.006047248840332031, -0.0048618316650390625, -0.0036764144897460938, -0.002490997314453125, -0.0013055801391601562, -0.0001201629638671875, 0.0010652542114257812, 0.00225067138671875, 0.0034360885620117188, 0.0046215057373046875, 0.005806922912597656, 0.006992340087890625, 0.008177757263183594, 0.009363174438476562, 0.010548591613769531, 0.0117340087890625, 0.012919425964355469, 0.014104843139648438, 0.015290260314941406, 0.016475677490234375, 0.017661094665527344, 0.018846511840820312, 0.02003192901611328, 0.02121734619140625, 0.02240276336669922, 0.023588180541992188, 0.024773597717285156, 0.025959014892578125, 0.027144432067871094, 0.028329849243164062, 0.02951526641845703, 0.03070068359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 8.0, 14.0, 24.0, 40.0, 84.0, 145.0, 229.0, 189.0, 116.0, 68.0, 32.0, 23.0, 5.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05415951833128929, -0.05221942812204361, -0.05027933791279793, -0.048339247703552246, -0.04639916121959686, -0.04445907101035118, -0.0425189808011055, -0.04057889059185982, -0.038638800382614136, -0.036698710173368454, -0.03475861996412277, -0.03281853348016739, -0.030878443270921707, -0.028938353061676025, -0.026998262852430344, -0.025058172643184662, -0.02311808615922928, -0.021177995949983597, -0.019237907603383064, -0.017297817394137383, -0.015357728116214275, -0.013417638838291168, -0.011477548629045486, -0.00953745935112238, -0.007597370073199272, -0.005657280795276165, -0.0037171910516917706, -0.001777101308107376, 0.00016298796981573105, 0.002103077247738838, 0.00404316745698452, 0.005983256734907627, 0.007923342287540436, 0.009863431565463543, 0.01180352084338665, 0.013743611052632332, 0.015683699399232864, 0.017623789608478546, 0.019563879817724228, 0.02150397002696991, 0.023444058373570442, 0.025384148582816124, 0.027324236929416656, 0.029264327138662338, 0.03120441734790802, 0.0331445038318634, 0.035084597766399384, 0.03702468425035477, 0.03896477445960045, 0.04090486466884613, 0.04284495487809181, 0.044785045087337494, 0.04672513157129288, 0.04866522178053856, 0.05060531198978424, 0.05254540219902992, 0.054485492408275604, 0.056425582617521286, 0.05836567282676697, 0.06030575931072235, 0.06224584951996803, 0.06418593972921371, 0.0661260336637497, 0.06806612014770508, 0.07000620663166046]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 5.0, 7.0, 10.0, 11.0, 10.0, 13.0, 13.0, 18.0, 20.0, 21.0, 29.0, 25.0, 26.0, 34.0, 24.0, 28.0, 27.0, 29.0, 28.0, 22.0, 24.0, 42.0, 37.0, 28.0, 40.0, 40.0, 36.0, 25.0, 44.0, 30.0, 32.0, 21.0, 22.0, 27.0, 21.0, 20.0, 25.0, 18.0, 10.0, 8.0, 12.0, 11.0, 7.0, 8.0, 3.0, 5.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.030307292938232422, -0.029374143108725548, -0.028440993279218674, -0.0275078434497118, -0.026574693620204926, -0.02564154379069805, -0.024708393961191177, -0.023775244131684303, -0.02284209430217743, -0.021908944472670555, -0.02097579464316368, -0.020042644813656807, -0.019109494984149933, -0.01817634515464306, -0.017243195325136185, -0.01631004549562931, -0.015376895666122437, -0.014443745836615562, -0.013510596007108688, -0.012577446177601814, -0.01164429634809494, -0.010711146518588066, -0.009777996689081192, -0.008844846859574318, -0.007911697030067444, -0.00697854720056057, -0.006045397371053696, -0.005112247541546822, -0.0041790977120399475, -0.0032459478825330734, -0.0023127980530261993, -0.0013796482235193253, -0.00044649839401245117, 0.0004866514354944229, 0.001419801265001297, 0.002352951094508171, 0.003286100924015045, 0.004219250753521919, 0.005152400583028793, 0.006085550412535667, 0.0070187002420425415, 0.007951850071549416, 0.00888499990105629, 0.009818149730563164, 0.010751299560070038, 0.011684449389576912, 0.012617599219083786, 0.01355074904859066, 0.014483898878097534, 0.015417048707604408, 0.016350198537111282, 0.017283348366618156, 0.01821649819612503, 0.019149648025631905, 0.02008279785513878, 0.021015947684645653, 0.021949097514152527, 0.0228822473436594, 0.023815397173166275, 0.02474854700267315, 0.025681696832180023, 0.026614846661686897, 0.02754799649119377, 0.028481146320700645, 0.02941429615020752]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 8.0, 8.0, 10.0, 15.0, 19.0, 31.0, 35.0, 44.0, 63.0, 80.0, 105.0, 153.0, 219.0, 288.0, 525.0, 815.0, 1285.0, 2589.0, 5788.0, 14164.0, 44475.0, 169004.0, 481641.0, 234684.0, 59929.0, 18334.0, 6985.0, 3076.0, 1632.0, 874.0, 576.0, 324.0, 215.0, 167.0, 96.0, 82.0, 57.0, 42.0, 32.0, 25.0, 21.0, 14.0, 12.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.0069122314453125, -0.006718158721923828, -0.006524085998535156, -0.006330013275146484, -0.0061359405517578125, -0.005941867828369141, -0.005747795104980469, -0.005553722381591797, -0.005359649658203125, -0.005165576934814453, -0.004971504211425781, -0.004777431488037109, -0.0045833587646484375, -0.004389286041259766, -0.004195213317871094, -0.004001140594482422, -0.00380706787109375, -0.003612995147705078, -0.0034189224243164062, -0.0032248497009277344, -0.0030307769775390625, -0.0028367042541503906, -0.0026426315307617188, -0.002448558807373047, -0.002254486083984375, -0.002060413360595703, -0.0018663406372070312, -0.0016722679138183594, -0.0014781951904296875, -0.0012841224670410156, -0.0010900497436523438, -0.0008959770202636719, -0.000701904296875, -0.0005078315734863281, -0.00031375885009765625, -0.00011968612670898438, 7.43865966796875e-05, 0.0002684593200683594, 0.00046253204345703125, 0.0006566047668457031, 0.000850677490234375, 0.0010447502136230469, 0.0012388229370117188, 0.0014328956604003906, 0.0016269683837890625, 0.0018210411071777344, 0.0020151138305664062, 0.002209186553955078, 0.00240325927734375, 0.002597332000732422, 0.0027914047241210938, 0.0029854774475097656, 0.0031795501708984375, 0.0033736228942871094, 0.0035676956176757812, 0.003761768341064453, 0.003955841064453125, 0.004149913787841797, 0.004343986511230469, 0.004538059234619141, 0.0047321319580078125, 0.004926204681396484, 0.005120277404785156, 0.005314350128173828, 0.0055084228515625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 15.0, 19.0, 23.0, 36.0, 50.0, 74.0, 88.0, 93.0, 117.0, 105.0, 99.0, 63.0, 72.0, 41.0, 33.0, 22.0, 14.0, 9.0, 10.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01345062255859375, -0.013126730918884277, -0.012802839279174805, -0.012478947639465332, -0.01215505599975586, -0.011831164360046387, -0.011507272720336914, -0.011183381080627441, -0.010859489440917969, -0.010535597801208496, -0.010211706161499023, -0.00988781452178955, -0.009563922882080078, -0.009240031242370605, -0.008916139602661133, -0.00859224796295166, -0.008268356323242188, -0.007944464683532715, -0.007620573043823242, -0.0072966814041137695, -0.006972789764404297, -0.006648898124694824, -0.0063250064849853516, -0.006001114845275879, -0.005677223205566406, -0.005353331565856934, -0.005029439926147461, -0.004705548286437988, -0.004381656646728516, -0.004057765007019043, -0.0037338733673095703, -0.0034099817276000977, -0.003086090087890625, -0.0027621984481811523, -0.0024383068084716797, -0.002114415168762207, -0.0017905235290527344, -0.0014666318893432617, -0.001142740249633789, -0.0008188486099243164, -0.0004949569702148438, -0.0001710653305053711, 0.00015282630920410156, 0.0004767179489135742, 0.0008006095886230469, 0.0011245012283325195, 0.0014483928680419922, 0.0017722845077514648, 0.0020961761474609375, 0.00242006778717041, 0.002743959426879883, 0.0030678510665893555, 0.003391742706298828, 0.0037156343460083008, 0.0040395259857177734, 0.004363417625427246, 0.004687309265136719, 0.005011200904846191, 0.005335092544555664, 0.005658984184265137, 0.005982875823974609, 0.006306767463684082, 0.006630659103393555, 0.006954550743103027, 0.0072784423828125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 15.0, 14.0, 20.0, 16.0, 29.0, 39.0, 52.0, 65.0, 65.0, 97.0, 139.0, 166.0, 188.0, 320.0, 476.0, 787.0, 1520.0, 4011.0, 13605.0, 67910.0, 574061.0, 313220.0, 53258.0, 11390.0, 3398.0, 1459.0, 722.0, 429.0, 300.0, 188.0, 128.0, 96.0, 88.0, 61.0, 50.0, 31.0, 30.0, 24.0, 12.0, 13.0, 9.0, 5.0, 10.0, 6.0, 0.0, 4.0, 4.0, 3.0, 0.0, 4.0, 3.0], "bins": [-0.00945281982421875, -0.009174227714538574, -0.008895635604858398, -0.008617043495178223, -0.008338451385498047, -0.008059859275817871, -0.007781267166137695, -0.0075026750564575195, -0.007224082946777344, -0.006945490837097168, -0.006666898727416992, -0.006388306617736816, -0.006109714508056641, -0.005831122398376465, -0.005552530288696289, -0.005273938179016113, -0.0049953460693359375, -0.004716753959655762, -0.004438161849975586, -0.00415956974029541, -0.0038809776306152344, -0.0036023855209350586, -0.003323793411254883, -0.003045201301574707, -0.0027666091918945312, -0.0024880170822143555, -0.0022094249725341797, -0.001930832862854004, -0.0016522407531738281, -0.0013736486434936523, -0.0010950565338134766, -0.0008164644241333008, -0.000537872314453125, -0.0002592802047729492, 1.9311904907226562e-05, 0.00029790401458740234, 0.0005764961242675781, 0.0008550882339477539, 0.0011336803436279297, 0.0014122724533081055, 0.0016908645629882812, 0.001969456672668457, 0.002248048782348633, 0.0025266408920288086, 0.0028052330017089844, 0.00308382511138916, 0.003362417221069336, 0.0036410093307495117, 0.0039196014404296875, 0.004198193550109863, 0.004476785659790039, 0.004755377769470215, 0.005033969879150391, 0.005312561988830566, 0.005591154098510742, 0.005869746208190918, 0.006148338317871094, 0.0064269304275512695, 0.006705522537231445, 0.006984114646911621, 0.007262706756591797, 0.007541298866271973, 0.007819890975952148, 0.008098483085632324, 0.0083770751953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 4.0, 3.0, 10.0, 12.0, 8.0, 16.0, 12.0, 24.0, 17.0, 32.0, 21.0, 42.0, 33.0, 44.0, 42.0, 48.0, 42.0, 40.0, 53.0, 49.0, 42.0, 36.0, 38.0, 36.0, 30.0, 36.0, 38.0, 32.0, 27.0, 24.0, 15.0, 22.0, 7.0, 11.0, 10.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0174407958984375, -0.016884326934814453, -0.016327857971191406, -0.01577138900756836, -0.015214920043945312, -0.014658451080322266, -0.014101982116699219, -0.013545513153076172, -0.012989044189453125, -0.012432575225830078, -0.011876106262207031, -0.011319637298583984, -0.010763168334960938, -0.01020669937133789, -0.009650230407714844, -0.009093761444091797, -0.00853729248046875, -0.007980823516845703, -0.007424354553222656, -0.006867885589599609, -0.0063114166259765625, -0.005754947662353516, -0.005198478698730469, -0.004642009735107422, -0.004085540771484375, -0.003529071807861328, -0.0029726028442382812, -0.0024161338806152344, -0.0018596649169921875, -0.0013031959533691406, -0.0007467269897460938, -0.00019025802612304688, 0.0003662109375, 0.0009226799011230469, 0.0014791488647460938, 0.0020356178283691406, 0.0025920867919921875, 0.0031485557556152344, 0.0037050247192382812, 0.004261493682861328, 0.004817962646484375, 0.005374431610107422, 0.005930900573730469, 0.006487369537353516, 0.0070438385009765625, 0.007600307464599609, 0.008156776428222656, 0.008713245391845703, 0.00926971435546875, 0.009826183319091797, 0.010382652282714844, 0.01093912124633789, 0.011495590209960938, 0.012052059173583984, 0.012608528137207031, 0.013164997100830078, 0.013721466064453125, 0.014277935028076172, 0.014834403991699219, 0.015390872955322266, 0.015947341918945312, 0.01650381088256836, 0.017060279846191406, 0.017616748809814453, 0.0181732177734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 11.0, 11.0, 11.0, 24.0, 39.0, 50.0, 104.0, 187.0, 264.0, 467.0, 786.0, 1535.0, 3646.0, 9628.0, 36009.0, 211004.0, 686329.0, 71809.0, 16497.0, 5368.0, 2238.0, 1021.0, 574.0, 330.0, 207.0, 140.0, 75.0, 50.0, 44.0, 14.0, 14.0, 8.0, 9.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.002288818359375, -0.0022155046463012695, -0.002142190933227539, -0.0020688772201538086, -0.001995563507080078, -0.0019222497940063477, -0.0018489360809326172, -0.0017756223678588867, -0.0017023086547851562, -0.0016289949417114258, -0.0015556812286376953, -0.0014823675155639648, -0.0014090538024902344, -0.001335740089416504, -0.0012624263763427734, -0.001189112663269043, -0.0011157989501953125, -0.001042485237121582, -0.0009691715240478516, -0.0008958578109741211, -0.0008225440979003906, -0.0007492303848266602, -0.0006759166717529297, -0.0006026029586791992, -0.0005292892456054688, -0.0004559755325317383, -0.0003826618194580078, -0.00030934810638427734, -0.00023603439331054688, -0.0001627206802368164, -8.940696716308594e-05, -1.609325408935547e-05, 5.7220458984375e-05, 0.00013053417205810547, 0.00020384788513183594, 0.0002771615982055664, 0.0003504753112792969, 0.00042378902435302734, 0.0004971027374267578, 0.0005704164505004883, 0.0006437301635742188, 0.0007170438766479492, 0.0007903575897216797, 0.0008636713027954102, 0.0009369850158691406, 0.001010298728942871, 0.0010836124420166016, 0.001156926155090332, 0.0012302398681640625, 0.001303553581237793, 0.0013768672943115234, 0.001450181007385254, 0.0015234947204589844, 0.0015968084335327148, 0.0016701221466064453, 0.0017434358596801758, 0.0018167495727539062, 0.0018900632858276367, 0.001963376998901367, 0.0020366907119750977, 0.002110004425048828, 0.0021833181381225586, 0.002256631851196289, 0.0023299455642700195, 0.00240325927734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 2.0, 8.0, 15.0, 17.0, 10.0, 18.0, 22.0, 27.0, 31.0, 36.0, 35.0, 37.0, 37.0, 52.0, 42.0, 53.0, 81.0, 52.0, 45.0, 38.0, 40.0, 44.0, 42.0, 59.0, 22.0, 19.0, 18.0, 19.0, 13.0, 17.0, 11.0, 7.0, 8.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.589557647705078e-06, -4.4619664549827576e-06, -4.334375262260437e-06, -4.2067840695381165e-06, -4.079192876815796e-06, -3.951601684093475e-06, -3.824010491371155e-06, -3.6964192986488342e-06, -3.5688281059265137e-06, -3.441236913204193e-06, -3.3136457204818726e-06, -3.186054527759552e-06, -3.0584633350372314e-06, -2.930872142314911e-06, -2.8032809495925903e-06, -2.6756897568702698e-06, -2.5480985641479492e-06, -2.4205073714256287e-06, -2.292916178703308e-06, -2.1653249859809875e-06, -2.037733793258667e-06, -1.9101426005363464e-06, -1.7825514078140259e-06, -1.6549602150917053e-06, -1.5273690223693848e-06, -1.3997778296470642e-06, -1.2721866369247437e-06, -1.144595444202423e-06, -1.0170042514801025e-06, -8.89413058757782e-07, -7.618218660354614e-07, -6.342306733131409e-07, -5.066394805908203e-07, -3.7904828786849976e-07, -2.514570951461792e-07, -1.2386590242385864e-07, 3.725290298461914e-09, 1.3131648302078247e-07, 2.5890767574310303e-07, 3.864988684654236e-07, 5.140900611877441e-07, 6.416812539100647e-07, 7.692724466323853e-07, 8.968636393547058e-07, 1.0244548320770264e-06, 1.152046024799347e-06, 1.2796372175216675e-06, 1.407228410243988e-06, 1.5348196029663086e-06, 1.6624107956886292e-06, 1.7900019884109497e-06, 1.9175931811332703e-06, 2.045184373855591e-06, 2.1727755665779114e-06, 2.300366759300232e-06, 2.4279579520225525e-06, 2.555549144744873e-06, 2.6831403374671936e-06, 2.810731530189514e-06, 2.9383227229118347e-06, 3.0659139156341553e-06, 3.193505108356476e-06, 3.3210963010787964e-06, 3.448687493801117e-06, 3.5762786865234375e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 12.0, 7.0, 15.0, 37.0, 50.0, 50.0, 133.0, 191.0, 397.0, 802.0, 1833.0, 5031.0, 18538.0, 92992.0, 730283.0, 159242.0, 27282.0, 7087.0, 2477.0, 1014.0, 449.0, 251.0, 135.0, 89.0, 30.0, 45.0, 22.0, 18.0, 11.0, 11.0, 8.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002201080322265625, -0.0021336376667022705, -0.002066195011138916, -0.0019987523555755615, -0.001931309700012207, -0.0018638670444488525, -0.001796424388885498, -0.0017289817333221436, -0.001661539077758789, -0.0015940964221954346, -0.00152665376663208, -0.0014592111110687256, -0.001391768455505371, -0.0013243257999420166, -0.0012568831443786621, -0.0011894404888153076, -0.0011219978332519531, -0.0010545551776885986, -0.0009871125221252441, -0.0009196698665618896, -0.0008522272109985352, -0.0007847845554351807, -0.0007173418998718262, -0.0006498992443084717, -0.0005824565887451172, -0.0005150139331817627, -0.0004475712776184082, -0.0003801286220550537, -0.0003126859664916992, -0.0002452433109283447, -0.00017780065536499023, -0.00011035799980163574, -4.291534423828125e-05, 2.4527311325073242e-05, 9.196996688842773e-05, 0.00015941262245178223, 0.00022685527801513672, 0.0002942979335784912, 0.0003617405891418457, 0.0004291832447052002, 0.0004966259002685547, 0.0005640685558319092, 0.0006315112113952637, 0.0006989538669586182, 0.0007663965225219727, 0.0008338391780853271, 0.0009012818336486816, 0.0009687244892120361, 0.0010361671447753906, 0.0011036098003387451, 0.0011710524559020996, 0.001238495111465454, 0.0013059377670288086, 0.001373380422592163, 0.0014408230781555176, 0.001508265733718872, 0.0015757083892822266, 0.001643151044845581, 0.0017105937004089355, 0.00177803635597229, 0.0018454790115356445, 0.001912921667098999, 0.0019803643226623535, 0.002047806978225708, 0.0021152496337890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 8.0, 8.0, 12.0, 11.0, 18.0, 23.0, 18.0, 25.0, 43.0, 49.0, 51.0, 50.0, 60.0, 60.0, 60.0, 62.0, 64.0, 52.0, 51.0, 41.0, 38.0, 27.0, 30.0, 26.0, 17.0, 17.0, 12.0, 8.0, 8.0, 6.0, 5.0, 2.0, 7.0, 8.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.0013790130615234375, -0.0013235509395599365, -0.0012680888175964355, -0.0012126266956329346, -0.0011571645736694336, -0.0011017024517059326, -0.0010462403297424316, -0.0009907782077789307, -0.0009353160858154297, -0.0008798539638519287, -0.0008243918418884277, -0.0007689297199249268, -0.0007134675979614258, -0.0006580054759979248, -0.0006025433540344238, -0.0005470812320709229, -0.0004916191101074219, -0.0004361569881439209, -0.0003806948661804199, -0.00032523274421691895, -0.00026977062225341797, -0.000214308500289917, -0.00015884637832641602, -0.00010338425636291504, -4.792213439941406e-05, 7.539987564086914e-06, 6.300210952758789e-05, 0.00011846423149108887, 0.00017392635345458984, 0.00022938847541809082, 0.0002848505973815918, 0.0003403127193450928, 0.00039577484130859375, 0.0004512369632720947, 0.0005066990852355957, 0.0005621612071990967, 0.0006176233291625977, 0.0006730854511260986, 0.0007285475730895996, 0.0007840096950531006, 0.0008394718170166016, 0.0008949339389801025, 0.0009503960609436035, 0.0010058581829071045, 0.0010613203048706055, 0.0011167824268341064, 0.0011722445487976074, 0.0012277066707611084, 0.0012831687927246094, 0.0013386309146881104, 0.0013940930366516113, 0.0014495551586151123, 0.0015050172805786133, 0.0015604794025421143, 0.0016159415245056152, 0.0016714036464691162, 0.0017268657684326172, 0.0017823278903961182, 0.0018377900123596191, 0.0018932521343231201, 0.001948714256286621, 0.002004176378250122, 0.002059638500213623, 0.002115100622177124, 0.002170562744140625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 16.0, 26.0, 76.0, 138.0, 296.0, 288.0, 93.0, 27.0, 12.0, 10.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.14450019598007202, -0.14166796207427979, -0.13883571326732635, -0.13600347936153412, -0.13317124545574188, -0.13033899664878845, -0.12750676274299622, -0.12467452883720398, -0.12184228748083115, -0.11901004612445831, -0.11617781221866608, -0.11334557086229324, -0.11051332950592041, -0.10768109560012817, -0.10484885424375534, -0.10201661288738251, -0.09918437898159027, -0.09635213762521744, -0.0935199037194252, -0.09068766236305237, -0.08785542845726013, -0.0850231871008873, -0.08219094574451447, -0.07935871183872223, -0.0765264704823494, -0.07369422912597656, -0.07086199522018433, -0.06802975386381149, -0.06519751250743866, -0.06236527860164642, -0.05953303724527359, -0.056700799614191055, -0.053868554532527924, -0.05103631690144539, -0.048204079270362854, -0.04537183791399002, -0.042539600282907486, -0.03970736265182495, -0.03687512129545212, -0.03404288366436958, -0.03121064603328705, -0.028378408402204514, -0.02554616890847683, -0.022713929414749146, -0.01988169178366661, -0.017049454152584076, -0.014217214658856392, -0.011384975165128708, -0.008552737534046173, -0.005720498971641064, -0.0028882604092359543, -5.602184683084488e-05, 0.0027762167155742645, 0.005608455277979374, 0.008440693840384483, 0.011272933334112167, 0.014105170965194702, 0.016937408596277237, 0.01976964809000492, 0.022601887583732605, 0.02543412521481514, 0.028266362845897675, 0.03109860233962536, 0.03393084183335304, 0.03676307946443558]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 6.0, 11.0, 6.0, 15.0, 11.0, 11.0, 14.0, 22.0, 28.0, 30.0, 30.0, 23.0, 26.0, 36.0, 43.0, 53.0, 68.0, 96.0, 93.0, 61.0, 50.0, 28.0, 28.0, 21.0, 26.0, 19.0, 18.0, 29.0, 15.0, 10.0, 13.0, 4.0, 8.0, 6.0, 11.0, 7.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06246751546859741, -0.060436688363552094, -0.058405857533216476, -0.05637502670288086, -0.05434419959783554, -0.05231337249279022, -0.050282541662454605, -0.04825171083211899, -0.04622088372707367, -0.04419005662202835, -0.042159225791692734, -0.04012839496135712, -0.0380975678563118, -0.03606674075126648, -0.03403590992093086, -0.032005079090595245, -0.029974251985549927, -0.02794342301785946, -0.02591259405016899, -0.023881765082478523, -0.021850936114788055, -0.019820107147097588, -0.01778927817940712, -0.015758449211716652, -0.013727620244026184, -0.011696791276335716, -0.009665962308645248, -0.007635133340954781, -0.005604304373264313, -0.003573475405573845, -0.001542646437883377, 0.00048818252980709076, 0.0025190114974975586, 0.004549840465188026, 0.006580669432878494, 0.008611498400568962, 0.01064232736825943, 0.012673156335949898, 0.014703985303640366, 0.016734814271330833, 0.0187656432390213, 0.02079647220671177, 0.022827301174402237, 0.024858130142092705, 0.026888959109783173, 0.02891978807747364, 0.03095061704516411, 0.032981447875499725, 0.035012274980545044, 0.03704310208559036, 0.03907393291592598, 0.0411047637462616, 0.043135590851306915, 0.045166417956352234, 0.04719724878668785, 0.04922807961702347, 0.05125890672206879, 0.053289733827114105, 0.05532056465744972, 0.05735139548778534, 0.05938222259283066, 0.06141304969787598, 0.06344388425350189, 0.06547471135854721, 0.06750553846359253]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 8.0, 16.0, 14.0, 22.0, 28.0, 41.0, 61.0, 80.0, 108.0, 145.0, 273.0, 463.0, 1103.0, 4896.0, 136009.0, 3822693.0, 206292.0, 16110.0, 4225.0, 864.0, 274.0, 169.0, 109.0, 78.0, 48.0, 33.0, 31.0, 27.0, 14.0, 13.0, 9.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.009918212890625, -0.009529948234558105, -0.009141683578491211, -0.008753418922424316, -0.008365154266357422, -0.007976889610290527, -0.007588624954223633, -0.007200360298156738, -0.006812095642089844, -0.006423830986022949, -0.006035566329956055, -0.00564730167388916, -0.005259037017822266, -0.004870772361755371, -0.0044825077056884766, -0.004094243049621582, -0.0037059783935546875, -0.003317713737487793, -0.0029294490814208984, -0.002541184425354004, -0.0021529197692871094, -0.0017646551132202148, -0.0013763904571533203, -0.0009881258010864258, -0.0005998611450195312, -0.00021159648895263672, 0.0001766681671142578, 0.0005649328231811523, 0.0009531974792480469, 0.0013414621353149414, 0.001729726791381836, 0.0021179914474487305, 0.002506256103515625, 0.0028945207595825195, 0.003282785415649414, 0.0036710500717163086, 0.004059314727783203, 0.004447579383850098, 0.004835844039916992, 0.005224108695983887, 0.005612373352050781, 0.006000638008117676, 0.00638890266418457, 0.006777167320251465, 0.007165431976318359, 0.007553696632385254, 0.007941961288452148, 0.008330225944519043, 0.008718490600585938, 0.009106755256652832, 0.009495019912719727, 0.009883284568786621, 0.010271549224853516, 0.01065981388092041, 0.011048078536987305, 0.0114363431930542, 0.011824607849121094, 0.012212872505187988, 0.012601137161254883, 0.012989401817321777, 0.013377666473388672, 0.013765931129455566, 0.014154195785522461, 0.014542460441589355, 0.01493072509765625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 9.0, 21.0, 23.0, 32.0, 59.0, 84.0, 77.0, 76.0, 117.0, 119.0, 108.0, 81.0, 50.0, 48.0, 21.0, 20.0, 9.0, 15.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01348876953125, -0.013163566589355469, -0.012838363647460938, -0.012513160705566406, -0.012187957763671875, -0.011862754821777344, -0.011537551879882812, -0.011212348937988281, -0.01088714599609375, -0.010561943054199219, -0.010236740112304688, -0.009911537170410156, -0.009586334228515625, -0.009261131286621094, -0.008935928344726562, -0.008610725402832031, -0.0082855224609375, -0.007960319519042969, -0.0076351165771484375, -0.007309913635253906, -0.006984710693359375, -0.006659507751464844, -0.0063343048095703125, -0.006009101867675781, -0.00568389892578125, -0.005358695983886719, -0.0050334930419921875, -0.004708290100097656, -0.004383087158203125, -0.004057884216308594, -0.0037326812744140625, -0.0034074783325195312, -0.003082275390625, -0.0027570724487304688, -0.0024318695068359375, -0.0021066665649414062, -0.001781463623046875, -0.0014562606811523438, -0.0011310577392578125, -0.0008058547973632812, -0.00048065185546875, -0.00015544891357421875, 0.0001697540283203125, 0.0004949569702148438, 0.000820159912109375, 0.0011453628540039062, 0.0014705657958984375, 0.0017957687377929688, 0.0021209716796875, 0.0024461746215820312, 0.0027713775634765625, 0.0030965805053710938, 0.003421783447265625, 0.0037469863891601562, 0.0040721893310546875, 0.004397392272949219, 0.00472259521484375, 0.005047798156738281, 0.0053730010986328125, 0.005698204040527344, 0.006023406982421875, 0.006348609924316406, 0.0066738128662109375, 0.006999015808105469, 0.00732421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 11.0, 18.0, 23.0, 55.0, 120.0, 286.0, 662.0, 2324.0, 26873.0, 4118606.0, 41274.0, 2788.0, 687.0, 298.0, 122.0, 56.0, 32.0, 13.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0165252685546875, -0.015965938568115234, -0.015406608581542969, -0.014847278594970703, -0.014287948608398438, -0.013728618621826172, -0.013169288635253906, -0.01260995864868164, -0.012050628662109375, -0.01149129867553711, -0.010931968688964844, -0.010372638702392578, -0.009813308715820312, -0.009253978729248047, -0.008694648742675781, -0.008135318756103516, -0.00757598876953125, -0.007016658782958984, -0.006457328796386719, -0.005897998809814453, -0.0053386688232421875, -0.004779338836669922, -0.004220008850097656, -0.0036606788635253906, -0.003101348876953125, -0.0025420188903808594, -0.0019826889038085938, -0.0014233589172363281, -0.0008640289306640625, -0.0003046989440917969, 0.00025463104248046875, 0.0008139610290527344, 0.001373291015625, 0.0019326210021972656, 0.0024919509887695312, 0.003051280975341797, 0.0036106109619140625, 0.004169940948486328, 0.004729270935058594, 0.005288600921630859, 0.005847930908203125, 0.006407260894775391, 0.006966590881347656, 0.007525920867919922, 0.008085250854492188, 0.008644580841064453, 0.009203910827636719, 0.009763240814208984, 0.01032257080078125, 0.010881900787353516, 0.011441230773925781, 0.012000560760498047, 0.012559890747070312, 0.013119220733642578, 0.013678550720214844, 0.01423788070678711, 0.014797210693359375, 0.01535654067993164, 0.015915870666503906, 0.016475200653076172, 0.017034530639648438, 0.017593860626220703, 0.01815319061279297, 0.018712520599365234, 0.0192718505859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 9.0, 15.0, 48.0, 82.0, 286.0, 765.0, 1414.0, 902.0, 344.0, 108.0, 37.0, 20.0, 14.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0175323486328125, -0.017090201377868652, -0.016648054122924805, -0.016205906867980957, -0.01576375961303711, -0.015321612358093262, -0.014879465103149414, -0.014437317848205566, -0.013995170593261719, -0.013553023338317871, -0.013110876083374023, -0.012668728828430176, -0.012226581573486328, -0.01178443431854248, -0.011342287063598633, -0.010900139808654785, -0.010457992553710938, -0.01001584529876709, -0.009573698043823242, -0.009131550788879395, -0.008689403533935547, -0.0082472562789917, -0.0078051090240478516, -0.007362961769104004, -0.006920814514160156, -0.006478667259216309, -0.006036520004272461, -0.005594372749328613, -0.005152225494384766, -0.004710078239440918, -0.00426793098449707, -0.0038257837295532227, -0.003383636474609375, -0.0029414892196655273, -0.0024993419647216797, -0.002057194709777832, -0.0016150474548339844, -0.0011729001998901367, -0.0007307529449462891, -0.0002886056900024414, 0.00015354156494140625, 0.0005956888198852539, 0.0010378360748291016, 0.0014799833297729492, 0.0019221305847167969, 0.0023642778396606445, 0.002806425094604492, 0.00324857234954834, 0.0036907196044921875, 0.004132866859436035, 0.004575014114379883, 0.0050171613693237305, 0.005459308624267578, 0.005901455879211426, 0.0063436031341552734, 0.006785750389099121, 0.007227897644042969, 0.007670044898986816, 0.008112192153930664, 0.008554339408874512, 0.00899648666381836, 0.009438633918762207, 0.009880781173706055, 0.010322928428649902, 0.01076507568359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 11.0, 22.0, 46.0, 105.0, 202.0, 228.0, 196.0, 89.0, 41.0, 30.0, 11.0, 7.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020223934203386307, -0.01802668906748295, -0.01582944393157959, -0.01363220065832138, -0.011434955522418022, -0.009237710386514664, -0.00704046618193388, -0.004843221977353096, -0.0026459768414497375, -0.0004487321712076664, 0.0017485124990344048, 0.003945757169276476, 0.006143001839518547, 0.008340246975421906, 0.01053749118000269, 0.012734735384583473, 0.014931980520486832, 0.01712922565639019, 0.01932647079229355, 0.021523714065551758, 0.023720959201455116, 0.025918204337358475, 0.028115447610616684, 0.030312692746520042, 0.0325099378824234, 0.03470718115568161, 0.03690442815423012, 0.03910167142748833, 0.041298918426036835, 0.043496161699295044, 0.04569340497255325, 0.04789064824581146, 0.05008789151906967, 0.05228513479232788, 0.05448238179087639, 0.0566796250641346, 0.058876872062683105, 0.061074115335941315, 0.06327135860919952, 0.06546860188245773, 0.06766584515571594, 0.06986308842897415, 0.07206033170223236, 0.07425758242607117, 0.07645482569932938, 0.07865206897258759, 0.0808493122458458, 0.083046555519104, 0.08524380624294281, 0.08744104951620102, 0.08963829278945923, 0.09183554351329803, 0.09403278678655624, 0.09623003005981445, 0.09842727333307266, 0.10062451660633087, 0.10282176733016968, 0.10501901060342789, 0.1072162538766861, 0.1094135046005249, 0.11161074787378311, 0.11380799114704132, 0.11600523442029953, 0.11820247769355774, 0.12039972096681595]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 12.0, 23.0, 29.0, 22.0, 29.0, 51.0, 54.0, 64.0, 65.0, 77.0, 74.0, 56.0, 69.0, 62.0, 57.0, 44.0, 48.0, 52.0, 36.0, 24.0, 15.0, 10.0, 10.0, 9.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028397321701049805, -0.026718582957983017, -0.02503984607756138, -0.02336110919713974, -0.021682370454072952, -0.020003631711006165, -0.018324894830584526, -0.016646157950162888, -0.0149674192070961, -0.013288681395351887, -0.011609943583607674, -0.00993120577186346, -0.008252467960119247, -0.006573730148375034, -0.004894992336630821, -0.003216254524886608, -0.001537516713142395, 0.00014122109860181808, 0.0018199589103460312, 0.0034986967220902443, 0.005177434533834457, 0.0068561723455786705, 0.008534910157322884, 0.010213647969067097, 0.01189238578081131, 0.013571123592555523, 0.015249861404299736, 0.016928598284721375, 0.018607337027788162, 0.02028607577085495, 0.02196481265127659, 0.023643549531698227, 0.025322288274765015, 0.027001027017831802, 0.02867976389825344, 0.03035850077867508, 0.03203723952174187, 0.033715978264808655, 0.035394713282585144, 0.03707345202565193, 0.03875219076871872, 0.04043092951178551, 0.042109668254852295, 0.043788403272628784, 0.04546714201569557, 0.04714588075876236, 0.04882461577653885, 0.05050335451960564, 0.052182093262672424, 0.05386083200573921, 0.055539570748806, 0.05721830576658249, 0.05889704450964928, 0.060575783252716064, 0.062254518270492554, 0.06393326073884964, 0.06561199575662613, 0.06729073077440262, 0.0689694732427597, 0.0706482082605362, 0.07232694327831268, 0.07400568574666977, 0.07568442076444626, 0.07736316323280334, 0.07904189825057983]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 4.0, 10.0, 9.0, 8.0, 22.0, 21.0, 28.0, 43.0, 55.0, 70.0, 119.0, 213.0, 332.0, 549.0, 1178.0, 2519.0, 6428.0, 22793.0, 122508.0, 613123.0, 226210.0, 36545.0, 9304.0, 3260.0, 1417.0, 696.0, 381.0, 247.0, 143.0, 81.0, 62.0, 46.0, 33.0, 18.0, 20.0, 15.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01110076904296875, -0.010770916938781738, -0.010441064834594727, -0.010111212730407715, -0.009781360626220703, -0.009451508522033691, -0.00912165641784668, -0.008791804313659668, -0.008461952209472656, -0.008132100105285645, -0.007802248001098633, -0.007472395896911621, -0.007142543792724609, -0.006812691688537598, -0.006482839584350586, -0.006152987480163574, -0.0058231353759765625, -0.005493283271789551, -0.005163431167602539, -0.004833579063415527, -0.004503726959228516, -0.004173874855041504, -0.003844022750854492, -0.0035141706466674805, -0.0031843185424804688, -0.002854466438293457, -0.0025246143341064453, -0.0021947622299194336, -0.0018649101257324219, -0.0015350580215454102, -0.0012052059173583984, -0.0008753538131713867, -0.000545501708984375, -0.00021564960479736328, 0.00011420249938964844, 0.00044405460357666016, 0.0007739067077636719, 0.0011037588119506836, 0.0014336109161376953, 0.001763463020324707, 0.0020933151245117188, 0.0024231672286987305, 0.002753019332885742, 0.003082871437072754, 0.0034127235412597656, 0.0037425756454467773, 0.004072427749633789, 0.004402279853820801, 0.0047321319580078125, 0.005061984062194824, 0.005391836166381836, 0.005721688270568848, 0.006051540374755859, 0.006381392478942871, 0.006711244583129883, 0.0070410966873168945, 0.007370948791503906, 0.007700800895690918, 0.00803065299987793, 0.008360505104064941, 0.008690357208251953, 0.009020209312438965, 0.009350061416625977, 0.009679913520812988, 0.010009765625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 7.0, 5.0, 3.0, 9.0, 25.0, 22.0, 38.0, 47.0, 61.0, 83.0, 91.0, 107.0, 95.0, 105.0, 87.0, 65.0, 53.0, 33.0, 25.0, 14.0, 10.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01336669921875, -0.013054251670837402, -0.012741804122924805, -0.012429356575012207, -0.01211690902709961, -0.011804461479187012, -0.011492013931274414, -0.011179566383361816, -0.010867118835449219, -0.010554671287536621, -0.010242223739624023, -0.009929776191711426, -0.009617328643798828, -0.00930488109588623, -0.008992433547973633, -0.008679986000061035, -0.008367538452148438, -0.00805509090423584, -0.007742643356323242, -0.0074301958084106445, -0.007117748260498047, -0.006805300712585449, -0.0064928531646728516, -0.006180405616760254, -0.005867958068847656, -0.005555510520935059, -0.005243062973022461, -0.004930615425109863, -0.004618167877197266, -0.004305720329284668, -0.00399327278137207, -0.0036808252334594727, -0.003368377685546875, -0.0030559301376342773, -0.0027434825897216797, -0.002431035041809082, -0.0021185874938964844, -0.0018061399459838867, -0.001493692398071289, -0.0011812448501586914, -0.0008687973022460938, -0.0005563497543334961, -0.00024390220642089844, 6.854534149169922e-05, 0.0003809928894042969, 0.0006934404373168945, 0.0010058879852294922, 0.0013183355331420898, 0.0016307830810546875, 0.0019432306289672852, 0.002255678176879883, 0.0025681257247924805, 0.002880573272705078, 0.0031930208206176758, 0.0035054683685302734, 0.003817915916442871, 0.004130363464355469, 0.004442811012268066, 0.004755258560180664, 0.005067706108093262, 0.005380153656005859, 0.005692601203918457, 0.006005048751831055, 0.006317496299743652, 0.00662994384765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 6.0, 1.0, 1.0, 3.0, 4.0, 5.0, 16.0, 7.0, 8.0, 25.0, 20.0, 33.0, 39.0, 48.0, 68.0, 86.0, 121.0, 162.0, 214.0, 293.0, 444.0, 686.0, 1111.0, 2243.0, 6471.0, 32556.0, 293981.0, 651060.0, 44769.0, 7993.0, 2524.0, 1189.0, 727.0, 494.0, 281.0, 243.0, 161.0, 116.0, 81.0, 67.0, 53.0, 42.0, 27.0, 23.0, 13.0, 15.0, 9.0, 12.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0113525390625, -0.0110093355178833, -0.010666131973266602, -0.010322928428649902, -0.009979724884033203, -0.009636521339416504, -0.009293317794799805, -0.008950114250183105, -0.008606910705566406, -0.008263707160949707, -0.007920503616333008, -0.007577300071716309, -0.007234096527099609, -0.00689089298248291, -0.006547689437866211, -0.006204485893249512, -0.0058612823486328125, -0.005518078804016113, -0.005174875259399414, -0.004831671714782715, -0.004488468170166016, -0.004145264625549316, -0.003802061080932617, -0.003458857536315918, -0.0031156539916992188, -0.0027724504470825195, -0.0024292469024658203, -0.002086043357849121, -0.0017428398132324219, -0.0013996362686157227, -0.0010564327239990234, -0.0007132291793823242, -0.000370025634765625, -2.682209014892578e-05, 0.00031638145446777344, 0.0006595849990844727, 0.0010027885437011719, 0.001345992088317871, 0.0016891956329345703, 0.0020323991775512695, 0.0023756027221679688, 0.002718806266784668, 0.003062009811401367, 0.0034052133560180664, 0.0037484169006347656, 0.004091620445251465, 0.004434823989868164, 0.004778027534484863, 0.0051212310791015625, 0.005464434623718262, 0.005807638168334961, 0.00615084171295166, 0.006494045257568359, 0.006837248802185059, 0.007180452346801758, 0.007523655891418457, 0.007866859436035156, 0.008210062980651855, 0.008553266525268555, 0.008896470069885254, 0.009239673614501953, 0.009582877159118652, 0.009926080703735352, 0.01026928424835205, 0.01061248779296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 9.0, 10.0, 12.0, 11.0, 17.0, 20.0, 20.0, 27.0, 29.0, 37.0, 42.0, 40.0, 35.0, 48.0, 56.0, 55.0, 69.0, 52.0, 55.0, 44.0, 41.0, 47.0, 32.0, 35.0, 25.0, 20.0, 18.0, 17.0, 16.0, 9.0, 8.0, 10.0, 4.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0225067138671875, -0.021872758865356445, -0.02123880386352539, -0.020604848861694336, -0.01997089385986328, -0.019336938858032227, -0.018702983856201172, -0.018069028854370117, -0.017435073852539062, -0.016801118850708008, -0.016167163848876953, -0.015533208847045898, -0.014899253845214844, -0.014265298843383789, -0.013631343841552734, -0.01299738883972168, -0.012363433837890625, -0.01172947883605957, -0.011095523834228516, -0.010461568832397461, -0.009827613830566406, -0.009193658828735352, -0.008559703826904297, -0.007925748825073242, -0.0072917938232421875, -0.006657838821411133, -0.006023883819580078, -0.0053899288177490234, -0.004755973815917969, -0.004122018814086914, -0.0034880638122558594, -0.0028541088104248047, -0.00222015380859375, -0.0015861988067626953, -0.0009522438049316406, -0.00031828880310058594, 0.00031566619873046875, 0.0009496212005615234, 0.0015835762023925781, 0.002217531204223633, 0.0028514862060546875, 0.003485441207885742, 0.004119396209716797, 0.0047533512115478516, 0.005387306213378906, 0.006021261215209961, 0.006655216217041016, 0.00728917121887207, 0.007923126220703125, 0.00855708122253418, 0.009191036224365234, 0.009824991226196289, 0.010458946228027344, 0.011092901229858398, 0.011726856231689453, 0.012360811233520508, 0.012994766235351562, 0.013628721237182617, 0.014262676239013672, 0.014896631240844727, 0.015530586242675781, 0.016164541244506836, 0.01679849624633789, 0.017432451248168945, 0.01806640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 5.0, 12.0, 18.0, 36.0, 44.0, 66.0, 124.0, 265.0, 606.0, 1752.0, 5946.0, 34833.0, 721317.0, 254603.0, 22207.0, 4441.0, 1266.0, 500.0, 219.0, 100.0, 70.0, 28.0, 23.0, 15.0, 7.0, 10.0, 4.0, 1.0, 6.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0025081634521484375, -0.002431899309158325, -0.002355635166168213, -0.0022793710231781006, -0.0022031068801879883, -0.002126842737197876, -0.0020505785942077637, -0.0019743144512176514, -0.001898050308227539, -0.0018217861652374268, -0.0017455220222473145, -0.0016692578792572021, -0.0015929937362670898, -0.0015167295932769775, -0.0014404654502868652, -0.001364201307296753, -0.0012879371643066406, -0.0012116730213165283, -0.001135408878326416, -0.0010591447353363037, -0.0009828805923461914, -0.0009066164493560791, -0.0008303523063659668, -0.0007540881633758545, -0.0006778240203857422, -0.0006015598773956299, -0.0005252957344055176, -0.0004490315914154053, -0.00037276744842529297, -0.00029650330543518066, -0.00022023916244506836, -0.00014397501945495605, -6.771087646484375e-05, 8.553266525268555e-06, 8.481740951538086e-05, 0.00016108155250549316, 0.00023734569549560547, 0.0003136098384857178, 0.0003898739814758301, 0.0004661381244659424, 0.0005424022674560547, 0.000618666410446167, 0.0006949305534362793, 0.0007711946964263916, 0.0008474588394165039, 0.0009237229824066162, 0.0009999871253967285, 0.0010762512683868408, 0.0011525154113769531, 0.0012287795543670654, 0.0013050436973571777, 0.00138130784034729, 0.0014575719833374023, 0.0015338361263275146, 0.001610100269317627, 0.0016863644123077393, 0.0017626285552978516, 0.0018388926982879639, 0.0019151568412780762, 0.0019914209842681885, 0.0020676851272583008, 0.002143949270248413, 0.0022202134132385254, 0.0022964775562286377, 0.00237274169921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 2.0, 4.0, 18.0, 5.0, 8.0, 20.0, 18.0, 16.0, 31.0, 30.0, 27.0, 66.0, 44.0, 41.0, 41.0, 49.0, 43.0, 40.0, 42.0, 40.0, 61.0, 49.0, 38.0, 45.0, 35.0, 32.0, 21.0, 20.0, 16.0, 26.0, 9.0, 11.0, 5.0, 5.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.231929779052734e-06, -4.106201231479645e-06, -3.980472683906555e-06, -3.8547441363334656e-06, -3.729015588760376e-06, -3.6032870411872864e-06, -3.4775584936141968e-06, -3.351829946041107e-06, -3.2261013984680176e-06, -3.100372850894928e-06, -2.9746443033218384e-06, -2.8489157557487488e-06, -2.723187208175659e-06, -2.5974586606025696e-06, -2.47173011302948e-06, -2.3460015654563904e-06, -2.2202730178833008e-06, -2.094544470310211e-06, -1.9688159227371216e-06, -1.843087375164032e-06, -1.7173588275909424e-06, -1.5916302800178528e-06, -1.4659017324447632e-06, -1.3401731848716736e-06, -1.214444637298584e-06, -1.0887160897254944e-06, -9.629875421524048e-07, -8.372589945793152e-07, -7.115304470062256e-07, -5.85801899433136e-07, -4.600733518600464e-07, -3.343448042869568e-07, -2.086162567138672e-07, -8.288770914077759e-08, 4.284083843231201e-08, 1.685693860054016e-07, 2.942979335784912e-07, 4.200264811515808e-07, 5.457550287246704e-07, 6.7148357629776e-07, 7.972121238708496e-07, 9.229406714439392e-07, 1.0486692190170288e-06, 1.1743977665901184e-06, 1.300126314163208e-06, 1.4258548617362976e-06, 1.5515834093093872e-06, 1.6773119568824768e-06, 1.8030405044555664e-06, 1.928769052028656e-06, 2.0544975996017456e-06, 2.180226147174835e-06, 2.305954694747925e-06, 2.4316832423210144e-06, 2.557411789894104e-06, 2.6831403374671936e-06, 2.808868885040283e-06, 2.934597432613373e-06, 3.0603259801864624e-06, 3.186054527759552e-06, 3.3117830753326416e-06, 3.437511622905731e-06, 3.563240170478821e-06, 3.6889687180519104e-06, 3.814697265625e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 18.0, 18.0, 42.0, 56.0, 89.0, 166.0, 322.0, 780.0, 2726.0, 17428.0, 403319.0, 601445.0, 17870.0, 2823.0, 768.0, 320.0, 164.0, 73.0, 46.0, 30.0, 14.0, 13.0, 5.0, 11.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0037517547607421875, -0.003660261631011963, -0.0035687685012817383, -0.0034772753715515137, -0.003385782241821289, -0.0032942891120910645, -0.00320279598236084, -0.0031113028526306152, -0.0030198097229003906, -0.002928316593170166, -0.0028368234634399414, -0.002745330333709717, -0.002653837203979492, -0.0025623440742492676, -0.002470850944519043, -0.0023793578147888184, -0.0022878646850585938, -0.002196371555328369, -0.0021048784255981445, -0.00201338529586792, -0.0019218921661376953, -0.0018303990364074707, -0.001738905906677246, -0.0016474127769470215, -0.0015559196472167969, -0.0014644265174865723, -0.0013729333877563477, -0.001281440258026123, -0.0011899471282958984, -0.0010984539985656738, -0.0010069608688354492, -0.0009154677391052246, -0.000823974609375, -0.0007324814796447754, -0.0006409883499145508, -0.0005494952201843262, -0.00045800209045410156, -0.00036650896072387695, -0.00027501583099365234, -0.00018352270126342773, -9.202957153320312e-05, -5.364418029785156e-07, 9.09566879272461e-05, 0.0001824498176574707, 0.0002739429473876953, 0.0003654360771179199, 0.00045692920684814453, 0.0005484223365783691, 0.0006399154663085938, 0.0007314085960388184, 0.000822901725769043, 0.0009143948554992676, 0.0010058879852294922, 0.0010973811149597168, 0.0011888742446899414, 0.001280367374420166, 0.0013718605041503906, 0.0014633536338806152, 0.0015548467636108398, 0.0016463398933410645, 0.001737833023071289, 0.0018293261528015137, 0.0019208192825317383, 0.002012312412261963, 0.0021038055419921875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 3.0, 8.0, 6.0, 4.0, 9.0, 11.0, 19.0, 19.0, 30.0, 31.0, 33.0, 62.0, 91.0, 99.0, 88.0, 93.0, 59.0, 73.0, 56.0, 57.0, 28.0, 33.0, 27.0, 10.0, 10.0, 10.0, 6.0, 3.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023193359375, -0.0022507905960083008, -0.0021822452545166016, -0.0021136999130249023, -0.002045154571533203, -0.001976609230041504, -0.0019080638885498047, -0.0018395185470581055, -0.0017709732055664062, -0.001702427864074707, -0.0016338825225830078, -0.0015653371810913086, -0.0014967918395996094, -0.0014282464981079102, -0.001359701156616211, -0.0012911558151245117, -0.0012226104736328125, -0.0011540651321411133, -0.001085519790649414, -0.0010169744491577148, -0.0009484291076660156, -0.0008798837661743164, -0.0008113384246826172, -0.000742793083190918, -0.0006742477416992188, -0.0006057024002075195, -0.0005371570587158203, -0.0004686117172241211, -0.0004000663757324219, -0.00033152103424072266, -0.00026297569274902344, -0.00019443035125732422, -0.000125885009765625, -5.733966827392578e-05, 1.1205673217773438e-05, 7.975101470947266e-05, 0.00014829635620117188, 0.0002168416976928711, 0.0002853870391845703, 0.00035393238067626953, 0.00042247772216796875, 0.000491023063659668, 0.0005595684051513672, 0.0006281137466430664, 0.0006966590881347656, 0.0007652044296264648, 0.0008337497711181641, 0.0009022951126098633, 0.0009708404541015625, 0.0010393857955932617, 0.001107931137084961, 0.0011764764785766602, 0.0012450218200683594, 0.0013135671615600586, 0.0013821125030517578, 0.001450657844543457, 0.0015192031860351562, 0.0015877485275268555, 0.0016562938690185547, 0.001724839210510254, 0.0017933845520019531, 0.0018619298934936523, 0.0019304752349853516, 0.0019990205764770508, 0.00206756591796875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 18.0, 43.0, 136.0, 483.0, 207.0, 72.0, 22.0, 10.0, 8.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09916044026613235, -0.09544247388839722, -0.09172450751066208, -0.08800654113292694, -0.0842885747551918, -0.08057060837745667, -0.07685264199972153, -0.07313467562198639, -0.06941670924425125, -0.06569874286651611, -0.061980776488780975, -0.05826281011104584, -0.0545448437333107, -0.05082687735557556, -0.047108910977840424, -0.043390944600105286, -0.03967297822237015, -0.03595501184463501, -0.03223704546689987, -0.028519079089164734, -0.024801112711429596, -0.021083146333694458, -0.01736517995595932, -0.013647213578224182, -0.009929247200489044, -0.006211280822753906, -0.0024933144450187683, 0.0012246519327163696, 0.004942618310451508, 0.008660584688186646, 0.012378551065921783, 0.01609651744365692, 0.019814491271972656, 0.023532457649707794, 0.027250424027442932, 0.03096839040517807, 0.03468635678291321, 0.038404323160648346, 0.042122289538383484, 0.04584025591611862, 0.04955822229385376, 0.0532761886715889, 0.056994155049324036, 0.060712121427059174, 0.06443008780479431, 0.06814805418252945, 0.07186602056026459, 0.07558398693799973, 0.07930195331573486, 0.08301991969347, 0.08673788607120514, 0.09045585244894028, 0.09417381882667542, 0.09789178520441055, 0.10160975158214569, 0.10532771795988083, 0.10904568433761597, 0.1127636507153511, 0.11648161709308624, 0.12019958347082138, 0.12391754984855652, 0.12763550877571106, 0.1313534826040268, 0.13507145643234253, 0.13878941535949707]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 8.0, 6.0, 12.0, 24.0, 23.0, 16.0, 19.0, 21.0, 15.0, 17.0, 33.0, 22.0, 44.0, 37.0, 52.0, 119.0, 149.0, 77.0, 39.0, 31.0, 36.0, 33.0, 22.0, 28.0, 18.0, 18.0, 16.0, 13.0, 11.0, 13.0, 7.0, 3.0, 3.0, 4.0, 0.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08641815185546875, -0.0839606523513794, -0.08150315284729004, -0.07904564589262009, -0.07658814638853073, -0.07413064688444138, -0.07167313992977142, -0.06921564042568207, -0.06675814092159271, -0.06430064141750336, -0.0618431381881237, -0.05938563495874405, -0.056928135454654694, -0.05447063595056534, -0.052013132721185684, -0.04955562949180603, -0.047098129987716675, -0.04464063048362732, -0.042183127254247665, -0.03972562402486801, -0.037268124520778656, -0.0348106250166893, -0.03235312178730965, -0.029895620420575142, -0.027438119053840637, -0.024980617687106133, -0.022523116320371628, -0.020065614953637123, -0.01760811358690262, -0.015150612220168114, -0.012693110853433609, -0.010235609486699104, -0.0077781081199646, -0.005320606753230095, -0.00286310538649559, -0.0004056040197610855, 0.002051897346973419, 0.004509398713707924, 0.006966900080442429, 0.009424401447176933, 0.011881902813911438, 0.014339404180645943, 0.016796905547380447, 0.019254406914114952, 0.021711908280849457, 0.02416940964758396, 0.026626911014318466, 0.02908441238105297, 0.031541913747787476, 0.03399941325187683, 0.036456916481256485, 0.03891441971063614, 0.041371919214725494, 0.04382941871881485, 0.046286921948194504, 0.04874442517757416, 0.05120192468166351, 0.05365942418575287, 0.05611692741513252, 0.058574430644512177, 0.06103193014860153, 0.06348942965269089, 0.06594693660736084, 0.0684044361114502, 0.07086193561553955]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 7.0, 4.0, 9.0, 16.0, 23.0, 15.0, 39.0, 62.0, 65.0, 139.0, 223.0, 466.0, 970.0, 2946.0, 24973.0, 558921.0, 3241795.0, 322980.0, 27303.0, 8778.0, 3238.0, 877.0, 225.0, 78.0, 53.0, 26.0, 13.0, 12.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0101776123046875, -0.009853839874267578, -0.009530067443847656, -0.009206295013427734, -0.008882522583007812, -0.00855875015258789, -0.008234977722167969, -0.007911205291748047, -0.007587432861328125, -0.007263660430908203, -0.006939888000488281, -0.006616115570068359, -0.0062923431396484375, -0.005968570709228516, -0.005644798278808594, -0.005321025848388672, -0.00499725341796875, -0.004673480987548828, -0.004349708557128906, -0.004025936126708984, -0.0037021636962890625, -0.0033783912658691406, -0.0030546188354492188, -0.002730846405029297, -0.002407073974609375, -0.002083301544189453, -0.0017595291137695312, -0.0014357566833496094, -0.0011119842529296875, -0.0007882118225097656, -0.00046443939208984375, -0.00014066696166992188, 0.00018310546875, 0.0005068778991699219, 0.0008306503295898438, 0.0011544227600097656, 0.0014781951904296875, 0.0018019676208496094, 0.0021257400512695312, 0.002449512481689453, 0.002773284912109375, 0.003097057342529297, 0.0034208297729492188, 0.0037446022033691406, 0.0040683746337890625, 0.004392147064208984, 0.004715919494628906, 0.005039691925048828, 0.00536346435546875, 0.005687236785888672, 0.006011009216308594, 0.006334781646728516, 0.0066585540771484375, 0.006982326507568359, 0.007306098937988281, 0.007629871368408203, 0.007953643798828125, 0.008277416229248047, 0.008601188659667969, 0.00892496109008789, 0.009248733520507812, 0.009572505950927734, 0.009896278381347656, 0.010220050811767578, 0.0105438232421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 7.0, 10.0, 19.0, 24.0, 38.0, 49.0, 62.0, 97.0, 92.0, 104.0, 102.0, 89.0, 82.0, 64.0, 44.0, 40.0, 23.0, 20.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.01329803466796875, -0.012986183166503906, -0.012674331665039062, -0.012362480163574219, -0.012050628662109375, -0.011738777160644531, -0.011426925659179688, -0.011115074157714844, -0.01080322265625, -0.010491371154785156, -0.010179519653320312, -0.009867668151855469, -0.009555816650390625, -0.009243965148925781, -0.008932113647460938, -0.008620262145996094, -0.00830841064453125, -0.007996559143066406, -0.0076847076416015625, -0.007372856140136719, -0.007061004638671875, -0.006749153137207031, -0.0064373016357421875, -0.006125450134277344, -0.0058135986328125, -0.005501747131347656, -0.0051898956298828125, -0.004878044128417969, -0.004566192626953125, -0.004254341125488281, -0.0039424896240234375, -0.0036306381225585938, -0.00331878662109375, -0.0030069351196289062, -0.0026950836181640625, -0.0023832321166992188, -0.002071380615234375, -0.0017595291137695312, -0.0014476776123046875, -0.0011358261108398438, -0.000823974609375, -0.0005121231079101562, -0.0002002716064453125, 0.00011157989501953125, 0.000423431396484375, 0.0007352828979492188, 0.0010471343994140625, 0.0013589859008789062, 0.00167083740234375, 0.0019826889038085938, 0.0022945404052734375, 0.0026063919067382812, 0.002918243408203125, 0.0032300949096679688, 0.0035419464111328125, 0.0038537979125976562, 0.0041656494140625, 0.004477500915527344, 0.0047893524169921875, 0.005101203918457031, 0.005413055419921875, 0.005724906921386719, 0.0060367584228515625, 0.006348609924316406, 0.00666046142578125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 9.0, 16.0, 32.0, 52.0, 137.0, 323.0, 1527.0, 35306.0, 4150528.0, 5040.0, 833.0, 246.0, 108.0, 44.0, 28.0, 14.0, 10.0, 9.0, 3.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048370361328125, -0.04665994644165039, -0.04494953155517578, -0.04323911666870117, -0.04152870178222656, -0.03981828689575195, -0.038107872009277344, -0.036397457122802734, -0.034687042236328125, -0.032976627349853516, -0.031266212463378906, -0.029555797576904297, -0.027845382690429688, -0.026134967803955078, -0.02442455291748047, -0.02271413803100586, -0.02100372314453125, -0.01929330825805664, -0.01758289337158203, -0.015872478485107422, -0.014162063598632812, -0.012451648712158203, -0.010741233825683594, -0.009030818939208984, -0.007320404052734375, -0.005609989166259766, -0.0038995742797851562, -0.002189159393310547, -0.0004787445068359375, 0.0012316703796386719, 0.0029420852661132812, 0.004652500152587891, 0.0063629150390625, 0.00807332992553711, 0.009783744812011719, 0.011494159698486328, 0.013204574584960938, 0.014914989471435547, 0.016625404357910156, 0.018335819244384766, 0.020046234130859375, 0.021756649017333984, 0.023467063903808594, 0.025177478790283203, 0.026887893676757812, 0.028598308563232422, 0.03030872344970703, 0.03201913833618164, 0.03372955322265625, 0.03543996810913086, 0.03715038299560547, 0.03886079788208008, 0.04057121276855469, 0.0422816276550293, 0.043992042541503906, 0.045702457427978516, 0.047412872314453125, 0.049123287200927734, 0.050833702087402344, 0.05254411697387695, 0.05425453186035156, 0.05596494674682617, 0.05767536163330078, 0.05938577651977539, 0.06109619140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 10.0, 15.0, 26.0, 18.0, 44.0, 91.0, 132.0, 304.0, 696.0, 1196.0, 778.0, 380.0, 140.0, 98.0, 54.0, 23.0, 19.0, 12.0, 9.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0173797607421875, -0.016646146774291992, -0.015912532806396484, -0.015178918838500977, -0.014445304870605469, -0.013711690902709961, -0.012978076934814453, -0.012244462966918945, -0.011510848999023438, -0.01077723503112793, -0.010043621063232422, -0.009310007095336914, -0.008576393127441406, -0.007842779159545898, -0.007109165191650391, -0.006375551223754883, -0.005641937255859375, -0.004908323287963867, -0.004174709320068359, -0.0034410953521728516, -0.0027074813842773438, -0.001973867416381836, -0.0012402534484863281, -0.0005066394805908203, 0.0002269744873046875, 0.0009605884552001953, 0.0016942024230957031, 0.002427816390991211, 0.0031614303588867188, 0.0038950443267822266, 0.004628658294677734, 0.005362272262573242, 0.00609588623046875, 0.006829500198364258, 0.007563114166259766, 0.008296728134155273, 0.009030342102050781, 0.009763956069946289, 0.010497570037841797, 0.011231184005737305, 0.011964797973632812, 0.01269841194152832, 0.013432025909423828, 0.014165639877319336, 0.014899253845214844, 0.01563286781311035, 0.01636648178100586, 0.017100095748901367, 0.017833709716796875, 0.018567323684692383, 0.01930093765258789, 0.0200345516204834, 0.020768165588378906, 0.021501779556274414, 0.022235393524169922, 0.02296900749206543, 0.023702621459960938, 0.024436235427856445, 0.025169849395751953, 0.02590346336364746, 0.02663707733154297, 0.027370691299438477, 0.028104305267333984, 0.028837919235229492, 0.029571533203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 21.0, 37.0, 131.0, 244.0, 310.0, 140.0, 47.0, 23.0, 14.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16548380255699158, -0.15911884605884552, -0.15275390446186066, -0.1463889479637146, -0.14002400636672974, -0.13365904986858368, -0.12729410827159882, -0.12092915177345276, -0.1145642101764679, -0.10819926112890244, -0.10183431208133698, -0.09546936303377151, -0.08910441398620605, -0.08273945748806, -0.07637451589107513, -0.07000955939292908, -0.06364461034536362, -0.05727966129779816, -0.0509147122502327, -0.044549763202667236, -0.038184814155101776, -0.03181986138224602, -0.025454912334680557, -0.019089963287115097, -0.012725014239549637, -0.006360064726322889, 4.884786903858185e-06, 0.006369834765791893, 0.012734783813357353, 0.019099734723567963, 0.025464683771133423, 0.03182963281869888, 0.03819458186626434, 0.0445595309138298, 0.050924479961395264, 0.057289429008960724, 0.06365437805652618, 0.07001933455467224, 0.0763842761516571, 0.08274923264980316, 0.08911417424678802, 0.09547912329435349, 0.10184407234191895, 0.1082090213894844, 0.11457397043704987, 0.12093892693519592, 0.1273038685321808, 0.13366882503032684, 0.1400337815284729, 0.14639873802661896, 0.15276367962360382, 0.15912863612174988, 0.16549357771873474, 0.1718585342168808, 0.17822347581386566, 0.18458843231201172, 0.19095337390899658, 0.19731833040714264, 0.2036832720041275, 0.21004822850227356, 0.21641317009925842, 0.22277812659740448, 0.22914306819438934, 0.2355080246925354, 0.24187296628952026]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 13.0, 12.0, 26.0, 48.0, 68.0, 69.0, 94.0, 127.0, 126.0, 115.0, 109.0, 78.0, 42.0, 25.0, 21.0, 7.0, 11.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21889573335647583, -0.2122393101453781, -0.2055828869342804, -0.19892646372318268, -0.19227004051208496, -0.18561361730098724, -0.17895719408988953, -0.17230075597763062, -0.1656443476676941, -0.15898792445659637, -0.15233150124549866, -0.14567507803440094, -0.13901865482330322, -0.1323622316122055, -0.1257058084011078, -0.11904937773942947, -0.11239294707775116, -0.10573652386665344, -0.09908010065555573, -0.09242367744445801, -0.08576725423336029, -0.07911083102226257, -0.07245440036058426, -0.06579797714948654, -0.059141553938388824, -0.05248513072729111, -0.04582870751619339, -0.039172280579805374, -0.03251585736870766, -0.02585943415760994, -0.019203007221221924, -0.012546584010124207, -0.005890160799026489, 0.0007662633433938026, 0.0074226874858140945, 0.014079112559556961, 0.02073553577065468, 0.027391958981752396, 0.03404838591814041, 0.04070480912923813, 0.047361232340335846, 0.05401765555143356, 0.06067407876253128, 0.0673305094242096, 0.07398693263530731, 0.08064335584640503, 0.08729977905750275, 0.09395620226860046, 0.10061262547969818, 0.1072690486907959, 0.11392547190189362, 0.12058189511299133, 0.12723831832408905, 0.13389474153518677, 0.14055117964744568, 0.1472075879573822, 0.1538640260696411, 0.16052044928073883, 0.16717687249183655, 0.17383329570293427, 0.18048971891403198, 0.1871461421251297, 0.19380256533622742, 0.20045900344848633, 0.20711541175842285]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 4.0, 9.0, 19.0, 27.0, 27.0, 48.0, 60.0, 131.0, 214.0, 356.0, 862.0, 2308.0, 8853.0, 66350.0, 824586.0, 125977.0, 13428.0, 3154.0, 1083.0, 465.0, 239.0, 120.0, 76.0, 38.0, 26.0, 19.0, 15.0, 9.0, 9.0, 11.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.018341064453125, -0.0177609920501709, -0.017180919647216797, -0.016600847244262695, -0.016020774841308594, -0.015440702438354492, -0.01486063003540039, -0.014280557632446289, -0.013700485229492188, -0.013120412826538086, -0.012540340423583984, -0.011960268020629883, -0.011380195617675781, -0.01080012321472168, -0.010220050811767578, -0.009639978408813477, -0.009059906005859375, -0.008479833602905273, -0.007899761199951172, -0.00731968879699707, -0.006739616394042969, -0.006159543991088867, -0.005579471588134766, -0.004999399185180664, -0.0044193267822265625, -0.003839254379272461, -0.0032591819763183594, -0.002679109573364258, -0.0020990371704101562, -0.0015189647674560547, -0.0009388923645019531, -0.00035881996154785156, 0.00022125244140625, 0.0008013248443603516, 0.0013813972473144531, 0.0019614696502685547, 0.0025415420532226562, 0.003121614456176758, 0.0037016868591308594, 0.004281759262084961, 0.0048618316650390625, 0.005441904067993164, 0.006021976470947266, 0.006602048873901367, 0.007182121276855469, 0.00776219367980957, 0.008342266082763672, 0.008922338485717773, 0.009502410888671875, 0.010082483291625977, 0.010662555694580078, 0.01124262809753418, 0.011822700500488281, 0.012402772903442383, 0.012982845306396484, 0.013562917709350586, 0.014142990112304688, 0.014723062515258789, 0.01530313491821289, 0.015883207321166992, 0.016463279724121094, 0.017043352127075195, 0.017623424530029297, 0.0182034969329834, 0.0187835693359375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 1.0, 3.0, 13.0, 23.0, 37.0, 57.0, 87.0, 105.0, 160.0, 133.0, 121.0, 108.0, 61.0, 41.0, 18.0, 15.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01947021484375, -0.018929243087768555, -0.01838827133178711, -0.017847299575805664, -0.01730632781982422, -0.016765356063842773, -0.016224384307861328, -0.015683412551879883, -0.015142440795898438, -0.014601469039916992, -0.014060497283935547, -0.013519525527954102, -0.012978553771972656, -0.012437582015991211, -0.011896610260009766, -0.01135563850402832, -0.010814666748046875, -0.01027369499206543, -0.009732723236083984, -0.009191751480102539, -0.008650779724121094, -0.008109807968139648, -0.007568836212158203, -0.007027864456176758, -0.0064868927001953125, -0.005945920944213867, -0.005404949188232422, -0.0048639774322509766, -0.004323005676269531, -0.003782033920288086, -0.0032410621643066406, -0.0027000904083251953, -0.00215911865234375, -0.0016181468963623047, -0.0010771751403808594, -0.0005362033843994141, 4.76837158203125e-06, 0.0005457401275634766, 0.0010867118835449219, 0.0016276836395263672, 0.0021686553955078125, 0.002709627151489258, 0.003250598907470703, 0.0037915706634521484, 0.004332542419433594, 0.004873514175415039, 0.005414485931396484, 0.00595545768737793, 0.006496429443359375, 0.00703740119934082, 0.007578372955322266, 0.008119344711303711, 0.008660316467285156, 0.009201288223266602, 0.009742259979248047, 0.010283231735229492, 0.010824203491210938, 0.011365175247192383, 0.011906147003173828, 0.012447118759155273, 0.012988090515136719, 0.013529062271118164, 0.01407003402709961, 0.014611005783081055, 0.0151519775390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 1.0, 5.0, 4.0, 7.0, 16.0, 16.0, 14.0, 18.0, 29.0, 53.0, 51.0, 77.0, 130.0, 209.0, 345.0, 651.0, 1517.0, 4904.0, 33604.0, 906061.0, 88262.0, 8497.0, 2148.0, 761.0, 424.0, 250.0, 152.0, 93.0, 61.0, 43.0, 33.0, 24.0, 22.0, 18.0, 15.0, 6.0, 8.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0], "bins": [-0.0198516845703125, -0.019338369369506836, -0.018825054168701172, -0.018311738967895508, -0.017798423767089844, -0.01728510856628418, -0.016771793365478516, -0.01625847816467285, -0.015745162963867188, -0.015231847763061523, -0.01471853256225586, -0.014205217361450195, -0.013691902160644531, -0.013178586959838867, -0.012665271759033203, -0.012151956558227539, -0.011638641357421875, -0.011125326156616211, -0.010612010955810547, -0.010098695755004883, -0.009585380554199219, -0.009072065353393555, -0.00855875015258789, -0.008045434951782227, -0.0075321197509765625, -0.0070188045501708984, -0.006505489349365234, -0.00599217414855957, -0.005478858947753906, -0.004965543746948242, -0.004452228546142578, -0.003938913345336914, -0.00342559814453125, -0.002912282943725586, -0.002398967742919922, -0.0018856525421142578, -0.0013723373413085938, -0.0008590221405029297, -0.0003457069396972656, 0.00016760826110839844, 0.0006809234619140625, 0.0011942386627197266, 0.0017075538635253906, 0.0022208690643310547, 0.0027341842651367188, 0.003247499465942383, 0.003760814666748047, 0.004274129867553711, 0.004787445068359375, 0.005300760269165039, 0.005814075469970703, 0.006327390670776367, 0.006840705871582031, 0.007354021072387695, 0.00786733627319336, 0.008380651473999023, 0.008893966674804688, 0.009407281875610352, 0.009920597076416016, 0.01043391227722168, 0.010947227478027344, 0.011460542678833008, 0.011973857879638672, 0.012487173080444336, 0.01300048828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 8.0, 6.0, 13.0, 9.0, 14.0, 14.0, 14.0, 15.0, 18.0, 13.0, 29.0, 33.0, 42.0, 50.0, 62.0, 79.0, 87.0, 81.0, 76.0, 57.0, 39.0, 30.0, 31.0, 24.0, 10.0, 16.0, 30.0, 14.0, 6.0, 13.0, 9.0, 9.0, 8.0, 6.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.02880859375, -0.027929306030273438, -0.027050018310546875, -0.026170730590820312, -0.02529144287109375, -0.024412155151367188, -0.023532867431640625, -0.022653579711914062, -0.0217742919921875, -0.020895004272460938, -0.020015716552734375, -0.019136428833007812, -0.01825714111328125, -0.017377853393554688, -0.016498565673828125, -0.015619277954101562, -0.014739990234375, -0.013860702514648438, -0.012981414794921875, -0.012102127075195312, -0.01122283935546875, -0.010343551635742188, -0.009464263916015625, -0.008584976196289062, -0.0077056884765625, -0.0068264007568359375, -0.005947113037109375, -0.0050678253173828125, -0.00418853759765625, -0.0033092498779296875, -0.002429962158203125, -0.0015506744384765625, -0.00067138671875, 0.0002079010009765625, 0.001087188720703125, 0.0019664764404296875, 0.00284576416015625, 0.0037250518798828125, 0.004604339599609375, 0.0054836273193359375, 0.0063629150390625, 0.0072422027587890625, 0.008121490478515625, 0.009000778198242188, 0.00988006591796875, 0.010759353637695312, 0.011638641357421875, 0.012517929077148438, 0.013397216796875, 0.014276504516601562, 0.015155792236328125, 0.016035079956054688, 0.01691436767578125, 0.017793655395507812, 0.018672943115234375, 0.019552230834960938, 0.0204315185546875, 0.021310806274414062, 0.022190093994140625, 0.023069381713867188, 0.02394866943359375, 0.024827957153320312, 0.025707244873046875, 0.026586532592773438, 0.0274658203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 11.0, 9.0, 7.0, 15.0, 18.0, 16.0, 30.0, 54.0, 81.0, 124.0, 206.0, 423.0, 1018.0, 3329.0, 17148.0, 863052.0, 148223.0, 10623.0, 2405.0, 847.0, 401.0, 170.0, 97.0, 60.0, 46.0, 40.0, 18.0, 16.0, 17.0, 15.0, 6.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0037555694580078125, -0.0036413371562957764, -0.0035271048545837402, -0.003412872552871704, -0.003298640251159668, -0.003184407949447632, -0.0030701756477355957, -0.0029559433460235596, -0.0028417110443115234, -0.0027274787425994873, -0.002613246440887451, -0.002499014139175415, -0.002384781837463379, -0.0022705495357513428, -0.0021563172340393066, -0.0020420849323272705, -0.0019278526306152344, -0.0018136203289031982, -0.0016993880271911621, -0.001585155725479126, -0.0014709234237670898, -0.0013566911220550537, -0.0012424588203430176, -0.0011282265186309814, -0.0010139942169189453, -0.0008997619152069092, -0.000785529613494873, -0.0006712973117828369, -0.0005570650100708008, -0.00044283270835876465, -0.0003286004066467285, -0.00021436810493469238, -0.00010013580322265625, 1.4096498489379883e-05, 0.00012832880020141602, 0.00024256110191345215, 0.0003567934036254883, 0.0004710257053375244, 0.0005852580070495605, 0.0006994903087615967, 0.0008137226104736328, 0.0009279549121856689, 0.001042187213897705, 0.0011564195156097412, 0.0012706518173217773, 0.0013848841190338135, 0.0014991164207458496, 0.0016133487224578857, 0.0017275810241699219, 0.001841813325881958, 0.001956045627593994, 0.0020702779293060303, 0.0021845102310180664, 0.0022987425327301025, 0.0024129748344421387, 0.002527207136154175, 0.002641439437866211, 0.002755671739578247, 0.002869904041290283, 0.0029841363430023193, 0.0030983686447143555, 0.0032126009464263916, 0.0033268332481384277, 0.003441065549850464, 0.0035552978515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 4.0, 0.0, 3.0, 4.0, 4.0, 3.0, 9.0, 11.0, 7.0, 12.0, 14.0, 5.0, 14.0, 12.0, 16.0, 32.0, 24.0, 31.0, 41.0, 47.0, 30.0, 59.0, 36.0, 54.0, 68.0, 44.0, 64.0, 64.0, 45.0, 38.0, 38.0, 29.0, 25.0, 13.0, 15.0, 16.0, 13.0, 8.0, 4.0, 7.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 4.0], "bins": [-5.185604095458984e-06, -5.027279257774353e-06, -4.868954420089722e-06, -4.71062958240509e-06, -4.552304744720459e-06, -4.393979907035828e-06, -4.235655069351196e-06, -4.077330231666565e-06, -3.919005393981934e-06, -3.7606805562973022e-06, -3.602355718612671e-06, -3.4440308809280396e-06, -3.285706043243408e-06, -3.127381205558777e-06, -2.9690563678741455e-06, -2.810731530189514e-06, -2.652406692504883e-06, -2.4940818548202515e-06, -2.33575701713562e-06, -2.1774321794509888e-06, -2.0191073417663574e-06, -1.860782504081726e-06, -1.7024576663970947e-06, -1.5441328287124634e-06, -1.385807991027832e-06, -1.2274831533432007e-06, -1.0691583156585693e-06, -9.10833477973938e-07, -7.525086402893066e-07, -5.941838026046753e-07, -4.3585896492004395e-07, -2.775341272354126e-07, -1.1920928955078125e-07, 3.91155481338501e-08, 1.9744038581848145e-07, 3.557652235031128e-07, 5.140900611877441e-07, 6.724148988723755e-07, 8.307397365570068e-07, 9.890645742416382e-07, 1.1473894119262695e-06, 1.3057142496109009e-06, 1.4640390872955322e-06, 1.6223639249801636e-06, 1.780688762664795e-06, 1.9390136003494263e-06, 2.0973384380340576e-06, 2.255663275718689e-06, 2.4139881134033203e-06, 2.5723129510879517e-06, 2.730637788772583e-06, 2.8889626264572144e-06, 3.0472874641418457e-06, 3.205612301826477e-06, 3.3639371395111084e-06, 3.5222619771957397e-06, 3.680586814880371e-06, 3.8389116525650024e-06, 3.997236490249634e-06, 4.155561327934265e-06, 4.3138861656188965e-06, 4.472211003303528e-06, 4.630535840988159e-06, 4.7888606786727905e-06, 4.947185516357422e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 13.0, 18.0, 11.0, 16.0, 44.0, 49.0, 85.0, 135.0, 267.0, 553.0, 1182.0, 3234.0, 11418.0, 62674.0, 889102.0, 62708.0, 11388.0, 3327.0, 1175.0, 535.0, 261.0, 129.0, 75.0, 56.0, 32.0, 14.0, 20.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0017881393432617188, -0.0017347633838653564, -0.0016813874244689941, -0.0016280114650726318, -0.0015746355056762695, -0.0015212595462799072, -0.001467883586883545, -0.0014145076274871826, -0.0013611316680908203, -0.001307755708694458, -0.0012543797492980957, -0.0012010037899017334, -0.001147627830505371, -0.0010942518711090088, -0.0010408759117126465, -0.0009874999523162842, -0.0009341239929199219, -0.0008807480335235596, -0.0008273720741271973, -0.000773996114730835, -0.0007206201553344727, -0.0006672441959381104, -0.000613868236541748, -0.0005604922771453857, -0.0005071163177490234, -0.00045374035835266113, -0.00040036439895629883, -0.0003469884395599365, -0.0002936124801635742, -0.00024023652076721191, -0.0001868605613708496, -0.0001334846019744873, -8.0108642578125e-05, -2.6732683181762695e-05, 2.664327621459961e-05, 8.001923561096191e-05, 0.00013339519500732422, 0.00018677115440368652, 0.00024014711380004883, 0.00029352307319641113, 0.00034689903259277344, 0.00040027499198913574, 0.00045365095138549805, 0.0005070269107818604, 0.0005604028701782227, 0.000613778829574585, 0.0006671547889709473, 0.0007205307483673096, 0.0007739067077636719, 0.0008272826671600342, 0.0008806586265563965, 0.0009340345859527588, 0.000987410545349121, 0.0010407865047454834, 0.0010941624641418457, 0.001147538423538208, 0.0012009143829345703, 0.0012542903423309326, 0.001307666301727295, 0.0013610422611236572, 0.0014144182205200195, 0.0014677941799163818, 0.0015211701393127441, 0.0015745460987091064, 0.0016279220581054688]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 7.0, 7.0, 6.0, 5.0, 7.0, 21.0, 27.0, 45.0, 61.0, 109.0, 102.0, 141.0, 121.0, 90.0, 75.0, 48.0, 35.0, 23.0, 15.0, 10.0, 6.0, 7.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030498504638671875, -0.0029566287994384766, -0.0028634071350097656, -0.0027701854705810547, -0.0026769638061523438, -0.002583742141723633, -0.002490520477294922, -0.002397298812866211, -0.0023040771484375, -0.002210855484008789, -0.002117633819580078, -0.002024412155151367, -0.0019311904907226562, -0.0018379688262939453, -0.0017447471618652344, -0.0016515254974365234, -0.0015583038330078125, -0.0014650821685791016, -0.0013718605041503906, -0.0012786388397216797, -0.0011854171752929688, -0.0010921955108642578, -0.0009989738464355469, -0.0009057521820068359, -0.000812530517578125, -0.0007193088531494141, -0.0006260871887207031, -0.0005328655242919922, -0.00043964385986328125, -0.0003464221954345703, -0.0002532005310058594, -0.00015997886657714844, -6.67572021484375e-05, 2.6464462280273438e-05, 0.00011968612670898438, 0.0002129077911376953, 0.00030612945556640625, 0.0003993511199951172, 0.0004925727844238281, 0.0005857944488525391, 0.00067901611328125, 0.0007722377777099609, 0.0008654594421386719, 0.0009586811065673828, 0.0010519027709960938, 0.0011451244354248047, 0.0012383460998535156, 0.0013315677642822266, 0.0014247894287109375, 0.0015180110931396484, 0.0016112327575683594, 0.0017044544219970703, 0.0017976760864257812, 0.0018908977508544922, 0.001984119415283203, 0.002077341079711914, 0.002170562744140625, 0.002263784408569336, 0.002357006072998047, 0.002450227737426758, 0.0025434494018554688, 0.0026366710662841797, 0.0027298927307128906, 0.0028231143951416016, 0.0029163360595703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 12.0, 35.0, 107.0, 657.0, 147.0, 27.0, 12.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.440475195646286, -0.43241697549819946, -0.4243587553501129, -0.41630053520202637, -0.4082423150539398, -0.40018409490585327, -0.3921258747577667, -0.3840676546096802, -0.376009464263916, -0.36795124411582947, -0.3598930239677429, -0.35183480381965637, -0.3437765836715698, -0.3357183635234833, -0.32766014337539673, -0.31960195302963257, -0.31154370307922363, -0.3034854829311371, -0.29542726278305054, -0.287369042634964, -0.27931082248687744, -0.2712526023387909, -0.26319438219070435, -0.2551361918449402, -0.24707795679569244, -0.2390197366476059, -0.23096151649951935, -0.2229032963514328, -0.21484509110450745, -0.2067868709564209, -0.19872865080833435, -0.1906704306602478, -0.18261224031448364, -0.1745540201663971, -0.16649580001831055, -0.158437579870224, -0.15037935972213745, -0.1423211395740509, -0.13426293432712555, -0.126204714179039, -0.11814649403095245, -0.1100882738828659, -0.10203005373477936, -0.09397184103727341, -0.08591362088918686, -0.07785540074110031, -0.06979718804359436, -0.06173896789550781, -0.053680747747421265, -0.04562252759933472, -0.03756431117653847, -0.02950609289109707, -0.02144787460565567, -0.013389654457569122, -0.005331438034772873, 0.0027267783880233765, 0.010784998536109924, 0.018843216821551323, 0.02690143510699272, 0.03495965152978897, 0.04301787167787552, 0.05107609182596207, 0.059134308248758316, 0.06719252467155457, 0.07525074481964111]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 13.0, 10.0, 11.0, 9.0, 9.0, 14.0, 16.0, 20.0, 23.0, 19.0, 35.0, 30.0, 36.0, 40.0, 268.0, 186.0, 38.0, 27.0, 22.0, 24.0, 20.0, 12.0, 21.0, 9.0, 13.0, 14.0, 7.0, 9.0, 12.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.08677631616592407, -0.08413365483283997, -0.08149100095033646, -0.07884833961725235, -0.07620568573474884, -0.07356302440166473, -0.07092036306858063, -0.06827770173549652, -0.06563504785299301, -0.0629923865199089, -0.060349732637405396, -0.05770707130432129, -0.05506441369652748, -0.05242175608873367, -0.04977909475564957, -0.04713643714785576, -0.04449377954006195, -0.04185112193226814, -0.039208464324474335, -0.03656580299139023, -0.03392314538359642, -0.03128048777580261, -0.028637828305363655, -0.025995168834924698, -0.02335251122713089, -0.020709853619337082, -0.018067194148898125, -0.015424535609781742, -0.01278187707066536, -0.010139218531548977, -0.007496559992432594, -0.004853900521993637, -0.002211242914199829, 0.0004314156249165535, 0.003074074164032936, 0.005716732703149319, 0.008359391242265701, 0.011002049781382084, 0.013644708320498466, 0.016287367790937424, 0.01893002539873123, 0.02157268300652504, 0.024215342476963997, 0.026858001947402954, 0.029500659555196762, 0.03214331716299057, 0.034785978496074677, 0.037428636103868484, 0.04007129371166229, 0.0427139513194561, 0.04535660892724991, 0.047999270260334015, 0.05064192786812782, 0.05328458547592163, 0.05592724680900574, 0.058569904416799545, 0.06121256202459335, 0.06385522335767746, 0.06649787724018097, 0.06914053857326508, 0.07178319990634918, 0.07442585378885269, 0.0770685151219368, 0.07971116900444031, 0.08235383033752441]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 11.0, 13.0, 30.0, 31.0, 31.0, 49.0, 42.0, 85.0, 329.0, 90.0, 62.0, 47.0, 39.0, 34.0, 25.0, 15.0, 10.0, 14.0, 12.0, 2.0, 0.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0113983154296875, -0.011130332946777344, -0.010862350463867188, -0.010594367980957031, -0.010326385498046875, -0.010058403015136719, -0.009790420532226562, -0.009522438049316406, -0.00925445556640625, -0.008986473083496094, -0.008718490600585938, -0.008450508117675781, -0.008182525634765625, -0.007914543151855469, -0.0076465606689453125, -0.007378578186035156, -0.007110595703125, -0.006842613220214844, -0.0065746307373046875, -0.006306648254394531, -0.006038665771484375, -0.005770683288574219, -0.0055027008056640625, -0.005234718322753906, -0.00496673583984375, -0.004698753356933594, -0.0044307708740234375, -0.004162788391113281, -0.003894805908203125, -0.0036268234252929688, -0.0033588409423828125, -0.0030908584594726562, -0.0028228759765625, -0.0025548934936523438, -0.0022869110107421875, -0.0020189285278320312, -0.001750946044921875, -0.0014829635620117188, -0.0012149810791015625, -0.0009469985961914062, -0.00067901611328125, -0.00041103363037109375, -0.0001430511474609375, 0.00012493133544921875, 0.000392913818359375, 0.0006608963012695312, 0.0009288787841796875, 0.0011968612670898438, 0.00146484375, 0.0017328262329101562, 0.0020008087158203125, 0.0022687911987304688, 0.002536773681640625, 0.0028047561645507812, 0.0030727386474609375, 0.0033407211303710938, 0.00360870361328125, 0.0038766860961914062, 0.0041446685791015625, 0.004412651062011719, 0.004680633544921875, 0.004948616027832031, 0.0052165985107421875, 0.005484580993652344, 0.0057525634765625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 4.0, 11.0, 3.0, 4.0, 16.0, 32.0, 42.0, 44.0, 102.0, 260.0, 1433.0, 8195138.0, 189680.0, 1267.0, 296.0, 105.0, 58.0, 29.0, 10.0, 6.0, 17.0, 2.0, 6.0, 11.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-0.07916759699583054, -0.07643561065196991, -0.07370362430810928, -0.07097163796424866, -0.06823964416980743, -0.06550765782594681, -0.06277567148208618, -0.060043685138225555, -0.05731169879436493, -0.0545797124505043, -0.05184772610664368, -0.04911573603749275, -0.046383749693632126, -0.0436517633497715, -0.040919773280620575, -0.03818778693675995, -0.03545580059289932, -0.032723814249038696, -0.02999182604253292, -0.027259837836027145, -0.02452785149216652, -0.021795865148305893, -0.019063876941800117, -0.016331888735294342, -0.013599902391433716, -0.010867915116250515, -0.008135927841067314, -0.005403940565884113, -0.0026719532907009125, 6.003398448228836e-05, 0.002792021259665489, 0.005524009466171265, 0.008255995810031891, 0.010987983085215092, 0.013719970360398293, 0.016451958566904068, 0.019183944910764694, 0.02191593125462532, 0.024647919461131096, 0.02737990766763687, 0.030111894011497498, 0.032843880355358124, 0.03557586669921875, 0.038307856768369675, 0.0410398431122303, 0.04377182945609093, 0.04650381952524185, 0.04923580586910248, 0.051967792212963104, 0.05469977855682373, 0.05743176490068436, 0.06016375496983528, 0.0628957450389862, 0.06562773138284683, 0.06835971772670746, 0.07109170407056808, 0.07382369041442871, 0.07655567675828934, 0.07928766310214996, 0.08201964944601059, 0.08475163578987122, 0.08748362958431244, 0.09021561592817307, 0.09294760227203369, 0.09567958861589432]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 1.0, 5.0, 3.0, 6.0, 5.0, 9.0, 5.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03842676803469658, -0.037440795451402664, -0.03645482659339905, -0.03546885401010513, -0.03448288142681122, -0.0334969088435173, -0.03251093998551369, -0.03152496740221977, -0.030538994818925858, -0.029553024098277092, -0.028567051514983177, -0.02758108079433441, -0.026595108211040497, -0.02560913749039173, -0.024623166769742966, -0.02363719418644905, -0.022651223465800285, -0.02166525274515152, -0.020679280161857605, -0.01969330944120884, -0.018707336857914925, -0.01772136613726616, -0.016735393553972244, -0.01574942283332348, -0.014763451181352139, -0.013777479529380798, -0.012791507877409458, -0.011805536225438118, -0.010819565504789352, -0.009833592921495438, -0.008847622200846672, -0.007861650548875332, -0.006875680759549141, -0.005889709107577801, -0.004903737455606461, -0.003917766269296408, -0.0029317946173250675, -0.0019458229653537273, -0.0009598517790436745, 2.611987292766571e-05, 0.0010120915248990059, 0.001998063176870346, 0.0029840345960110426, 0.003970006015151739, 0.004955977667123079, 0.0059419493190944195, 0.006927920505404472, 0.007913892157375813, 0.008899863809347153, 0.009885835461318493, 0.010871807113289833, 0.011857777833938599, 0.012843750417232513, 0.013829721137881279, 0.01481569278985262, 0.01580166444182396, 0.016787637025117874, 0.01777360774576664, 0.018759580329060555, 0.01974555104970932, 0.020731523633003235, 0.021717494353652, 0.022703465074300766, 0.02368943765759468, 0.024675408378243446]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 4.0, 19.0, 24.0, 26.0, 42.0, 80.0, 125.0, 216.0, 495.0, 1068.0, 2772.0, 9847.0, 43836.0, 224445.0, 192400.0, 36581.0, 8206.0, 2366.0, 827.0, 364.0, 194.0, 106.0, 71.0, 53.0, 27.0, 21.0, 18.0, 9.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042938232421875, -0.04174327850341797, -0.04054832458496094, -0.039353370666503906, -0.038158416748046875, -0.036963462829589844, -0.03576850891113281, -0.03457355499267578, -0.03337860107421875, -0.03218364715576172, -0.030988693237304688, -0.029793739318847656, -0.028598785400390625, -0.027403831481933594, -0.026208877563476562, -0.02501392364501953, -0.0238189697265625, -0.02262401580810547, -0.021429061889648438, -0.020234107971191406, -0.019039154052734375, -0.017844200134277344, -0.016649246215820312, -0.015454292297363281, -0.01425933837890625, -0.013064384460449219, -0.011869430541992188, -0.010674476623535156, -0.009479522705078125, -0.008284568786621094, -0.0070896148681640625, -0.005894660949707031, -0.00469970703125, -0.0035047531127929688, -0.0023097991943359375, -0.0011148452758789062, 8.0108642578125e-05, 0.0012750625610351562, 0.0024700164794921875, 0.0036649703979492188, 0.00485992431640625, 0.006054878234863281, 0.0072498321533203125, 0.008444786071777344, 0.009639739990234375, 0.010834693908691406, 0.012029647827148438, 0.013224601745605469, 0.0144195556640625, 0.015614509582519531, 0.016809463500976562, 0.018004417419433594, 0.019199371337890625, 0.020394325256347656, 0.021589279174804688, 0.02278423309326172, 0.02397918701171875, 0.02517414093017578, 0.026369094848632812, 0.027564048767089844, 0.028759002685546875, 0.029953956604003906, 0.031148910522460938, 0.03234386444091797, 0.033538818359375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 9.0, 34.0, 48.0, 65.0, 97.0, 145.0, 176.0, 148.0, 116.0, 74.0, 36.0, 27.0, 11.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0199737548828125, -0.01942455768585205, -0.0188753604888916, -0.018326163291931152, -0.017776966094970703, -0.017227768898010254, -0.016678571701049805, -0.016129374504089355, -0.015580177307128906, -0.015030980110168457, -0.014481782913208008, -0.013932585716247559, -0.01338338851928711, -0.01283419132232666, -0.012284994125366211, -0.011735796928405762, -0.011186599731445312, -0.010637402534484863, -0.010088205337524414, -0.009539008140563965, -0.008989810943603516, -0.008440613746643066, -0.007891416549682617, -0.007342219352722168, -0.006793022155761719, -0.0062438249588012695, -0.00569462776184082, -0.005145430564880371, -0.004596233367919922, -0.004047036170959473, -0.0034978389739990234, -0.0029486417770385742, -0.002399444580078125, -0.0018502473831176758, -0.0013010501861572266, -0.0007518529891967773, -0.00020265579223632812, 0.0003465414047241211, 0.0008957386016845703, 0.0014449357986450195, 0.0019941329956054688, 0.002543330192565918, 0.003092527389526367, 0.0036417245864868164, 0.004190921783447266, 0.004740118980407715, 0.005289316177368164, 0.005838513374328613, 0.0063877105712890625, 0.006936907768249512, 0.007486104965209961, 0.00803530216217041, 0.00858449935913086, 0.009133696556091309, 0.009682893753051758, 0.010232090950012207, 0.010781288146972656, 0.011330485343933105, 0.011879682540893555, 0.012428879737854004, 0.012978076934814453, 0.013527274131774902, 0.014076471328735352, 0.0146256685256958, 0.01517486572265625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 6.0, 6.0, 17.0, 19.0, 61.0, 195.0, 127.0, 28.0, 14.0, 9.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10789994150400162, -0.10525205731391907, -0.10260417312383652, -0.09995628893375397, -0.09730840474367142, -0.09466052055358887, -0.09201264381408691, -0.08936475217342377, -0.08671687543392181, -0.08406899124383926, -0.08142110705375671, -0.07877322286367416, -0.07612533867359161, -0.07347745448350906, -0.07082957029342651, -0.06818169355392456, -0.06553380191326141, -0.06288591772317886, -0.060238033533096313, -0.05759014934301376, -0.05494226515293121, -0.05229438096284866, -0.04964650049805641, -0.04699861630797386, -0.04435073211789131, -0.04170284792780876, -0.03905496373772621, -0.03640708327293396, -0.03375919908285141, -0.03111131303012371, -0.02846343070268631, -0.02581554651260376, -0.02316766232252121, -0.02051977813243866, -0.01787189394235611, -0.015224011614918709, -0.012576127424836159, -0.009928243234753609, -0.007280360907316208, -0.004632476717233658, -0.001984592527151108, 0.000663291197270155, 0.0033111749216914177, 0.005959058180451393, 0.008606942370533943, 0.011254826560616493, 0.013902708888053894, 0.016550593078136444, 0.019198477268218994, 0.021846361458301544, 0.024494245648384094, 0.027142127975821495, 0.029790012165904045, 0.032437898218631744, 0.035085778683423996, 0.037733662873506546, 0.040381547063589096, 0.043029431253671646, 0.045677315443754196, 0.04832519590854645, 0.050973080098629, 0.05362096428871155, 0.0562688484787941, 0.05891673266887665, 0.0615646168589592]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 2.0, 1.0, 9.0, 7.0, 8.0, 7.0, 22.0, 42.0, 93.0, 100.0, 90.0, 45.0, 14.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06165480613708496, -0.059876758605241776, -0.05809871107339859, -0.0563206672668457, -0.05454261973500252, -0.05276457220315933, -0.050986528396606445, -0.04920848086476326, -0.047430433332920074, -0.04565238580107689, -0.043874338269233704, -0.04209629446268082, -0.04031824693083763, -0.038540199398994446, -0.03676215559244156, -0.03498410806059837, -0.03320606052875519, -0.031428012996912, -0.029649967327713966, -0.02787192165851593, -0.026093874126672745, -0.02431582659482956, -0.022537780925631523, -0.020759735256433487, -0.0189816877245903, -0.017203640192747116, -0.01542559452354908, -0.013647547923028469, -0.011869501322507858, -0.010091454721987247, -0.008313408121466637, -0.006535361520946026, -0.004757314920425415, -0.0029792683199048042, -0.0012012217193841934, 0.0005768248811364174, 0.002354871481657028, 0.004132918082177639, 0.00591096468269825, 0.007689011283218861, 0.009467057883739471, 0.011245104484260082, 0.013023151084780693, 0.014801197685301304, 0.016579244285821915, 0.0183572918176651, 0.020135337486863136, 0.021913383156061172, 0.023691430687904358, 0.025469478219747543, 0.02724752388894558, 0.029025569558143616, 0.0308036170899868, 0.03258166462182999, 0.034359708428382874, 0.03613775596022606, 0.037915803492069244, 0.03969385102391243, 0.041471898555755615, 0.0432499423623085, 0.04502798989415169, 0.04680603742599487, 0.04858408123254776, 0.050362128764390945, 0.05214017629623413]}, "eval/loss": 4.670431137084961, "eval/wer": 1.9589646965489884, "eval/runtime": 781.1725, "eval/samples_per_second": 3.382, "eval/steps_per_second": 0.283} \ No newline at end of file +{"train/loss": 5.1519, "train/learning_rate": 1.741654571843251e-06, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 6725, "_timestamp": 1646242620, "_step": 1191, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 39.0, 666.0, 303.0, 7.0, 1.0, 0.0, 1.0], "bins": [-403.2832946777344, -396.4258117675781, -389.5683288574219, -382.7108459472656, -375.8533630371094, -368.9958801269531, -362.138427734375, -355.28094482421875, -348.4234619140625, -341.56597900390625, -334.70849609375, -327.85101318359375, -320.9935302734375, -314.13604736328125, -307.278564453125, -300.42108154296875, -293.5635986328125, -286.70611572265625, -279.8486328125, -272.99114990234375, -266.1336669921875, -259.27618408203125, -252.41871643066406, -245.5612335205078, -238.70376586914062, -231.84628295898438, -224.98880004882812, -218.13131713867188, -211.2738494873047, -204.41636657714844, -197.5588836669922, -190.70140075683594, -183.84393310546875, -176.9864501953125, -170.12896728515625, -163.271484375, -156.4140167236328, -149.55653381347656, -142.6990509033203, -135.84156799316406, -128.9840850830078, -122.12660217285156, -115.26912689208984, -108.4116439819336, -101.55416107177734, -94.69668579101562, -87.83920288085938, -80.98171997070312, -74.12423706054688, -67.26675415039062, -60.40927505493164, -53.551795959472656, -46.694313049316406, -39.83683395385742, -32.97935485839844, -26.121871948242188, -19.264392852783203, -12.406911849975586, -5.549431800842285, 1.3080482482910156, 8.165529251098633, 15.02301025390625, 21.880489349365234, 28.737972259521484, 35.59545135498047]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 2.0, 4.0, 10.0, 8.0, 12.0, 10.0, 11.0, 23.0, 12.0, 16.0, 20.0, 30.0, 24.0, 30.0, 35.0, 37.0, 35.0, 57.0, 39.0, 42.0, 42.0, 43.0, 40.0, 36.0, 42.0, 36.0, 30.0, 32.0, 24.0, 31.0, 28.0, 17.0, 24.0, 21.0, 15.0, 14.0, 14.0, 13.0, 6.0, 5.0, 4.0, 8.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-56.051300048828125, -54.218135833740234, -52.384971618652344, -50.55180740356445, -48.71864318847656, -46.88547897338867, -45.05231475830078, -43.21915054321289, -41.385986328125, -39.55282211303711, -37.71965789794922, -35.88649368286133, -34.05332946777344, -32.22016525268555, -30.387001037597656, -28.553836822509766, -26.720674514770508, -24.887510299682617, -23.054346084594727, -21.221181869506836, -19.388017654418945, -17.554855346679688, -15.72169017791748, -13.88852596282959, -12.0553617477417, -10.222197532653809, -8.389033317565918, -6.5558695793151855, -4.722705364227295, -2.8895416259765625, -1.0563774108886719, 0.7767868041992188, 2.6099510192871094, 4.443115234375, 6.276279449462891, 8.109443664550781, 9.942607879638672, 11.775771141052246, 13.608935356140137, 15.442099571228027, 17.275264739990234, 19.108428955078125, 20.941593170166016, 22.774757385253906, 24.607921600341797, 26.441085815429688, 28.274250030517578, 30.10741424560547, 31.940576553344727, 33.773738861083984, 35.606903076171875, 37.440067291259766, 39.273231506347656, 41.10639572143555, 42.93955993652344, 44.77272415161133, 46.60588836669922, 48.43905258178711, 50.272216796875, 52.10538101196289, 53.93854522705078, 55.77170944213867, 57.60487365722656, 59.43803787231445, 61.271202087402344]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 15.0, 13.0, 14.0, 33.0, 29.0, 41.0, 51.0, 70.0, 70.0, 74.0, 85.0, 77.0, 74.0, 68.0, 60.0, 59.0, 45.0, 45.0, 27.0, 15.0, 14.0, 7.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.728515625, -3.641937255859375, -3.55535888671875, -3.468780517578125, -3.3822021484375, -3.295623779296875, -3.20904541015625, -3.122467041015625, -3.035888671875, -2.949310302734375, -2.86273193359375, -2.776153564453125, -2.6895751953125, -2.602996826171875, -2.51641845703125, -2.429840087890625, -2.34326171875, -2.256683349609375, -2.17010498046875, -2.083526611328125, -1.9969482421875, -1.910369873046875, -1.82379150390625, -1.737213134765625, -1.650634765625, -1.564056396484375, -1.47747802734375, -1.390899658203125, -1.3043212890625, -1.217742919921875, -1.13116455078125, -1.044586181640625, -0.9580078125, -0.871429443359375, -0.78485107421875, -0.698272705078125, -0.6116943359375, -0.525115966796875, -0.43853759765625, -0.351959228515625, -0.265380859375, -0.178802490234375, -0.09222412109375, -0.005645751953125, 0.0809326171875, 0.167510986328125, 0.25408935546875, 0.340667724609375, 0.42724609375, 0.513824462890625, 0.60040283203125, 0.686981201171875, 0.7735595703125, 0.860137939453125, 0.94671630859375, 1.033294677734375, 1.119873046875, 1.206451416015625, 1.29302978515625, 1.379608154296875, 1.4661865234375, 1.552764892578125, 1.63934326171875, 1.725921630859375, 1.8125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 0.0, 10.0, 11.0, 23.0, 29.0, 64.0, 77.0, 120.0, 228.0, 450.0, 833.0, 2069.0, 6217.0, 47833.0, 3781207.0, 334939.0, 14092.0, 3323.0, 1314.0, 631.0, 346.0, 189.0, 111.0, 59.0, 35.0, 33.0, 18.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-24.46875, -23.882568359375, -23.29638671875, -22.710205078125, -22.1240234375, -21.537841796875, -20.95166015625, -20.365478515625, -19.779296875, -19.193115234375, -18.60693359375, -18.020751953125, -17.4345703125, -16.848388671875, -16.26220703125, -15.676025390625, -15.08984375, -14.503662109375, -13.91748046875, -13.331298828125, -12.7451171875, -12.158935546875, -11.57275390625, -10.986572265625, -10.400390625, -9.814208984375, -9.22802734375, -8.641845703125, -8.0556640625, -7.469482421875, -6.88330078125, -6.297119140625, -5.7109375, -5.124755859375, -4.53857421875, -3.952392578125, -3.3662109375, -2.780029296875, -2.19384765625, -1.607666015625, -1.021484375, -0.435302734375, 0.15087890625, 0.737060546875, 1.3232421875, 1.909423828125, 2.49560546875, 3.081787109375, 3.66796875, 4.254150390625, 4.84033203125, 5.426513671875, 6.0126953125, 6.598876953125, 7.18505859375, 7.771240234375, 8.357421875, 8.943603515625, 9.52978515625, 10.115966796875, 10.7021484375, 11.288330078125, 11.87451171875, 12.460693359375, 13.046875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 12.0, 23.0, 34.0, 64.0, 139.0, 237.0, 451.0, 822.0, 948.0, 613.0, 318.0, 179.0, 94.0, 63.0, 28.0, 21.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.90625, -17.5263671875, -17.146484375, -16.7666015625, -16.38671875, -16.0068359375, -15.626953125, -15.2470703125, -14.8671875, -14.4873046875, -14.107421875, -13.7275390625, -13.34765625, -12.9677734375, -12.587890625, -12.2080078125, -11.828125, -11.4482421875, -11.068359375, -10.6884765625, -10.30859375, -9.9287109375, -9.548828125, -9.1689453125, -8.7890625, -8.4091796875, -8.029296875, -7.6494140625, -7.26953125, -6.8896484375, -6.509765625, -6.1298828125, -5.75, -5.3701171875, -4.990234375, -4.6103515625, -4.23046875, -3.8505859375, -3.470703125, -3.0908203125, -2.7109375, -2.3310546875, -1.951171875, -1.5712890625, -1.19140625, -0.8115234375, -0.431640625, -0.0517578125, 0.328125, 0.7080078125, 1.087890625, 1.4677734375, 1.84765625, 2.2275390625, 2.607421875, 2.9873046875, 3.3671875, 3.7470703125, 4.126953125, 4.5068359375, 4.88671875, 5.2666015625, 5.646484375, 6.0263671875, 6.40625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 8.0, 9.0, 10.0, 27.0, 50.0, 123.0, 263.0, 691.0, 3128.0, 691723.0, 3491822.0, 4969.0, 883.0, 330.0, 129.0, 62.0, 27.0, 12.0, 8.0, 10.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.28125, -44.79248046875, -43.3037109375, -41.81494140625, -40.326171875, -38.83740234375, -37.3486328125, -35.85986328125, -34.37109375, -32.88232421875, -31.3935546875, -29.90478515625, -28.416015625, -26.92724609375, -25.4384765625, -23.94970703125, -22.4609375, -20.97216796875, -19.4833984375, -17.99462890625, -16.505859375, -15.01708984375, -13.5283203125, -12.03955078125, -10.55078125, -9.06201171875, -7.5732421875, -6.08447265625, -4.595703125, -3.10693359375, -1.6181640625, -0.12939453125, 1.359375, 2.84814453125, 4.3369140625, 5.82568359375, 7.314453125, 8.80322265625, 10.2919921875, 11.78076171875, 13.26953125, 14.75830078125, 16.2470703125, 17.73583984375, 19.224609375, 20.71337890625, 22.2021484375, 23.69091796875, 25.1796875, 26.66845703125, 28.1572265625, 29.64599609375, 31.134765625, 32.62353515625, 34.1123046875, 35.60107421875, 37.08984375, 38.57861328125, 40.0673828125, 41.55615234375, 43.044921875, 44.53369140625, 46.0224609375, 47.51123046875, 49.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 67.0, 329.0, 452.0, 125.0, 25.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-148.87753295898438, -146.17604064941406, -143.47454833984375, -140.77305603027344, -138.07156372070312, -135.3700714111328, -132.6685791015625, -129.9670867919922, -127.26558685302734, -124.56409454345703, -121.86260223388672, -119.1611099243164, -116.4596176147461, -113.75811767578125, -111.05662536621094, -108.35513305664062, -105.65364074707031, -102.9521484375, -100.25065612792969, -97.54916381835938, -94.84767150878906, -92.14617919921875, -89.44468688964844, -86.7431869506836, -84.04170227050781, -81.3402099609375, -78.63871765136719, -75.93722534179688, -73.23573303222656, -70.53424072265625, -67.83274841308594, -65.1312484741211, -62.42975616455078, -59.72826385498047, -57.026771545410156, -54.325279235839844, -51.623783111572266, -48.92229080200195, -46.22079849243164, -43.51930236816406, -40.81781005859375, -38.11631774902344, -35.414825439453125, -32.71333312988281, -30.011837005615234, -27.310344696044922, -24.60885238647461, -21.907358169555664, -19.20586585998535, -16.50437355041504, -13.802879333496094, -11.101387023925781, -8.399893760681152, -5.698400497436523, -2.996908187866211, -0.2954139709472656, 2.406078338623047, 5.107571601867676, 7.8090643882751465, 10.510557174682617, 13.212050437927246, 15.913543701171875, 18.615036010742188, 21.316530227661133, 24.018022537231445]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 3.0, 8.0, 12.0, 7.0, 6.0, 13.0, 15.0, 12.0, 24.0, 22.0, 26.0, 29.0, 29.0, 27.0, 36.0, 46.0, 44.0, 44.0, 49.0, 51.0, 54.0, 36.0, 35.0, 48.0, 35.0, 30.0, 32.0, 35.0, 40.0, 24.0, 18.0, 22.0, 11.0, 18.0, 13.0, 15.0, 5.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-29.539199829101562, -28.756149291992188, -27.973098754882812, -27.190048217773438, -26.406997680664062, -25.623945236206055, -24.84089469909668, -24.057844161987305, -23.27479362487793, -22.491743087768555, -21.70869255065918, -20.925642013549805, -20.142589569091797, -19.359539031982422, -18.576488494873047, -17.793437957763672, -17.010387420654297, -16.227336883544922, -15.444286346435547, -14.661234855651855, -13.87818431854248, -13.095133781433105, -12.312082290649414, -11.529031753540039, -10.745981216430664, -9.962930679321289, -9.179880142211914, -8.396828651428223, -7.613778114318848, -6.830727577209473, -6.0476765632629395, -5.264625549316406, -4.481575012207031, -3.698524236679077, -2.915473461151123, -2.132422685623169, -1.3493719100952148, -0.5663211345672607, 0.21672964096069336, 0.9997806549072266, 1.7828311920166016, 2.5658819675445557, 3.3489327430725098, 4.131983757019043, 4.915034294128418, 5.698084831237793, 6.481135845184326, 7.264186859130859, 8.047237396240234, 8.83028793334961, 9.613338470458984, 10.396389961242676, 11.17944049835205, 11.962491035461426, 12.745542526245117, 13.528593063354492, 14.311643600463867, 15.094694137573242, 15.877744674682617, 16.660795211791992, 17.44384765625, 18.226898193359375, 19.00994873046875, 19.792999267578125, 20.5760498046875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 7.0, 4.0, 4.0, 18.0, 14.0, 25.0, 21.0, 20.0, 31.0, 48.0, 49.0, 40.0, 65.0, 68.0, 56.0, 69.0, 63.0, 62.0, 65.0, 53.0, 43.0, 38.0, 40.0, 28.0, 22.0, 10.0, 17.0, 6.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-3.1328125, -3.0621490478515625, -2.991485595703125, -2.9208221435546875, -2.85015869140625, -2.7794952392578125, -2.708831787109375, -2.6381683349609375, -2.5675048828125, -2.4968414306640625, -2.426177978515625, -2.3555145263671875, -2.28485107421875, -2.2141876220703125, -2.143524169921875, -2.0728607177734375, -2.002197265625, -1.9315338134765625, -1.860870361328125, -1.7902069091796875, -1.71954345703125, -1.6488800048828125, -1.578216552734375, -1.5075531005859375, -1.4368896484375, -1.3662261962890625, -1.295562744140625, -1.2248992919921875, -1.15423583984375, -1.0835723876953125, -1.012908935546875, -0.9422454833984375, -0.87158203125, -0.8009185791015625, -0.730255126953125, -0.6595916748046875, -0.58892822265625, -0.5182647705078125, -0.447601318359375, -0.3769378662109375, -0.3062744140625, -0.2356109619140625, -0.164947509765625, -0.0942840576171875, -0.02362060546875, 0.0470428466796875, 0.117706298828125, 0.1883697509765625, 0.259033203125, 0.3296966552734375, 0.400360107421875, 0.4710235595703125, 0.54168701171875, 0.6123504638671875, 0.683013916015625, 0.7536773681640625, 0.8243408203125, 0.8950042724609375, 0.965667724609375, 1.0363311767578125, 1.10699462890625, 1.1776580810546875, 1.248321533203125, 1.3189849853515625, 1.3896484375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 8.0, 5.0, 8.0, 11.0, 9.0, 11.0, 25.0, 35.0, 64.0, 97.0, 178.0, 414.0, 866.0, 1655.0, 3606.0, 7591.0, 16643.0, 38682.0, 103024.0, 415424.0, 311612.0, 87079.0, 33793.0, 14710.0, 6696.0, 3208.0, 1515.0, 746.0, 369.0, 179.0, 80.0, 60.0, 41.0, 23.0, 11.0, 8.0, 10.0, 13.0, 6.0, 11.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0218048095703125, -0.02114248275756836, -0.02048015594482422, -0.019817829132080078, -0.019155502319335938, -0.018493175506591797, -0.017830848693847656, -0.017168521881103516, -0.016506195068359375, -0.015843868255615234, -0.015181541442871094, -0.014519214630126953, -0.013856887817382812, -0.013194561004638672, -0.012532234191894531, -0.01186990737915039, -0.01120758056640625, -0.01054525375366211, -0.009882926940917969, -0.009220600128173828, -0.008558273315429688, -0.007895946502685547, -0.007233619689941406, -0.006571292877197266, -0.005908966064453125, -0.005246639251708984, -0.004584312438964844, -0.003921985626220703, -0.0032596588134765625, -0.002597332000732422, -0.0019350051879882812, -0.0012726783752441406, -0.0006103515625, 5.1975250244140625e-05, 0.0007143020629882812, 0.0013766288757324219, 0.0020389556884765625, 0.002701282501220703, 0.0033636093139648438, 0.004025936126708984, 0.004688262939453125, 0.005350589752197266, 0.006012916564941406, 0.006675243377685547, 0.0073375701904296875, 0.007999897003173828, 0.008662223815917969, 0.00932455062866211, 0.00998687744140625, 0.01064920425415039, 0.011311531066894531, 0.011973857879638672, 0.012636184692382812, 0.013298511505126953, 0.013960838317871094, 0.014623165130615234, 0.015285491943359375, 0.015947818756103516, 0.016610145568847656, 0.017272472381591797, 0.017934799194335938, 0.018597126007080078, 0.01925945281982422, 0.01992177963256836, 0.0205841064453125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 0.0, 3.0, 5.0, 4.0, 6.0, 2.0, 13.0, 15.0, 11.0, 20.0, 17.0, 14.0, 23.0, 20.0, 18.0, 30.0, 27.0, 31.0, 32.0, 51.0, 49.0, 46.0, 45.0, 1061.0, 42.0, 41.0, 41.0, 35.0, 42.0, 32.0, 36.0, 32.0, 28.0, 22.0, 16.0, 25.0, 18.0, 13.0, 9.0, 16.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.97998046875, -0.9477157592773438, -0.9154510498046875, -0.8831863403320312, -0.850921630859375, -0.8186569213867188, -0.7863922119140625, -0.7541275024414062, -0.72186279296875, -0.6895980834960938, -0.6573333740234375, -0.6250686645507812, -0.592803955078125, -0.5605392456054688, -0.5282745361328125, -0.49600982666015625, -0.4637451171875, -0.43148040771484375, -0.3992156982421875, -0.36695098876953125, -0.334686279296875, -0.30242156982421875, -0.2701568603515625, -0.23789215087890625, -0.20562744140625, -0.17336273193359375, -0.1410980224609375, -0.10883331298828125, -0.076568603515625, -0.04430389404296875, -0.0120391845703125, 0.02022552490234375, 0.052490234375, 0.08475494384765625, 0.1170196533203125, 0.14928436279296875, 0.181549072265625, 0.21381378173828125, 0.2460784912109375, 0.27834320068359375, 0.31060791015625, 0.34287261962890625, 0.3751373291015625, 0.40740203857421875, 0.439666748046875, 0.47193145751953125, 0.5041961669921875, 0.5364608764648438, 0.5687255859375, 0.6009902954101562, 0.6332550048828125, 0.6655197143554688, 0.697784423828125, 0.7300491333007812, 0.7623138427734375, 0.7945785522460938, 0.82684326171875, 0.8591079711914062, 0.8913726806640625, 0.9236373901367188, 0.955902099609375, 0.9881668090820312, 1.0204315185546875, 1.0526962280273438, 1.0849609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 11.0, 28.0, 25.0, 39.0, 62.0, 109.0, 153.0, 231.0, 326.0, 383.0, 684.0, 969.0, 1480.0, 2228.0, 3402.0, 5230.0, 8127.0, 12528.0, 20118.0, 32612.0, 54585.0, 100946.0, 231085.0, 1334619.0, 122295.0, 63595.0, 37380.0, 23019.0, 14390.0, 9155.0, 5922.0, 3817.0, 2544.0, 1692.0, 1116.0, 682.0, 471.0, 355.0, 230.0, 133.0, 108.0, 74.0, 47.0, 40.0, 20.0, 26.0, 9.0, 9.0, 7.0, 5.0, 0.0, 3.0, 5.0], "bins": [-0.006641387939453125, -0.00644683837890625, -0.006252288818359375, -0.0060577392578125, -0.005863189697265625, -0.00566864013671875, -0.005474090576171875, -0.005279541015625, -0.005084991455078125, -0.00489044189453125, -0.004695892333984375, -0.0045013427734375, -0.004306793212890625, -0.00411224365234375, -0.003917694091796875, -0.00372314453125, -0.003528594970703125, -0.00333404541015625, -0.003139495849609375, -0.0029449462890625, -0.002750396728515625, -0.00255584716796875, -0.002361297607421875, -0.002166748046875, -0.001972198486328125, -0.00177764892578125, -0.001583099365234375, -0.0013885498046875, -0.001194000244140625, -0.00099945068359375, -0.000804901123046875, -0.0006103515625, -0.000415802001953125, -0.00022125244140625, -2.6702880859375e-05, 0.0001678466796875, 0.000362396240234375, 0.00055694580078125, 0.000751495361328125, 0.000946044921875, 0.001140594482421875, 0.00133514404296875, 0.001529693603515625, 0.0017242431640625, 0.001918792724609375, 0.00211334228515625, 0.002307891845703125, 0.00250244140625, 0.002696990966796875, 0.00289154052734375, 0.003086090087890625, 0.0032806396484375, 0.003475189208984375, 0.00366973876953125, 0.003864288330078125, 0.004058837890625, 0.004253387451171875, 0.00444793701171875, 0.004642486572265625, 0.0048370361328125, 0.005031585693359375, 0.00522613525390625, 0.005420684814453125, 0.005615234375, 0.005809783935546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1005.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 3.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 2222.0, 0.0, 1043919.0, 2264.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 3.0, 0.0, 2.0, 10.0], "bins": [-1.0728836059570312e-06, -1.039355993270874e-06, -1.0058283805847168e-06, -9.723007678985596e-07, -9.387731552124023e-07, -9.052455425262451e-07, -8.717179298400879e-07, -8.381903171539307e-07, -8.046627044677734e-07, -7.711350917816162e-07, -7.37607479095459e-07, -7.040798664093018e-07, -6.705522537231445e-07, -6.370246410369873e-07, -6.034970283508301e-07, -5.699694156646729e-07, -5.364418029785156e-07, -5.029141902923584e-07, -4.6938657760620117e-07, -4.3585896492004395e-07, -4.023313522338867e-07, -3.688037395477295e-07, -3.3527612686157227e-07, -3.0174851417541504e-07, -2.682209014892578e-07, -2.3469328880310059e-07, -2.0116567611694336e-07, -1.6763806343078613e-07, -1.341104507446289e-07, -1.0058283805847168e-07, -6.705522537231445e-08, -3.3527612686157227e-08, 0.0, 3.3527612686157227e-08, 6.705522537231445e-08, 1.0058283805847168e-07, 1.341104507446289e-07, 1.6763806343078613e-07, 2.0116567611694336e-07, 2.3469328880310059e-07, 2.682209014892578e-07, 3.0174851417541504e-07, 3.3527612686157227e-07, 3.688037395477295e-07, 4.023313522338867e-07, 4.3585896492004395e-07, 4.6938657760620117e-07, 5.029141902923584e-07, 5.364418029785156e-07, 5.699694156646729e-07, 6.034970283508301e-07, 6.370246410369873e-07, 6.705522537231445e-07, 7.040798664093018e-07, 7.37607479095459e-07, 7.711350917816162e-07, 8.046627044677734e-07, 8.381903171539307e-07, 8.717179298400879e-07, 9.052455425262451e-07, 9.387731552124023e-07, 9.723007678985596e-07, 1.0058283805847168e-06, 1.039355993270874e-06, 1.0728836059570312e-06]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 7.0, 4.0, 4.0, 18.0, 14.0, 25.0, 21.0, 20.0, 31.0, 48.0, 49.0, 40.0, 65.0, 68.0, 56.0, 69.0, 63.0, 62.0, 65.0, 53.0, 43.0, 38.0, 40.0, 28.0, 22.0, 10.0, 17.0, 6.0, 10.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-3.1328125, -3.0621490478515625, -2.991485595703125, -2.9208221435546875, -2.85015869140625, -2.7794952392578125, -2.708831787109375, -2.6381683349609375, -2.5675048828125, -2.4968414306640625, -2.426177978515625, -2.3555145263671875, -2.28485107421875, -2.2141876220703125, -2.143524169921875, -2.0728607177734375, -2.002197265625, -1.9315338134765625, -1.860870361328125, -1.7902069091796875, -1.71954345703125, -1.6488800048828125, -1.578216552734375, -1.5075531005859375, -1.4368896484375, -1.3662261962890625, -1.295562744140625, -1.2248992919921875, -1.15423583984375, -1.0835723876953125, -1.012908935546875, -0.9422454833984375, -0.87158203125, -0.8009185791015625, -0.730255126953125, -0.6595916748046875, -0.58892822265625, -0.5182647705078125, -0.447601318359375, -0.3769378662109375, -0.3062744140625, -0.2356109619140625, -0.164947509765625, -0.0942840576171875, -0.02362060546875, 0.0470428466796875, 0.117706298828125, 0.1883697509765625, 0.259033203125, 0.3296966552734375, 0.400360107421875, 0.4710235595703125, 0.54168701171875, 0.6123504638671875, 0.683013916015625, 0.7536773681640625, 0.8243408203125, 0.8950042724609375, 0.965667724609375, 1.0363311767578125, 1.10699462890625, 1.1776580810546875, 1.248321533203125, 1.3189849853515625, 1.3896484375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 6.0, 7.0, 13.0, 14.0, 19.0, 30.0, 55.0, 75.0, 110.0, 193.0, 329.0, 510.0, 819.0, 1398.0, 2368.0, 4388.0, 8947.0, 22532.0, 128773.0, 746617.0, 93907.0, 19680.0, 8056.0, 4058.0, 2233.0, 1332.0, 792.0, 437.0, 307.0, 182.0, 127.0, 70.0, 48.0, 34.0, 27.0, 16.0, 11.0, 5.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-9.8984375, -9.62677001953125, -9.3551025390625, -9.08343505859375, -8.811767578125, -8.54010009765625, -8.2684326171875, -7.99676513671875, -7.72509765625, -7.45343017578125, -7.1817626953125, -6.91009521484375, -6.638427734375, -6.36676025390625, -6.0950927734375, -5.82342529296875, -5.5517578125, -5.28009033203125, -5.0084228515625, -4.73675537109375, -4.465087890625, -4.19342041015625, -3.9217529296875, -3.65008544921875, -3.37841796875, -3.10675048828125, -2.8350830078125, -2.56341552734375, -2.291748046875, -2.02008056640625, -1.7484130859375, -1.47674560546875, -1.205078125, -0.93341064453125, -0.6617431640625, -0.39007568359375, -0.118408203125, 0.15325927734375, 0.4249267578125, 0.69659423828125, 0.96826171875, 1.23992919921875, 1.5115966796875, 1.78326416015625, 2.054931640625, 2.32659912109375, 2.5982666015625, 2.86993408203125, 3.1416015625, 3.41326904296875, 3.6849365234375, 3.95660400390625, 4.228271484375, 4.49993896484375, 4.7716064453125, 5.04327392578125, 5.31494140625, 5.58660888671875, 5.8582763671875, 6.12994384765625, 6.401611328125, 6.67327880859375, 6.9449462890625, 7.21661376953125, 7.48828125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 5.0, 1.0, 7.0, 17.0, 11.0, 12.0, 17.0, 24.0, 26.0, 19.0, 29.0, 25.0, 28.0, 36.0, 30.0, 45.0, 43.0, 73.0, 134.0, 1474.0, 376.0, 144.0, 58.0, 58.0, 52.0, 40.0, 42.0, 29.0, 31.0, 19.0, 19.0, 18.0, 20.0, 20.0, 16.0, 8.0, 8.0, 7.0, 12.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.70703125, -4.5640869140625, -4.421142578125, -4.2781982421875, -4.13525390625, -3.9923095703125, -3.849365234375, -3.7064208984375, -3.5634765625, -3.4205322265625, -3.277587890625, -3.1346435546875, -2.99169921875, -2.8487548828125, -2.705810546875, -2.5628662109375, -2.419921875, -2.2769775390625, -2.134033203125, -1.9910888671875, -1.84814453125, -1.7052001953125, -1.562255859375, -1.4193115234375, -1.2763671875, -1.1334228515625, -0.990478515625, -0.8475341796875, -0.70458984375, -0.5616455078125, -0.418701171875, -0.2757568359375, -0.1328125, 0.0101318359375, 0.153076171875, 0.2960205078125, 0.43896484375, 0.5819091796875, 0.724853515625, 0.8677978515625, 1.0107421875, 1.1536865234375, 1.296630859375, 1.4395751953125, 1.58251953125, 1.7254638671875, 1.868408203125, 2.0113525390625, 2.154296875, 2.2972412109375, 2.440185546875, 2.5831298828125, 2.72607421875, 2.8690185546875, 3.011962890625, 3.1549072265625, 3.2978515625, 3.4407958984375, 3.583740234375, 3.7266845703125, 3.86962890625, 4.0125732421875, 4.155517578125, 4.2984619140625, 4.44140625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 12.0, 7.0, 8.0, 7.0, 10.0, 18.0, 16.0, 12.0, 19.0, 21.0, 22.0, 24.0, 42.0, 45.0, 65.0, 107.0, 213.0, 723.0, 9179.0, 3094224.0, 39200.0, 965.0, 284.0, 113.0, 73.0, 54.0, 28.0, 25.0, 22.0, 23.0, 25.0, 23.0, 20.0, 16.0, 8.0, 14.0, 11.0, 5.0, 2.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.734375, -19.068359375, -18.40234375, -17.736328125, -17.0703125, -16.404296875, -15.73828125, -15.072265625, -14.40625, -13.740234375, -13.07421875, -12.408203125, -11.7421875, -11.076171875, -10.41015625, -9.744140625, -9.078125, -8.412109375, -7.74609375, -7.080078125, -6.4140625, -5.748046875, -5.08203125, -4.416015625, -3.75, -3.083984375, -2.41796875, -1.751953125, -1.0859375, -0.419921875, 0.24609375, 0.912109375, 1.578125, 2.244140625, 2.91015625, 3.576171875, 4.2421875, 4.908203125, 5.57421875, 6.240234375, 6.90625, 7.572265625, 8.23828125, 8.904296875, 9.5703125, 10.236328125, 10.90234375, 11.568359375, 12.234375, 12.900390625, 13.56640625, 14.232421875, 14.8984375, 15.564453125, 16.23046875, 16.896484375, 17.5625, 18.228515625, 18.89453125, 19.560546875, 20.2265625, 20.892578125, 21.55859375, 22.224609375, 22.890625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 197.0, 784.0, 33.0, 1.0, 1.0, 0.0, 1.0], "bins": [-141.17442321777344, -138.7506103515625, -136.3267822265625, -133.90296936035156, -131.47914123535156, -129.05532836914062, -126.63150024414062, -124.20768737792969, -121.78385925292969, -119.36003875732422, -116.93621826171875, -114.51239776611328, -112.08857727050781, -109.66475677490234, -107.24093627929688, -104.81712341308594, -102.39330291748047, -99.969482421875, -97.54566192626953, -95.12184143066406, -92.6980209350586, -90.27420043945312, -87.85037994384766, -85.42655944824219, -83.00274658203125, -80.57892608642578, -78.15510559082031, -75.73128509521484, -73.30746459960938, -70.8836441040039, -68.45982360839844, -66.0360107421875, -63.612186431884766, -61.1883659362793, -58.76454544067383, -56.34072494506836, -53.916908264160156, -51.49308776855469, -49.06926727294922, -46.64544677734375, -44.22162628173828, -41.79780578613281, -39.373985290527344, -36.950164794921875, -34.526344299316406, -32.10252380371094, -29.678707122802734, -27.254886627197266, -24.831066131591797, -22.407245635986328, -19.98342514038086, -17.559606552124023, -15.135786056518555, -12.711965560913086, -10.288146018981934, -7.864326477050781, -5.440506935119629, -3.0166869163513184, -0.5928668975830078, 1.8309531211853027, 4.254773139953613, 6.678593635559082, 9.102413177490234, 11.526232719421387, 13.950053215026855]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 9.0, 3.0, 5.0, 7.0, 17.0, 15.0, 32.0, 19.0, 26.0, 19.0, 23.0, 30.0, 35.0, 31.0, 32.0, 36.0, 44.0, 34.0, 47.0, 35.0, 42.0, 42.0, 45.0, 36.0, 27.0, 32.0, 35.0, 31.0, 31.0, 22.0, 22.0, 24.0, 20.0, 16.0, 15.0, 9.0, 10.0, 12.0, 7.0, 8.0, 5.0, 1.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.92745590209961, -16.432964324951172, -15.938474655151367, -15.443984031677246, -14.949493408203125, -14.455002784729004, -13.960512161254883, -13.466020584106445, -12.97153091430664, -12.47704029083252, -11.982549667358398, -11.488059043884277, -10.993568420410156, -10.499077796936035, -10.004587173461914, -9.510095596313477, -9.015604972839355, -8.521114349365234, -8.026623725891113, -7.532133102416992, -7.037642478942871, -6.54315185546875, -6.048660755157471, -5.55417013168335, -5.0596795082092285, -4.565188884735107, -4.070698261260986, -3.576207399368286, -3.081716775894165, -2.587226152420044, -2.0927352905273438, -1.5982446670532227, -1.1037540435791016, -0.6092633605003357, -0.11477267742156982, 0.3797180652618408, 0.8742086887359619, 1.368699312210083, 1.8631901741027832, 2.3576807975769043, 2.8521714210510254, 3.3466620445251465, 3.8411526679992676, 4.335643768310547, 4.830134391784668, 5.324625015258789, 5.81911563873291, 6.313606262207031, 6.808096885681152, 7.302587509155273, 7.7970781326293945, 8.291568756103516, 8.786059379577637, 9.280550003051758, 9.775041580200195, 10.26953125, 10.764022827148438, 11.258513450622559, 11.75300407409668, 12.2474946975708, 12.741985321044922, 13.236475944519043, 13.730966567993164, 14.225458145141602, 14.719947814941406]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 14.0, 12.0, 24.0, 18.0, 22.0, 15.0, 42.0, 42.0, 48.0, 58.0, 61.0, 57.0, 55.0, 70.0, 70.0, 68.0, 52.0, 51.0, 37.0, 44.0, 35.0, 22.0, 20.0, 16.0, 11.0, 12.0, 5.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-3.15234375, -3.080780029296875, -3.00921630859375, -2.937652587890625, -2.8660888671875, -2.794525146484375, -2.72296142578125, -2.651397705078125, -2.579833984375, -2.508270263671875, -2.43670654296875, -2.365142822265625, -2.2935791015625, -2.222015380859375, -2.15045166015625, -2.078887939453125, -2.00732421875, -1.935760498046875, -1.86419677734375, -1.792633056640625, -1.7210693359375, -1.649505615234375, -1.57794189453125, -1.506378173828125, -1.434814453125, -1.363250732421875, -1.29168701171875, -1.220123291015625, -1.1485595703125, -1.076995849609375, -1.00543212890625, -0.933868408203125, -0.8623046875, -0.790740966796875, -0.71917724609375, -0.647613525390625, -0.5760498046875, -0.504486083984375, -0.43292236328125, -0.361358642578125, -0.289794921875, -0.218231201171875, -0.14666748046875, -0.075103759765625, -0.0035400390625, 0.068023681640625, 0.13958740234375, 0.211151123046875, 0.28271484375, 0.354278564453125, 0.42584228515625, 0.497406005859375, 0.5689697265625, 0.640533447265625, 0.71209716796875, 0.783660888671875, 0.855224609375, 0.926788330078125, 0.99835205078125, 1.069915771484375, 1.1414794921875, 1.213043212890625, 1.28460693359375, 1.356170654296875, 1.427734375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 8.0, 5.0, 17.0, 17.0, 38.0, 31.0, 61.0, 92.0, 162.0, 315.0, 552.0, 1474.0, 7353.0, 115096.0, 3709689.0, 341748.0, 13941.0, 2092.0, 704.0, 353.0, 197.0, 120.0, 78.0, 40.0, 25.0, 33.0, 18.0, 8.0, 3.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0], "bins": [-20.015625, -19.5570068359375, -19.098388671875, -18.6397705078125, -18.18115234375, -17.7225341796875, -17.263916015625, -16.8052978515625, -16.3466796875, -15.8880615234375, -15.429443359375, -14.9708251953125, -14.51220703125, -14.0535888671875, -13.594970703125, -13.1363525390625, -12.677734375, -12.2191162109375, -11.760498046875, -11.3018798828125, -10.84326171875, -10.3846435546875, -9.926025390625, -9.4674072265625, -9.0087890625, -8.5501708984375, -8.091552734375, -7.6329345703125, -7.17431640625, -6.7156982421875, -6.257080078125, -5.7984619140625, -5.33984375, -4.8812255859375, -4.422607421875, -3.9639892578125, -3.50537109375, -3.0467529296875, -2.588134765625, -2.1295166015625, -1.6708984375, -1.2122802734375, -0.753662109375, -0.2950439453125, 0.16357421875, 0.6221923828125, 1.080810546875, 1.5394287109375, 1.998046875, 2.4566650390625, 2.915283203125, 3.3739013671875, 3.83251953125, 4.2911376953125, 4.749755859375, 5.2083740234375, 5.6669921875, 6.1256103515625, 6.584228515625, 7.0428466796875, 7.50146484375, 7.9600830078125, 8.418701171875, 8.8773193359375, 9.3359375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 6.0, 16.0, 29.0, 21.0, 57.0, 75.0, 160.0, 235.0, 375.0, 573.0, 760.0, 631.0, 420.0, 290.0, 179.0, 104.0, 63.0, 30.0, 12.0, 15.0, 1.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.494384765625, -8.20751953125, -7.920654296875, -7.6337890625, -7.346923828125, -7.06005859375, -6.773193359375, -6.486328125, -6.199462890625, -5.91259765625, -5.625732421875, -5.3388671875, -5.052001953125, -4.76513671875, -4.478271484375, -4.19140625, -3.904541015625, -3.61767578125, -3.330810546875, -3.0439453125, -2.757080078125, -2.47021484375, -2.183349609375, -1.896484375, -1.609619140625, -1.32275390625, -1.035888671875, -0.7490234375, -0.462158203125, -0.17529296875, 0.111572265625, 0.3984375, 0.685302734375, 0.97216796875, 1.259033203125, 1.5458984375, 1.832763671875, 2.11962890625, 2.406494140625, 2.693359375, 2.980224609375, 3.26708984375, 3.553955078125, 3.8408203125, 4.127685546875, 4.41455078125, 4.701416015625, 4.98828125, 5.275146484375, 5.56201171875, 5.848876953125, 6.1357421875, 6.422607421875, 6.70947265625, 6.996337890625, 7.283203125, 7.570068359375, 7.85693359375, 8.143798828125, 8.4306640625, 8.717529296875, 9.00439453125, 9.291259765625, 9.578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 9.0, 13.0, 12.0, 29.0, 29.0, 38.0, 68.0, 93.0, 150.0, 276.0, 541.0, 1037.0, 2743.0, 14790.0, 260557.0, 3580244.0, 311548.0, 16687.0, 2978.0, 1072.0, 569.0, 291.0, 188.0, 102.0, 85.0, 44.0, 28.0, 22.0, 18.0, 9.0, 7.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.421875, -15.84619140625, -15.2705078125, -14.69482421875, -14.119140625, -13.54345703125, -12.9677734375, -12.39208984375, -11.81640625, -11.24072265625, -10.6650390625, -10.08935546875, -9.513671875, -8.93798828125, -8.3623046875, -7.78662109375, -7.2109375, -6.63525390625, -6.0595703125, -5.48388671875, -4.908203125, -4.33251953125, -3.7568359375, -3.18115234375, -2.60546875, -2.02978515625, -1.4541015625, -0.87841796875, -0.302734375, 0.27294921875, 0.8486328125, 1.42431640625, 2.0, 2.57568359375, 3.1513671875, 3.72705078125, 4.302734375, 4.87841796875, 5.4541015625, 6.02978515625, 6.60546875, 7.18115234375, 7.7568359375, 8.33251953125, 8.908203125, 9.48388671875, 10.0595703125, 10.63525390625, 11.2109375, 11.78662109375, 12.3623046875, 12.93798828125, 13.513671875, 14.08935546875, 14.6650390625, 15.24072265625, 15.81640625, 16.39208984375, 16.9677734375, 17.54345703125, 18.119140625, 18.69482421875, 19.2705078125, 19.84619140625, 20.421875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 10.0, 32.0, 162.0, 313.0, 323.0, 133.0, 34.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.589736938476562, -16.253463745117188, -13.91718864440918, -11.580914497375488, -9.244640350341797, -6.9083662033081055, -4.572092056274414, -2.2358169555664062, 0.10045623779296875, 2.43673038482666, 4.773004531860352, 7.109278678894043, 9.445552825927734, 11.781826972961426, 14.118101119995117, 16.454376220703125, 18.7906494140625, 21.126922607421875, 23.463197708129883, 25.79947280883789, 28.135746002197266, 30.47201919555664, 32.80829620361328, 35.144569396972656, 37.48084259033203, 39.817115783691406, 42.15338897705078, 44.48966598510742, 46.8259391784668, 49.16221237182617, 51.49848937988281, 53.83476257324219, 56.17103576660156, 58.50730895996094, 60.84358215332031, 63.17985916137695, 65.51612854003906, 67.85240936279297, 70.18868255615234, 72.52495574951172, 74.8612289428711, 77.19750213623047, 79.53377532958984, 81.87004852294922, 84.20632934570312, 86.5426025390625, 88.87887573242188, 91.21514892578125, 93.55142211914062, 95.8876953125, 98.22396850585938, 100.56024169921875, 102.89651489257812, 105.23279571533203, 107.5690689086914, 109.90534210205078, 112.24161529541016, 114.57788848876953, 116.9141616821289, 119.25043487548828, 121.58671569824219, 123.92298889160156, 126.25926208496094, 128.5955352783203, 130.9318084716797]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 8.0, 9.0, 6.0, 10.0, 17.0, 10.0, 26.0, 10.0, 20.0, 21.0, 22.0, 35.0, 26.0, 34.0, 32.0, 34.0, 33.0, 54.0, 39.0, 34.0, 37.0, 34.0, 40.0, 36.0, 40.0, 35.0, 36.0, 28.0, 33.0, 24.0, 21.0, 18.0, 17.0, 15.0, 17.0, 16.0, 11.0, 8.0, 14.0, 6.0, 9.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 3.0], "bins": [-20.789962768554688, -20.206619262695312, -19.623275756835938, -19.03993034362793, -18.456586837768555, -17.87324333190918, -17.289897918701172, -16.706554412841797, -16.123210906982422, -15.539867401123047, -14.956522941589355, -14.373178482055664, -13.789834976196289, -13.206491470336914, -12.623147010803223, -12.039802551269531, -11.456459045410156, -10.873115539550781, -10.28977108001709, -9.706426620483398, -9.123083114624023, -8.539739608764648, -7.956395149230957, -7.373051166534424, -6.789707183837891, -6.206363201141357, -5.623019218444824, -5.039675235748291, -4.456331253051758, -3.8729872703552246, -3.2896432876586914, -2.706299304962158, -2.122955322265625, -1.5396113395690918, -0.9562673568725586, -0.3729233741760254, 0.2104206085205078, 0.793764591217041, 1.3771085739135742, 1.9604525566101074, 2.5437965393066406, 3.127140522003174, 3.710484504699707, 4.29382848739624, 4.877172470092773, 5.460516452789307, 6.04386043548584, 6.627204418182373, 7.210548400878906, 7.7938923835754395, 8.377236366271973, 8.960580825805664, 9.543924331665039, 10.127267837524414, 10.710612297058105, 11.293956756591797, 11.877300262451172, 12.460643768310547, 13.043988227844238, 13.62733268737793, 14.210676193237305, 14.79401969909668, 15.377364158630371, 15.960708618164062, 16.544052124023438]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 10.0, 12.0, 12.0, 16.0, 25.0, 25.0, 38.0, 35.0, 37.0, 43.0, 43.0, 69.0, 64.0, 67.0, 59.0, 62.0, 67.0, 55.0, 39.0, 42.0, 41.0, 29.0, 24.0, 16.0, 20.0, 13.0, 8.0, 5.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 4.0], "bins": [-3.064453125, -2.99285888671875, -2.9212646484375, -2.84967041015625, -2.778076171875, -2.70648193359375, -2.6348876953125, -2.56329345703125, -2.49169921875, -2.42010498046875, -2.3485107421875, -2.27691650390625, -2.205322265625, -2.13372802734375, -2.0621337890625, -1.99053955078125, -1.9189453125, -1.84735107421875, -1.7757568359375, -1.70416259765625, -1.632568359375, -1.56097412109375, -1.4893798828125, -1.41778564453125, -1.34619140625, -1.27459716796875, -1.2030029296875, -1.13140869140625, -1.059814453125, -0.98822021484375, -0.9166259765625, -0.84503173828125, -0.7734375, -0.70184326171875, -0.6302490234375, -0.55865478515625, -0.487060546875, -0.41546630859375, -0.3438720703125, -0.27227783203125, -0.20068359375, -0.12908935546875, -0.0574951171875, 0.01409912109375, 0.085693359375, 0.15728759765625, 0.2288818359375, 0.30047607421875, 0.3720703125, 0.44366455078125, 0.5152587890625, 0.58685302734375, 0.658447265625, 0.73004150390625, 0.8016357421875, 0.87322998046875, 0.94482421875, 1.01641845703125, 1.0880126953125, 1.15960693359375, 1.231201171875, 1.30279541015625, 1.3743896484375, 1.44598388671875, 1.517578125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 12.0, 14.0, 18.0, 29.0, 48.0, 85.0, 144.0, 277.0, 450.0, 980.0, 1990.0, 4413.0, 10226.0, 24121.0, 61967.0, 190593.0, 522948.0, 144393.0, 50174.0, 19938.0, 8507.0, 3760.0, 1698.0, 797.0, 428.0, 220.0, 123.0, 67.0, 48.0, 18.0, 16.0, 15.0, 4.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.023162841796875, -0.02250838279724121, -0.021853923797607422, -0.021199464797973633, -0.020545005798339844, -0.019890546798706055, -0.019236087799072266, -0.018581628799438477, -0.017927169799804688, -0.0172727108001709, -0.01661825180053711, -0.01596379280090332, -0.015309333801269531, -0.014654874801635742, -0.014000415802001953, -0.013345956802368164, -0.012691497802734375, -0.012037038803100586, -0.011382579803466797, -0.010728120803833008, -0.010073661804199219, -0.00941920280456543, -0.00876474380493164, -0.008110284805297852, -0.0074558258056640625, -0.0068013668060302734, -0.006146907806396484, -0.005492448806762695, -0.004837989807128906, -0.004183530807495117, -0.003529071807861328, -0.002874612808227539, -0.00222015380859375, -0.001565694808959961, -0.0009112358093261719, -0.0002567768096923828, 0.00039768218994140625, 0.0010521411895751953, 0.0017066001892089844, 0.0023610591888427734, 0.0030155181884765625, 0.0036699771881103516, 0.004324436187744141, 0.00497889518737793, 0.005633354187011719, 0.006287813186645508, 0.006942272186279297, 0.007596731185913086, 0.008251190185546875, 0.008905649185180664, 0.009560108184814453, 0.010214567184448242, 0.010869026184082031, 0.01152348518371582, 0.01217794418334961, 0.012832403182983398, 0.013486862182617188, 0.014141321182250977, 0.014795780181884766, 0.015450239181518555, 0.016104698181152344, 0.016759157180786133, 0.017413616180419922, 0.01806807518005371, 0.0187225341796875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 4.0, 10.0, 7.0, 13.0, 8.0, 21.0, 25.0, 12.0, 17.0, 25.0, 30.0, 31.0, 34.0, 33.0, 27.0, 28.0, 49.0, 41.0, 49.0, 1061.0, 48.0, 42.0, 33.0, 41.0, 25.0, 33.0, 34.0, 31.0, 32.0, 30.0, 30.0, 15.0, 20.0, 11.0, 13.0, 15.0, 5.0, 7.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-1.1044921875, -1.0704803466796875, -1.036468505859375, -1.0024566650390625, -0.96844482421875, -0.9344329833984375, -0.900421142578125, -0.8664093017578125, -0.8323974609375, -0.7983856201171875, -0.764373779296875, -0.7303619384765625, -0.69635009765625, -0.6623382568359375, -0.628326416015625, -0.5943145751953125, -0.560302734375, -0.5262908935546875, -0.492279052734375, -0.4582672119140625, -0.42425537109375, -0.3902435302734375, -0.356231689453125, -0.3222198486328125, -0.2882080078125, -0.2541961669921875, -0.220184326171875, -0.1861724853515625, -0.15216064453125, -0.1181488037109375, -0.084136962890625, -0.0501251220703125, -0.01611328125, 0.0178985595703125, 0.051910400390625, 0.0859222412109375, 0.11993408203125, 0.1539459228515625, 0.187957763671875, 0.2219696044921875, 0.2559814453125, 0.2899932861328125, 0.324005126953125, 0.3580169677734375, 0.39202880859375, 0.4260406494140625, 0.460052490234375, 0.4940643310546875, 0.528076171875, 0.5620880126953125, 0.596099853515625, 0.6301116943359375, 0.66412353515625, 0.6981353759765625, 0.732147216796875, 0.7661590576171875, 0.8001708984375, 0.8341827392578125, 0.868194580078125, 0.9022064208984375, 0.93621826171875, 0.9702301025390625, 1.004241943359375, 1.0382537841796875, 1.072265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 0.0, 1.0, 7.0, 5.0, 6.0, 19.0, 35.0, 42.0, 58.0, 71.0, 142.0, 201.0, 291.0, 394.0, 648.0, 994.0, 1505.0, 2182.0, 3416.0, 5195.0, 8100.0, 13052.0, 20452.0, 32921.0, 54282.0, 92404.0, 202912.0, 1345625.0, 129312.0, 69463.0, 42111.0, 25838.0, 16266.0, 10303.0, 6585.0, 4212.0, 2731.0, 1811.0, 1121.0, 802.0, 558.0, 358.0, 219.0, 125.0, 117.0, 93.0, 51.0, 37.0, 25.0, 9.0, 8.0, 14.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006343841552734375, -0.0061408281326293945, -0.005937814712524414, -0.005734801292419434, -0.005531787872314453, -0.005328774452209473, -0.005125761032104492, -0.004922747611999512, -0.004719734191894531, -0.004516720771789551, -0.00431370735168457, -0.00411069393157959, -0.003907680511474609, -0.003704667091369629, -0.0035016536712646484, -0.003298640251159668, -0.0030956268310546875, -0.002892613410949707, -0.0026895999908447266, -0.002486586570739746, -0.0022835731506347656, -0.002080559730529785, -0.0018775463104248047, -0.0016745328903198242, -0.0014715194702148438, -0.0012685060501098633, -0.0010654926300048828, -0.0008624792098999023, -0.0006594657897949219, -0.0004564523696899414, -0.00025343894958496094, -5.042552947998047e-05, 0.000152587890625, 0.00035560131072998047, 0.0005586147308349609, 0.0007616281509399414, 0.0009646415710449219, 0.0011676549911499023, 0.0013706684112548828, 0.0015736818313598633, 0.0017766952514648438, 0.0019797086715698242, 0.0021827220916748047, 0.002385735511779785, 0.0025887489318847656, 0.002791762351989746, 0.0029947757720947266, 0.003197789192199707, 0.0034008026123046875, 0.003603816032409668, 0.0038068294525146484, 0.004009842872619629, 0.004212856292724609, 0.00441586971282959, 0.00461888313293457, 0.004821896553039551, 0.005024909973144531, 0.005227923393249512, 0.005430936813354492, 0.005633950233459473, 0.005836963653564453, 0.006039977073669434, 0.006242990493774414, 0.0064460039138793945, 0.006649017333984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 990.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 0.0, 13.0, 0.0, 29.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 486.0, 0.0, 7355.0, 0.0, 1032694.0, 0.0, 7334.0, 0.0, 505.0, 0.0, 45.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 28.0, 0.0, 10.0, 0.0, 6.0, 4.0], "bins": [-9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 10.0, 12.0, 12.0, 16.0, 25.0, 25.0, 38.0, 35.0, 37.0, 43.0, 43.0, 69.0, 64.0, 67.0, 59.0, 62.0, 67.0, 55.0, 39.0, 42.0, 41.0, 29.0, 24.0, 16.0, 20.0, 13.0, 8.0, 5.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 4.0], "bins": [-3.064453125, -2.99285888671875, -2.9212646484375, -2.84967041015625, -2.778076171875, -2.70648193359375, -2.6348876953125, -2.56329345703125, -2.49169921875, -2.42010498046875, -2.3485107421875, -2.27691650390625, -2.205322265625, -2.13372802734375, -2.0621337890625, -1.99053955078125, -1.9189453125, -1.84735107421875, -1.7757568359375, -1.70416259765625, -1.632568359375, -1.56097412109375, -1.4893798828125, -1.41778564453125, -1.34619140625, -1.27459716796875, -1.2030029296875, -1.13140869140625, -1.059814453125, -0.98822021484375, -0.9166259765625, -0.84503173828125, -0.7734375, -0.70184326171875, -0.6302490234375, -0.55865478515625, -0.487060546875, -0.41546630859375, -0.3438720703125, -0.27227783203125, -0.20068359375, -0.12908935546875, -0.0574951171875, 0.01409912109375, 0.085693359375, 0.15728759765625, 0.2288818359375, 0.30047607421875, 0.3720703125, 0.44366455078125, 0.5152587890625, 0.58685302734375, 0.658447265625, 0.73004150390625, 0.8016357421875, 0.87322998046875, 0.94482421875, 1.01641845703125, 1.0880126953125, 1.15960693359375, 1.231201171875, 1.30279541015625, 1.3743896484375, 1.44598388671875, 1.517578125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 8.0, 8.0, 15.0, 24.0, 41.0, 57.0, 93.0, 157.0, 272.0, 451.0, 959.0, 1876.0, 4531.0, 14526.0, 58368.0, 308742.0, 528354.0, 96148.0, 22376.0, 6573.0, 2444.0, 1158.0, 540.0, 328.0, 217.0, 117.0, 63.0, 41.0, 31.0, 14.0, 10.0, 9.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.59765625, -2.5295867919921875, -2.461517333984375, -2.3934478759765625, -2.32537841796875, -2.2573089599609375, -2.189239501953125, -2.1211700439453125, -2.0531005859375, -1.9850311279296875, -1.916961669921875, -1.8488922119140625, -1.78082275390625, -1.7127532958984375, -1.644683837890625, -1.5766143798828125, -1.508544921875, -1.4404754638671875, -1.372406005859375, -1.3043365478515625, -1.23626708984375, -1.1681976318359375, -1.100128173828125, -1.0320587158203125, -0.9639892578125, -0.8959197998046875, -0.827850341796875, -0.7597808837890625, -0.69171142578125, -0.6236419677734375, -0.555572509765625, -0.4875030517578125, -0.41943359375, -0.3513641357421875, -0.283294677734375, -0.2152252197265625, -0.14715576171875, -0.0790863037109375, -0.011016845703125, 0.0570526123046875, 0.1251220703125, 0.1931915283203125, 0.261260986328125, 0.3293304443359375, 0.39739990234375, 0.4654693603515625, 0.533538818359375, 0.6016082763671875, 0.669677734375, 0.7377471923828125, 0.805816650390625, 0.8738861083984375, 0.94195556640625, 1.0100250244140625, 1.078094482421875, 1.1461639404296875, 1.2142333984375, 1.2823028564453125, 1.350372314453125, 1.4184417724609375, 1.48651123046875, 1.5545806884765625, 1.622650146484375, 1.6907196044921875, 1.7587890625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 7.0, 7.0, 10.0, 9.0, 13.0, 21.0, 19.0, 17.0, 25.0, 22.0, 23.0, 29.0, 35.0, 33.0, 32.0, 51.0, 57.0, 89.0, 371.0, 1608.0, 103.0, 44.0, 46.0, 47.0, 39.0, 41.0, 40.0, 25.0, 38.0, 20.0, 32.0, 9.0, 13.0, 20.0, 12.0, 10.0, 9.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.9150390625, -4.740234375, -4.5654296875, -4.390625, -4.2158203125, -4.041015625, -3.8662109375, -3.69140625, -3.5166015625, -3.341796875, -3.1669921875, -2.9921875, -2.8173828125, -2.642578125, -2.4677734375, -2.29296875, -2.1181640625, -1.943359375, -1.7685546875, -1.59375, -1.4189453125, -1.244140625, -1.0693359375, -0.89453125, -0.7197265625, -0.544921875, -0.3701171875, -0.1953125, -0.0205078125, 0.154296875, 0.3291015625, 0.50390625, 0.6787109375, 0.853515625, 1.0283203125, 1.203125, 1.3779296875, 1.552734375, 1.7275390625, 1.90234375, 2.0771484375, 2.251953125, 2.4267578125, 2.6015625, 2.7763671875, 2.951171875, 3.1259765625, 3.30078125, 3.4755859375, 3.650390625, 3.8251953125, 4.0, 4.1748046875, 4.349609375, 4.5244140625, 4.69921875, 4.8740234375, 5.048828125, 5.2236328125, 5.3984375, 5.5732421875, 5.748046875, 5.9228515625, 6.09765625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 6.0, 4.0, 9.0, 8.0, 12.0, 21.0, 10.0, 11.0, 19.0, 20.0, 27.0, 37.0, 39.0, 39.0, 79.0, 72.0, 136.0, 224.0, 537.0, 1478.0, 14793.0, 3044403.0, 79553.0, 2659.0, 671.0, 280.0, 129.0, 91.0, 73.0, 48.0, 38.0, 23.0, 25.0, 20.0, 15.0, 21.0, 13.0, 21.0, 10.0, 6.0, 9.0, 5.0, 5.0, 8.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.546875, -11.2138671875, -10.880859375, -10.5478515625, -10.21484375, -9.8818359375, -9.548828125, -9.2158203125, -8.8828125, -8.5498046875, -8.216796875, -7.8837890625, -7.55078125, -7.2177734375, -6.884765625, -6.5517578125, -6.21875, -5.8857421875, -5.552734375, -5.2197265625, -4.88671875, -4.5537109375, -4.220703125, -3.8876953125, -3.5546875, -3.2216796875, -2.888671875, -2.5556640625, -2.22265625, -1.8896484375, -1.556640625, -1.2236328125, -0.890625, -0.5576171875, -0.224609375, 0.1083984375, 0.44140625, 0.7744140625, 1.107421875, 1.4404296875, 1.7734375, 2.1064453125, 2.439453125, 2.7724609375, 3.10546875, 3.4384765625, 3.771484375, 4.1044921875, 4.4375, 4.7705078125, 5.103515625, 5.4365234375, 5.76953125, 6.1025390625, 6.435546875, 6.7685546875, 7.1015625, 7.4345703125, 7.767578125, 8.1005859375, 8.43359375, 8.7666015625, 9.099609375, 9.4326171875, 9.765625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 19.0, 375.0, 598.0, 23.0, 0.0, 0.0, 2.0], "bins": [-67.957275390625, -66.80784606933594, -65.65841674804688, -64.50898742675781, -63.35955810546875, -62.21012878417969, -61.060699462890625, -59.91127014160156, -58.7618408203125, -57.61241149902344, -56.462982177734375, -55.31355285644531, -54.16412353515625, -53.01469421386719, -51.865264892578125, -50.71583557128906, -49.56640625, -48.41697692871094, -47.267547607421875, -46.11811828613281, -44.96868896484375, -43.81925964355469, -42.669830322265625, -41.52040100097656, -40.370967864990234, -39.22153854370117, -38.07210922241211, -36.92267990112305, -35.773250579833984, -34.62382125854492, -33.47439193725586, -32.3249626159668, -31.175533294677734, -30.026103973388672, -28.87667465209961, -27.727245330810547, -26.577816009521484, -25.428386688232422, -24.27895736694336, -23.129528045654297, -21.980098724365234, -20.830669403076172, -19.68124008178711, -18.531810760498047, -17.382381439208984, -16.232952117919922, -15.083521842956543, -13.93409252166748, -12.784662246704102, -11.635232925415039, -10.485803604125977, -9.336374282836914, -8.186944961547852, -7.037515163421631, -5.88808536529541, -4.738656044006348, -3.589226722717285, -2.4397974014282227, -1.290367841720581, -0.14093828201293945, 1.008491039276123, 2.1579203605651855, 3.3073501586914062, 4.456779479980469, 5.606208801269531]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 8.0, 10.0, 6.0, 8.0, 13.0, 25.0, 20.0, 23.0, 18.0, 21.0, 32.0, 34.0, 33.0, 37.0, 40.0, 44.0, 44.0, 39.0, 41.0, 35.0, 36.0, 43.0, 39.0, 41.0, 40.0, 33.0, 40.0, 38.0, 25.0, 21.0, 21.0, 17.0, 16.0, 15.0, 13.0, 10.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.0784969329834, -19.500879287719727, -18.923263549804688, -18.345645904541016, -17.768030166625977, -17.190412521362305, -16.612796783447266, -16.035179138183594, -15.457562446594238, -14.879945755004883, -14.302329063415527, -13.724712371826172, -13.1470947265625, -12.569478988647461, -11.991861343383789, -11.414244651794434, -10.836627960205078, -10.259011268615723, -9.681394577026367, -9.103777885437012, -8.526161193847656, -7.948544025421143, -7.370926856994629, -6.793310165405273, -6.215693473815918, -5.6380767822265625, -5.060460090637207, -4.482842922210693, -3.905226230621338, -3.3276095390319824, -2.749992609024048, -2.1723756790161133, -1.594757080078125, -1.01714026927948, -0.43952345848083496, 0.13809335231781006, 0.7157101631164551, 1.2933268547058105, 1.8709437847137451, 2.4485607147216797, 3.026177406311035, 3.6037940979003906, 4.181410789489746, 4.75902795791626, 5.336644649505615, 5.914261341094971, 6.491878509521484, 7.06949520111084, 7.647111892700195, 8.22472858428955, 8.802345275878906, 9.379961967468262, 9.957578659057617, 10.535196304321289, 11.112812995910645, 11.6904296875, 12.268046379089355, 12.845663070678711, 13.423279762268066, 14.000896453857422, 14.578514099121094, 15.156129837036133, 15.733747482299805, 16.311363220214844, 16.888980865478516]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 4.0, 10.0, 7.0, 16.0, 13.0, 17.0, 31.0, 30.0, 31.0, 41.0, 28.0, 46.0, 53.0, 65.0, 68.0, 54.0, 64.0, 70.0, 63.0, 48.0, 37.0, 47.0, 36.0, 25.0, 25.0, 14.0, 19.0, 13.0, 4.0, 8.0, 9.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.08203125, -3.0094451904296875, -2.936859130859375, -2.8642730712890625, -2.79168701171875, -2.7191009521484375, -2.646514892578125, -2.5739288330078125, -2.5013427734375, -2.4287567138671875, -2.356170654296875, -2.2835845947265625, -2.21099853515625, -2.1384124755859375, -2.065826416015625, -1.9932403564453125, -1.920654296875, -1.8480682373046875, -1.775482177734375, -1.7028961181640625, -1.63031005859375, -1.5577239990234375, -1.485137939453125, -1.4125518798828125, -1.3399658203125, -1.2673797607421875, -1.194793701171875, -1.1222076416015625, -1.04962158203125, -0.9770355224609375, -0.904449462890625, -0.8318634033203125, -0.75927734375, -0.6866912841796875, -0.614105224609375, -0.5415191650390625, -0.46893310546875, -0.3963470458984375, -0.323760986328125, -0.2511749267578125, -0.1785888671875, -0.1060028076171875, -0.033416748046875, 0.0391693115234375, 0.11175537109375, 0.1843414306640625, 0.256927490234375, 0.3295135498046875, 0.402099609375, 0.4746856689453125, 0.547271728515625, 0.6198577880859375, 0.69244384765625, 0.7650299072265625, 0.837615966796875, 0.9102020263671875, 0.9827880859375, 1.0553741455078125, 1.127960205078125, 1.2005462646484375, 1.27313232421875, 1.3457183837890625, 1.418304443359375, 1.4908905029296875, 1.5634765625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 10.0, 15.0, 25.0, 29.0, 27.0, 42.0, 60.0, 82.0, 174.0, 237.0, 595.0, 1720.0, 9327.0, 87901.0, 2223289.0, 1786588.0, 73295.0, 8084.0, 1585.0, 544.0, 219.0, 140.0, 88.0, 62.0, 37.0, 32.0, 18.0, 16.0, 10.0, 8.0, 4.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-12.921875, -12.6064453125, -12.291015625, -11.9755859375, -11.66015625, -11.3447265625, -11.029296875, -10.7138671875, -10.3984375, -10.0830078125, -9.767578125, -9.4521484375, -9.13671875, -8.8212890625, -8.505859375, -8.1904296875, -7.875, -7.5595703125, -7.244140625, -6.9287109375, -6.61328125, -6.2978515625, -5.982421875, -5.6669921875, -5.3515625, -5.0361328125, -4.720703125, -4.4052734375, -4.08984375, -3.7744140625, -3.458984375, -3.1435546875, -2.828125, -2.5126953125, -2.197265625, -1.8818359375, -1.56640625, -1.2509765625, -0.935546875, -0.6201171875, -0.3046875, 0.0107421875, 0.326171875, 0.6416015625, 0.95703125, 1.2724609375, 1.587890625, 1.9033203125, 2.21875, 2.5341796875, 2.849609375, 3.1650390625, 3.48046875, 3.7958984375, 4.111328125, 4.4267578125, 4.7421875, 5.0576171875, 5.373046875, 5.6884765625, 6.00390625, 6.3193359375, 6.634765625, 6.9501953125, 7.265625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 11.0, 9.0, 19.0, 36.0, 77.0, 132.0, 248.0, 413.0, 608.0, 821.0, 647.0, 451.0, 262.0, 142.0, 83.0, 47.0, 28.0, 19.0, 11.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.75360107421875, -6.4407958984375, -6.12799072265625, -5.815185546875, -5.50238037109375, -5.1895751953125, -4.87677001953125, -4.56396484375, -4.25115966796875, -3.9383544921875, -3.62554931640625, -3.312744140625, -2.99993896484375, -2.6871337890625, -2.37432861328125, -2.0615234375, -1.74871826171875, -1.4359130859375, -1.12310791015625, -0.810302734375, -0.49749755859375, -0.1846923828125, 0.12811279296875, 0.44091796875, 0.75372314453125, 1.0665283203125, 1.37933349609375, 1.692138671875, 2.00494384765625, 2.3177490234375, 2.63055419921875, 2.943359375, 3.25616455078125, 3.5689697265625, 3.88177490234375, 4.194580078125, 4.50738525390625, 4.8201904296875, 5.13299560546875, 5.44580078125, 5.75860595703125, 6.0714111328125, 6.38421630859375, 6.697021484375, 7.00982666015625, 7.3226318359375, 7.63543701171875, 7.9482421875, 8.26104736328125, 8.5738525390625, 8.88665771484375, 9.199462890625, 9.51226806640625, 9.8250732421875, 10.13787841796875, 10.45068359375, 10.76348876953125, 11.0762939453125, 11.38909912109375, 11.701904296875, 12.01470947265625, 12.3275146484375, 12.64031982421875, 12.953125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 10.0, 11.0, 11.0, 21.0, 11.0, 28.0, 43.0, 50.0, 81.0, 134.0, 193.0, 362.0, 588.0, 1349.0, 4062.0, 19563.0, 185063.0, 2816702.0, 1078819.0, 72457.0, 9911.0, 2530.0, 969.0, 488.0, 275.0, 180.0, 108.0, 59.0, 68.0, 41.0, 31.0, 13.0, 15.0, 15.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.875, -14.421630859375, -13.96826171875, -13.514892578125, -13.0615234375, -12.608154296875, -12.15478515625, -11.701416015625, -11.248046875, -10.794677734375, -10.34130859375, -9.887939453125, -9.4345703125, -8.981201171875, -8.52783203125, -8.074462890625, -7.62109375, -7.167724609375, -6.71435546875, -6.260986328125, -5.8076171875, -5.354248046875, -4.90087890625, -4.447509765625, -3.994140625, -3.540771484375, -3.08740234375, -2.634033203125, -2.1806640625, -1.727294921875, -1.27392578125, -0.820556640625, -0.3671875, 0.086181640625, 0.53955078125, 0.992919921875, 1.4462890625, 1.899658203125, 2.35302734375, 2.806396484375, 3.259765625, 3.713134765625, 4.16650390625, 4.619873046875, 5.0732421875, 5.526611328125, 5.97998046875, 6.433349609375, 6.88671875, 7.340087890625, 7.79345703125, 8.246826171875, 8.7001953125, 9.153564453125, 9.60693359375, 10.060302734375, 10.513671875, 10.967041015625, 11.42041015625, 11.873779296875, 12.3271484375, 12.780517578125, 13.23388671875, 13.687255859375, 14.140625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 17.0, 81.0, 200.0, 310.0, 253.0, 111.0, 35.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-97.1061782836914, -94.59596252441406, -92.08575439453125, -89.5755386352539, -87.06532287597656, -84.55510711669922, -82.04489135742188, -79.53468322753906, -77.02446746826172, -74.51425170898438, -72.00404357910156, -69.49382781982422, -66.98361206054688, -64.47339630126953, -61.96318435668945, -59.452972412109375, -56.94275665283203, -54.43254089355469, -51.92232894897461, -49.41211700439453, -46.90190124511719, -44.391685485839844, -41.881473541259766, -39.37126159667969, -36.861045837402344, -34.350830078125, -31.840618133544922, -29.33040428161621, -26.8201904296875, -24.30997657775879, -21.799762725830078, -19.289548873901367, -16.77933120727539, -14.26911735534668, -11.758903503417969, -9.248689651489258, -6.738475799560547, -4.228261947631836, -1.718048095703125, 0.7921657562255859, 3.302379608154297, 5.812593460083008, 8.322807312011719, 10.83302116394043, 13.34323501586914, 15.853448867797852, 18.363662719726562, 20.873876571655273, 23.384090423583984, 25.894304275512695, 28.404518127441406, 30.914731979370117, 33.42494583129883, 35.935157775878906, 38.44537353515625, 40.955589294433594, 43.46580123901367, 45.97601318359375, 48.486228942871094, 50.99644470214844, 53.506656646728516, 56.016868591308594, 58.52708435058594, 61.03730010986328, 63.54751205444336]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 9.0, 12.0, 13.0, 13.0, 16.0, 22.0, 28.0, 24.0, 21.0, 28.0, 16.0, 40.0, 33.0, 36.0, 36.0, 31.0, 32.0, 45.0, 25.0, 37.0, 32.0, 51.0, 32.0, 34.0, 23.0, 28.0, 26.0, 27.0, 21.0, 33.0, 16.0, 23.0, 15.0, 20.0, 19.0, 10.0, 15.0, 10.0, 5.0, 6.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-18.29857635498047, -17.76156234741211, -17.22454833984375, -16.687536239624023, -16.150522232055664, -15.613508224487305, -15.076494216918945, -14.539480209350586, -14.002467155456543, -13.465453147888184, -12.92844009399414, -12.391426086425781, -11.854412078857422, -11.317399024963379, -10.78038501739502, -10.243371963500977, -9.706357955932617, -9.169343948364258, -8.632330894470215, -8.095316886901855, -7.558303356170654, -7.021289825439453, -6.484275817871094, -5.947262287139893, -5.410248756408691, -4.87323522567749, -4.336221694946289, -3.7992076873779297, -3.2621941566467285, -2.7251806259155273, -2.188166856765747, -1.6511530876159668, -1.1141395568847656, -0.5771259069442749, -0.04011225700378418, 0.49690139293670654, 1.0339150428771973, 1.5709285736083984, 2.1079423427581787, 2.644956111907959, 3.18196964263916, 3.7189831733703613, 4.2559967041015625, 4.793010711669922, 5.330024242401123, 5.867037773132324, 6.404051780700684, 6.941065311431885, 7.478078842163086, 8.015092849731445, 8.552105903625488, 9.089119911193848, 9.62613296508789, 10.16314697265625, 10.70016098022461, 11.237174987792969, 11.774188041687012, 12.311202049255371, 12.848215103149414, 13.385229110717773, 13.922243118286133, 14.459256172180176, 14.996270179748535, 15.533283233642578, 16.070297241210938]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 9.0, 6.0, 15.0, 9.0, 16.0, 10.0, 20.0, 19.0, 33.0, 49.0, 50.0, 35.0, 59.0, 54.0, 62.0, 57.0, 49.0, 60.0, 59.0, 68.0, 55.0, 40.0, 35.0, 29.0, 28.0, 20.0, 11.0, 18.0, 8.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.890625, -2.8162078857421875, -2.741790771484375, -2.6673736572265625, -2.59295654296875, -2.5185394287109375, -2.444122314453125, -2.3697052001953125, -2.2952880859375, -2.2208709716796875, -2.146453857421875, -2.0720367431640625, -1.99761962890625, -1.9232025146484375, -1.848785400390625, -1.7743682861328125, -1.699951171875, -1.6255340576171875, -1.551116943359375, -1.4766998291015625, -1.40228271484375, -1.3278656005859375, -1.253448486328125, -1.1790313720703125, -1.1046142578125, -1.0301971435546875, -0.955780029296875, -0.8813629150390625, -0.80694580078125, -0.7325286865234375, -0.658111572265625, -0.5836944580078125, -0.50927734375, -0.4348602294921875, -0.360443115234375, -0.2860260009765625, -0.21160888671875, -0.1371917724609375, -0.062774658203125, 0.0116424560546875, 0.0860595703125, 0.1604766845703125, 0.234893798828125, 0.3093109130859375, 0.38372802734375, 0.4581451416015625, 0.532562255859375, 0.6069793701171875, 0.681396484375, 0.7558135986328125, 0.830230712890625, 0.9046478271484375, 0.97906494140625, 1.0534820556640625, 1.127899169921875, 1.2023162841796875, 1.2767333984375, 1.3511505126953125, 1.425567626953125, 1.4999847412109375, 1.57440185546875, 1.6488189697265625, 1.723236083984375, 1.7976531982421875, 1.8720703125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 5.0, 10.0, 10.0, 17.0, 14.0, 25.0, 53.0, 62.0, 123.0, 166.0, 323.0, 577.0, 1039.0, 2000.0, 3708.0, 7463.0, 14951.0, 32214.0, 74631.0, 207590.0, 455021.0, 143040.0, 56522.0, 24714.0, 11887.0, 5880.0, 2974.0, 1568.0, 863.0, 452.0, 254.0, 154.0, 89.0, 51.0, 41.0, 21.0, 19.0, 7.0, 4.0, 0.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0191802978515625, -0.01862168312072754, -0.018063068389892578, -0.017504453659057617, -0.016945838928222656, -0.016387224197387695, -0.015828609466552734, -0.015269994735717773, -0.014711380004882812, -0.014152765274047852, -0.01359415054321289, -0.01303553581237793, -0.012476921081542969, -0.011918306350708008, -0.011359691619873047, -0.010801076889038086, -0.010242462158203125, -0.009683847427368164, -0.009125232696533203, -0.008566617965698242, -0.008008003234863281, -0.00744938850402832, -0.006890773773193359, -0.0063321590423583984, -0.0057735443115234375, -0.0052149295806884766, -0.004656314849853516, -0.004097700119018555, -0.0035390853881835938, -0.002980470657348633, -0.002421855926513672, -0.001863241195678711, -0.00130462646484375, -0.0007460117340087891, -0.00018739700317382812, 0.0003712177276611328, 0.0009298324584960938, 0.0014884471893310547, 0.0020470619201660156, 0.0026056766510009766, 0.0031642913818359375, 0.0037229061126708984, 0.004281520843505859, 0.00484013557434082, 0.005398750305175781, 0.005957365036010742, 0.006515979766845703, 0.007074594497680664, 0.007633209228515625, 0.008191823959350586, 0.008750438690185547, 0.009309053421020508, 0.009867668151855469, 0.01042628288269043, 0.01098489761352539, 0.011543512344360352, 0.012102127075195312, 0.012660741806030273, 0.013219356536865234, 0.013777971267700195, 0.014336585998535156, 0.014895200729370117, 0.015453815460205078, 0.01601243019104004, 0.016571044921875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 8.0, 12.0, 8.0, 16.0, 17.0, 17.0, 13.0, 29.0, 31.0, 35.0, 22.0, 36.0, 32.0, 49.0, 35.0, 48.0, 37.0, 1074.0, 40.0, 40.0, 24.0, 29.0, 36.0, 43.0, 35.0, 30.0, 25.0, 32.0, 25.0, 33.0, 15.0, 16.0, 11.0, 16.0, 18.0, 13.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0726318359375, -1.036865234375, -1.0010986328125, -0.96533203125, -0.9295654296875, -0.893798828125, -0.8580322265625, -0.822265625, -0.7864990234375, -0.750732421875, -0.7149658203125, -0.67919921875, -0.6434326171875, -0.607666015625, -0.5718994140625, -0.5361328125, -0.5003662109375, -0.464599609375, -0.4288330078125, -0.39306640625, -0.3572998046875, -0.321533203125, -0.2857666015625, -0.25, -0.2142333984375, -0.178466796875, -0.1427001953125, -0.10693359375, -0.0711669921875, -0.035400390625, 0.0003662109375, 0.0361328125, 0.0718994140625, 0.107666015625, 0.1434326171875, 0.17919921875, 0.2149658203125, 0.250732421875, 0.2864990234375, 0.322265625, 0.3580322265625, 0.393798828125, 0.4295654296875, 0.46533203125, 0.5010986328125, 0.536865234375, 0.5726318359375, 0.6083984375, 0.6441650390625, 0.679931640625, 0.7156982421875, 0.75146484375, 0.7872314453125, 0.822998046875, 0.8587646484375, 0.89453125, 0.9302978515625, 0.966064453125, 1.0018310546875, 1.03759765625, 1.0733642578125, 1.109130859375, 1.1448974609375, 1.1806640625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 11.0, 6.0, 17.0, 43.0, 56.0, 77.0, 119.0, 161.0, 277.0, 436.0, 619.0, 920.0, 1553.0, 2396.0, 3613.0, 5795.0, 9418.0, 14640.0, 23853.0, 38674.0, 64669.0, 112999.0, 1301692.0, 243799.0, 109072.0, 62191.0, 37528.0, 23214.0, 14306.0, 9020.0, 5639.0, 3678.0, 2279.0, 1493.0, 1033.0, 623.0, 366.0, 260.0, 194.0, 142.0, 70.0, 59.0, 30.0, 29.0, 25.0, 11.0, 14.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.006916046142578125, -0.006706297397613525, -0.006496548652648926, -0.006286799907684326, -0.0060770511627197266, -0.005867302417755127, -0.005657553672790527, -0.005447804927825928, -0.005238056182861328, -0.0050283074378967285, -0.004818558692932129, -0.004608809947967529, -0.00439906120300293, -0.00418931245803833, -0.0039795637130737305, -0.003769814968109131, -0.0035600662231445312, -0.0033503174781799316, -0.003140568733215332, -0.0029308199882507324, -0.002721071243286133, -0.002511322498321533, -0.0023015737533569336, -0.002091825008392334, -0.0018820762634277344, -0.0016723275184631348, -0.0014625787734985352, -0.0012528300285339355, -0.001043081283569336, -0.0008333325386047363, -0.0006235837936401367, -0.0004138350486755371, -0.0002040863037109375, 5.662441253662109e-06, 0.00021541118621826172, 0.00042515993118286133, 0.0006349086761474609, 0.0008446574211120605, 0.0010544061660766602, 0.0012641549110412598, 0.0014739036560058594, 0.001683652400970459, 0.0018934011459350586, 0.002103149890899658, 0.002312898635864258, 0.0025226473808288574, 0.002732396125793457, 0.0029421448707580566, 0.0031518936157226562, 0.003361642360687256, 0.0035713911056518555, 0.003781139850616455, 0.003990888595581055, 0.004200637340545654, 0.004410386085510254, 0.0046201348304748535, 0.004829883575439453, 0.005039632320404053, 0.005249381065368652, 0.005459129810333252, 0.0056688785552978516, 0.005878627300262451, 0.006088376045227051, 0.00629812479019165, 0.00650787353515625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 998.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [18.0, 0.0, 8.0, 0.0, 0.0, 11.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 52.0, 0.0, 755.0, 0.0, 0.0, 5962.0, 0.0, 0.0, 1034942.0, 0.0, 5984.0, 0.0, 0.0, 715.0, 0.0, 0.0, 59.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 10.0, 0.0, 16.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 9.0, 6.0, 15.0, 9.0, 16.0, 10.0, 20.0, 19.0, 33.0, 49.0, 50.0, 35.0, 59.0, 54.0, 62.0, 57.0, 49.0, 60.0, 59.0, 68.0, 55.0, 40.0, 35.0, 29.0, 28.0, 20.0, 11.0, 18.0, 8.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.890625, -2.8162078857421875, -2.741790771484375, -2.6673736572265625, -2.59295654296875, -2.5185394287109375, -2.444122314453125, -2.3697052001953125, -2.2952880859375, -2.2208709716796875, -2.146453857421875, -2.0720367431640625, -1.99761962890625, -1.9232025146484375, -1.848785400390625, -1.7743682861328125, -1.699951171875, -1.6255340576171875, -1.551116943359375, -1.4766998291015625, -1.40228271484375, -1.3278656005859375, -1.253448486328125, -1.1790313720703125, -1.1046142578125, -1.0301971435546875, -0.955780029296875, -0.8813629150390625, -0.80694580078125, -0.7325286865234375, -0.658111572265625, -0.5836944580078125, -0.50927734375, -0.4348602294921875, -0.360443115234375, -0.2860260009765625, -0.21160888671875, -0.1371917724609375, -0.062774658203125, 0.0116424560546875, 0.0860595703125, 0.1604766845703125, 0.234893798828125, 0.3093109130859375, 0.38372802734375, 0.4581451416015625, 0.532562255859375, 0.6069793701171875, 0.681396484375, 0.7558135986328125, 0.830230712890625, 0.9046478271484375, 0.97906494140625, 1.0534820556640625, 1.127899169921875, 1.2023162841796875, 1.2767333984375, 1.3511505126953125, 1.425567626953125, 1.4999847412109375, 1.57440185546875, 1.6488189697265625, 1.723236083984375, 1.7976531982421875, 1.8720703125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 16.0, 10.0, 28.0, 36.0, 100.0, 177.0, 346.0, 775.0, 1841.0, 4521.0, 11392.0, 30568.0, 105352.0, 713714.0, 124879.0, 33631.0, 12617.0, 4897.0, 1970.0, 868.0, 400.0, 178.0, 88.0, 72.0, 25.0, 11.0, 8.0, 8.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.85546875, -2.761993408203125, -2.66851806640625, -2.575042724609375, -2.4815673828125, -2.388092041015625, -2.29461669921875, -2.201141357421875, -2.107666015625, -2.014190673828125, -1.92071533203125, -1.827239990234375, -1.7337646484375, -1.640289306640625, -1.54681396484375, -1.453338623046875, -1.35986328125, -1.266387939453125, -1.17291259765625, -1.079437255859375, -0.9859619140625, -0.892486572265625, -0.79901123046875, -0.705535888671875, -0.612060546875, -0.518585205078125, -0.42510986328125, -0.331634521484375, -0.2381591796875, -0.144683837890625, -0.05120849609375, 0.042266845703125, 0.1357421875, 0.229217529296875, 0.32269287109375, 0.416168212890625, 0.5096435546875, 0.603118896484375, 0.69659423828125, 0.790069580078125, 0.883544921875, 0.977020263671875, 1.07049560546875, 1.163970947265625, 1.2574462890625, 1.350921630859375, 1.44439697265625, 1.537872314453125, 1.63134765625, 1.724822998046875, 1.81829833984375, 1.911773681640625, 2.0052490234375, 2.098724365234375, 2.19219970703125, 2.285675048828125, 2.379150390625, 2.472625732421875, 2.56610107421875, 2.659576416015625, 2.7530517578125, 2.846527099609375, 2.94000244140625, 3.033477783203125, 3.126953125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 3.0, 4.0, 7.0, 4.0, 9.0, 14.0, 15.0, 17.0, 13.0, 19.0, 21.0, 20.0, 19.0, 27.0, 38.0, 34.0, 33.0, 41.0, 53.0, 74.0, 110.0, 1700.0, 242.0, 102.0, 40.0, 33.0, 32.0, 43.0, 37.0, 38.0, 24.0, 26.0, 22.0, 26.0, 10.0, 15.0, 10.0, 15.0, 7.0, 9.0, 5.0, 5.0, 5.0, 2.0, 7.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.625, -5.44256591796875, -5.2601318359375, -5.07769775390625, -4.895263671875, -4.71282958984375, -4.5303955078125, -4.34796142578125, -4.16552734375, -3.98309326171875, -3.8006591796875, -3.61822509765625, -3.435791015625, -3.25335693359375, -3.0709228515625, -2.88848876953125, -2.7060546875, -2.52362060546875, -2.3411865234375, -2.15875244140625, -1.976318359375, -1.79388427734375, -1.6114501953125, -1.42901611328125, -1.24658203125, -1.06414794921875, -0.8817138671875, -0.69927978515625, -0.516845703125, -0.33441162109375, -0.1519775390625, 0.03045654296875, 0.212890625, 0.39532470703125, 0.5777587890625, 0.76019287109375, 0.942626953125, 1.12506103515625, 1.3074951171875, 1.48992919921875, 1.67236328125, 1.85479736328125, 2.0372314453125, 2.21966552734375, 2.402099609375, 2.58453369140625, 2.7669677734375, 2.94940185546875, 3.1318359375, 3.31427001953125, 3.4967041015625, 3.67913818359375, 3.861572265625, 4.04400634765625, 4.2264404296875, 4.40887451171875, 4.59130859375, 4.77374267578125, 4.9561767578125, 5.13861083984375, 5.321044921875, 5.50347900390625, 5.6859130859375, 5.86834716796875, 6.05078125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 9.0, 7.0, 7.0, 12.0, 13.0, 19.0, 14.0, 21.0, 35.0, 29.0, 39.0, 72.0, 96.0, 138.0, 239.0, 466.0, 1604.0, 11384.0, 415481.0, 2689898.0, 22125.0, 2522.0, 599.0, 297.0, 143.0, 103.0, 68.0, 58.0, 29.0, 26.0, 19.0, 24.0, 14.0, 16.0, 15.0, 10.0, 10.0, 6.0, 4.0, 4.0, 6.0, 4.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-10.1875, -9.8800048828125, -9.572509765625, -9.2650146484375, -8.95751953125, -8.6500244140625, -8.342529296875, -8.0350341796875, -7.7275390625, -7.4200439453125, -7.112548828125, -6.8050537109375, -6.49755859375, -6.1900634765625, -5.882568359375, -5.5750732421875, -5.267578125, -4.9600830078125, -4.652587890625, -4.3450927734375, -4.03759765625, -3.7301025390625, -3.422607421875, -3.1151123046875, -2.8076171875, -2.5001220703125, -2.192626953125, -1.8851318359375, -1.57763671875, -1.2701416015625, -0.962646484375, -0.6551513671875, -0.34765625, -0.0401611328125, 0.267333984375, 0.5748291015625, 0.88232421875, 1.1898193359375, 1.497314453125, 1.8048095703125, 2.1123046875, 2.4197998046875, 2.727294921875, 3.0347900390625, 3.34228515625, 3.6497802734375, 3.957275390625, 4.2647705078125, 4.572265625, 4.8797607421875, 5.187255859375, 5.4947509765625, 5.80224609375, 6.1097412109375, 6.417236328125, 6.7247314453125, 7.0322265625, 7.3397216796875, 7.647216796875, 7.9547119140625, 8.26220703125, 8.5697021484375, 8.877197265625, 9.1846923828125, 9.4921875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 24.0, 83.0, 151.0, 265.0, 219.0, 160.0, 79.0, 22.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9689764976501465, -4.418506622314453, -3.868037223815918, -3.3175673484802246, -2.7670977115631104, -2.216628074645996, -1.6661581993103027, -1.1156885623931885, -0.5652189254760742, -0.014749228954315186, 0.5357204675674438, 1.0861902236938477, 1.636659860610962, 2.187129497528076, 2.7375993728637695, 3.288069009780884, 3.838538646697998, 4.389008522033691, 4.939477920532227, 5.48994779586792, 6.040417671203613, 6.590887069702148, 7.141356945037842, 7.691826820373535, 8.24229621887207, 8.792765617370605, 9.343235969543457, 9.893705368041992, 10.444174766540527, 10.994644165039062, 11.545114517211914, 12.09558391571045, 12.646055221557617, 13.196524620056152, 13.746994972229004, 14.297464370727539, 14.847933769226074, 15.39840316772461, 15.948873519897461, 16.499343872070312, 17.04981231689453, 17.600282669067383, 18.1507511138916, 18.701221466064453, 19.251691818237305, 19.802160263061523, 20.352630615234375, 20.903100967407227, 21.453571319580078, 22.00404167175293, 22.55451011657715, 23.10498046875, 23.65545082092285, 24.20591926574707, 24.756389617919922, 25.306859970092773, 25.857328414916992, 26.407798767089844, 26.958267211914062, 27.508737564086914, 28.059207916259766, 28.609676361083984, 29.160146713256836, 29.710617065429688, 30.261085510253906]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 1.0, 4.0, 5.0, 11.0, 7.0, 14.0, 25.0, 19.0, 16.0, 18.0, 22.0, 28.0, 44.0, 32.0, 36.0, 37.0, 36.0, 51.0, 33.0, 39.0, 43.0, 36.0, 44.0, 36.0, 45.0, 40.0, 26.0, 26.0, 28.0, 33.0, 26.0, 16.0, 19.0, 13.0, 24.0, 15.0, 14.0, 7.0, 8.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.887758255004883, -18.264698028564453, -17.641637802124023, -17.018577575683594, -16.395517349243164, -15.772457122802734, -15.149397850036621, -14.526337623596191, -13.903277397155762, -13.280217170715332, -12.657156944274902, -12.034096717834473, -11.41103744506836, -10.78797721862793, -10.1649169921875, -9.54185676574707, -8.91879653930664, -8.295736312866211, -7.672676086425781, -7.04961633682251, -6.42655611038208, -5.80349588394165, -5.180436134338379, -4.557375907897949, -3.9343156814575195, -3.31125545501709, -2.6881954669952393, -2.0651354789733887, -1.442075252532959, -0.8190150260925293, -0.1959550380706787, 0.4271049499511719, 1.0501651763916016, 1.6732252836227417, 2.296285390853882, 2.9193453788757324, 3.542405605316162, 4.165465831756592, 4.788525581359863, 5.411585807800293, 6.034646034240723, 6.657706260681152, 7.280766487121582, 7.9038262367248535, 8.526885986328125, 9.149946212768555, 9.773006439208984, 10.396066665649414, 11.019126892089844, 11.642187118530273, 12.265247344970703, 12.888307571411133, 13.511367797851562, 14.134428024291992, 14.757487297058105, 15.380547523498535, 16.00360870361328, 16.62666893005371, 17.24972915649414, 17.87278938293457, 18.495849609375, 19.11890983581543, 19.74197006225586, 20.365028381347656, 20.988088607788086]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 13.0, 10.0, 17.0, 10.0, 13.0, 20.0, 31.0, 37.0, 55.0, 37.0, 56.0, 56.0, 51.0, 68.0, 43.0, 49.0, 67.0, 66.0, 52.0, 51.0, 38.0, 33.0, 26.0, 24.0, 16.0, 15.0, 13.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.875, -2.7997589111328125, -2.724517822265625, -2.6492767333984375, -2.57403564453125, -2.4987945556640625, -2.423553466796875, -2.3483123779296875, -2.2730712890625, -2.1978302001953125, -2.122589111328125, -2.0473480224609375, -1.97210693359375, -1.8968658447265625, -1.821624755859375, -1.7463836669921875, -1.671142578125, -1.5959014892578125, -1.520660400390625, -1.4454193115234375, -1.37017822265625, -1.2949371337890625, -1.219696044921875, -1.1444549560546875, -1.0692138671875, -0.9939727783203125, -0.918731689453125, -0.8434906005859375, -0.76824951171875, -0.6930084228515625, -0.617767333984375, -0.5425262451171875, -0.46728515625, -0.3920440673828125, -0.316802978515625, -0.2415618896484375, -0.16632080078125, -0.0910797119140625, -0.015838623046875, 0.0594024658203125, 0.1346435546875, 0.2098846435546875, 0.285125732421875, 0.3603668212890625, 0.43560791015625, 0.5108489990234375, 0.586090087890625, 0.6613311767578125, 0.736572265625, 0.8118133544921875, 0.887054443359375, 0.9622955322265625, 1.03753662109375, 1.1127777099609375, 1.188018798828125, 1.2632598876953125, 1.3385009765625, 1.4137420654296875, 1.488983154296875, 1.5642242431640625, 1.63946533203125, 1.7147064208984375, 1.789947509765625, 1.8651885986328125, 1.9404296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 10.0, 19.0, 16.0, 15.0, 20.0, 20.0, 26.0, 40.0, 46.0, 74.0, 105.0, 252.0, 576.0, 1598.0, 7556.0, 51914.0, 676609.0, 3194326.0, 230616.0, 24316.0, 4151.0, 1070.0, 376.0, 150.0, 93.0, 86.0, 45.0, 32.0, 29.0, 26.0, 10.0, 16.0, 8.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0078125, -9.7161865234375, -9.424560546875, -9.1329345703125, -8.84130859375, -8.5496826171875, -8.258056640625, -7.9664306640625, -7.6748046875, -7.3831787109375, -7.091552734375, -6.7999267578125, -6.50830078125, -6.2166748046875, -5.925048828125, -5.6334228515625, -5.341796875, -5.0501708984375, -4.758544921875, -4.4669189453125, -4.17529296875, -3.8836669921875, -3.592041015625, -3.3004150390625, -3.0087890625, -2.7171630859375, -2.425537109375, -2.1339111328125, -1.84228515625, -1.5506591796875, -1.259033203125, -0.9674072265625, -0.67578125, -0.3841552734375, -0.092529296875, 0.1990966796875, 0.49072265625, 0.7823486328125, 1.073974609375, 1.3656005859375, 1.6572265625, 1.9488525390625, 2.240478515625, 2.5321044921875, 2.82373046875, 3.1153564453125, 3.406982421875, 3.6986083984375, 3.990234375, 4.2818603515625, 4.573486328125, 4.8651123046875, 5.15673828125, 5.4483642578125, 5.739990234375, 6.0316162109375, 6.3232421875, 6.6148681640625, 6.906494140625, 7.1981201171875, 7.48974609375, 7.7813720703125, 8.072998046875, 8.3646240234375, 8.65625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 7.0, 5.0, 8.0, 16.0, 32.0, 55.0, 103.0, 163.0, 292.0, 510.0, 844.0, 840.0, 520.0, 317.0, 171.0, 96.0, 49.0, 24.0, 10.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.375, -16.03363037109375, -15.6922607421875, -15.35089111328125, -15.009521484375, -14.66815185546875, -14.3267822265625, -13.98541259765625, -13.64404296875, -13.30267333984375, -12.9613037109375, -12.61993408203125, -12.278564453125, -11.93719482421875, -11.5958251953125, -11.25445556640625, -10.9130859375, -10.57171630859375, -10.2303466796875, -9.88897705078125, -9.547607421875, -9.20623779296875, -8.8648681640625, -8.52349853515625, -8.18212890625, -7.84075927734375, -7.4993896484375, -7.15802001953125, -6.816650390625, -6.47528076171875, -6.1339111328125, -5.79254150390625, -5.451171875, -5.10980224609375, -4.7684326171875, -4.42706298828125, -4.085693359375, -3.74432373046875, -3.4029541015625, -3.06158447265625, -2.72021484375, -2.37884521484375, -2.0374755859375, -1.69610595703125, -1.354736328125, -1.01336669921875, -0.6719970703125, -0.33062744140625, 0.0107421875, 0.35211181640625, 0.6934814453125, 1.03485107421875, 1.376220703125, 1.71759033203125, 2.0589599609375, 2.40032958984375, 2.74169921875, 3.08306884765625, 3.4244384765625, 3.76580810546875, 4.107177734375, 4.44854736328125, 4.7899169921875, 5.13128662109375, 5.47265625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 13.0, 12.0, 11.0, 25.0, 31.0, 58.0, 112.0, 146.0, 365.0, 880.0, 3783.0, 57427.0, 3360730.0, 751169.0, 16427.0, 1913.0, 551.0, 230.0, 141.0, 86.0, 32.0, 38.0, 35.0, 20.0, 13.0, 8.0, 6.0, 1.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.563232421875, -15.76708984375, -14.970947265625, -14.1748046875, -13.378662109375, -12.58251953125, -11.786376953125, -10.990234375, -10.194091796875, -9.39794921875, -8.601806640625, -7.8056640625, -7.009521484375, -6.21337890625, -5.417236328125, -4.62109375, -3.824951171875, -3.02880859375, -2.232666015625, -1.4365234375, -0.640380859375, 0.15576171875, 0.951904296875, 1.748046875, 2.544189453125, 3.34033203125, 4.136474609375, 4.9326171875, 5.728759765625, 6.52490234375, 7.321044921875, 8.1171875, 8.913330078125, 9.70947265625, 10.505615234375, 11.3017578125, 12.097900390625, 12.89404296875, 13.690185546875, 14.486328125, 15.282470703125, 16.07861328125, 16.874755859375, 17.6708984375, 18.467041015625, 19.26318359375, 20.059326171875, 20.85546875, 21.651611328125, 22.44775390625, 23.243896484375, 24.0400390625, 24.836181640625, 25.63232421875, 26.428466796875, 27.224609375, 28.020751953125, 28.81689453125, 29.613037109375, 30.4091796875, 31.205322265625, 32.00146484375, 32.797607421875, 33.59375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 17.0, 25.0, 43.0, 61.0, 104.0, 152.0, 153.0, 141.0, 121.0, 83.0, 56.0, 22.0, 12.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.122764587402344, -60.66960525512695, -59.21644592285156, -57.763282775878906, -56.310123443603516, -54.856964111328125, -53.403804779052734, -51.950645446777344, -50.49748611450195, -49.04432678222656, -47.59116744995117, -46.13800811767578, -44.684844970703125, -43.231685638427734, -41.778526306152344, -40.32536697387695, -38.87220764160156, -37.41904830932617, -35.96588897705078, -34.512725830078125, -33.059566497802734, -31.606407165527344, -30.153247833251953, -28.700088500976562, -27.246925354003906, -25.793766021728516, -24.340604782104492, -22.8874454498291, -21.43428611755371, -19.981124877929688, -18.527965545654297, -17.074806213378906, -15.621644973754883, -14.168484687805176, -12.715325355529785, -11.262165069580078, -9.809005737304688, -8.35584545135498, -6.902685165405273, -5.449525833129883, -3.996365547180176, -2.543205738067627, -1.090045690536499, 0.3631143569946289, 1.8162741661071777, 3.2694339752197266, 4.722594261169434, 6.175753593444824, 7.628913879394531, 9.082074165344238, 10.535233497619629, 11.988393783569336, 13.441553115844727, 14.894713401794434, 16.34787368774414, 17.80103302001953, 19.254192352294922, 20.707351684570312, 22.160512924194336, 23.613672256469727, 25.066831588745117, 26.51999282836914, 27.97315216064453, 29.426311492919922, 30.879472732543945]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 2.0, 4.0, 8.0, 9.0, 13.0, 10.0, 13.0, 11.0, 15.0, 21.0, 23.0, 24.0, 18.0, 44.0, 32.0, 35.0, 42.0, 39.0, 42.0, 43.0, 39.0, 51.0, 41.0, 51.0, 44.0, 44.0, 27.0, 42.0, 37.0, 26.0, 24.0, 30.0, 22.0, 18.0, 15.0, 11.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.445066452026367, -20.74574089050293, -20.046417236328125, -19.347091674804688, -18.64776611328125, -17.948440551757812, -17.249114990234375, -16.54979133605957, -15.850465774536133, -15.151140213012695, -14.451815605163574, -13.752490997314453, -13.053165435791016, -12.353839874267578, -11.654515266418457, -10.955190658569336, -10.255865097045898, -9.556539535522461, -8.85721492767334, -8.157890319824219, -7.458564758300781, -6.759239673614502, -6.059914588928223, -5.360589504241943, -4.661264419555664, -3.9619393348693848, -3.2626142501831055, -2.563289165496826, -1.8639640808105469, -1.1646389961242676, -0.4653139114379883, 0.23401117324829102, 0.9333343505859375, 1.6326594352722168, 2.331984519958496, 3.0313096046447754, 3.7306346893310547, 4.429959774017334, 5.129284858703613, 5.828609943389893, 6.527935028076172, 7.227260112762451, 7.9265851974487305, 8.625909805297852, 9.325235366821289, 10.024560928344727, 10.723885536193848, 11.423210144042969, 12.122535705566406, 12.821861267089844, 13.521185874938965, 14.220510482788086, 14.919836044311523, 15.619161605834961, 16.318485260009766, 17.017810821533203, 17.71713638305664, 18.416461944580078, 19.115787506103516, 19.81511116027832, 20.514436721801758, 21.213762283325195, 21.9130859375, 22.612411499023438, 23.311737060546875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 9.0, 9.0, 16.0, 7.0, 14.0, 11.0, 18.0, 16.0, 32.0, 41.0, 38.0, 41.0, 46.0, 45.0, 55.0, 47.0, 56.0, 54.0, 55.0, 52.0, 51.0, 62.0, 31.0, 31.0, 35.0, 26.0, 22.0, 24.0, 12.0, 11.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.71875, -2.64459228515625, -2.5704345703125, -2.49627685546875, -2.422119140625, -2.34796142578125, -2.2738037109375, -2.19964599609375, -2.12548828125, -2.05133056640625, -1.9771728515625, -1.90301513671875, -1.828857421875, -1.75469970703125, -1.6805419921875, -1.60638427734375, -1.5322265625, -1.45806884765625, -1.3839111328125, -1.30975341796875, -1.235595703125, -1.16143798828125, -1.0872802734375, -1.01312255859375, -0.93896484375, -0.86480712890625, -0.7906494140625, -0.71649169921875, -0.642333984375, -0.56817626953125, -0.4940185546875, -0.41986083984375, -0.345703125, -0.27154541015625, -0.1973876953125, -0.12322998046875, -0.049072265625, 0.02508544921875, 0.0992431640625, 0.17340087890625, 0.24755859375, 0.32171630859375, 0.3958740234375, 0.47003173828125, 0.544189453125, 0.61834716796875, 0.6925048828125, 0.76666259765625, 0.8408203125, 0.91497802734375, 0.9891357421875, 1.06329345703125, 1.137451171875, 1.21160888671875, 1.2857666015625, 1.35992431640625, 1.43408203125, 1.50823974609375, 1.5823974609375, 1.65655517578125, 1.730712890625, 1.80487060546875, 1.8790283203125, 1.95318603515625, 2.02734375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 3.0, 14.0, 18.0, 27.0, 38.0, 53.0, 101.0, 151.0, 239.0, 395.0, 606.0, 997.0, 1559.0, 2846.0, 4639.0, 8287.0, 14334.0, 25620.0, 49873.0, 103556.0, 307771.0, 311669.0, 105086.0, 49890.0, 26517.0, 14373.0, 8109.0, 4662.0, 2787.0, 1647.0, 1029.0, 641.0, 379.0, 240.0, 139.0, 68.0, 57.0, 42.0, 25.0, 15.0, 14.0, 12.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0162353515625, -0.01575791835784912, -0.015280485153198242, -0.014803051948547363, -0.014325618743896484, -0.013848185539245605, -0.013370752334594727, -0.012893319129943848, -0.012415885925292969, -0.01193845272064209, -0.011461019515991211, -0.010983586311340332, -0.010506153106689453, -0.010028719902038574, -0.009551286697387695, -0.009073853492736816, -0.008596420288085938, -0.008118987083435059, -0.00764155387878418, -0.007164120674133301, -0.006686687469482422, -0.006209254264831543, -0.005731821060180664, -0.005254387855529785, -0.004776954650878906, -0.004299521446228027, -0.0038220882415771484, -0.0033446550369262695, -0.0028672218322753906, -0.0023897886276245117, -0.0019123554229736328, -0.001434922218322754, -0.000957489013671875, -0.0004800558090209961, -2.6226043701171875e-06, 0.0004748106002807617, 0.0009522438049316406, 0.0014296770095825195, 0.0019071102142333984, 0.0023845434188842773, 0.0028619766235351562, 0.003339409828186035, 0.003816843032836914, 0.004294276237487793, 0.004771709442138672, 0.005249142646789551, 0.00572657585144043, 0.006204009056091309, 0.0066814422607421875, 0.007158875465393066, 0.007636308670043945, 0.008113741874694824, 0.008591175079345703, 0.009068608283996582, 0.009546041488647461, 0.01002347469329834, 0.010500907897949219, 0.010978341102600098, 0.011455774307250977, 0.011933207511901855, 0.012410640716552734, 0.012888073921203613, 0.013365507125854492, 0.013842940330505371, 0.01432037353515625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 6.0, 5.0, 6.0, 5.0, 9.0, 13.0, 11.0, 15.0, 12.0, 13.0, 15.0, 17.0, 20.0, 26.0, 31.0, 41.0, 39.0, 46.0, 34.0, 44.0, 49.0, 1063.0, 45.0, 31.0, 34.0, 40.0, 42.0, 39.0, 38.0, 26.0, 33.0, 28.0, 18.0, 22.0, 21.0, 22.0, 11.0, 13.0, 6.0, 6.0, 6.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.1953125, -1.1561279296875, -1.116943359375, -1.0777587890625, -1.03857421875, -0.9993896484375, -0.960205078125, -0.9210205078125, -0.8818359375, -0.8426513671875, -0.803466796875, -0.7642822265625, -0.72509765625, -0.6859130859375, -0.646728515625, -0.6075439453125, -0.568359375, -0.5291748046875, -0.489990234375, -0.4508056640625, -0.41162109375, -0.3724365234375, -0.333251953125, -0.2940673828125, -0.2548828125, -0.2156982421875, -0.176513671875, -0.1373291015625, -0.09814453125, -0.0589599609375, -0.019775390625, 0.0194091796875, 0.05859375, 0.0977783203125, 0.136962890625, 0.1761474609375, 0.21533203125, 0.2545166015625, 0.293701171875, 0.3328857421875, 0.3720703125, 0.4112548828125, 0.450439453125, 0.4896240234375, 0.52880859375, 0.5679931640625, 0.607177734375, 0.6463623046875, 0.685546875, 0.7247314453125, 0.763916015625, 0.8031005859375, 0.84228515625, 0.8814697265625, 0.920654296875, 0.9598388671875, 0.9990234375, 1.0382080078125, 1.077392578125, 1.1165771484375, 1.15576171875, 1.1949462890625, 1.234130859375, 1.2733154296875, 1.3125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 10.0, 7.0, 21.0, 17.0, 40.0, 74.0, 76.0, 111.0, 167.0, 271.0, 447.0, 559.0, 810.0, 1207.0, 1854.0, 2759.0, 4100.0, 6238.0, 9679.0, 15103.0, 23859.0, 39471.0, 67743.0, 127778.0, 1339385.0, 214543.0, 97302.0, 54112.0, 32442.0, 19700.0, 12684.0, 8306.0, 5345.0, 3605.0, 2449.0, 1552.0, 1084.0, 757.0, 466.0, 328.0, 231.0, 129.0, 95.0, 68.0, 45.0, 34.0, 25.0, 20.0, 11.0, 6.0, 5.0, 3.0, 1.0, 5.0, 2.0], "bins": [-0.00792694091796875, -0.007692456245422363, -0.0074579715728759766, -0.00722348690032959, -0.006989002227783203, -0.006754517555236816, -0.00652003288269043, -0.006285548210144043, -0.006051063537597656, -0.0058165788650512695, -0.005582094192504883, -0.005347609519958496, -0.005113124847412109, -0.004878640174865723, -0.004644155502319336, -0.004409670829772949, -0.0041751861572265625, -0.003940701484680176, -0.003706216812133789, -0.0034717321395874023, -0.0032372474670410156, -0.003002762794494629, -0.002768278121948242, -0.0025337934494018555, -0.0022993087768554688, -0.002064824104309082, -0.0018303394317626953, -0.0015958547592163086, -0.0013613700866699219, -0.0011268854141235352, -0.0008924007415771484, -0.0006579160690307617, -0.000423431396484375, -0.00018894672393798828, 4.553794860839844e-05, 0.00028002262115478516, 0.0005145072937011719, 0.0007489919662475586, 0.0009834766387939453, 0.001217961311340332, 0.0014524459838867188, 0.0016869306564331055, 0.0019214153289794922, 0.002155900001525879, 0.0023903846740722656, 0.0026248693466186523, 0.002859354019165039, 0.0030938386917114258, 0.0033283233642578125, 0.0035628080368041992, 0.003797292709350586, 0.004031777381896973, 0.004266262054443359, 0.004500746726989746, 0.004735231399536133, 0.0049697160720825195, 0.005204200744628906, 0.005438685417175293, 0.00567317008972168, 0.005907654762268066, 0.006142139434814453, 0.00637662410736084, 0.0066111087799072266, 0.006845593452453613, 0.007080078125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1000.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [9.0, 0.0, 6.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 20.0, 0.0, 0.0, 61.0, 0.0, 960.0, 0.0, 0.0, 5984.0, 0.0, 0.0, 1034427.0, 0.0, 6024.0, 0.0, 0.0, 944.0, 0.0, 0.0, 55.0, 0.0, 17.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 5.0, 0.0, 4.0], "bins": [-7.152557373046875e-07, -6.92903995513916e-07, -6.705522537231445e-07, -6.48200511932373e-07, -6.258487701416016e-07, -6.034970283508301e-07, -5.811452865600586e-07, -5.587935447692871e-07, -5.364418029785156e-07, -5.140900611877441e-07, -4.917383193969727e-07, -4.6938657760620117e-07, -4.470348358154297e-07, -4.246830940246582e-07, -4.023313522338867e-07, -3.7997961044311523e-07, -3.5762786865234375e-07, -3.3527612686157227e-07, -3.129243850708008e-07, -2.905726432800293e-07, -2.682209014892578e-07, -2.4586915969848633e-07, -2.2351741790771484e-07, -2.0116567611694336e-07, -1.7881393432617188e-07, -1.564621925354004e-07, -1.341104507446289e-07, -1.1175870895385742e-07, -8.940696716308594e-08, -6.705522537231445e-08, -4.470348358154297e-08, -2.2351741790771484e-08, 0.0, 2.2351741790771484e-08, 4.470348358154297e-08, 6.705522537231445e-08, 8.940696716308594e-08, 1.1175870895385742e-07, 1.341104507446289e-07, 1.564621925354004e-07, 1.7881393432617188e-07, 2.0116567611694336e-07, 2.2351741790771484e-07, 2.4586915969848633e-07, 2.682209014892578e-07, 2.905726432800293e-07, 3.129243850708008e-07, 3.3527612686157227e-07, 3.5762786865234375e-07, 3.7997961044311523e-07, 4.023313522338867e-07, 4.246830940246582e-07, 4.470348358154297e-07, 4.6938657760620117e-07, 4.917383193969727e-07, 5.140900611877441e-07, 5.364418029785156e-07, 5.587935447692871e-07, 5.811452865600586e-07, 6.034970283508301e-07, 6.258487701416016e-07, 6.48200511932373e-07, 6.705522537231445e-07, 6.92903995513916e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 9.0, 9.0, 16.0, 7.0, 14.0, 11.0, 18.0, 16.0, 32.0, 41.0, 38.0, 41.0, 46.0, 45.0, 55.0, 47.0, 56.0, 54.0, 55.0, 52.0, 51.0, 62.0, 31.0, 31.0, 35.0, 26.0, 22.0, 24.0, 12.0, 11.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.71875, -2.64459228515625, -2.5704345703125, -2.49627685546875, -2.422119140625, -2.34796142578125, -2.2738037109375, -2.19964599609375, -2.12548828125, -2.05133056640625, -1.9771728515625, -1.90301513671875, -1.828857421875, -1.75469970703125, -1.6805419921875, -1.60638427734375, -1.5322265625, -1.45806884765625, -1.3839111328125, -1.30975341796875, -1.235595703125, -1.16143798828125, -1.0872802734375, -1.01312255859375, -0.93896484375, -0.86480712890625, -0.7906494140625, -0.71649169921875, -0.642333984375, -0.56817626953125, -0.4940185546875, -0.41986083984375, -0.345703125, -0.27154541015625, -0.1973876953125, -0.12322998046875, -0.049072265625, 0.02508544921875, 0.0992431640625, 0.17340087890625, 0.24755859375, 0.32171630859375, 0.3958740234375, 0.47003173828125, 0.544189453125, 0.61834716796875, 0.6925048828125, 0.76666259765625, 0.8408203125, 0.91497802734375, 0.9891357421875, 1.06329345703125, 1.137451171875, 1.21160888671875, 1.2857666015625, 1.35992431640625, 1.43408203125, 1.50823974609375, 1.5823974609375, 1.65655517578125, 1.730712890625, 1.80487060546875, 1.8790283203125, 1.95318603515625, 2.02734375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 10.0, 8.0, 23.0, 19.0, 36.0, 60.0, 60.0, 115.0, 161.0, 254.0, 363.0, 587.0, 950.0, 1584.0, 2423.0, 4055.0, 6975.0, 12453.0, 24466.0, 57204.0, 192700.0, 506814.0, 141809.0, 47304.0, 21099.0, 11187.0, 6102.0, 3666.0, 2216.0, 1381.0, 893.0, 550.0, 344.0, 239.0, 156.0, 108.0, 57.0, 41.0, 29.0, 23.0, 12.0, 12.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.568359375, -1.5252685546875, -1.482177734375, -1.4390869140625, -1.39599609375, -1.3529052734375, -1.309814453125, -1.2667236328125, -1.2236328125, -1.1805419921875, -1.137451171875, -1.0943603515625, -1.05126953125, -1.0081787109375, -0.965087890625, -0.9219970703125, -0.87890625, -0.8358154296875, -0.792724609375, -0.7496337890625, -0.70654296875, -0.6634521484375, -0.620361328125, -0.5772705078125, -0.5341796875, -0.4910888671875, -0.447998046875, -0.4049072265625, -0.36181640625, -0.3187255859375, -0.275634765625, -0.2325439453125, -0.189453125, -0.1463623046875, -0.103271484375, -0.0601806640625, -0.01708984375, 0.0260009765625, 0.069091796875, 0.1121826171875, 0.1552734375, 0.1983642578125, 0.241455078125, 0.2845458984375, 0.32763671875, 0.3707275390625, 0.413818359375, 0.4569091796875, 0.5, 0.5430908203125, 0.586181640625, 0.6292724609375, 0.67236328125, 0.7154541015625, 0.758544921875, 0.8016357421875, 0.8447265625, 0.8878173828125, 0.930908203125, 0.9739990234375, 1.01708984375, 1.0601806640625, 1.103271484375, 1.1463623046875, 1.189453125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 9.0, 10.0, 13.0, 14.0, 19.0, 30.0, 26.0, 40.0, 42.0, 52.0, 44.0, 63.0, 93.0, 317.0, 1706.0, 97.0, 72.0, 65.0, 55.0, 51.0, 39.0, 32.0, 22.0, 20.0, 21.0, 23.0, 9.0, 11.0, 13.0, 9.0, 7.0, 2.0, 1.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9453125, -7.6815185546875, -7.417724609375, -7.1539306640625, -6.89013671875, -6.6263427734375, -6.362548828125, -6.0987548828125, -5.8349609375, -5.5711669921875, -5.307373046875, -5.0435791015625, -4.77978515625, -4.5159912109375, -4.252197265625, -3.9884033203125, -3.724609375, -3.4608154296875, -3.197021484375, -2.9332275390625, -2.66943359375, -2.4056396484375, -2.141845703125, -1.8780517578125, -1.6142578125, -1.3504638671875, -1.086669921875, -0.8228759765625, -0.55908203125, -0.2952880859375, -0.031494140625, 0.2322998046875, 0.49609375, 0.7598876953125, 1.023681640625, 1.2874755859375, 1.55126953125, 1.8150634765625, 2.078857421875, 2.3426513671875, 2.6064453125, 2.8702392578125, 3.134033203125, 3.3978271484375, 3.66162109375, 3.9254150390625, 4.189208984375, 4.4530029296875, 4.716796875, 4.9805908203125, 5.244384765625, 5.5081787109375, 5.77197265625, 6.0357666015625, 6.299560546875, 6.5633544921875, 6.8271484375, 7.0909423828125, 7.354736328125, 7.6185302734375, 7.88232421875, 8.1461181640625, 8.409912109375, 8.6737060546875, 8.9375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 16.0, 9.0, 10.0, 15.0, 19.0, 22.0, 28.0, 47.0, 67.0, 92.0, 147.0, 247.0, 405.0, 981.0, 3352.0, 23011.0, 2669611.0, 429122.0, 14348.0, 2339.0, 807.0, 350.0, 232.0, 119.0, 80.0, 51.0, 42.0, 30.0, 17.0, 17.0, 10.0, 11.0, 8.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.25, -10.9180908203125, -10.586181640625, -10.2542724609375, -9.92236328125, -9.5904541015625, -9.258544921875, -8.9266357421875, -8.5947265625, -8.2628173828125, -7.930908203125, -7.5989990234375, -7.26708984375, -6.9351806640625, -6.603271484375, -6.2713623046875, -5.939453125, -5.6075439453125, -5.275634765625, -4.9437255859375, -4.61181640625, -4.2799072265625, -3.947998046875, -3.6160888671875, -3.2841796875, -2.9522705078125, -2.620361328125, -2.2884521484375, -1.95654296875, -1.6246337890625, -1.292724609375, -0.9608154296875, -0.62890625, -0.2969970703125, 0.034912109375, 0.3668212890625, 0.69873046875, 1.0306396484375, 1.362548828125, 1.6944580078125, 2.0263671875, 2.3582763671875, 2.690185546875, 3.0220947265625, 3.35400390625, 3.6859130859375, 4.017822265625, 4.3497314453125, 4.681640625, 5.0135498046875, 5.345458984375, 5.6773681640625, 6.00927734375, 6.3411865234375, 6.673095703125, 7.0050048828125, 7.3369140625, 7.6688232421875, 8.000732421875, 8.3326416015625, 8.66455078125, 8.9964599609375, 9.328369140625, 9.6602783203125, 9.9921875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 734.0, 282.0, 1.0], "bins": [-292.466796875, -287.7378845214844, -283.0090026855469, -278.28009033203125, -273.55120849609375, -268.8222961425781, -264.0933837890625, -259.364501953125, -254.63558959960938, -249.9066925048828, -245.17779541015625, -240.44888305664062, -235.71998596191406, -230.9910888671875, -226.26219177246094, -221.53329467773438, -216.8043975830078, -212.07550048828125, -207.3466033935547, -202.61769104003906, -197.8887939453125, -193.15989685058594, -188.43099975585938, -183.7021026611328, -178.97320556640625, -174.2443084716797, -169.51541137695312, -164.7864990234375, -160.05760192871094, -155.32870483398438, -150.5998077392578, -145.87091064453125, -141.14199829101562, -136.41310119628906, -131.6842041015625, -126.9552993774414, -122.22639465332031, -117.49749755859375, -112.76860046386719, -108.03970336914062, -103.31079864501953, -98.58190155029297, -93.85299682617188, -89.12409973144531, -84.39520263671875, -79.66629791259766, -74.9374008178711, -70.20849609375, -65.47959899902344, -60.75069808959961, -56.02179718017578, -51.29290008544922, -46.56399917602539, -41.83509826660156, -37.106201171875, -32.37730026245117, -27.648401260375977, -22.91950225830078, -18.190601348876953, -13.461701393127441, -8.73280143737793, -4.003900527954102, 0.7249984741210938, 5.453897476196289, 10.182798385620117]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 8.0, 1.0, 3.0, 7.0, 8.0, 10.0, 16.0, 14.0, 18.0, 22.0, 18.0, 22.0, 22.0, 21.0, 20.0, 22.0, 38.0, 36.0, 24.0, 42.0, 30.0, 37.0, 29.0, 46.0, 29.0, 32.0, 42.0, 43.0, 38.0, 34.0, 27.0, 27.0, 20.0, 28.0, 24.0, 26.0, 23.0, 14.0, 13.0, 15.0, 10.0, 8.0, 8.0, 5.0, 7.0, 6.0, 6.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0], "bins": [-21.769140243530273, -21.129335403442383, -20.489532470703125, -19.849727630615234, -19.209924697875977, -18.570119857788086, -17.930316925048828, -17.290512084960938, -16.650707244873047, -16.010902404785156, -15.371099472045898, -14.731295585632324, -14.09149169921875, -13.45168685913086, -12.811882972717285, -12.172079086303711, -11.532276153564453, -10.892472267150879, -10.252668380737305, -9.61286449432373, -8.973060607910156, -8.333255767822266, -7.693451881408691, -7.053647994995117, -6.413844108581543, -5.774040222167969, -5.1342363357543945, -4.494431972503662, -3.854628086090088, -3.2148241996765137, -2.5750200748443604, -1.935215950012207, -1.2954120635986328, -0.655608057975769, -0.015804052352905273, 0.6239999532699585, 1.2638039588928223, 1.9036078453063965, 2.54341197013855, 3.183216094970703, 3.8230199813842773, 4.462823867797852, 5.102627754211426, 5.742432117462158, 6.382236003875732, 7.022039890289307, 7.661844253540039, 8.301648139953613, 8.941452026367188, 9.581255912780762, 10.221059799194336, 10.86086368560791, 11.500667572021484, 12.140472412109375, 12.78027629852295, 13.420080184936523, 14.059884071350098, 14.699687957763672, 15.339491844177246, 15.97929573059082, 16.61910057067871, 17.25890350341797, 17.89870834350586, 18.53851318359375, 19.178316116333008]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 9.0, 8.0, 10.0, 12.0, 9.0, 8.0, 8.0, 16.0, 24.0, 24.0, 29.0, 39.0, 52.0, 44.0, 42.0, 50.0, 48.0, 46.0, 65.0, 56.0, 54.0, 48.0, 48.0, 49.0, 44.0, 33.0, 20.0, 25.0, 15.0, 22.0, 14.0, 11.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.787109375, -2.711669921875, -2.63623046875, -2.560791015625, -2.4853515625, -2.409912109375, -2.33447265625, -2.259033203125, -2.18359375, -2.108154296875, -2.03271484375, -1.957275390625, -1.8818359375, -1.806396484375, -1.73095703125, -1.655517578125, -1.580078125, -1.504638671875, -1.42919921875, -1.353759765625, -1.2783203125, -1.202880859375, -1.12744140625, -1.052001953125, -0.9765625, -0.901123046875, -0.82568359375, -0.750244140625, -0.6748046875, -0.599365234375, -0.52392578125, -0.448486328125, -0.373046875, -0.297607421875, -0.22216796875, -0.146728515625, -0.0712890625, 0.004150390625, 0.07958984375, 0.155029296875, 0.23046875, 0.305908203125, 0.38134765625, 0.456787109375, 0.5322265625, 0.607666015625, 0.68310546875, 0.758544921875, 0.833984375, 0.909423828125, 0.98486328125, 1.060302734375, 1.1357421875, 1.211181640625, 1.28662109375, 1.362060546875, 1.4375, 1.512939453125, 1.58837890625, 1.663818359375, 1.7392578125, 1.814697265625, 1.89013671875, 1.965576171875, 2.041015625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 17.0, 12.0, 13.0, 20.0, 22.0, 35.0, 66.0, 127.0, 210.0, 486.0, 1144.0, 3100.0, 9495.0, 34004.0, 150617.0, 1156212.0, 2426968.0, 324908.0, 62266.0, 16302.0, 4927.0, 1816.0, 709.0, 357.0, 171.0, 99.0, 47.0, 35.0, 26.0, 19.0, 13.0, 10.0, 3.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.87109375, -6.68646240234375, -6.5018310546875, -6.31719970703125, -6.132568359375, -5.94793701171875, -5.7633056640625, -5.57867431640625, -5.39404296875, -5.20941162109375, -5.0247802734375, -4.84014892578125, -4.655517578125, -4.47088623046875, -4.2862548828125, -4.10162353515625, -3.9169921875, -3.73236083984375, -3.5477294921875, -3.36309814453125, -3.178466796875, -2.99383544921875, -2.8092041015625, -2.62457275390625, -2.43994140625, -2.25531005859375, -2.0706787109375, -1.88604736328125, -1.701416015625, -1.51678466796875, -1.3321533203125, -1.14752197265625, -0.962890625, -0.77825927734375, -0.5936279296875, -0.40899658203125, -0.224365234375, -0.03973388671875, 0.1448974609375, 0.32952880859375, 0.51416015625, 0.69879150390625, 0.8834228515625, 1.06805419921875, 1.252685546875, 1.43731689453125, 1.6219482421875, 1.80657958984375, 1.9912109375, 2.17584228515625, 2.3604736328125, 2.54510498046875, 2.729736328125, 2.91436767578125, 3.0989990234375, 3.28363037109375, 3.46826171875, 3.65289306640625, 3.8375244140625, 4.02215576171875, 4.206787109375, 4.39141845703125, 4.5760498046875, 4.76068115234375, 4.9453125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 5.0, 16.0, 21.0, 20.0, 25.0, 44.0, 69.0, 96.0, 132.0, 211.0, 343.0, 473.0, 563.0, 572.0, 432.0, 335.0, 224.0, 148.0, 94.0, 78.0, 54.0, 38.0, 20.0, 19.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1875, -8.9576416015625, -8.727783203125, -8.4979248046875, -8.26806640625, -8.0382080078125, -7.808349609375, -7.5784912109375, -7.3486328125, -7.1187744140625, -6.888916015625, -6.6590576171875, -6.42919921875, -6.1993408203125, -5.969482421875, -5.7396240234375, -5.509765625, -5.2799072265625, -5.050048828125, -4.8201904296875, -4.59033203125, -4.3604736328125, -4.130615234375, -3.9007568359375, -3.6708984375, -3.4410400390625, -3.211181640625, -2.9813232421875, -2.75146484375, -2.5216064453125, -2.291748046875, -2.0618896484375, -1.83203125, -1.6021728515625, -1.372314453125, -1.1424560546875, -0.91259765625, -0.6827392578125, -0.452880859375, -0.2230224609375, 0.0068359375, 0.2366943359375, 0.466552734375, 0.6964111328125, 0.92626953125, 1.1561279296875, 1.385986328125, 1.6158447265625, 1.845703125, 2.0755615234375, 2.305419921875, 2.5352783203125, 2.76513671875, 2.9949951171875, 3.224853515625, 3.4547119140625, 3.6845703125, 3.9144287109375, 4.144287109375, 4.3741455078125, 4.60400390625, 4.8338623046875, 5.063720703125, 5.2935791015625, 5.5234375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 17.0, 30.0, 38.0, 69.0, 113.0, 226.0, 363.0, 844.0, 2212.0, 8960.0, 62659.0, 813458.0, 3031703.0, 241598.0, 24755.0, 4599.0, 1402.0, 592.0, 274.0, 135.0, 92.0, 56.0, 32.0, 24.0, 10.0, 10.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.5859375, -13.1219482421875, -12.657958984375, -12.1939697265625, -11.72998046875, -11.2659912109375, -10.802001953125, -10.3380126953125, -9.8740234375, -9.4100341796875, -8.946044921875, -8.4820556640625, -8.01806640625, -7.5540771484375, -7.090087890625, -6.6260986328125, -6.162109375, -5.6981201171875, -5.234130859375, -4.7701416015625, -4.30615234375, -3.8421630859375, -3.378173828125, -2.9141845703125, -2.4501953125, -1.9862060546875, -1.522216796875, -1.0582275390625, -0.59423828125, -0.1302490234375, 0.333740234375, 0.7977294921875, 1.26171875, 1.7257080078125, 2.189697265625, 2.6536865234375, 3.11767578125, 3.5816650390625, 4.045654296875, 4.5096435546875, 4.9736328125, 5.4376220703125, 5.901611328125, 6.3656005859375, 6.82958984375, 7.2935791015625, 7.757568359375, 8.2215576171875, 8.685546875, 9.1495361328125, 9.613525390625, 10.0775146484375, 10.54150390625, 11.0054931640625, 11.469482421875, 11.9334716796875, 12.3974609375, 12.8614501953125, 13.325439453125, 13.7894287109375, 14.25341796875, 14.7174072265625, 15.181396484375, 15.6453857421875, 16.109375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 8.0, 16.0, 22.0, 51.0, 76.0, 88.0, 120.0, 135.0, 148.0, 122.0, 69.0, 63.0, 38.0, 21.0, 12.0, 8.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.174633026123047, -26.935260772705078, -25.69588851928711, -24.45651626586914, -23.217144012451172, -21.977771759033203, -20.738399505615234, -19.499027252197266, -18.259654998779297, -17.020282745361328, -15.78091049194336, -14.54153823852539, -13.302165985107422, -12.062793731689453, -10.823421478271484, -9.584049224853516, -8.344676971435547, -7.105304718017578, -5.865932464599609, -4.626560211181641, -3.387187957763672, -2.147815704345703, -0.9084434509277344, 0.3309288024902344, 1.5703010559082031, 2.809673309326172, 4.049045562744141, 5.288417816162109, 6.527790069580078, 7.767162322998047, 9.006534576416016, 10.245906829833984, 11.485282897949219, 12.724655151367188, 13.964027404785156, 15.203399658203125, 16.442771911621094, 17.682144165039062, 18.92151641845703, 20.160888671875, 21.40026092529297, 22.639633178710938, 23.879005432128906, 25.118377685546875, 26.357749938964844, 27.597122192382812, 28.83649444580078, 30.07586669921875, 31.31523895263672, 32.55461120605469, 33.793983459472656, 35.033355712890625, 36.272727966308594, 37.51210021972656, 38.75147247314453, 39.9908447265625, 41.23021697998047, 42.46958923339844, 43.708961486816406, 44.948333740234375, 46.187705993652344, 47.42707824707031, 48.66645050048828, 49.90582275390625, 51.14519500732422]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 7.0, 6.0, 9.0, 10.0, 16.0, 15.0, 10.0, 18.0, 18.0, 22.0, 32.0, 30.0, 40.0, 29.0, 39.0, 47.0, 41.0, 36.0, 31.0, 52.0, 47.0, 50.0, 51.0, 43.0, 34.0, 40.0, 28.0, 20.0, 27.0, 27.0, 19.0, 18.0, 21.0, 12.0, 13.0, 8.0, 8.0, 11.0, 7.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.300743103027344, -20.645584106445312, -19.99042320251465, -19.335264205932617, -18.680103302001953, -18.024944305419922, -17.36978530883789, -16.71462631225586, -16.059465408325195, -15.404305458068848, -14.7491455078125, -14.093986511230469, -13.438826560974121, -12.783666610717773, -12.128507614135742, -11.473347663879395, -10.818187713623047, -10.1630277633667, -9.507867813110352, -8.85270881652832, -8.197548866271973, -7.542388916015625, -6.8872294425964355, -6.232069969177246, -5.576910018920898, -4.921750068664551, -4.266590595245361, -3.6114308834075928, -2.956271171569824, -2.3011114597320557, -1.645951747894287, -0.9907922744750977, -0.33563232421875, 0.31952738761901855, 0.9746870994567871, 1.6298468112945557, 2.285006523132324, 2.9401662349700928, 3.5953259468078613, 4.250485420227051, 4.905645370483398, 5.560805320739746, 6.2159647941589355, 6.871124267578125, 7.526284217834473, 8.18144416809082, 8.836603164672852, 9.4917631149292, 10.146923065185547, 10.802083015441895, 11.457242965698242, 12.112401962280273, 12.767561912536621, 13.422721862792969, 14.077880859375, 14.733040809631348, 15.388200759887695, 16.043359756469727, 16.69852066040039, 17.353679656982422, 18.008838653564453, 18.663999557495117, 19.31915855407715, 19.974319458007812, 20.629478454589844]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 6.0, 14.0, 11.0, 10.0, 7.0, 17.0, 19.0, 21.0, 22.0, 32.0, 39.0, 42.0, 47.0, 38.0, 43.0, 52.0, 56.0, 54.0, 56.0, 46.0, 38.0, 50.0, 40.0, 45.0, 32.0, 35.0, 22.0, 19.0, 20.0, 16.0, 12.0, 14.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.5557861328125, -2.480712890625, -2.4056396484375, -2.33056640625, -2.2554931640625, -2.180419921875, -2.1053466796875, -2.0302734375, -1.9552001953125, -1.880126953125, -1.8050537109375, -1.72998046875, -1.6549072265625, -1.579833984375, -1.5047607421875, -1.4296875, -1.3546142578125, -1.279541015625, -1.2044677734375, -1.12939453125, -1.0543212890625, -0.979248046875, -0.9041748046875, -0.8291015625, -0.7540283203125, -0.678955078125, -0.6038818359375, -0.52880859375, -0.4537353515625, -0.378662109375, -0.3035888671875, -0.228515625, -0.1534423828125, -0.078369140625, -0.0032958984375, 0.07177734375, 0.1468505859375, 0.221923828125, 0.2969970703125, 0.3720703125, 0.4471435546875, 0.522216796875, 0.5972900390625, 0.67236328125, 0.7474365234375, 0.822509765625, 0.8975830078125, 0.97265625, 1.0477294921875, 1.122802734375, 1.1978759765625, 1.27294921875, 1.3480224609375, 1.423095703125, 1.4981689453125, 1.5732421875, 1.6483154296875, 1.723388671875, 1.7984619140625, 1.87353515625, 1.9486083984375, 2.023681640625, 2.0987548828125, 2.173828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 8.0, 14.0, 18.0, 23.0, 28.0, 65.0, 79.0, 123.0, 213.0, 349.0, 516.0, 825.0, 1340.0, 1955.0, 3110.0, 4808.0, 7814.0, 12557.0, 20268.0, 34231.0, 59463.0, 112473.0, 320617.0, 243186.0, 94681.0, 51462.0, 30040.0, 17862.0, 11138.0, 7071.0, 4385.0, 2882.0, 1790.0, 1129.0, 733.0, 473.0, 304.0, 181.0, 112.0, 77.0, 47.0, 23.0, 29.0, 17.0, 8.0, 6.0, 2.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.01385498046875, -0.013433575630187988, -0.013012170791625977, -0.012590765953063965, -0.012169361114501953, -0.011747956275939941, -0.01132655143737793, -0.010905146598815918, -0.010483741760253906, -0.010062336921691895, -0.009640932083129883, -0.009219527244567871, -0.00879812240600586, -0.008376717567443848, -0.007955312728881836, -0.007533907890319824, -0.0071125030517578125, -0.006691098213195801, -0.006269693374633789, -0.005848288536071777, -0.005426883697509766, -0.005005478858947754, -0.004584074020385742, -0.0041626691818237305, -0.0037412643432617188, -0.003319859504699707, -0.0028984546661376953, -0.0024770498275756836, -0.002055644989013672, -0.0016342401504516602, -0.0012128353118896484, -0.0007914304733276367, -0.000370025634765625, 5.137920379638672e-05, 0.00047278404235839844, 0.0008941888809204102, 0.0013155937194824219, 0.0017369985580444336, 0.0021584033966064453, 0.002579808235168457, 0.0030012130737304688, 0.0034226179122924805, 0.003844022750854492, 0.004265427589416504, 0.004686832427978516, 0.005108237266540527, 0.005529642105102539, 0.005951046943664551, 0.0063724517822265625, 0.006793856620788574, 0.007215261459350586, 0.007636666297912598, 0.00805807113647461, 0.008479475975036621, 0.008900880813598633, 0.009322285652160645, 0.009743690490722656, 0.010165095329284668, 0.01058650016784668, 0.011007905006408691, 0.011429309844970703, 0.011850714683532715, 0.012272119522094727, 0.012693524360656738, 0.01311492919921875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 11.0, 16.0, 12.0, 12.0, 27.0, 21.0, 29.0, 30.0, 34.0, 40.0, 38.0, 36.0, 38.0, 45.0, 42.0, 1078.0, 38.0, 46.0, 50.0, 40.0, 32.0, 50.0, 44.0, 21.0, 26.0, 22.0, 27.0, 24.0, 20.0, 16.0, 8.0, 8.0, 9.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-1.740234375, -1.6942138671875, -1.648193359375, -1.6021728515625, -1.55615234375, -1.5101318359375, -1.464111328125, -1.4180908203125, -1.3720703125, -1.3260498046875, -1.280029296875, -1.2340087890625, -1.18798828125, -1.1419677734375, -1.095947265625, -1.0499267578125, -1.00390625, -0.9578857421875, -0.911865234375, -0.8658447265625, -0.81982421875, -0.7738037109375, -0.727783203125, -0.6817626953125, -0.6357421875, -0.5897216796875, -0.543701171875, -0.4976806640625, -0.45166015625, -0.4056396484375, -0.359619140625, -0.3135986328125, -0.267578125, -0.2215576171875, -0.175537109375, -0.1295166015625, -0.08349609375, -0.0374755859375, 0.008544921875, 0.0545654296875, 0.1005859375, 0.1466064453125, 0.192626953125, 0.2386474609375, 0.28466796875, 0.3306884765625, 0.376708984375, 0.4227294921875, 0.46875, 0.5147705078125, 0.560791015625, 0.6068115234375, 0.65283203125, 0.6988525390625, 0.744873046875, 0.7908935546875, 0.8369140625, 0.8829345703125, 0.928955078125, 0.9749755859375, 1.02099609375, 1.0670166015625, 1.113037109375, 1.1590576171875, 1.205078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 13.0, 5.0, 8.0, 21.0, 34.0, 54.0, 69.0, 117.0, 220.0, 349.0, 589.0, 972.0, 1752.0, 2759.0, 5069.0, 8621.0, 15150.0, 27375.0, 50093.0, 95903.0, 227885.0, 1382660.0, 131264.0, 65419.0, 35183.0, 19437.0, 10828.0, 6288.0, 3648.0, 2097.0, 1246.0, 758.0, 471.0, 278.0, 174.0, 128.0, 82.0, 38.0, 22.0, 13.0, 14.0, 15.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00922393798828125, -0.0089186429977417, -0.008613348007202148, -0.008308053016662598, -0.008002758026123047, -0.007697463035583496, -0.007392168045043945, -0.0070868730545043945, -0.006781578063964844, -0.006476283073425293, -0.006170988082885742, -0.005865693092346191, -0.005560398101806641, -0.00525510311126709, -0.004949808120727539, -0.004644513130187988, -0.0043392181396484375, -0.004033923149108887, -0.003728628158569336, -0.003423333168029785, -0.0031180381774902344, -0.0028127431869506836, -0.002507448196411133, -0.002202153205871582, -0.0018968582153320312, -0.0015915632247924805, -0.0012862682342529297, -0.000980973243713379, -0.0006756782531738281, -0.00037038326263427734, -6.508827209472656e-05, 0.00024020671844482422, 0.000545501708984375, 0.0008507966995239258, 0.0011560916900634766, 0.0014613866806030273, 0.0017666816711425781, 0.002071976661682129, 0.0023772716522216797, 0.0026825666427612305, 0.0029878616333007812, 0.003293156623840332, 0.003598451614379883, 0.0039037466049194336, 0.004209041595458984, 0.004514336585998535, 0.004819631576538086, 0.005124926567077637, 0.0054302215576171875, 0.005735516548156738, 0.006040811538696289, 0.00634610652923584, 0.006651401519775391, 0.006956696510314941, 0.007261991500854492, 0.007567286491394043, 0.007872581481933594, 0.008177876472473145, 0.008483171463012695, 0.008788466453552246, 0.009093761444091797, 0.009399056434631348, 0.009704351425170898, 0.01000964641571045, 0.01031494140625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 979.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 7.0, 20.0, 1.0, 0.0, 4.0, 2.0, 5.0, 0.0, 13.0, 40.0, 55.0, 0.0, 313.0, 2397.0, 10804.0, 0.0, 1021150.0, 10988.0, 2288.0, 0.0, 315.0, 72.0, 37.0, 0.0, 24.0, 4.0, 3.0, 0.0, 3.0, 0.0, 11.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 6.0, 14.0, 11.0, 10.0, 7.0, 17.0, 19.0, 21.0, 22.0, 32.0, 39.0, 42.0, 47.0, 38.0, 43.0, 52.0, 56.0, 54.0, 56.0, 46.0, 38.0, 50.0, 40.0, 45.0, 32.0, 35.0, 22.0, 19.0, 20.0, 16.0, 12.0, 14.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.5557861328125, -2.480712890625, -2.4056396484375, -2.33056640625, -2.2554931640625, -2.180419921875, -2.1053466796875, -2.0302734375, -1.9552001953125, -1.880126953125, -1.8050537109375, -1.72998046875, -1.6549072265625, -1.579833984375, -1.5047607421875, -1.4296875, -1.3546142578125, -1.279541015625, -1.2044677734375, -1.12939453125, -1.0543212890625, -0.979248046875, -0.9041748046875, -0.8291015625, -0.7540283203125, -0.678955078125, -0.6038818359375, -0.52880859375, -0.4537353515625, -0.378662109375, -0.3035888671875, -0.228515625, -0.1534423828125, -0.078369140625, -0.0032958984375, 0.07177734375, 0.1468505859375, 0.221923828125, 0.2969970703125, 0.3720703125, 0.4471435546875, 0.522216796875, 0.5972900390625, 0.67236328125, 0.7474365234375, 0.822509765625, 0.8975830078125, 0.97265625, 1.0477294921875, 1.122802734375, 1.1978759765625, 1.27294921875, 1.3480224609375, 1.423095703125, 1.4981689453125, 1.5732421875, 1.6483154296875, 1.723388671875, 1.7984619140625, 1.87353515625, 1.9486083984375, 2.023681640625, 2.0987548828125, 2.173828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 9.0, 7.0, 13.0, 15.0, 22.0, 27.0, 51.0, 77.0, 85.0, 107.0, 181.0, 272.0, 379.0, 552.0, 844.0, 1183.0, 1778.0, 2760.0, 4125.0, 6688.0, 10928.0, 19352.0, 35285.0, 72605.0, 188407.0, 406711.0, 155979.0, 63079.0, 31560.0, 17650.0, 10146.0, 6196.0, 3836.0, 2480.0, 1725.0, 1072.0, 728.0, 461.0, 369.0, 204.0, 176.0, 132.0, 80.0, 54.0, 53.0, 36.0, 17.0, 20.0, 9.0, 12.0, 6.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.4365234375, -1.3907928466796875, -1.345062255859375, -1.2993316650390625, -1.25360107421875, -1.2078704833984375, -1.162139892578125, -1.1164093017578125, -1.0706787109375, -1.0249481201171875, -0.979217529296875, -0.9334869384765625, -0.88775634765625, -0.8420257568359375, -0.796295166015625, -0.7505645751953125, -0.704833984375, -0.6591033935546875, -0.613372802734375, -0.5676422119140625, -0.52191162109375, -0.4761810302734375, -0.430450439453125, -0.3847198486328125, -0.3389892578125, -0.2932586669921875, -0.247528076171875, -0.2017974853515625, -0.15606689453125, -0.1103363037109375, -0.064605712890625, -0.0188751220703125, 0.02685546875, 0.0725860595703125, 0.118316650390625, 0.1640472412109375, 0.20977783203125, 0.2555084228515625, 0.301239013671875, 0.3469696044921875, 0.3927001953125, 0.4384307861328125, 0.484161376953125, 0.5298919677734375, 0.57562255859375, 0.6213531494140625, 0.667083740234375, 0.7128143310546875, 0.758544921875, 0.8042755126953125, 0.850006103515625, 0.8957366943359375, 0.94146728515625, 0.9871978759765625, 1.032928466796875, 1.0786590576171875, 1.1243896484375, 1.1701202392578125, 1.215850830078125, 1.2615814208984375, 1.30731201171875, 1.3530426025390625, 1.398773193359375, 1.4445037841796875, 1.490234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 10.0, 10.0, 9.0, 13.0, 9.0, 17.0, 16.0, 25.0, 25.0, 42.0, 25.0, 31.0, 35.0, 46.0, 62.0, 75.0, 75.0, 245.0, 1613.0, 147.0, 90.0, 54.0, 47.0, 39.0, 42.0, 34.0, 25.0, 26.0, 29.0, 17.0, 20.0, 17.0, 17.0, 11.0, 9.0, 9.0, 7.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-7.8671875, -7.6383056640625, -7.409423828125, -7.1805419921875, -6.95166015625, -6.7227783203125, -6.493896484375, -6.2650146484375, -6.0361328125, -5.8072509765625, -5.578369140625, -5.3494873046875, -5.12060546875, -4.8917236328125, -4.662841796875, -4.4339599609375, -4.205078125, -3.9761962890625, -3.747314453125, -3.5184326171875, -3.28955078125, -3.0606689453125, -2.831787109375, -2.6029052734375, -2.3740234375, -2.1451416015625, -1.916259765625, -1.6873779296875, -1.45849609375, -1.2296142578125, -1.000732421875, -0.7718505859375, -0.54296875, -0.3140869140625, -0.085205078125, 0.1436767578125, 0.37255859375, 0.6014404296875, 0.830322265625, 1.0592041015625, 1.2880859375, 1.5169677734375, 1.745849609375, 1.9747314453125, 2.20361328125, 2.4324951171875, 2.661376953125, 2.8902587890625, 3.119140625, 3.3480224609375, 3.576904296875, 3.8057861328125, 4.03466796875, 4.2635498046875, 4.492431640625, 4.7213134765625, 4.9501953125, 5.1790771484375, 5.407958984375, 5.6368408203125, 5.86572265625, 6.0946044921875, 6.323486328125, 6.5523681640625, 6.78125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 11.0, 12.0, 9.0, 19.0, 11.0, 20.0, 22.0, 34.0, 37.0, 54.0, 69.0, 127.0, 167.0, 320.0, 607.0, 1645.0, 8426.0, 102324.0, 2909526.0, 110297.0, 8679.0, 1686.0, 623.0, 361.0, 186.0, 106.0, 68.0, 49.0, 49.0, 31.0, 23.0, 15.0, 15.0, 11.0, 11.0, 9.0, 11.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.3125, -9.9852294921875, -9.657958984375, -9.3306884765625, -9.00341796875, -8.6761474609375, -8.348876953125, -8.0216064453125, -7.6943359375, -7.3670654296875, -7.039794921875, -6.7125244140625, -6.38525390625, -6.0579833984375, -5.730712890625, -5.4034423828125, -5.076171875, -4.7489013671875, -4.421630859375, -4.0943603515625, -3.76708984375, -3.4398193359375, -3.112548828125, -2.7852783203125, -2.4580078125, -2.1307373046875, -1.803466796875, -1.4761962890625, -1.14892578125, -0.8216552734375, -0.494384765625, -0.1671142578125, 0.16015625, 0.4874267578125, 0.814697265625, 1.1419677734375, 1.46923828125, 1.7965087890625, 2.123779296875, 2.4510498046875, 2.7783203125, 3.1055908203125, 3.432861328125, 3.7601318359375, 4.08740234375, 4.4146728515625, 4.741943359375, 5.0692138671875, 5.396484375, 5.7237548828125, 6.051025390625, 6.3782958984375, 6.70556640625, 7.0328369140625, 7.360107421875, 7.6873779296875, 8.0146484375, 8.3419189453125, 8.669189453125, 8.9964599609375, 9.32373046875, 9.6510009765625, 9.978271484375, 10.3055419921875, 10.6328125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [104.0, 905.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9601569175720215, -1.7863740921020508, 3.38740873336792, 8.56119155883789, 13.734973907470703, 18.908756256103516, 24.08254051208496, 29.256322860717773, 34.43010711669922, 39.60388946533203, 44.777671813964844, 49.951454162597656, 55.12523651123047, 60.29901885986328, 65.47280883789062, 70.64659118652344, 75.82036590576172, 80.99414825439453, 86.16793060302734, 91.34171295166016, 96.51549530029297, 101.68927764892578, 106.86306762695312, 112.03684997558594, 117.21063232421875, 122.38441467285156, 127.55819702148438, 132.7319793701172, 137.90576171875, 143.0795440673828, 148.25332641601562, 153.42710876464844, 158.6009063720703, 163.77468872070312, 168.94847106933594, 174.12225341796875, 179.29603576660156, 184.46981811523438, 189.6436004638672, 194.8173828125, 199.9911651611328, 205.16494750976562, 210.33872985839844, 215.51251220703125, 220.68629455566406, 225.86007690429688, 231.0338592529297, 236.2076416015625, 241.38143920898438, 246.5552215576172, 251.72900390625, 256.9028015136719, 262.0765686035156, 267.2503662109375, 272.42413330078125, 277.5979309082031, 282.7716979980469, 287.94549560546875, 293.1192626953125, 298.2930603027344, 303.4668273925781, 308.640625, 313.81439208984375, 318.9881896972656, 324.1619567871094]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 14.0, 11.0, 20.0, 11.0, 23.0, 24.0, 19.0, 30.0, 32.0, 37.0, 37.0, 45.0, 35.0, 45.0, 28.0, 51.0, 45.0, 43.0, 43.0, 37.0, 36.0, 35.0, 48.0, 38.0, 30.0, 26.0, 37.0, 18.0, 16.0, 8.0, 14.0, 11.0, 11.0, 6.0, 5.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.54470443725586, -29.739673614501953, -28.934642791748047, -28.12961196899414, -27.324583053588867, -26.51955223083496, -25.714521408081055, -24.90949058532715, -24.104461669921875, -23.29943084716797, -22.494400024414062, -21.689369201660156, -20.884340286254883, -20.079309463500977, -19.27427864074707, -18.469247817993164, -17.664216995239258, -16.85918617248535, -16.054155349731445, -15.249125480651855, -14.444095611572266, -13.63906478881836, -12.834033966064453, -12.029003143310547, -11.223973274230957, -10.41894245147705, -9.613912582397461, -8.808881759643555, -8.003850936889648, -7.198821067810059, -6.393790245056152, -5.588759899139404, -4.783731460571289, -3.978701114654541, -3.173670530319214, -2.3686399459838867, -1.5636096000671387, -0.7585792541503906, 0.046451568603515625, 0.8514819145202637, 1.6565122604370117, 2.4615426063537598, 3.266573190689087, 4.071603775024414, 4.876634120941162, 5.68166446685791, 6.486695289611816, 7.2917256355285645, 8.096755981445312, 8.901786804199219, 9.706816673278809, 10.511847496032715, 11.316877365112305, 12.121908187866211, 12.926939010620117, 13.731969833374023, 14.536999702453613, 15.34203052520752, 16.14706039428711, 16.952091217041016, 17.757122039794922, 18.562152862548828, 19.367183685302734, 20.172212600708008, 20.977243423461914]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 1.0, 10.0, 14.0, 13.0, 12.0, 9.0, 18.0, 26.0, 22.0, 31.0, 26.0, 46.0, 53.0, 47.0, 46.0, 36.0, 56.0, 51.0, 64.0, 36.0, 46.0, 48.0, 39.0, 52.0, 37.0, 32.0, 26.0, 15.0, 13.0, 23.0, 15.0, 9.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.569000244140625, -2.49151611328125, -2.414031982421875, -2.3365478515625, -2.259063720703125, -2.18157958984375, -2.104095458984375, -2.026611328125, -1.949127197265625, -1.87164306640625, -1.794158935546875, -1.7166748046875, -1.639190673828125, -1.56170654296875, -1.484222412109375, -1.40673828125, -1.329254150390625, -1.25177001953125, -1.174285888671875, -1.0968017578125, -1.019317626953125, -0.94183349609375, -0.864349365234375, -0.786865234375, -0.709381103515625, -0.63189697265625, -0.554412841796875, -0.4769287109375, -0.399444580078125, -0.32196044921875, -0.244476318359375, -0.1669921875, -0.089508056640625, -0.01202392578125, 0.065460205078125, 0.1429443359375, 0.220428466796875, 0.29791259765625, 0.375396728515625, 0.452880859375, 0.530364990234375, 0.60784912109375, 0.685333251953125, 0.7628173828125, 0.840301513671875, 0.91778564453125, 0.995269775390625, 1.07275390625, 1.150238037109375, 1.22772216796875, 1.305206298828125, 1.3826904296875, 1.460174560546875, 1.53765869140625, 1.615142822265625, 1.692626953125, 1.770111083984375, 1.84759521484375, 1.925079345703125, 2.0025634765625, 2.080047607421875, 2.15753173828125, 2.235015869140625, 2.3125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 9.0, 11.0, 19.0, 16.0, 24.0, 23.0, 37.0, 78.0, 119.0, 228.0, 552.0, 1451.0, 4559.0, 16578.0, 70848.0, 463659.0, 2806713.0, 705475.0, 93968.0, 21088.0, 5619.0, 1841.0, 644.0, 296.0, 121.0, 77.0, 50.0, 41.0, 23.0, 14.0, 20.0, 13.0, 8.0, 12.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.44140625, -7.2322998046875, -7.023193359375, -6.8140869140625, -6.60498046875, -6.3958740234375, -6.186767578125, -5.9776611328125, -5.7685546875, -5.5594482421875, -5.350341796875, -5.1412353515625, -4.93212890625, -4.7230224609375, -4.513916015625, -4.3048095703125, -4.095703125, -3.8865966796875, -3.677490234375, -3.4683837890625, -3.25927734375, -3.0501708984375, -2.841064453125, -2.6319580078125, -2.4228515625, -2.2137451171875, -2.004638671875, -1.7955322265625, -1.58642578125, -1.3773193359375, -1.168212890625, -0.9591064453125, -0.75, -0.5408935546875, -0.331787109375, -0.1226806640625, 0.08642578125, 0.2955322265625, 0.504638671875, 0.7137451171875, 0.9228515625, 1.1319580078125, 1.341064453125, 1.5501708984375, 1.75927734375, 1.9683837890625, 2.177490234375, 2.3865966796875, 2.595703125, 2.8048095703125, 3.013916015625, 3.2230224609375, 3.43212890625, 3.6412353515625, 3.850341796875, 4.0594482421875, 4.2685546875, 4.4776611328125, 4.686767578125, 4.8958740234375, 5.10498046875, 5.3140869140625, 5.523193359375, 5.7322998046875, 5.94140625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 10.0, 7.0, 21.0, 23.0, 64.0, 85.0, 157.0, 323.0, 562.0, 812.0, 760.0, 525.0, 333.0, 175.0, 93.0, 67.0, 28.0, 12.0, 10.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.4044189453125, -11.058837890625, -10.7132568359375, -10.36767578125, -10.0220947265625, -9.676513671875, -9.3309326171875, -8.9853515625, -8.6397705078125, -8.294189453125, -7.9486083984375, -7.60302734375, -7.2574462890625, -6.911865234375, -6.5662841796875, -6.220703125, -5.8751220703125, -5.529541015625, -5.1839599609375, -4.83837890625, -4.4927978515625, -4.147216796875, -3.8016357421875, -3.4560546875, -3.1104736328125, -2.764892578125, -2.4193115234375, -2.07373046875, -1.7281494140625, -1.382568359375, -1.0369873046875, -0.69140625, -0.3458251953125, -0.000244140625, 0.3453369140625, 0.69091796875, 1.0364990234375, 1.382080078125, 1.7276611328125, 2.0732421875, 2.4188232421875, 2.764404296875, 3.1099853515625, 3.45556640625, 3.8011474609375, 4.146728515625, 4.4923095703125, 4.837890625, 5.1834716796875, 5.529052734375, 5.8746337890625, 6.22021484375, 6.5657958984375, 6.911376953125, 7.2569580078125, 7.6025390625, 7.9481201171875, 8.293701171875, 8.6392822265625, 8.98486328125, 9.3304443359375, 9.676025390625, 10.0216064453125, 10.3671875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 12.0, 25.0, 27.0, 50.0, 86.0, 129.0, 218.0, 364.0, 592.0, 1297.0, 4021.0, 22211.0, 254842.0, 3208463.0, 647882.0, 44151.0, 6320.0, 1728.0, 792.0, 426.0, 244.0, 138.0, 98.0, 63.0, 34.0, 25.0, 20.0, 8.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.515625, -15.0255126953125, -14.535400390625, -14.0452880859375, -13.55517578125, -13.0650634765625, -12.574951171875, -12.0848388671875, -11.5947265625, -11.1046142578125, -10.614501953125, -10.1243896484375, -9.63427734375, -9.1441650390625, -8.654052734375, -8.1639404296875, -7.673828125, -7.1837158203125, -6.693603515625, -6.2034912109375, -5.71337890625, -5.2232666015625, -4.733154296875, -4.2430419921875, -3.7529296875, -3.2628173828125, -2.772705078125, -2.2825927734375, -1.79248046875, -1.3023681640625, -0.812255859375, -0.3221435546875, 0.16796875, 0.6580810546875, 1.148193359375, 1.6383056640625, 2.12841796875, 2.6185302734375, 3.108642578125, 3.5987548828125, 4.0888671875, 4.5789794921875, 5.069091796875, 5.5592041015625, 6.04931640625, 6.5394287109375, 7.029541015625, 7.5196533203125, 8.009765625, 8.4998779296875, 8.989990234375, 9.4801025390625, 9.97021484375, 10.4603271484375, 10.950439453125, 11.4405517578125, 11.9306640625, 12.4207763671875, 12.910888671875, 13.4010009765625, 13.89111328125, 14.3812255859375, 14.871337890625, 15.3614501953125, 15.8515625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 10.0, 30.0, 60.0, 86.0, 164.0, 177.0, 179.0, 136.0, 92.0, 43.0, 24.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.16366958618164, -41.268028259277344, -39.37238693237305, -37.47674560546875, -35.58110809326172, -33.68546676635742, -31.789825439453125, -29.894184112548828, -27.998544692993164, -26.102903366088867, -24.207263946533203, -22.311622619628906, -20.41598129272461, -18.520341873168945, -16.62470054626465, -14.729060173034668, -12.833419799804688, -10.937779426574707, -9.042139053344727, -7.14649772644043, -5.250857353210449, -3.3552169799804688, -1.4595756530761719, 0.4360647201538086, 2.331705093383789, 4.2273454666137695, 6.122986316680908, 8.018627166748047, 9.914267539978027, 11.809907913208008, 13.705549240112305, 15.601189613342285, 17.496826171875, 19.392467498779297, 21.28810691833496, 23.183748245239258, 25.079387664794922, 26.97502899169922, 28.870670318603516, 30.766311645507812, 32.661949157714844, 34.55759048461914, 36.45323181152344, 38.34886932373047, 40.244510650634766, 42.14015197753906, 44.03579330444336, 45.931434631347656, 47.82707595825195, 49.72271728515625, 51.61835861206055, 53.513999938964844, 55.409637451171875, 57.30527877807617, 59.20092010498047, 61.096561431884766, 62.99220275878906, 64.8878402709961, 66.78348541259766, 68.67912292480469, 70.57476806640625, 72.47040557861328, 74.36604309082031, 76.26168823242188, 78.1573257446289]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 8.0, 10.0, 11.0, 8.0, 8.0, 16.0, 15.0, 12.0, 15.0, 26.0, 22.0, 25.0, 35.0, 27.0, 28.0, 37.0, 36.0, 30.0, 37.0, 40.0, 43.0, 33.0, 32.0, 41.0, 37.0, 42.0, 31.0, 33.0, 28.0, 31.0, 33.0, 22.0, 20.0, 15.0, 24.0, 18.0, 6.0, 8.0, 15.0, 9.0, 7.0, 4.0, 3.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-20.6429443359375, -20.021011352539062, -19.399080276489258, -18.77714729309082, -18.155216217041016, -17.533283233642578, -16.91135025024414, -16.289417266845703, -15.667486190795898, -15.045554161071777, -14.423622131347656, -13.801689147949219, -13.179757118225098, -12.557825088500977, -11.935892105102539, -11.313960075378418, -10.692028045654297, -10.070096015930176, -9.448163986206055, -8.826231002807617, -8.204298973083496, -7.582366943359375, -6.960434436798096, -6.338501930236816, -5.716569900512695, -5.094637870788574, -4.472705364227295, -3.8507730960845947, -3.2288408279418945, -2.6069085597991943, -1.9849762916564941, -1.3630437850952148, -0.7411117553710938, -0.11917948722839355, 0.5027527809143066, 1.1246850490570068, 1.746617317199707, 2.3685495853424072, 2.9904818534851074, 3.6124143600463867, 4.234346389770508, 4.856278419494629, 5.478210926055908, 6.1001434326171875, 6.722075462341309, 7.34400749206543, 7.965939998626709, 8.587872505187988, 9.20980453491211, 9.83173656463623, 10.453668594360352, 11.075601577758789, 11.69753360748291, 12.319465637207031, 12.941398620605469, 13.56333065032959, 14.185262680053711, 14.807194709777832, 15.429126739501953, 16.05105972290039, 16.672992706298828, 17.294923782348633, 17.91685676574707, 18.538787841796875, 19.160720825195312]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 10.0, 8.0, 7.0, 11.0, 12.0, 16.0, 18.0, 19.0, 10.0, 31.0, 30.0, 24.0, 27.0, 44.0, 39.0, 48.0, 38.0, 21.0, 42.0, 42.0, 54.0, 49.0, 44.0, 37.0, 44.0, 35.0, 31.0, 42.0, 30.0, 24.0, 20.0, 15.0, 20.0, 13.0, 10.0, 6.0, 6.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.150390625, -2.081634521484375, -2.01287841796875, -1.944122314453125, -1.8753662109375, -1.806610107421875, -1.73785400390625, -1.669097900390625, -1.600341796875, -1.531585693359375, -1.46282958984375, -1.394073486328125, -1.3253173828125, -1.256561279296875, -1.18780517578125, -1.119049072265625, -1.05029296875, -0.981536865234375, -0.91278076171875, -0.844024658203125, -0.7752685546875, -0.706512451171875, -0.63775634765625, -0.569000244140625, -0.500244140625, -0.431488037109375, -0.36273193359375, -0.293975830078125, -0.2252197265625, -0.156463623046875, -0.08770751953125, -0.018951416015625, 0.0498046875, 0.118560791015625, 0.18731689453125, 0.256072998046875, 0.3248291015625, 0.393585205078125, 0.46234130859375, 0.531097412109375, 0.599853515625, 0.668609619140625, 0.73736572265625, 0.806121826171875, 0.8748779296875, 0.943634033203125, 1.01239013671875, 1.081146240234375, 1.14990234375, 1.218658447265625, 1.28741455078125, 1.356170654296875, 1.4249267578125, 1.493682861328125, 1.56243896484375, 1.631195068359375, 1.699951171875, 1.768707275390625, 1.83746337890625, 1.906219482421875, 1.9749755859375, 2.043731689453125, 2.11248779296875, 2.181243896484375, 2.25]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 11.0, 6.0, 17.0, 29.0, 30.0, 53.0, 89.0, 131.0, 176.0, 272.0, 434.0, 639.0, 892.0, 1519.0, 2163.0, 3397.0, 5334.0, 8162.0, 13161.0, 21160.0, 35024.0, 60665.0, 114177.0, 287264.0, 249123.0, 103140.0, 55213.0, 32581.0, 19742.0, 12276.0, 7662.0, 4870.0, 3100.0, 2091.0, 1320.0, 832.0, 609.0, 404.0, 250.0, 184.0, 118.0, 84.0, 47.0, 35.0, 21.0, 20.0, 15.0, 7.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.01360321044921875, -0.013190031051635742, -0.012776851654052734, -0.012363672256469727, -0.011950492858886719, -0.011537313461303711, -0.011124134063720703, -0.010710954666137695, -0.010297775268554688, -0.00988459587097168, -0.009471416473388672, -0.009058237075805664, -0.008645057678222656, -0.008231878280639648, -0.00781869888305664, -0.007405519485473633, -0.006992340087890625, -0.006579160690307617, -0.006165981292724609, -0.0057528018951416016, -0.005339622497558594, -0.004926443099975586, -0.004513263702392578, -0.00410008430480957, -0.0036869049072265625, -0.0032737255096435547, -0.002860546112060547, -0.002447366714477539, -0.0020341873168945312, -0.0016210079193115234, -0.0012078285217285156, -0.0007946491241455078, -0.0003814697265625, 3.170967102050781e-05, 0.0004448890686035156, 0.0008580684661865234, 0.0012712478637695312, 0.001684427261352539, 0.002097606658935547, 0.0025107860565185547, 0.0029239654541015625, 0.0033371448516845703, 0.003750324249267578, 0.004163503646850586, 0.004576683044433594, 0.0049898624420166016, 0.005403041839599609, 0.005816221237182617, 0.006229400634765625, 0.006642580032348633, 0.007055759429931641, 0.0074689388275146484, 0.007882118225097656, 0.008295297622680664, 0.008708477020263672, 0.00912165641784668, 0.009534835815429688, 0.009948015213012695, 0.010361194610595703, 0.010774374008178711, 0.011187553405761719, 0.011600732803344727, 0.012013912200927734, 0.012427091598510742, 0.01284027099609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 10.0, 12.0, 9.0, 19.0, 13.0, 12.0, 30.0, 31.0, 26.0, 38.0, 44.0, 33.0, 46.0, 52.0, 52.0, 52.0, 1068.0, 46.0, 53.0, 42.0, 43.0, 27.0, 36.0, 35.0, 40.0, 28.0, 21.0, 19.0, 17.0, 19.0, 10.0, 9.0, 11.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.77734375, -1.727081298828125, -1.67681884765625, -1.626556396484375, -1.5762939453125, -1.526031494140625, -1.47576904296875, -1.425506591796875, -1.375244140625, -1.324981689453125, -1.27471923828125, -1.224456787109375, -1.1741943359375, -1.123931884765625, -1.07366943359375, -1.023406982421875, -0.97314453125, -0.922882080078125, -0.87261962890625, -0.822357177734375, -0.7720947265625, -0.721832275390625, -0.67156982421875, -0.621307373046875, -0.571044921875, -0.520782470703125, -0.47052001953125, -0.420257568359375, -0.3699951171875, -0.319732666015625, -0.26947021484375, -0.219207763671875, -0.1689453125, -0.118682861328125, -0.06842041015625, -0.018157958984375, 0.0321044921875, 0.082366943359375, 0.13262939453125, 0.182891845703125, 0.233154296875, 0.283416748046875, 0.33367919921875, 0.383941650390625, 0.4342041015625, 0.484466552734375, 0.53472900390625, 0.584991455078125, 0.63525390625, 0.685516357421875, 0.73577880859375, 0.786041259765625, 0.8363037109375, 0.886566162109375, 0.93682861328125, 0.987091064453125, 1.037353515625, 1.087615966796875, 1.13787841796875, 1.188140869140625, 1.2384033203125, 1.288665771484375, 1.33892822265625, 1.389190673828125, 1.439453125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 16.0, 12.0, 14.0, 27.0, 53.0, 85.0, 93.0, 164.0, 262.0, 428.0, 677.0, 1084.0, 1773.0, 2976.0, 4931.0, 8603.0, 14747.0, 26485.0, 47523.0, 90889.0, 219700.0, 1392243.0, 136007.0, 65163.0, 35399.0, 19828.0, 11322.0, 6542.0, 3903.0, 2375.0, 1383.0, 881.0, 532.0, 341.0, 220.0, 153.0, 103.0, 62.0, 44.0, 31.0, 16.0, 17.0, 4.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00954437255859375, -0.009228944778442383, -0.008913516998291016, -0.008598089218139648, -0.008282661437988281, -0.007967233657836914, -0.007651805877685547, -0.00733637809753418, -0.0070209503173828125, -0.006705522537231445, -0.006390094757080078, -0.006074666976928711, -0.005759239196777344, -0.0054438114166259766, -0.005128383636474609, -0.004812955856323242, -0.004497528076171875, -0.004182100296020508, -0.0038666725158691406, -0.0035512447357177734, -0.0032358169555664062, -0.002920389175415039, -0.002604961395263672, -0.0022895336151123047, -0.0019741058349609375, -0.0016586780548095703, -0.0013432502746582031, -0.001027822494506836, -0.0007123947143554688, -0.00039696693420410156, -8.153915405273438e-05, 0.0002338886260986328, 0.00054931640625, 0.0008647441864013672, 0.0011801719665527344, 0.0014955997467041016, 0.0018110275268554688, 0.002126455307006836, 0.002441883087158203, 0.0027573108673095703, 0.0030727386474609375, 0.0033881664276123047, 0.003703594207763672, 0.004019021987915039, 0.004334449768066406, 0.0046498775482177734, 0.004965305328369141, 0.005280733108520508, 0.005596160888671875, 0.005911588668823242, 0.006227016448974609, 0.0065424442291259766, 0.006857872009277344, 0.007173299789428711, 0.007488727569580078, 0.007804155349731445, 0.008119583129882812, 0.00843501091003418, 0.008750438690185547, 0.009065866470336914, 0.009381294250488281, 0.009696722030639648, 0.010012149810791016, 0.010327577590942383, 0.01064300537109375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 973.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 19.0, 1.0, 0.0, 10.0, 1.0, 11.0, 0.0, 2.0, 38.0, 55.0, 0.0, 331.0, 2405.0, 11960.0, 0.0, 1018940.0, 11984.0, 2299.0, 0.0, 360.0, 61.0, 38.0, 0.0, 7.0, 4.0, 4.0, 0.0, 5.0, 5.0, 15.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 10.0, 8.0, 7.0, 11.0, 12.0, 16.0, 18.0, 19.0, 10.0, 31.0, 30.0, 24.0, 27.0, 44.0, 39.0, 48.0, 38.0, 21.0, 42.0, 42.0, 54.0, 49.0, 44.0, 37.0, 44.0, 35.0, 31.0, 42.0, 30.0, 24.0, 20.0, 15.0, 20.0, 13.0, 10.0, 6.0, 6.0, 7.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.150390625, -2.081634521484375, -2.01287841796875, -1.944122314453125, -1.8753662109375, -1.806610107421875, -1.73785400390625, -1.669097900390625, -1.600341796875, -1.531585693359375, -1.46282958984375, -1.394073486328125, -1.3253173828125, -1.256561279296875, -1.18780517578125, -1.119049072265625, -1.05029296875, -0.981536865234375, -0.91278076171875, -0.844024658203125, -0.7752685546875, -0.706512451171875, -0.63775634765625, -0.569000244140625, -0.500244140625, -0.431488037109375, -0.36273193359375, -0.293975830078125, -0.2252197265625, -0.156463623046875, -0.08770751953125, -0.018951416015625, 0.0498046875, 0.118560791015625, 0.18731689453125, 0.256072998046875, 0.3248291015625, 0.393585205078125, 0.46234130859375, 0.531097412109375, 0.599853515625, 0.668609619140625, 0.73736572265625, 0.806121826171875, 0.8748779296875, 0.943634033203125, 1.01239013671875, 1.081146240234375, 1.14990234375, 1.218658447265625, 1.28741455078125, 1.356170654296875, 1.4249267578125, 1.493682861328125, 1.56243896484375, 1.631195068359375, 1.699951171875, 1.768707275390625, 1.83746337890625, 1.906219482421875, 1.9749755859375, 2.043731689453125, 2.11248779296875, 2.181243896484375, 2.25]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 5.0, 2.0, 8.0, 11.0, 19.0, 22.0, 28.0, 36.0, 52.0, 77.0, 137.0, 198.0, 309.0, 460.0, 776.0, 1189.0, 1900.0, 2964.0, 4951.0, 8050.0, 13456.0, 22749.0, 40406.0, 93820.0, 431212.0, 270642.0, 70898.0, 34187.0, 19676.0, 11696.0, 7033.0, 4289.0, 2631.0, 1732.0, 1056.0, 627.0, 396.0, 288.0, 173.0, 123.0, 87.0, 52.0, 32.0, 27.0, 21.0, 12.0, 11.0, 8.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.068359375, -2.0013427734375, -1.934326171875, -1.8673095703125, -1.80029296875, -1.7332763671875, -1.666259765625, -1.5992431640625, -1.5322265625, -1.4652099609375, -1.398193359375, -1.3311767578125, -1.26416015625, -1.1971435546875, -1.130126953125, -1.0631103515625, -0.99609375, -0.9290771484375, -0.862060546875, -0.7950439453125, -0.72802734375, -0.6610107421875, -0.593994140625, -0.5269775390625, -0.4599609375, -0.3929443359375, -0.325927734375, -0.2589111328125, -0.19189453125, -0.1248779296875, -0.057861328125, 0.0091552734375, 0.076171875, 0.1431884765625, 0.210205078125, 0.2772216796875, 0.34423828125, 0.4112548828125, 0.478271484375, 0.5452880859375, 0.6123046875, 0.6793212890625, 0.746337890625, 0.8133544921875, 0.88037109375, 0.9473876953125, 1.014404296875, 1.0814208984375, 1.1484375, 1.2154541015625, 1.282470703125, 1.3494873046875, 1.41650390625, 1.4835205078125, 1.550537109375, 1.6175537109375, 1.6845703125, 1.7515869140625, 1.818603515625, 1.8856201171875, 1.95263671875, 2.0196533203125, 2.086669921875, 2.1536865234375, 2.220703125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 4.0, 5.0, 6.0, 7.0, 14.0, 13.0, 21.0, 19.0, 22.0, 24.0, 30.0, 32.0, 38.0, 39.0, 61.0, 45.0, 77.0, 116.0, 334.0, 1529.0, 141.0, 80.0, 50.0, 43.0, 41.0, 37.0, 36.0, 26.0, 18.0, 21.0, 25.0, 18.0, 13.0, 12.0, 7.0, 8.0, 8.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.7578125, -7.5159912109375, -7.274169921875, -7.0323486328125, -6.79052734375, -6.5487060546875, -6.306884765625, -6.0650634765625, -5.8232421875, -5.5814208984375, -5.339599609375, -5.0977783203125, -4.85595703125, -4.6141357421875, -4.372314453125, -4.1304931640625, -3.888671875, -3.6468505859375, -3.405029296875, -3.1632080078125, -2.92138671875, -2.6795654296875, -2.437744140625, -2.1959228515625, -1.9541015625, -1.7122802734375, -1.470458984375, -1.2286376953125, -0.98681640625, -0.7449951171875, -0.503173828125, -0.2613525390625, -0.01953125, 0.2222900390625, 0.464111328125, 0.7059326171875, 0.94775390625, 1.1895751953125, 1.431396484375, 1.6732177734375, 1.9150390625, 2.1568603515625, 2.398681640625, 2.6405029296875, 2.88232421875, 3.1241455078125, 3.365966796875, 3.6077880859375, 3.849609375, 4.0914306640625, 4.333251953125, 4.5750732421875, 4.81689453125, 5.0587158203125, 5.300537109375, 5.5423583984375, 5.7841796875, 6.0260009765625, 6.267822265625, 6.5096435546875, 6.75146484375, 6.9932861328125, 7.235107421875, 7.4769287109375, 7.71875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 8.0, 6.0, 7.0, 5.0, 14.0, 16.0, 19.0, 27.0, 26.0, 38.0, 52.0, 59.0, 91.0, 150.0, 204.0, 321.0, 1000.0, 3881.0, 32593.0, 2440153.0, 641860.0, 20605.0, 2784.0, 776.0, 345.0, 186.0, 124.0, 82.0, 64.0, 53.0, 39.0, 11.0, 27.0, 23.0, 12.0, 11.0, 4.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.96875, -11.60498046875, -11.2412109375, -10.87744140625, -10.513671875, -10.14990234375, -9.7861328125, -9.42236328125, -9.05859375, -8.69482421875, -8.3310546875, -7.96728515625, -7.603515625, -7.23974609375, -6.8759765625, -6.51220703125, -6.1484375, -5.78466796875, -5.4208984375, -5.05712890625, -4.693359375, -4.32958984375, -3.9658203125, -3.60205078125, -3.23828125, -2.87451171875, -2.5107421875, -2.14697265625, -1.783203125, -1.41943359375, -1.0556640625, -0.69189453125, -0.328125, 0.03564453125, 0.3994140625, 0.76318359375, 1.126953125, 1.49072265625, 1.8544921875, 2.21826171875, 2.58203125, 2.94580078125, 3.3095703125, 3.67333984375, 4.037109375, 4.40087890625, 4.7646484375, 5.12841796875, 5.4921875, 5.85595703125, 6.2197265625, 6.58349609375, 6.947265625, 7.31103515625, 7.6748046875, 8.03857421875, 8.40234375, 8.76611328125, 9.1298828125, 9.49365234375, 9.857421875, 10.22119140625, 10.5849609375, 10.94873046875, 11.3125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 248.0, 686.0, 76.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.660686492919922, -23.813861846923828, -20.967037200927734, -18.12021255493164, -15.27338695526123, -12.426562309265137, -9.579736709594727, -6.732912063598633, -3.886087417602539, -1.0392625331878662, 1.8075623512268066, 4.654387474060059, 7.501212120056152, 10.348036766052246, 13.194862365722656, 16.04168701171875, 18.888511657714844, 21.735336303710938, 24.58216094970703, 27.428985595703125, 30.27581024169922, 33.12263488769531, 35.969459533691406, 38.8162841796875, 41.663108825683594, 44.50993347167969, 47.35675811767578, 50.203582763671875, 53.05040740966797, 55.89723205566406, 58.744056701660156, 61.59088134765625, 64.43770599365234, 67.28453063964844, 70.13135528564453, 72.97817993164062, 75.82500457763672, 78.67182922363281, 81.5186538696289, 84.365478515625, 87.2123031616211, 90.05912780761719, 92.90595245361328, 95.75277709960938, 98.59960174560547, 101.44642639160156, 104.29325103759766, 107.14007568359375, 109.98690795898438, 112.83373260498047, 115.68055725097656, 118.52738189697266, 121.37420654296875, 124.22103118896484, 127.06785583496094, 129.91468811035156, 132.76150512695312, 135.60833740234375, 138.4551544189453, 141.30198669433594, 144.1488037109375, 146.99563598632812, 149.8424530029297, 152.6892852783203, 155.53610229492188]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 5.0, 7.0, 11.0, 7.0, 7.0, 22.0, 19.0, 21.0, 23.0, 25.0, 26.0, 22.0, 29.0, 43.0, 40.0, 37.0, 36.0, 39.0, 36.0, 44.0, 48.0, 38.0, 31.0, 43.0, 37.0, 35.0, 39.0, 30.0, 28.0, 20.0, 24.0, 20.0, 20.0, 13.0, 14.0, 12.0, 9.0, 10.0, 11.0, 7.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.083560943603516, -23.362991333007812, -22.64242172241211, -21.921852111816406, -21.201282501220703, -20.480712890625, -19.760143280029297, -19.03957176208496, -18.319002151489258, -17.598432540893555, -16.87786293029785, -16.15729331970215, -15.436722755432129, -14.716153144836426, -13.995583534240723, -13.275012969970703, -12.554444313049316, -11.833874702453613, -11.11330509185791, -10.39273452758789, -9.672164916992188, -8.951595306396484, -8.231025695800781, -7.51045560836792, -6.789885997772217, -6.069316387176514, -5.348746299743652, -4.628176689147949, -3.907606840133667, -3.1870369911193848, -2.4664673805236816, -1.7458972930908203, -1.0253276824951172, -0.30475789308547974, 0.4158118963241577, 1.1363816261291504, 1.8569514751434326, 2.577521324157715, 3.298090934753418, 4.018661022186279, 4.739230632781982, 5.4598002433776855, 6.180370330810547, 6.90093994140625, 7.621509552001953, 8.342079162597656, 9.06264877319336, 9.783219337463379, 10.503788948059082, 11.224358558654785, 11.944928169250488, 12.665498733520508, 13.386068344116211, 14.106637954711914, 14.827207565307617, 15.54777717590332, 16.268346786499023, 16.988916397094727, 17.70948600769043, 18.430055618286133, 19.150625228881836, 19.871196746826172, 20.591766357421875, 21.312335968017578, 22.03290557861328]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 3.0, 6.0, 4.0, 13.0, 3.0, 8.0, 12.0, 18.0, 17.0, 17.0, 21.0, 25.0, 33.0, 30.0, 33.0, 35.0, 34.0, 45.0, 42.0, 30.0, 37.0, 42.0, 57.0, 47.0, 45.0, 36.0, 41.0, 43.0, 33.0, 32.0, 30.0, 18.0, 25.0, 19.0, 17.0, 11.0, 10.0, 8.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.283203125, -2.212066650390625, -2.14093017578125, -2.069793701171875, -1.9986572265625, -1.927520751953125, -1.85638427734375, -1.785247802734375, -1.714111328125, -1.642974853515625, -1.57183837890625, -1.500701904296875, -1.4295654296875, -1.358428955078125, -1.28729248046875, -1.216156005859375, -1.14501953125, -1.073883056640625, -1.00274658203125, -0.931610107421875, -0.8604736328125, -0.789337158203125, -0.71820068359375, -0.647064208984375, -0.575927734375, -0.504791259765625, -0.43365478515625, -0.362518310546875, -0.2913818359375, -0.220245361328125, -0.14910888671875, -0.077972412109375, -0.0068359375, 0.064300537109375, 0.13543701171875, 0.206573486328125, 0.2777099609375, 0.348846435546875, 0.41998291015625, 0.491119384765625, 0.562255859375, 0.633392333984375, 0.70452880859375, 0.775665283203125, 0.8468017578125, 0.917938232421875, 0.98907470703125, 1.060211181640625, 1.13134765625, 1.202484130859375, 1.27362060546875, 1.344757080078125, 1.4158935546875, 1.487030029296875, 1.55816650390625, 1.629302978515625, 1.700439453125, 1.771575927734375, 1.84271240234375, 1.913848876953125, 1.9849853515625, 2.056121826171875, 2.12725830078125, 2.198394775390625, 2.26953125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 6.0, 9.0, 10.0, 20.0, 25.0, 51.0, 58.0, 95.0, 133.0, 223.0, 349.0, 530.0, 916.0, 1589.0, 2732.0, 5107.0, 9536.0, 18982.0, 39965.0, 90610.0, 237036.0, 766115.0, 1652928.0, 900227.0, 277134.0, 101578.0, 44403.0, 20862.0, 10279.0, 5528.0, 3022.0, 1629.0, 952.0, 582.0, 364.0, 230.0, 167.0, 88.0, 74.0, 44.0, 29.0, 22.0, 13.0, 11.0, 9.0, 7.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.3673095703125, -3.263916015625, -3.1605224609375, -3.05712890625, -2.9537353515625, -2.850341796875, -2.7469482421875, -2.6435546875, -2.5401611328125, -2.436767578125, -2.3333740234375, -2.22998046875, -2.1265869140625, -2.023193359375, -1.9197998046875, -1.81640625, -1.7130126953125, -1.609619140625, -1.5062255859375, -1.40283203125, -1.2994384765625, -1.196044921875, -1.0926513671875, -0.9892578125, -0.8858642578125, -0.782470703125, -0.6790771484375, -0.57568359375, -0.4722900390625, -0.368896484375, -0.2655029296875, -0.162109375, -0.0587158203125, 0.044677734375, 0.1480712890625, 0.25146484375, 0.3548583984375, 0.458251953125, 0.5616455078125, 0.6650390625, 0.7684326171875, 0.871826171875, 0.9752197265625, 1.07861328125, 1.1820068359375, 1.285400390625, 1.3887939453125, 1.4921875, 1.5955810546875, 1.698974609375, 1.8023681640625, 1.90576171875, 2.0091552734375, 2.112548828125, 2.2159423828125, 2.3193359375, 2.4227294921875, 2.526123046875, 2.6295166015625, 2.73291015625, 2.8363037109375, 2.939697265625, 3.0430908203125, 3.146484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 9.0, 12.0, 13.0, 16.0, 13.0, 19.0, 40.0, 44.0, 72.0, 82.0, 95.0, 141.0, 219.0, 283.0, 327.0, 401.0, 439.0, 431.0, 329.0, 256.0, 216.0, 162.0, 112.0, 103.0, 73.0, 49.0, 30.0, 20.0, 16.0, 13.0, 10.0, 5.0, 5.0, 0.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.12890625, -6.9437255859375, -6.758544921875, -6.5733642578125, -6.38818359375, -6.2030029296875, -6.017822265625, -5.8326416015625, -5.6474609375, -5.4622802734375, -5.277099609375, -5.0919189453125, -4.90673828125, -4.7215576171875, -4.536376953125, -4.3511962890625, -4.166015625, -3.9808349609375, -3.795654296875, -3.6104736328125, -3.42529296875, -3.2401123046875, -3.054931640625, -2.8697509765625, -2.6845703125, -2.4993896484375, -2.314208984375, -2.1290283203125, -1.94384765625, -1.7586669921875, -1.573486328125, -1.3883056640625, -1.203125, -1.0179443359375, -0.832763671875, -0.6475830078125, -0.46240234375, -0.2772216796875, -0.092041015625, 0.0931396484375, 0.2783203125, 0.4635009765625, 0.648681640625, 0.8338623046875, 1.01904296875, 1.2042236328125, 1.389404296875, 1.5745849609375, 1.759765625, 1.9449462890625, 2.130126953125, 2.3153076171875, 2.50048828125, 2.6856689453125, 2.870849609375, 3.0560302734375, 3.2412109375, 3.4263916015625, 3.611572265625, 3.7967529296875, 3.98193359375, 4.1671142578125, 4.352294921875, 4.5374755859375, 4.72265625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 20.0, 33.0, 33.0, 50.0, 80.0, 124.0, 234.0, 368.0, 691.0, 1566.0, 4511.0, 16015.0, 76422.0, 503492.0, 2668388.0, 780589.0, 110327.0, 21601.0, 5801.0, 1995.0, 814.0, 428.0, 251.0, 139.0, 92.0, 62.0, 44.0, 26.0, 19.0, 14.0, 7.0, 11.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.0103759765625, -7.684814453125, -7.3592529296875, -7.03369140625, -6.7081298828125, -6.382568359375, -6.0570068359375, -5.7314453125, -5.4058837890625, -5.080322265625, -4.7547607421875, -4.42919921875, -4.1036376953125, -3.778076171875, -3.4525146484375, -3.126953125, -2.8013916015625, -2.475830078125, -2.1502685546875, -1.82470703125, -1.4991455078125, -1.173583984375, -0.8480224609375, -0.5224609375, -0.1968994140625, 0.128662109375, 0.4542236328125, 0.77978515625, 1.1053466796875, 1.430908203125, 1.7564697265625, 2.08203125, 2.4075927734375, 2.733154296875, 3.0587158203125, 3.38427734375, 3.7098388671875, 4.035400390625, 4.3609619140625, 4.6865234375, 5.0120849609375, 5.337646484375, 5.6632080078125, 5.98876953125, 6.3143310546875, 6.639892578125, 6.9654541015625, 7.291015625, 7.6165771484375, 7.942138671875, 8.2677001953125, 8.59326171875, 8.9188232421875, 9.244384765625, 9.5699462890625, 9.8955078125, 10.2210693359375, 10.546630859375, 10.8721923828125, 11.19775390625, 11.5233154296875, 11.848876953125, 12.1744384765625, 12.5]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 9.0, 24.0, 37.0, 75.0, 111.0, 144.0, 173.0, 141.0, 122.0, 79.0, 58.0, 24.0, 10.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.887874603271484, -43.20592498779297, -41.52397537231445, -39.84202575683594, -38.16007995605469, -36.478126525878906, -34.796180725097656, -33.11423110961914, -31.432281494140625, -29.75033187866211, -28.068382263183594, -26.38643455505371, -24.704484939575195, -23.02253532409668, -21.340587615966797, -19.65863800048828, -17.976688385009766, -16.29473876953125, -14.61279010772705, -12.930841445922852, -11.248891830444336, -9.56694221496582, -7.884993553161621, -6.203044891357422, -4.521095275878906, -2.839146137237549, -1.1571969985961914, 0.524752140045166, 2.2067012786865234, 3.888650894165039, 5.570599555969238, 7.2525482177734375, 8.934494018554688, 10.616443634033203, 12.298392295837402, 13.980340957641602, 15.662290573120117, 17.344240188598633, 19.026187896728516, 20.70813751220703, 22.390087127685547, 24.072036743164062, 25.753986358642578, 27.43593406677246, 29.117883682250977, 30.799833297729492, 32.481781005859375, 34.16373062133789, 35.845680236816406, 37.52762985229492, 39.20957946777344, 40.89152908325195, 42.57347869873047, 44.25542449951172, 45.937374114990234, 47.61932373046875, 49.301273345947266, 50.98322296142578, 52.6651725769043, 54.34712219238281, 56.02906799316406, 57.711021423339844, 59.392967224121094, 61.07491683959961, 62.756866455078125]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 3.0, 9.0, 4.0, 8.0, 7.0, 9.0, 14.0, 11.0, 16.0, 23.0, 22.0, 27.0, 32.0, 30.0, 24.0, 31.0, 46.0, 36.0, 52.0, 35.0, 54.0, 38.0, 45.0, 41.0, 42.0, 33.0, 33.0, 26.0, 33.0, 29.0, 20.0, 21.0, 23.0, 24.0, 23.0, 17.0, 14.0, 10.0, 7.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.47724151611328, -19.817333221435547, -19.15742301940918, -18.497514724731445, -17.837604522705078, -17.177696228027344, -16.517786026000977, -15.857877731323242, -15.197968482971191, -14.53805923461914, -13.87814998626709, -13.218240737915039, -12.558332443237305, -11.898422241210938, -11.238513946533203, -10.578604698181152, -9.918695449829102, -9.25878620147705, -8.598876953125, -7.938968181610107, -7.279058933258057, -6.619149684906006, -5.959240913391113, -5.2993316650390625, -4.639422416687012, -3.979513168334961, -3.3196041584014893, -2.6596951484680176, -1.9997859001159668, -1.339876651763916, -0.6799676418304443, -0.020058631896972656, 0.6398506164550781, 1.2997597455978394, 1.9596688747406006, 2.6195778846740723, 3.279487133026123, 3.939396381378174, 4.599305152893066, 5.259214401245117, 5.919123649597168, 6.579032897949219, 7.2389421463012695, 7.898850917816162, 8.558759689331055, 9.218669891357422, 9.878578186035156, 10.538487434387207, 11.198396682739258, 11.858305931091309, 12.51821517944336, 13.17812442779541, 13.838033676147461, 14.497941970825195, 15.157851219177246, 15.817760467529297, 16.47766876220703, 17.137577056884766, 17.797487258911133, 18.457395553588867, 19.117305755615234, 19.77721405029297, 20.437124252319336, 21.09703254699707, 21.756942749023438]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 7.0, 3.0, 6.0, 4.0, 11.0, 7.0, 16.0, 17.0, 15.0, 13.0, 16.0, 36.0, 30.0, 39.0, 28.0, 28.0, 34.0, 42.0, 39.0, 55.0, 38.0, 40.0, 50.0, 34.0, 45.0, 33.0, 39.0, 37.0, 19.0, 26.0, 32.0, 23.0, 20.0, 32.0, 18.0, 12.0, 11.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0078125, -1.939056396484375, -1.87030029296875, -1.801544189453125, -1.7327880859375, -1.664031982421875, -1.59527587890625, -1.526519775390625, -1.457763671875, -1.389007568359375, -1.32025146484375, -1.251495361328125, -1.1827392578125, -1.113983154296875, -1.04522705078125, -0.976470947265625, -0.90771484375, -0.838958740234375, -0.77020263671875, -0.701446533203125, -0.6326904296875, -0.563934326171875, -0.49517822265625, -0.426422119140625, -0.357666015625, -0.288909912109375, -0.22015380859375, -0.151397705078125, -0.0826416015625, -0.013885498046875, 0.05487060546875, 0.123626708984375, 0.1923828125, 0.261138916015625, 0.32989501953125, 0.398651123046875, 0.4674072265625, 0.536163330078125, 0.60491943359375, 0.673675537109375, 0.742431640625, 0.811187744140625, 0.87994384765625, 0.948699951171875, 1.0174560546875, 1.086212158203125, 1.15496826171875, 1.223724365234375, 1.29248046875, 1.361236572265625, 1.42999267578125, 1.498748779296875, 1.5675048828125, 1.636260986328125, 1.70501708984375, 1.773773193359375, 1.842529296875, 1.911285400390625, 1.98004150390625, 2.048797607421875, 2.1175537109375, 2.186309814453125, 2.25506591796875, 2.323822021484375, 2.392578125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 3.0, 14.0, 23.0, 26.0, 35.0, 74.0, 102.0, 169.0, 252.0, 375.0, 540.0, 780.0, 1087.0, 1770.0, 2730.0, 4116.0, 6308.0, 10217.0, 16300.0, 26546.0, 44655.0, 78352.0, 164455.0, 350468.0, 152501.0, 74824.0, 42920.0, 25356.0, 15864.0, 9933.0, 6132.0, 3985.0, 2572.0, 1700.0, 1046.0, 736.0, 492.0, 399.0, 243.0, 166.0, 106.0, 61.0, 31.0, 34.0, 19.0, 15.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.013885498046875, -0.01348257064819336, -0.013079643249511719, -0.012676715850830078, -0.012273788452148438, -0.011870861053466797, -0.011467933654785156, -0.011065006256103516, -0.010662078857421875, -0.010259151458740234, -0.009856224060058594, -0.009453296661376953, -0.009050369262695312, -0.008647441864013672, -0.008244514465332031, -0.00784158706665039, -0.00743865966796875, -0.007035732269287109, -0.006632804870605469, -0.006229877471923828, -0.0058269500732421875, -0.005424022674560547, -0.005021095275878906, -0.004618167877197266, -0.004215240478515625, -0.0038123130798339844, -0.0034093856811523438, -0.003006458282470703, -0.0026035308837890625, -0.002200603485107422, -0.0017976760864257812, -0.0013947486877441406, -0.0009918212890625, -0.0005888938903808594, -0.00018596649169921875, 0.00021696090698242188, 0.0006198883056640625, 0.0010228157043457031, 0.0014257431030273438, 0.0018286705017089844, 0.002231597900390625, 0.0026345252990722656, 0.0030374526977539062, 0.003440380096435547, 0.0038433074951171875, 0.004246234893798828, 0.004649162292480469, 0.005052089691162109, 0.00545501708984375, 0.005857944488525391, 0.006260871887207031, 0.006663799285888672, 0.0070667266845703125, 0.007469654083251953, 0.007872581481933594, 0.008275508880615234, 0.008678436279296875, 0.009081363677978516, 0.009484291076660156, 0.009887218475341797, 0.010290145874023438, 0.010693073272705078, 0.011096000671386719, 0.01149892807006836, 0.01190185546875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 4.0, 5.0, 10.0, 11.0, 12.0, 15.0, 12.0, 22.0, 20.0, 22.0, 23.0, 29.0, 24.0, 31.0, 37.0, 35.0, 38.0, 30.0, 35.0, 49.0, 1077.0, 42.0, 39.0, 31.0, 32.0, 39.0, 28.0, 26.0, 19.0, 42.0, 37.0, 26.0, 24.0, 15.0, 11.0, 10.0, 13.0, 13.0, 8.0, 9.0, 8.0, 4.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.341796875, -1.29779052734375, -1.2537841796875, -1.20977783203125, -1.165771484375, -1.12176513671875, -1.0777587890625, -1.03375244140625, -0.98974609375, -0.94573974609375, -0.9017333984375, -0.85772705078125, -0.813720703125, -0.76971435546875, -0.7257080078125, -0.68170166015625, -0.6376953125, -0.59368896484375, -0.5496826171875, -0.50567626953125, -0.461669921875, -0.41766357421875, -0.3736572265625, -0.32965087890625, -0.28564453125, -0.24163818359375, -0.1976318359375, -0.15362548828125, -0.109619140625, -0.06561279296875, -0.0216064453125, 0.02239990234375, 0.06640625, 0.11041259765625, 0.1544189453125, 0.19842529296875, 0.242431640625, 0.28643798828125, 0.3304443359375, 0.37445068359375, 0.41845703125, 0.46246337890625, 0.5064697265625, 0.55047607421875, 0.594482421875, 0.63848876953125, 0.6824951171875, 0.72650146484375, 0.7705078125, 0.81451416015625, 0.8585205078125, 0.90252685546875, 0.946533203125, 0.99053955078125, 1.0345458984375, 1.07855224609375, 1.12255859375, 1.16656494140625, 1.2105712890625, 1.25457763671875, 1.298583984375, 1.34259033203125, 1.3865966796875, 1.43060302734375, 1.474609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 6.0, 3.0, 17.0, 26.0, 28.0, 56.0, 75.0, 107.0, 174.0, 282.0, 409.0, 565.0, 1001.0, 1426.0, 2142.0, 3343.0, 5138.0, 7950.0, 12644.0, 19920.0, 31359.0, 50583.0, 85013.0, 170741.0, 1352403.0, 148008.0, 76716.0, 46739.0, 28977.0, 18179.0, 11692.0, 7619.0, 4697.0, 3112.0, 2041.0, 1295.0, 913.0, 555.0, 401.0, 247.0, 179.0, 118.0, 77.0, 49.0, 25.0, 35.0, 22.0, 5.0, 11.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.00872802734375, -0.008466839790344238, -0.008205652236938477, -0.007944464683532715, -0.007683277130126953, -0.007422089576721191, -0.00716090202331543, -0.006899714469909668, -0.006638526916503906, -0.0063773393630981445, -0.006116151809692383, -0.005854964256286621, -0.005593776702880859, -0.005332589149475098, -0.005071401596069336, -0.004810214042663574, -0.0045490264892578125, -0.004287838935852051, -0.004026651382446289, -0.0037654638290405273, -0.0035042762756347656, -0.003243088722229004, -0.002981901168823242, -0.0027207136154174805, -0.0024595260620117188, -0.002198338508605957, -0.0019371509552001953, -0.0016759634017944336, -0.0014147758483886719, -0.0011535882949829102, -0.0008924007415771484, -0.0006312131881713867, -0.000370025634765625, -0.00010883808135986328, 0.00015234947204589844, 0.00041353702545166016, 0.0006747245788574219, 0.0009359121322631836, 0.0011970996856689453, 0.001458287239074707, 0.0017194747924804688, 0.0019806623458862305, 0.002241849899291992, 0.002503037452697754, 0.0027642250061035156, 0.0030254125595092773, 0.003286600112915039, 0.0035477876663208008, 0.0038089752197265625, 0.004070162773132324, 0.004331350326538086, 0.004592537879943848, 0.004853725433349609, 0.005114912986755371, 0.005376100540161133, 0.0056372880935668945, 0.005898475646972656, 0.006159663200378418, 0.00642085075378418, 0.006682038307189941, 0.006943225860595703, 0.007204413414001465, 0.0074656009674072266, 0.007726788520812988, 0.00798797607421875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 968.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 17.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 0.0, 46.0, 52.0, 0.0, 256.0, 2449.0, 0.0, 13420.0, 0.0, 1015763.0, 13756.0, 0.0, 2366.0, 274.0, 0.0, 63.0, 30.0, 0.0, 13.0, 0.0, 7.0, 2.0, 0.0, 0.0, 5.0, 0.0, 11.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0728836059570312e-06, -1.0346993803977966e-06, -9.96515154838562e-07, -9.583309292793274e-07, -9.201467037200928e-07, -8.819624781608582e-07, -8.437782526016235e-07, -8.055940270423889e-07, -7.674098014831543e-07, -7.292255759239197e-07, -6.910413503646851e-07, -6.528571248054504e-07, -6.146728992462158e-07, -5.764886736869812e-07, -5.383044481277466e-07, -5.00120222568512e-07, -4.6193599700927734e-07, -4.237517714500427e-07, -3.855675458908081e-07, -3.473833203315735e-07, -3.0919909477233887e-07, -2.7101486921310425e-07, -2.3283064365386963e-07, -1.94646418094635e-07, -1.564621925354004e-07, -1.1827796697616577e-07, -8.009374141693115e-08, -4.190951585769653e-08, -3.725290298461914e-09, 3.4458935260772705e-08, 7.264316082000732e-08, 1.1082738637924194e-07, 1.4901161193847656e-07, 1.8719583749771118e-07, 2.253800630569458e-07, 2.635642886161804e-07, 3.0174851417541504e-07, 3.3993273973464966e-07, 3.781169652938843e-07, 4.163011908531189e-07, 4.544854164123535e-07, 4.926696419715881e-07, 5.308538675308228e-07, 5.690380930900574e-07, 6.07222318649292e-07, 6.454065442085266e-07, 6.835907697677612e-07, 7.217749953269958e-07, 7.599592208862305e-07, 7.981434464454651e-07, 8.363276720046997e-07, 8.745118975639343e-07, 9.126961231231689e-07, 9.508803486824036e-07, 9.890645742416382e-07, 1.0272487998008728e-06, 1.0654330253601074e-06, 1.103617250919342e-06, 1.1418014764785767e-06, 1.1799857020378113e-06, 1.218169927597046e-06, 1.2563541531562805e-06, 1.2945383787155151e-06, 1.3327226042747498e-06, 1.3709068298339844e-06]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 4.0, 7.0, 3.0, 6.0, 4.0, 11.0, 7.0, 16.0, 17.0, 15.0, 13.0, 16.0, 36.0, 30.0, 39.0, 28.0, 28.0, 34.0, 42.0, 39.0, 55.0, 38.0, 40.0, 50.0, 34.0, 45.0, 33.0, 39.0, 37.0, 19.0, 26.0, 32.0, 23.0, 20.0, 32.0, 18.0, 12.0, 11.0, 12.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0078125, -1.939056396484375, -1.87030029296875, -1.801544189453125, -1.7327880859375, -1.664031982421875, -1.59527587890625, -1.526519775390625, -1.457763671875, -1.389007568359375, -1.32025146484375, -1.251495361328125, -1.1827392578125, -1.113983154296875, -1.04522705078125, -0.976470947265625, -0.90771484375, -0.838958740234375, -0.77020263671875, -0.701446533203125, -0.6326904296875, -0.563934326171875, -0.49517822265625, -0.426422119140625, -0.357666015625, -0.288909912109375, -0.22015380859375, -0.151397705078125, -0.0826416015625, -0.013885498046875, 0.05487060546875, 0.123626708984375, 0.1923828125, 0.261138916015625, 0.32989501953125, 0.398651123046875, 0.4674072265625, 0.536163330078125, 0.60491943359375, 0.673675537109375, 0.742431640625, 0.811187744140625, 0.87994384765625, 0.948699951171875, 1.0174560546875, 1.086212158203125, 1.15496826171875, 1.223724365234375, 1.29248046875, 1.361236572265625, 1.42999267578125, 1.498748779296875, 1.5675048828125, 1.636260986328125, 1.70501708984375, 1.773773193359375, 1.842529296875, 1.911285400390625, 1.98004150390625, 2.048797607421875, 2.1175537109375, 2.186309814453125, 2.25506591796875, 2.323822021484375, 2.392578125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 7.0, 1.0, 10.0, 13.0, 16.0, 26.0, 39.0, 45.0, 73.0, 75.0, 132.0, 183.0, 257.0, 334.0, 515.0, 732.0, 974.0, 1458.0, 2066.0, 2930.0, 4293.0, 6124.0, 9236.0, 14218.0, 23583.0, 49575.0, 144409.0, 479019.0, 177936.0, 57383.0, 26492.0, 15290.0, 9802.0, 6509.0, 4459.0, 3121.0, 2158.0, 1416.0, 1018.0, 733.0, 553.0, 396.0, 265.0, 213.0, 137.0, 111.0, 81.0, 51.0, 32.0, 15.0, 22.0, 14.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.0078125, -1.9461822509765625, -1.884552001953125, -1.8229217529296875, -1.76129150390625, -1.6996612548828125, -1.638031005859375, -1.5764007568359375, -1.5147705078125, -1.4531402587890625, -1.391510009765625, -1.3298797607421875, -1.26824951171875, -1.2066192626953125, -1.144989013671875, -1.0833587646484375, -1.021728515625, -0.9600982666015625, -0.898468017578125, -0.8368377685546875, -0.77520751953125, -0.7135772705078125, -0.651947021484375, -0.5903167724609375, -0.5286865234375, -0.4670562744140625, -0.405426025390625, -0.3437957763671875, -0.28216552734375, -0.2205352783203125, -0.158905029296875, -0.0972747802734375, -0.03564453125, 0.0259857177734375, 0.087615966796875, 0.1492462158203125, 0.21087646484375, 0.2725067138671875, 0.334136962890625, 0.3957672119140625, 0.4573974609375, 0.5190277099609375, 0.580657958984375, 0.6422882080078125, 0.70391845703125, 0.7655487060546875, 0.827178955078125, 0.8888092041015625, 0.950439453125, 1.0120697021484375, 1.073699951171875, 1.1353302001953125, 1.19696044921875, 1.2585906982421875, 1.320220947265625, 1.3818511962890625, 1.4434814453125, 1.5051116943359375, 1.566741943359375, 1.6283721923828125, 1.69000244140625, 1.7516326904296875, 1.813262939453125, 1.8748931884765625, 1.9365234375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 6.0, 6.0, 8.0, 6.0, 13.0, 16.0, 14.0, 16.0, 31.0, 18.0, 36.0, 31.0, 32.0, 44.0, 48.0, 77.0, 75.0, 142.0, 1680.0, 243.0, 93.0, 60.0, 48.0, 47.0, 38.0, 31.0, 39.0, 29.0, 19.0, 21.0, 16.0, 17.0, 14.0, 4.0, 7.0, 7.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25, -7.9720458984375, -7.694091796875, -7.4161376953125, -7.13818359375, -6.8602294921875, -6.582275390625, -6.3043212890625, -6.0263671875, -5.7484130859375, -5.470458984375, -5.1925048828125, -4.91455078125, -4.6365966796875, -4.358642578125, -4.0806884765625, -3.802734375, -3.5247802734375, -3.246826171875, -2.9688720703125, -2.69091796875, -2.4129638671875, -2.135009765625, -1.8570556640625, -1.5791015625, -1.3011474609375, -1.023193359375, -0.7452392578125, -0.46728515625, -0.1893310546875, 0.088623046875, 0.3665771484375, 0.64453125, 0.9224853515625, 1.200439453125, 1.4783935546875, 1.75634765625, 2.0343017578125, 2.312255859375, 2.5902099609375, 2.8681640625, 3.1461181640625, 3.424072265625, 3.7020263671875, 3.97998046875, 4.2579345703125, 4.535888671875, 4.8138427734375, 5.091796875, 5.3697509765625, 5.647705078125, 5.9256591796875, 6.20361328125, 6.4815673828125, 6.759521484375, 7.0374755859375, 7.3154296875, 7.5933837890625, 7.871337890625, 8.1492919921875, 8.42724609375, 8.7052001953125, 8.983154296875, 9.2611083984375, 9.5390625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 9.0, 7.0, 16.0, 21.0, 18.0, 27.0, 21.0, 39.0, 60.0, 67.0, 114.0, 162.0, 222.0, 400.0, 1986.0, 29673.0, 3009534.0, 97732.0, 4067.0, 610.0, 258.0, 181.0, 109.0, 88.0, 72.0, 50.0, 27.0, 29.0, 25.0, 16.0, 19.0, 8.0, 3.0, 8.0, 11.0, 2.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.8125, -17.2984619140625, -16.784423828125, -16.2703857421875, -15.75634765625, -15.2423095703125, -14.728271484375, -14.2142333984375, -13.7001953125, -13.1861572265625, -12.672119140625, -12.1580810546875, -11.64404296875, -11.1300048828125, -10.615966796875, -10.1019287109375, -9.587890625, -9.0738525390625, -8.559814453125, -8.0457763671875, -7.53173828125, -7.0177001953125, -6.503662109375, -5.9896240234375, -5.4755859375, -4.9615478515625, -4.447509765625, -3.9334716796875, -3.41943359375, -2.9053955078125, -2.391357421875, -1.8773193359375, -1.36328125, -0.8492431640625, -0.335205078125, 0.1788330078125, 0.69287109375, 1.2069091796875, 1.720947265625, 2.2349853515625, 2.7490234375, 3.2630615234375, 3.777099609375, 4.2911376953125, 4.80517578125, 5.3192138671875, 5.833251953125, 6.3472900390625, 6.861328125, 7.3753662109375, 7.889404296875, 8.4034423828125, 8.91748046875, 9.4315185546875, 9.945556640625, 10.4595947265625, 10.9736328125, 11.4876708984375, 12.001708984375, 12.5157470703125, 13.02978515625, 13.5438232421875, 14.057861328125, 14.5718994140625, 15.0859375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 169.0, 677.0, 163.0], "bins": [-141.75186157226562, -139.48297119140625, -137.21408081054688, -134.94520568847656, -132.6763153076172, -130.4074249267578, -128.13853454589844, -125.8696517944336, -123.60076141357422, -121.33187103271484, -119.06298828125, -116.79409790039062, -114.52521514892578, -112.2563247680664, -109.98744201660156, -107.71855163574219, -105.44966125488281, -103.18077087402344, -100.9118881225586, -98.64299774169922, -96.37411499023438, -94.105224609375, -91.83633422851562, -89.56745147705078, -87.29856872558594, -85.02967834472656, -82.76079559326172, -80.49190521240234, -78.2230224609375, -75.95413208007812, -73.68524169921875, -71.4163589477539, -69.14747619628906, -66.87858581542969, -64.60970306396484, -62.34081268310547, -60.07192611694336, -57.80303955078125, -55.53415298461914, -53.26526641845703, -50.996376037597656, -48.72748947143555, -46.45860290527344, -44.18971252441406, -41.92082595825195, -39.651939392089844, -37.383052825927734, -35.114166259765625, -32.84527587890625, -30.57638931274414, -28.3075008392334, -26.03861427307129, -23.769725799560547, -21.500839233398438, -19.231952667236328, -16.96306610107422, -14.694177627563477, -12.42529010772705, -10.156402587890625, -7.887516021728516, -5.61862850189209, -3.349740982055664, -1.0808544158935547, 1.188033103942871, 3.4569203853607178]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 12.0, 18.0, 12.0, 20.0, 20.0, 18.0, 24.0, 26.0, 36.0, 30.0, 46.0, 46.0, 37.0, 34.0, 57.0, 59.0, 43.0, 35.0, 35.0, 41.0, 41.0, 31.0, 35.0, 25.0, 32.0, 26.0, 23.0, 20.0, 24.0, 17.0, 10.0, 12.0, 13.0, 6.0, 2.0, 4.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.954151153564453, -18.2750301361084, -17.595909118652344, -16.91678810119629, -16.237667083740234, -15.55854606628418, -14.879426002502441, -14.200304985046387, -13.521183967590332, -12.842062950134277, -12.162941932678223, -11.483821868896484, -10.80470085144043, -10.125579833984375, -9.44645881652832, -8.767337799072266, -8.088216781616211, -7.409095764160156, -6.729974746704102, -6.050854206085205, -5.37173318862915, -4.692612171173096, -4.013491630554199, -3.3343706130981445, -2.65524959564209, -1.9761286973953247, -1.2970077991485596, -0.617887020111084, 0.0612339973449707, 0.7403550148010254, 1.4194755554199219, 2.0985965728759766, 2.777719497680664, 3.4568405151367188, 4.135961532592773, 4.81508207321167, 5.494203090667725, 6.173324108123779, 6.852444648742676, 7.5315656661987305, 8.210686683654785, 8.88980770111084, 9.568928718566895, 10.248048782348633, 10.927169799804688, 11.606290817260742, 12.285411834716797, 12.964532852172852, 13.643653869628906, 14.322774887084961, 15.001895904541016, 15.68101692199707, 16.360137939453125, 17.03925895690918, 17.718379974365234, 18.397499084472656, 19.076622009277344, 19.7557430267334, 20.434864044189453, 21.113985061645508, 21.793106079101562, 22.472227096557617, 23.151348114013672, 23.830467224121094, 24.50958824157715]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 6.0, 12.0, 7.0, 13.0, 20.0, 15.0, 22.0, 17.0, 23.0, 32.0, 34.0, 41.0, 27.0, 38.0, 43.0, 36.0, 34.0, 40.0, 52.0, 47.0, 39.0, 36.0, 43.0, 27.0, 32.0, 29.0, 24.0, 23.0, 38.0, 27.0, 16.0, 14.0, 19.0, 12.0, 17.0, 4.0, 4.0, 1.0, 4.0, 6.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1015625, -2.031890869140625, -1.96221923828125, -1.892547607421875, -1.8228759765625, -1.753204345703125, -1.68353271484375, -1.613861083984375, -1.544189453125, -1.474517822265625, -1.40484619140625, -1.335174560546875, -1.2655029296875, -1.195831298828125, -1.12615966796875, -1.056488037109375, -0.98681640625, -0.917144775390625, -0.84747314453125, -0.777801513671875, -0.7081298828125, -0.638458251953125, -0.56878662109375, -0.499114990234375, -0.429443359375, -0.359771728515625, -0.29010009765625, -0.220428466796875, -0.1507568359375, -0.081085205078125, -0.01141357421875, 0.058258056640625, 0.1279296875, 0.197601318359375, 0.26727294921875, 0.336944580078125, 0.4066162109375, 0.476287841796875, 0.54595947265625, 0.615631103515625, 0.685302734375, 0.754974365234375, 0.82464599609375, 0.894317626953125, 0.9639892578125, 1.033660888671875, 1.10333251953125, 1.173004150390625, 1.24267578125, 1.312347412109375, 1.38201904296875, 1.451690673828125, 1.5213623046875, 1.591033935546875, 1.66070556640625, 1.730377197265625, 1.800048828125, 1.869720458984375, 1.93939208984375, 2.009063720703125, 2.0787353515625, 2.148406982421875, 2.21807861328125, 2.287750244140625, 2.357421875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 6.0, 5.0, 4.0, 6.0, 6.0, 10.0, 12.0, 11.0, 13.0, 18.0, 27.0, 26.0, 47.0, 57.0, 79.0, 125.0, 208.0, 376.0, 916.0, 2376.0, 8033.0, 35723.0, 243525.0, 2494000.0, 1262897.0, 116641.0, 20618.0, 5201.0, 1707.0, 686.0, 331.0, 178.0, 104.0, 80.0, 50.0, 39.0, 27.0, 23.0, 28.0, 16.0, 9.0, 3.0, 4.0, 5.0, 6.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 0.0, 1.0, 2.0], "bins": [-7.7734375, -7.5291748046875, -7.284912109375, -7.0406494140625, -6.79638671875, -6.5521240234375, -6.307861328125, -6.0635986328125, -5.8193359375, -5.5750732421875, -5.330810546875, -5.0865478515625, -4.84228515625, -4.5980224609375, -4.353759765625, -4.1094970703125, -3.865234375, -3.6209716796875, -3.376708984375, -3.1324462890625, -2.88818359375, -2.6439208984375, -2.399658203125, -2.1553955078125, -1.9111328125, -1.6668701171875, -1.422607421875, -1.1783447265625, -0.93408203125, -0.6898193359375, -0.445556640625, -0.2012939453125, 0.04296875, 0.2872314453125, 0.531494140625, 0.7757568359375, 1.02001953125, 1.2642822265625, 1.508544921875, 1.7528076171875, 1.9970703125, 2.2413330078125, 2.485595703125, 2.7298583984375, 2.97412109375, 3.2183837890625, 3.462646484375, 3.7069091796875, 3.951171875, 4.1954345703125, 4.439697265625, 4.6839599609375, 4.92822265625, 5.1724853515625, 5.416748046875, 5.6610107421875, 5.9052734375, 6.1495361328125, 6.393798828125, 6.6380615234375, 6.88232421875, 7.1265869140625, 7.370849609375, 7.6151123046875, 7.859375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 4.0, 11.0, 18.0, 22.0, 33.0, 33.0, 50.0, 65.0, 90.0, 129.0, 171.0, 193.0, 264.0, 333.0, 449.0, 440.0, 383.0, 310.0, 261.0, 196.0, 157.0, 129.0, 90.0, 67.0, 47.0, 23.0, 28.0, 14.0, 12.0, 14.0, 6.0, 11.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.64453125, -6.46661376953125, -6.2886962890625, -6.11077880859375, -5.932861328125, -5.75494384765625, -5.5770263671875, -5.39910888671875, -5.22119140625, -5.04327392578125, -4.8653564453125, -4.68743896484375, -4.509521484375, -4.33160400390625, -4.1536865234375, -3.97576904296875, -3.7978515625, -3.61993408203125, -3.4420166015625, -3.26409912109375, -3.086181640625, -2.90826416015625, -2.7303466796875, -2.55242919921875, -2.37451171875, -2.19659423828125, -2.0186767578125, -1.84075927734375, -1.662841796875, -1.48492431640625, -1.3070068359375, -1.12908935546875, -0.951171875, -0.77325439453125, -0.5953369140625, -0.41741943359375, -0.239501953125, -0.06158447265625, 0.1163330078125, 0.29425048828125, 0.47216796875, 0.65008544921875, 0.8280029296875, 1.00592041015625, 1.183837890625, 1.36175537109375, 1.5396728515625, 1.71759033203125, 1.8955078125, 2.07342529296875, 2.2513427734375, 2.42926025390625, 2.607177734375, 2.78509521484375, 2.9630126953125, 3.14093017578125, 3.31884765625, 3.49676513671875, 3.6746826171875, 3.85260009765625, 4.030517578125, 4.20843505859375, 4.3863525390625, 4.56427001953125, 4.7421875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 1.0, 4.0, 6.0, 8.0, 20.0, 23.0, 35.0, 44.0, 57.0, 77.0, 111.0, 193.0, 282.0, 535.0, 1139.0, 4270.0, 31896.0, 426599.0, 3224666.0, 463204.0, 33963.0, 4647.0, 1139.0, 495.0, 267.0, 185.0, 114.0, 88.0, 58.0, 39.0, 35.0, 23.0, 14.0, 7.0, 9.0, 9.0, 4.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.1768798828125, -10.720947265625, -10.2650146484375, -9.80908203125, -9.3531494140625, -8.897216796875, -8.4412841796875, -7.9853515625, -7.5294189453125, -7.073486328125, -6.6175537109375, -6.16162109375, -5.7056884765625, -5.249755859375, -4.7938232421875, -4.337890625, -3.8819580078125, -3.426025390625, -2.9700927734375, -2.51416015625, -2.0582275390625, -1.602294921875, -1.1463623046875, -0.6904296875, -0.2344970703125, 0.221435546875, 0.6773681640625, 1.13330078125, 1.5892333984375, 2.045166015625, 2.5010986328125, 2.95703125, 3.4129638671875, 3.868896484375, 4.3248291015625, 4.78076171875, 5.2366943359375, 5.692626953125, 6.1485595703125, 6.6044921875, 7.0604248046875, 7.516357421875, 7.9722900390625, 8.42822265625, 8.8841552734375, 9.340087890625, 9.7960205078125, 10.251953125, 10.7078857421875, 11.163818359375, 11.6197509765625, 12.07568359375, 12.5316162109375, 12.987548828125, 13.4434814453125, 13.8994140625, 14.3553466796875, 14.811279296875, 15.2672119140625, 15.72314453125, 16.1790771484375, 16.635009765625, 17.0909423828125, 17.546875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [4.0, 4.0, 15.0, 31.0, 57.0, 68.0, 132.0, 166.0, 149.0, 144.0, 112.0, 80.0, 34.0, 15.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.939248085021973, -12.229952812194824, -10.520657539367676, -8.811361312866211, -7.102066516876221, -5.392770767211914, -3.6834754943847656, -1.9741802215576172, -0.26488494873046875, 1.4444104433059692, 3.1537058353424072, 4.863001346588135, 6.572296619415283, 8.28159236907959, 9.990887641906738, 11.700182914733887, 13.409478187561035, 15.118773460388184, 16.82806968688965, 18.537364959716797, 20.246660232543945, 21.955955505371094, 23.665250778198242, 25.37454605102539, 27.08384132385254, 28.793136596679688, 30.502431869506836, 32.211727142333984, 33.921024322509766, 35.63031768798828, 37.33961486816406, 39.04890823364258, 40.75820541381836, 42.46750259399414, 44.176795959472656, 45.88609313964844, 47.59538650512695, 49.304683685302734, 51.01397705078125, 52.72327423095703, 54.43256759643555, 56.14186477661133, 57.851158142089844, 59.560455322265625, 61.26974868774414, 62.97904586791992, 64.68833923339844, 66.39763641357422, 68.10693359375, 69.81623077392578, 71.52552795410156, 73.23481750488281, 74.9441146850586, 76.65341186523438, 78.36270904541016, 80.0719985961914, 81.78129577636719, 83.49059295654297, 85.19989013671875, 86.9091796875, 88.61847686767578, 90.32777404785156, 92.03707122802734, 93.7463607788086, 95.45565795898438]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 6.0, 3.0, 11.0, 9.0, 9.0, 16.0, 15.0, 20.0, 14.0, 23.0, 22.0, 22.0, 32.0, 25.0, 30.0, 43.0, 35.0, 42.0, 41.0, 52.0, 39.0, 41.0, 35.0, 39.0, 40.0, 43.0, 43.0, 37.0, 33.0, 24.0, 32.0, 18.0, 20.0, 12.0, 12.0, 9.0, 7.0, 13.0, 6.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.55908966064453, -16.9721622467041, -16.38523292541504, -15.79830551147461, -15.211377143859863, -14.624448776245117, -14.037521362304688, -13.450592994689941, -12.863664627075195, -12.27673625946045, -11.689807891845703, -11.102880477905273, -10.515952110290527, -9.929023742675781, -9.342096328735352, -8.755167961120605, -8.16823959350586, -7.581311225891113, -6.994383335113525, -6.4074554443359375, -5.820527076721191, -5.233598709106445, -4.646670818328857, -4.0597429275512695, -3.4728145599365234, -2.8858864307403564, -2.2989583015441895, -1.7120301723480225, -1.1251020431518555, -0.5381739139556885, 0.048754215240478516, 0.6356821060180664, 1.2226104736328125, 1.8095386028289795, 2.3964667320251465, 2.9833948612213135, 3.5703229904174805, 4.157251358032227, 4.7441792488098145, 5.331107139587402, 5.918035507202148, 6.5049638748168945, 7.091891765594482, 7.67881965637207, 8.265748023986816, 8.852676391601562, 9.439603805541992, 10.026532173156738, 10.613460540771484, 11.20038890838623, 11.787317276000977, 12.374244689941406, 12.961173057556152, 13.548101425170898, 14.135028839111328, 14.721957206726074, 15.30888557434082, 15.895813941955566, 16.482742309570312, 17.069669723510742, 17.656597137451172, 18.243526458740234, 18.830453872680664, 19.417381286621094, 20.004310607910156]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 3.0, 6.0, 8.0, 5.0, 13.0, 16.0, 12.0, 13.0, 18.0, 26.0, 17.0, 24.0, 37.0, 36.0, 28.0, 36.0, 42.0, 46.0, 44.0, 33.0, 46.0, 36.0, 30.0, 54.0, 34.0, 26.0, 29.0, 27.0, 27.0, 31.0, 30.0, 31.0, 27.0, 19.0, 17.0, 14.0, 10.0, 5.0, 9.0, 7.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.12890625, -2.0594482421875, -1.989990234375, -1.9205322265625, -1.85107421875, -1.7816162109375, -1.712158203125, -1.6427001953125, -1.5732421875, -1.5037841796875, -1.434326171875, -1.3648681640625, -1.29541015625, -1.2259521484375, -1.156494140625, -1.0870361328125, -1.017578125, -0.9481201171875, -0.878662109375, -0.8092041015625, -0.73974609375, -0.6702880859375, -0.600830078125, -0.5313720703125, -0.4619140625, -0.3924560546875, -0.322998046875, -0.2535400390625, -0.18408203125, -0.1146240234375, -0.045166015625, 0.0242919921875, 0.09375, 0.1632080078125, 0.232666015625, 0.3021240234375, 0.37158203125, 0.4410400390625, 0.510498046875, 0.5799560546875, 0.6494140625, 0.7188720703125, 0.788330078125, 0.8577880859375, 0.92724609375, 0.9967041015625, 1.066162109375, 1.1356201171875, 1.205078125, 1.2745361328125, 1.343994140625, 1.4134521484375, 1.48291015625, 1.5523681640625, 1.621826171875, 1.6912841796875, 1.7607421875, 1.8302001953125, 1.899658203125, 1.9691162109375, 2.03857421875, 2.1080322265625, 2.177490234375, 2.2469482421875, 2.31640625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 10.0, 15.0, 27.0, 42.0, 51.0, 74.0, 124.0, 181.0, 227.0, 331.0, 482.0, 765.0, 1035.0, 1550.0, 2337.0, 3495.0, 5298.0, 8192.0, 12959.0, 20445.0, 33734.0, 55774.0, 98218.0, 214681.0, 287990.0, 124621.0, 67647.0, 39952.0, 24766.0, 15314.0, 9692.0, 6105.0, 4094.0, 2632.0, 1801.0, 1182.0, 813.0, 569.0, 398.0, 306.0, 182.0, 133.0, 100.0, 61.0, 44.0, 32.0, 19.0, 15.0, 8.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0], "bins": [-0.01373291015625, -0.013319015502929688, -0.012905120849609375, -0.012491226196289062, -0.01207733154296875, -0.011663436889648438, -0.011249542236328125, -0.010835647583007812, -0.0104217529296875, -0.010007858276367188, -0.009593963623046875, -0.009180068969726562, -0.00876617431640625, -0.008352279663085938, -0.007938385009765625, -0.0075244903564453125, -0.007110595703125, -0.0066967010498046875, -0.006282806396484375, -0.0058689117431640625, -0.00545501708984375, -0.0050411224365234375, -0.004627227783203125, -0.0042133331298828125, -0.0037994384765625, -0.0033855438232421875, -0.002971649169921875, -0.0025577545166015625, -0.00214385986328125, -0.0017299652099609375, -0.001316070556640625, -0.0009021759033203125, -0.00048828125, -7.43865966796875e-05, 0.000339508056640625, 0.0007534027099609375, 0.00116729736328125, 0.0015811920166015625, 0.001995086669921875, 0.0024089813232421875, 0.0028228759765625, 0.0032367706298828125, 0.003650665283203125, 0.0040645599365234375, 0.00447845458984375, 0.0048923492431640625, 0.005306243896484375, 0.0057201385498046875, 0.006134033203125, 0.0065479278564453125, 0.006961822509765625, 0.0073757171630859375, 0.00778961181640625, 0.008203506469726562, 0.008617401123046875, 0.009031295776367188, 0.0094451904296875, 0.009859085083007812, 0.010272979736328125, 0.010686874389648438, 0.01110076904296875, 0.011514663696289062, 0.011928558349609375, 0.012342453002929688, 0.01275634765625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 8.0, 3.0, 9.0, 11.0, 15.0, 14.0, 17.0, 16.0, 25.0, 15.0, 28.0, 34.0, 29.0, 40.0, 35.0, 32.0, 51.0, 45.0, 32.0, 1084.0, 34.0, 56.0, 39.0, 34.0, 41.0, 41.0, 22.0, 32.0, 29.0, 24.0, 22.0, 20.0, 17.0, 18.0, 9.0, 6.0, 12.0, 10.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.7880859375, -1.734893798828125, -1.68170166015625, -1.628509521484375, -1.5753173828125, -1.522125244140625, -1.46893310546875, -1.415740966796875, -1.362548828125, -1.309356689453125, -1.25616455078125, -1.202972412109375, -1.1497802734375, -1.096588134765625, -1.04339599609375, -0.990203857421875, -0.93701171875, -0.883819580078125, -0.83062744140625, -0.777435302734375, -0.7242431640625, -0.671051025390625, -0.61785888671875, -0.564666748046875, -0.511474609375, -0.458282470703125, -0.40509033203125, -0.351898193359375, -0.2987060546875, -0.245513916015625, -0.19232177734375, -0.139129638671875, -0.0859375, -0.032745361328125, 0.02044677734375, 0.073638916015625, 0.1268310546875, 0.180023193359375, 0.23321533203125, 0.286407470703125, 0.339599609375, 0.392791748046875, 0.44598388671875, 0.499176025390625, 0.5523681640625, 0.605560302734375, 0.65875244140625, 0.711944580078125, 0.76513671875, 0.818328857421875, 0.87152099609375, 0.924713134765625, 0.9779052734375, 1.031097412109375, 1.08428955078125, 1.137481689453125, 1.190673828125, 1.243865966796875, 1.29705810546875, 1.350250244140625, 1.4034423828125, 1.456634521484375, 1.50982666015625, 1.563018798828125, 1.6162109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 21.0, 26.0, 28.0, 34.0, 65.0, 113.0, 142.0, 229.0, 376.0, 487.0, 808.0, 1187.0, 1937.0, 2783.0, 4517.0, 7065.0, 11336.0, 18259.0, 30208.0, 50222.0, 89777.0, 196904.0, 1366546.0, 137272.0, 70230.0, 40862.0, 24502.0, 15113.0, 9392.0, 5832.0, 3859.0, 2439.0, 1500.0, 1057.0, 659.0, 408.0, 290.0, 210.0, 129.0, 94.0, 68.0, 45.0, 26.0, 25.0, 17.0, 9.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0096588134765625, -0.009340047836303711, -0.009021282196044922, -0.008702516555786133, -0.008383750915527344, -0.008064985275268555, -0.007746219635009766, -0.0074274539947509766, -0.0071086883544921875, -0.0067899227142333984, -0.006471157073974609, -0.00615239143371582, -0.005833625793457031, -0.005514860153198242, -0.005196094512939453, -0.004877328872680664, -0.004558563232421875, -0.004239797592163086, -0.003921031951904297, -0.003602266311645508, -0.0032835006713867188, -0.0029647350311279297, -0.0026459693908691406, -0.0023272037506103516, -0.0020084381103515625, -0.0016896724700927734, -0.0013709068298339844, -0.0010521411895751953, -0.0007333755493164062, -0.0004146099090576172, -9.584426879882812e-05, 0.00022292137145996094, 0.00054168701171875, 0.0008604526519775391, 0.0011792182922363281, 0.0014979839324951172, 0.0018167495727539062, 0.0021355152130126953, 0.0024542808532714844, 0.0027730464935302734, 0.0030918121337890625, 0.0034105777740478516, 0.0037293434143066406, 0.00404810905456543, 0.004366874694824219, 0.004685640335083008, 0.005004405975341797, 0.005323171615600586, 0.005641937255859375, 0.005960702896118164, 0.006279468536376953, 0.006598234176635742, 0.006916999816894531, 0.00723576545715332, 0.007554531097412109, 0.007873296737670898, 0.008192062377929688, 0.008510828018188477, 0.008829593658447266, 0.009148359298706055, 0.009467124938964844, 0.009785890579223633, 0.010104656219482422, 0.010423421859741211, 0.0107421875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 956.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 38.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 31.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 37.0, 31.0, 0.0, 40.0, 0.0, 267.0, 2896.0, 0.0, 16532.0, 0.0, 1008809.0, 16601.0, 0.0, 2915.0, 0.0, 238.0, 53.0, 0.0, 43.0, 0.0, 26.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 20.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.1324882507324219e-06, -1.0961666703224182e-06, -1.0598450899124146e-06, -1.0235235095024109e-06, -9.872019290924072e-07, -9.508803486824036e-07, -9.145587682723999e-07, -8.782371878623962e-07, -8.419156074523926e-07, -8.055940270423889e-07, -7.692724466323853e-07, -7.329508662223816e-07, -6.966292858123779e-07, -6.603077054023743e-07, -6.239861249923706e-07, -5.876645445823669e-07, -5.513429641723633e-07, -5.150213837623596e-07, -4.78699803352356e-07, -4.423782229423523e-07, -4.0605664253234863e-07, -3.6973506212234497e-07, -3.334134817123413e-07, -2.9709190130233765e-07, -2.60770320892334e-07, -2.2444874048233032e-07, -1.8812716007232666e-07, -1.51805579662323e-07, -1.1548399925231934e-07, -7.916241884231567e-08, -4.284083843231201e-08, -6.51925802230835e-09, 2.9802322387695312e-08, 6.612390279769897e-08, 1.0244548320770264e-07, 1.387670636177063e-07, 1.7508864402770996e-07, 2.1141022443771362e-07, 2.477318048477173e-07, 2.8405338525772095e-07, 3.203749656677246e-07, 3.5669654607772827e-07, 3.9301812648773193e-07, 4.293397068977356e-07, 4.6566128730773926e-07, 5.019828677177429e-07, 5.383044481277466e-07, 5.746260285377502e-07, 6.109476089477539e-07, 6.472691893577576e-07, 6.835907697677612e-07, 7.199123501777649e-07, 7.562339305877686e-07, 7.925555109977722e-07, 8.288770914077759e-07, 8.651986718177795e-07, 9.015202522277832e-07, 9.378418326377869e-07, 9.741634130477905e-07, 1.0104849934577942e-06, 1.0468065738677979e-06, 1.0831281542778015e-06, 1.1194497346878052e-06, 1.1557713150978088e-06, 1.1920928955078125e-06]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 3.0, 6.0, 8.0, 5.0, 13.0, 16.0, 12.0, 13.0, 18.0, 26.0, 17.0, 24.0, 37.0, 36.0, 28.0, 36.0, 42.0, 46.0, 44.0, 33.0, 46.0, 36.0, 30.0, 54.0, 34.0, 26.0, 29.0, 27.0, 27.0, 31.0, 30.0, 31.0, 27.0, 19.0, 17.0, 14.0, 10.0, 5.0, 9.0, 7.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.12890625, -2.0594482421875, -1.989990234375, -1.9205322265625, -1.85107421875, -1.7816162109375, -1.712158203125, -1.6427001953125, -1.5732421875, -1.5037841796875, -1.434326171875, -1.3648681640625, -1.29541015625, -1.2259521484375, -1.156494140625, -1.0870361328125, -1.017578125, -0.9481201171875, -0.878662109375, -0.8092041015625, -0.73974609375, -0.6702880859375, -0.600830078125, -0.5313720703125, -0.4619140625, -0.3924560546875, -0.322998046875, -0.2535400390625, -0.18408203125, -0.1146240234375, -0.045166015625, 0.0242919921875, 0.09375, 0.1632080078125, 0.232666015625, 0.3021240234375, 0.37158203125, 0.4410400390625, 0.510498046875, 0.5799560546875, 0.6494140625, 0.7188720703125, 0.788330078125, 0.8577880859375, 0.92724609375, 0.9967041015625, 1.066162109375, 1.1356201171875, 1.205078125, 1.2745361328125, 1.343994140625, 1.4134521484375, 1.48291015625, 1.5523681640625, 1.621826171875, 1.6912841796875, 1.7607421875, 1.8302001953125, 1.899658203125, 1.9691162109375, 2.03857421875, 2.1080322265625, 2.177490234375, 2.2469482421875, 2.31640625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 18.0, 20.0, 12.0, 27.0, 31.0, 55.0, 87.0, 130.0, 240.0, 303.0, 494.0, 786.0, 1184.0, 1921.0, 2934.0, 4611.0, 7436.0, 11998.0, 18922.0, 30815.0, 52054.0, 143133.0, 483663.0, 150971.0, 53311.0, 30948.0, 19378.0, 12305.0, 7528.0, 4851.0, 3028.0, 1895.0, 1247.0, 817.0, 494.0, 298.0, 200.0, 149.0, 90.0, 54.0, 40.0, 31.0, 12.0, 8.0, 8.0, 5.0, 9.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.28515625, -2.21697998046875, -2.1488037109375, -2.08062744140625, -2.012451171875, -1.94427490234375, -1.8760986328125, -1.80792236328125, -1.73974609375, -1.67156982421875, -1.6033935546875, -1.53521728515625, -1.467041015625, -1.39886474609375, -1.3306884765625, -1.26251220703125, -1.1943359375, -1.12615966796875, -1.0579833984375, -0.98980712890625, -0.921630859375, -0.85345458984375, -0.7852783203125, -0.71710205078125, -0.64892578125, -0.58074951171875, -0.5125732421875, -0.44439697265625, -0.376220703125, -0.30804443359375, -0.2398681640625, -0.17169189453125, -0.103515625, -0.03533935546875, 0.0328369140625, 0.10101318359375, 0.169189453125, 0.23736572265625, 0.3055419921875, 0.37371826171875, 0.44189453125, 0.51007080078125, 0.5782470703125, 0.64642333984375, 0.714599609375, 0.78277587890625, 0.8509521484375, 0.91912841796875, 0.9873046875, 1.05548095703125, 1.1236572265625, 1.19183349609375, 1.260009765625, 1.32818603515625, 1.3963623046875, 1.46453857421875, 1.53271484375, 1.60089111328125, 1.6690673828125, 1.73724365234375, 1.805419921875, 1.87359619140625, 1.9417724609375, 2.00994873046875, 2.078125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 6.0, 8.0, 8.0, 10.0, 10.0, 12.0, 20.0, 10.0, 15.0, 21.0, 35.0, 25.0, 39.0, 37.0, 32.0, 49.0, 77.0, 136.0, 1590.0, 310.0, 105.0, 58.0, 51.0, 42.0, 46.0, 32.0, 31.0, 32.0, 33.0, 20.0, 22.0, 27.0, 19.0, 8.0, 12.0, 11.0, 11.0, 8.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0], "bins": [-8.265625, -8.0140380859375, -7.762451171875, -7.5108642578125, -7.25927734375, -7.0076904296875, -6.756103515625, -6.5045166015625, -6.2529296875, -6.0013427734375, -5.749755859375, -5.4981689453125, -5.24658203125, -4.9949951171875, -4.743408203125, -4.4918212890625, -4.240234375, -3.9886474609375, -3.737060546875, -3.4854736328125, -3.23388671875, -2.9822998046875, -2.730712890625, -2.4791259765625, -2.2275390625, -1.9759521484375, -1.724365234375, -1.4727783203125, -1.22119140625, -0.9696044921875, -0.718017578125, -0.4664306640625, -0.21484375, 0.0367431640625, 0.288330078125, 0.5399169921875, 0.79150390625, 1.0430908203125, 1.294677734375, 1.5462646484375, 1.7978515625, 2.0494384765625, 2.301025390625, 2.5526123046875, 2.80419921875, 3.0557861328125, 3.307373046875, 3.5589599609375, 3.810546875, 4.0621337890625, 4.313720703125, 4.5653076171875, 4.81689453125, 5.0684814453125, 5.320068359375, 5.5716552734375, 5.8232421875, 6.0748291015625, 6.326416015625, 6.5780029296875, 6.82958984375, 7.0811767578125, 7.332763671875, 7.5843505859375, 7.8359375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 15.0, 14.0, 12.0, 20.0, 20.0, 24.0, 31.0, 46.0, 52.0, 90.0, 84.0, 118.0, 149.0, 212.0, 375.0, 1123.0, 7061.0, 98740.0, 2927814.0, 100267.0, 7219.0, 1049.0, 367.0, 197.0, 144.0, 110.0, 78.0, 66.0, 35.0, 28.0, 20.0, 22.0, 11.0, 18.0, 14.0, 8.0, 6.0, 7.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.3359375, -12.91259765625, -12.4892578125, -12.06591796875, -11.642578125, -11.21923828125, -10.7958984375, -10.37255859375, -9.94921875, -9.52587890625, -9.1025390625, -8.67919921875, -8.255859375, -7.83251953125, -7.4091796875, -6.98583984375, -6.5625, -6.13916015625, -5.7158203125, -5.29248046875, -4.869140625, -4.44580078125, -4.0224609375, -3.59912109375, -3.17578125, -2.75244140625, -2.3291015625, -1.90576171875, -1.482421875, -1.05908203125, -0.6357421875, -0.21240234375, 0.2109375, 0.63427734375, 1.0576171875, 1.48095703125, 1.904296875, 2.32763671875, 2.7509765625, 3.17431640625, 3.59765625, 4.02099609375, 4.4443359375, 4.86767578125, 5.291015625, 5.71435546875, 6.1376953125, 6.56103515625, 6.984375, 7.40771484375, 7.8310546875, 8.25439453125, 8.677734375, 9.10107421875, 9.5244140625, 9.94775390625, 10.37109375, 10.79443359375, 11.2177734375, 11.64111328125, 12.064453125, 12.48779296875, 12.9111328125, 13.33447265625, 13.7578125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 9.0, 298.0, 656.0, 53.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.055992126464844, -13.795495986938477, -10.53499984741211, -7.274503707885742, -4.014007568359375, -0.7535114288330078, 2.5069847106933594, 5.767480850219727, 9.027976989746094, 12.288473129272461, 15.548969268798828, 18.809465408325195, 22.069961547851562, 25.33045768737793, 28.590953826904297, 31.851449966430664, 35.11194610595703, 38.37244415283203, 41.632938385009766, 44.8934326171875, 48.1539306640625, 51.4144287109375, 54.674922943115234, 57.93541717529297, 61.19591522216797, 64.45641326904297, 67.71690368652344, 70.97740173339844, 74.23789978027344, 77.49839782714844, 80.75889587402344, 84.0193862915039, 87.27987670898438, 90.54037475585938, 93.80087280273438, 97.06136322021484, 100.32186126708984, 103.58235931396484, 106.84284973144531, 110.10334777832031, 113.36384582519531, 116.62434387207031, 119.88484191894531, 123.14533233642578, 126.40583038330078, 129.66632080078125, 132.92681884765625, 136.18731689453125, 139.44781494140625, 142.70831298828125, 145.96881103515625, 149.22930908203125, 152.48980712890625, 155.7502899169922, 159.0107879638672, 162.2712860107422, 165.5317840576172, 168.7922821044922, 172.0527801513672, 175.3132781982422, 178.57376098632812, 181.83425903320312, 185.09475708007812, 188.35525512695312, 191.61575317382812]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 5.0, 14.0, 13.0, 12.0, 6.0, 20.0, 16.0, 18.0, 22.0, 25.0, 31.0, 32.0, 38.0, 26.0, 36.0, 39.0, 34.0, 36.0, 37.0, 33.0, 43.0, 27.0, 54.0, 46.0, 26.0, 29.0, 32.0, 23.0, 29.0, 25.0, 24.0, 18.0, 13.0, 17.0, 14.0, 9.0, 10.0, 8.0, 12.0, 9.0, 2.0, 8.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-20.439821243286133, -19.773361206054688, -19.106901168823242, -18.440441131591797, -17.77398109436035, -17.107521057128906, -16.441062927246094, -15.774602890014648, -15.108142852783203, -14.441682815551758, -13.775222778320312, -13.108762741088867, -12.442303657531738, -11.775843620300293, -11.109383583068848, -10.442924499511719, -9.776463508605957, -9.110003471374512, -8.443543434143066, -7.777083873748779, -7.110624313354492, -6.444164276123047, -5.777704238891602, -5.1112446784973145, -4.444784641265869, -3.778324842453003, -3.1118650436401367, -2.4454050064086914, -1.7789452075958252, -1.112485408782959, -0.44602537155151367, 0.22043418884277344, 0.8868942260742188, 1.553354024887085, 2.219813823699951, 2.8862738609313965, 3.5527336597442627, 4.219193458557129, 4.885653495788574, 5.552113056182861, 6.218573093414307, 6.885033130645752, 7.551492691040039, 8.217952728271484, 8.88441276550293, 9.550872802734375, 10.21733283996582, 10.88379192352295, 11.550251960754395, 12.21671199798584, 12.883172035217285, 13.549631118774414, 14.21609115600586, 14.882551193237305, 15.54901123046875, 16.215471267700195, 16.88193130493164, 17.548391342163086, 18.21485137939453, 18.881311416625977, 19.547771453857422, 20.214229583740234, 20.880691528320312, 21.547149658203125, 22.21360969543457]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 1.0, 2.0, 8.0, 7.0, 12.0, 12.0, 9.0, 14.0, 14.0, 20.0, 14.0, 21.0, 31.0, 40.0, 25.0, 44.0, 46.0, 35.0, 38.0, 45.0, 35.0, 39.0, 52.0, 46.0, 34.0, 29.0, 30.0, 27.0, 40.0, 22.0, 24.0, 35.0, 31.0, 25.0, 20.0, 11.0, 10.0, 8.0, 7.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.168426513671875, -2.09466552734375, -2.020904541015625, -1.9471435546875, -1.873382568359375, -1.79962158203125, -1.725860595703125, -1.652099609375, -1.578338623046875, -1.50457763671875, -1.430816650390625, -1.3570556640625, -1.283294677734375, -1.20953369140625, -1.135772705078125, -1.06201171875, -0.988250732421875, -0.91448974609375, -0.840728759765625, -0.7669677734375, -0.693206787109375, -0.61944580078125, -0.545684814453125, -0.471923828125, -0.398162841796875, -0.32440185546875, -0.250640869140625, -0.1768798828125, -0.103118896484375, -0.02935791015625, 0.044403076171875, 0.1181640625, 0.191925048828125, 0.26568603515625, 0.339447021484375, 0.4132080078125, 0.486968994140625, 0.56072998046875, 0.634490966796875, 0.708251953125, 0.782012939453125, 0.85577392578125, 0.929534912109375, 1.0032958984375, 1.077056884765625, 1.15081787109375, 1.224578857421875, 1.29833984375, 1.372100830078125, 1.44586181640625, 1.519622802734375, 1.5933837890625, 1.667144775390625, 1.74090576171875, 1.814666748046875, 1.888427734375, 1.962188720703125, 2.03594970703125, 2.109710693359375, 2.1834716796875, 2.257232666015625, 2.33099365234375, 2.404754638671875, 2.478515625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 13.0, 7.0, 10.0, 14.0, 27.0, 27.0, 28.0, 48.0, 76.0, 102.0, 145.0, 170.0, 293.0, 436.0, 640.0, 1041.0, 1895.0, 3543.0, 7088.0, 14999.0, 35893.0, 95645.0, 300903.0, 1018189.0, 1662454.0, 719415.0, 207287.0, 69938.0, 28182.0, 12243.0, 5864.0, 3076.0, 1707.0, 936.0, 622.0, 391.0, 246.0, 162.0, 136.0, 105.0, 79.0, 61.0, 33.0, 23.0, 29.0, 15.0, 15.0, 12.0, 6.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0], "bins": [-3.689453125, -3.575408935546875, -3.46136474609375, -3.347320556640625, -3.2332763671875, -3.119232177734375, -3.00518798828125, -2.891143798828125, -2.777099609375, -2.663055419921875, -2.54901123046875, -2.434967041015625, -2.3209228515625, -2.206878662109375, -2.09283447265625, -1.978790283203125, -1.86474609375, -1.750701904296875, -1.63665771484375, -1.522613525390625, -1.4085693359375, -1.294525146484375, -1.18048095703125, -1.066436767578125, -0.952392578125, -0.838348388671875, -0.72430419921875, -0.610260009765625, -0.4962158203125, -0.382171630859375, -0.26812744140625, -0.154083251953125, -0.0400390625, 0.074005126953125, 0.18804931640625, 0.302093505859375, 0.4161376953125, 0.530181884765625, 0.64422607421875, 0.758270263671875, 0.872314453125, 0.986358642578125, 1.10040283203125, 1.214447021484375, 1.3284912109375, 1.442535400390625, 1.55657958984375, 1.670623779296875, 1.78466796875, 1.898712158203125, 2.01275634765625, 2.126800537109375, 2.2408447265625, 2.354888916015625, 2.46893310546875, 2.582977294921875, 2.697021484375, 2.811065673828125, 2.92510986328125, 3.039154052734375, 3.1531982421875, 3.267242431640625, 3.38128662109375, 3.495330810546875, 3.609375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 4.0, 4.0, 10.0, 11.0, 16.0, 29.0, 34.0, 55.0, 68.0, 117.0, 138.0, 211.0, 245.0, 329.0, 402.0, 484.0, 454.0, 390.0, 278.0, 191.0, 159.0, 122.0, 93.0, 66.0, 48.0, 38.0, 19.0, 16.0, 14.0, 17.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.85546875, -7.66253662109375, -7.4696044921875, -7.27667236328125, -7.083740234375, -6.89080810546875, -6.6978759765625, -6.50494384765625, -6.31201171875, -6.11907958984375, -5.9261474609375, -5.73321533203125, -5.540283203125, -5.34735107421875, -5.1544189453125, -4.96148681640625, -4.7685546875, -4.57562255859375, -4.3826904296875, -4.18975830078125, -3.996826171875, -3.80389404296875, -3.6109619140625, -3.41802978515625, -3.22509765625, -3.03216552734375, -2.8392333984375, -2.64630126953125, -2.453369140625, -2.26043701171875, -2.0675048828125, -1.87457275390625, -1.681640625, -1.48870849609375, -1.2957763671875, -1.10284423828125, -0.909912109375, -0.71697998046875, -0.5240478515625, -0.33111572265625, -0.13818359375, 0.05474853515625, 0.2476806640625, 0.44061279296875, 0.633544921875, 0.82647705078125, 1.0194091796875, 1.21234130859375, 1.4052734375, 1.59820556640625, 1.7911376953125, 1.98406982421875, 2.177001953125, 2.36993408203125, 2.5628662109375, 2.75579833984375, 2.94873046875, 3.14166259765625, 3.3345947265625, 3.52752685546875, 3.720458984375, 3.91339111328125, 4.1063232421875, 4.29925537109375, 4.4921875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 7.0, 16.0, 21.0, 24.0, 41.0, 48.0, 69.0, 101.0, 137.0, 205.0, 307.0, 596.0, 1388.0, 4978.0, 27048.0, 217859.0, 2204622.0, 1561977.0, 149146.0, 19373.0, 3782.0, 1142.0, 491.0, 282.0, 162.0, 133.0, 76.0, 53.0, 49.0, 46.0, 22.0, 20.0, 19.0, 17.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.0921630859375, -7.739013671875, -7.3858642578125, -7.03271484375, -6.6795654296875, -6.326416015625, -5.9732666015625, -5.6201171875, -5.2669677734375, -4.913818359375, -4.5606689453125, -4.20751953125, -3.8543701171875, -3.501220703125, -3.1480712890625, -2.794921875, -2.4417724609375, -2.088623046875, -1.7354736328125, -1.38232421875, -1.0291748046875, -0.676025390625, -0.3228759765625, 0.0302734375, 0.3834228515625, 0.736572265625, 1.0897216796875, 1.44287109375, 1.7960205078125, 2.149169921875, 2.5023193359375, 2.85546875, 3.2086181640625, 3.561767578125, 3.9149169921875, 4.26806640625, 4.6212158203125, 4.974365234375, 5.3275146484375, 5.6806640625, 6.0338134765625, 6.386962890625, 6.7401123046875, 7.09326171875, 7.4464111328125, 7.799560546875, 8.1527099609375, 8.505859375, 8.8590087890625, 9.212158203125, 9.5653076171875, 9.91845703125, 10.2716064453125, 10.624755859375, 10.9779052734375, 11.3310546875, 11.6842041015625, 12.037353515625, 12.3905029296875, 12.74365234375, 13.0968017578125, 13.449951171875, 13.8031005859375, 14.15625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 8.0, 15.0, 22.0, 29.0, 45.0, 65.0, 91.0, 116.0, 115.0, 117.0, 110.0, 84.0, 59.0, 47.0, 23.0, 23.0, 14.0, 12.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.782926559448242, -17.738866806030273, -16.694808959960938, -15.650749206542969, -14.606689453125, -13.562630653381348, -12.518571853637695, -11.474512100219727, -10.430453300476074, -9.386394500732422, -8.342334747314453, -7.298275947570801, -6.25421667098999, -5.21015739440918, -4.166098594665527, -3.122039318084717, -2.0779800415039062, -1.0339208841323853, 0.010138273239135742, 1.0541973114013672, 2.0982565879821777, 3.1423158645629883, 4.186374664306641, 5.230433940887451, 6.274493217468262, 7.318552494049072, 8.362611770629883, 9.406670570373535, 10.450729370117188, 11.494789123535156, 12.538847923278809, 13.582906723022461, 14.626968383789062, 15.671027183532715, 16.715085983276367, 17.759145736694336, 18.803205490112305, 19.84726333618164, 20.89132308959961, 21.935382843017578, 22.979442596435547, 24.023502349853516, 25.06756019592285, 26.11161994934082, 27.15567970275879, 28.199737548828125, 29.243797302246094, 30.287857055664062, 31.3319149017334, 32.375972747802734, 33.4200325012207, 34.46409225463867, 35.50815200805664, 36.55221176147461, 37.59626770019531, 38.64032745361328, 39.68438720703125, 40.72844696044922, 41.77250671386719, 42.816566467285156, 43.86062240600586, 44.90468215942383, 45.9487419128418, 46.992801666259766, 48.036861419677734]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 13.0, 9.0, 12.0, 11.0, 18.0, 24.0, 16.0, 27.0, 36.0, 31.0, 24.0, 31.0, 39.0, 46.0, 30.0, 38.0, 43.0, 33.0, 45.0, 37.0, 44.0, 46.0, 48.0, 32.0, 26.0, 21.0, 32.0, 36.0, 25.0, 22.0, 16.0, 15.0, 21.0, 6.0, 12.0, 9.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.000259399414062, -17.39913558959961, -16.798011779785156, -16.196887969970703, -15.595763206481934, -14.99463939666748, -14.393514633178711, -13.792390823364258, -13.191267013549805, -12.590143203735352, -11.989019393920898, -11.387894630432129, -10.786770820617676, -10.185647010803223, -9.584522247314453, -8.9833984375, -8.382274627685547, -7.781150817871094, -7.180026531219482, -6.578902244567871, -5.977778434753418, -5.376654624938965, -4.7755303382873535, -4.174406051635742, -3.573282241821289, -2.972158193588257, -2.3710341453552246, -1.7699100971221924, -1.1687860488891602, -0.5676620006561279, 0.0334620475769043, 0.6345863342285156, 1.2357101440429688, 1.836834192276001, 2.437958240509033, 3.0390822887420654, 3.6402063369750977, 4.241330146789551, 4.842454433441162, 5.443578720092773, 6.044702529907227, 6.64582633972168, 7.246950626373291, 7.848074913024902, 8.449198722839355, 9.050322532653809, 9.651447296142578, 10.252571105957031, 10.853694915771484, 11.454818725585938, 12.05594253540039, 12.65706729888916, 13.258191108703613, 13.859314918518066, 14.460439682006836, 15.061563491821289, 15.662687301635742, 16.263811111450195, 16.86493492126465, 17.4660587310791, 18.067184448242188, 18.66830825805664, 19.269432067871094, 19.870555877685547, 20.4716796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 8.0, 5.0, 4.0, 7.0, 10.0, 13.0, 13.0, 18.0, 15.0, 17.0, 25.0, 22.0, 34.0, 30.0, 31.0, 32.0, 41.0, 35.0, 41.0, 56.0, 40.0, 34.0, 33.0, 41.0, 32.0, 32.0, 40.0, 54.0, 34.0, 22.0, 30.0, 25.0, 21.0, 16.0, 14.0, 10.0, 12.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.203125, -2.129730224609375, -2.05633544921875, -1.982940673828125, -1.9095458984375, -1.836151123046875, -1.76275634765625, -1.689361572265625, -1.615966796875, -1.542572021484375, -1.46917724609375, -1.395782470703125, -1.3223876953125, -1.248992919921875, -1.17559814453125, -1.102203369140625, -1.02880859375, -0.955413818359375, -0.88201904296875, -0.808624267578125, -0.7352294921875, -0.661834716796875, -0.58843994140625, -0.515045166015625, -0.441650390625, -0.368255615234375, -0.29486083984375, -0.221466064453125, -0.1480712890625, -0.074676513671875, -0.00128173828125, 0.072113037109375, 0.1455078125, 0.218902587890625, 0.29229736328125, 0.365692138671875, 0.4390869140625, 0.512481689453125, 0.58587646484375, 0.659271240234375, 0.732666015625, 0.806060791015625, 0.87945556640625, 0.952850341796875, 1.0262451171875, 1.099639892578125, 1.17303466796875, 1.246429443359375, 1.31982421875, 1.393218994140625, 1.46661376953125, 1.540008544921875, 1.6134033203125, 1.686798095703125, 1.76019287109375, 1.833587646484375, 1.906982421875, 1.980377197265625, 2.05377197265625, 2.127166748046875, 2.2005615234375, 2.273956298828125, 2.34735107421875, 2.420745849609375, 2.494140625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 8.0, 10.0, 21.0, 29.0, 32.0, 47.0, 72.0, 99.0, 145.0, 201.0, 292.0, 449.0, 642.0, 864.0, 1263.0, 1921.0, 2811.0, 4269.0, 6446.0, 9772.0, 15363.0, 25099.0, 41179.0, 71033.0, 133263.0, 299428.0, 200992.0, 93079.0, 52826.0, 31603.0, 19371.0, 12199.0, 7903.0, 5144.0, 3338.0, 2278.0, 1577.0, 1050.0, 748.0, 517.0, 351.0, 245.0, 158.0, 132.0, 86.0, 59.0, 35.0, 34.0, 33.0, 17.0, 6.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.01372528076171875, -0.013306021690368652, -0.012886762619018555, -0.012467503547668457, -0.01204824447631836, -0.011628985404968262, -0.011209726333618164, -0.010790467262268066, -0.010371208190917969, -0.009951949119567871, -0.009532690048217773, -0.009113430976867676, -0.008694171905517578, -0.00827491283416748, -0.007855653762817383, -0.007436394691467285, -0.0070171356201171875, -0.00659787654876709, -0.006178617477416992, -0.0057593584060668945, -0.005340099334716797, -0.004920840263366699, -0.0045015811920166016, -0.004082322120666504, -0.0036630630493164062, -0.0032438039779663086, -0.002824544906616211, -0.0024052858352661133, -0.0019860267639160156, -0.001566767692565918, -0.0011475086212158203, -0.0007282495498657227, -0.000308990478515625, 0.00011026859283447266, 0.0005295276641845703, 0.000948786735534668, 0.0013680458068847656, 0.0017873048782348633, 0.002206563949584961, 0.0026258230209350586, 0.0030450820922851562, 0.003464341163635254, 0.0038836002349853516, 0.004302859306335449, 0.004722118377685547, 0.0051413774490356445, 0.005560636520385742, 0.00597989559173584, 0.0063991546630859375, 0.006818413734436035, 0.007237672805786133, 0.0076569318771362305, 0.008076190948486328, 0.008495450019836426, 0.008914709091186523, 0.009333968162536621, 0.009753227233886719, 0.010172486305236816, 0.010591745376586914, 0.011011004447937012, 0.01143026351928711, 0.011849522590637207, 0.012268781661987305, 0.012688040733337402, 0.0131072998046875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 8.0, 14.0, 6.0, 13.0, 24.0, 19.0, 28.0, 26.0, 37.0, 46.0, 29.0, 52.0, 43.0, 48.0, 43.0, 40.0, 1067.0, 57.0, 62.0, 49.0, 29.0, 48.0, 36.0, 42.0, 25.0, 24.0, 26.0, 23.0, 9.0, 9.0, 5.0, 7.0, 6.0, 5.0, 2.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.349609375, -2.2863922119140625, -2.223175048828125, -2.1599578857421875, -2.09674072265625, -2.0335235595703125, -1.970306396484375, -1.9070892333984375, -1.8438720703125, -1.7806549072265625, -1.717437744140625, -1.6542205810546875, -1.59100341796875, -1.5277862548828125, -1.464569091796875, -1.4013519287109375, -1.338134765625, -1.2749176025390625, -1.211700439453125, -1.1484832763671875, -1.08526611328125, -1.0220489501953125, -0.958831787109375, -0.8956146240234375, -0.8323974609375, -0.7691802978515625, -0.705963134765625, -0.6427459716796875, -0.57952880859375, -0.5163116455078125, -0.453094482421875, -0.3898773193359375, -0.32666015625, -0.2634429931640625, -0.200225830078125, -0.1370086669921875, -0.07379150390625, -0.0105743408203125, 0.052642822265625, 0.1158599853515625, 0.1790771484375, 0.2422943115234375, 0.305511474609375, 0.3687286376953125, 0.43194580078125, 0.4951629638671875, 0.558380126953125, 0.6215972900390625, 0.684814453125, 0.7480316162109375, 0.811248779296875, 0.8744659423828125, 0.93768310546875, 1.0009002685546875, 1.064117431640625, 1.1273345947265625, 1.1905517578125, 1.2537689208984375, 1.316986083984375, 1.3802032470703125, 1.44342041015625, 1.5066375732421875, 1.569854736328125, 1.6330718994140625, 1.6962890625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 12.0, 5.0, 8.0, 21.0, 31.0, 48.0, 78.0, 114.0, 190.0, 288.0, 501.0, 925.0, 1386.0, 2288.0, 4101.0, 7141.0, 13017.0, 24359.0, 46570.0, 94666.0, 236920.0, 1399201.0, 132488.0, 62600.0, 31684.0, 16980.0, 8980.0, 5310.0, 2879.0, 1698.0, 1015.0, 603.0, 398.0, 227.0, 121.0, 106.0, 75.0, 31.0, 18.0, 15.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01261138916015625, -0.012193918228149414, -0.011776447296142578, -0.011358976364135742, -0.010941505432128906, -0.01052403450012207, -0.010106563568115234, -0.009689092636108398, -0.009271621704101562, -0.008854150772094727, -0.00843667984008789, -0.008019208908081055, -0.007601737976074219, -0.007184267044067383, -0.006766796112060547, -0.006349325180053711, -0.005931854248046875, -0.005514383316040039, -0.005096912384033203, -0.004679441452026367, -0.004261970520019531, -0.0038444995880126953, -0.0034270286560058594, -0.0030095577239990234, -0.0025920867919921875, -0.0021746158599853516, -0.0017571449279785156, -0.0013396739959716797, -0.0009222030639648438, -0.0005047321319580078, -8.726119995117188e-05, 0.00033020973205566406, 0.0007476806640625, 0.001165151596069336, 0.0015826225280761719, 0.002000093460083008, 0.0024175643920898438, 0.0028350353240966797, 0.0032525062561035156, 0.0036699771881103516, 0.0040874481201171875, 0.0045049190521240234, 0.004922389984130859, 0.005339860916137695, 0.005757331848144531, 0.006174802780151367, 0.006592273712158203, 0.007009744644165039, 0.007427215576171875, 0.007844686508178711, 0.008262157440185547, 0.008679628372192383, 0.009097099304199219, 0.009514570236206055, 0.00993204116821289, 0.010349512100219727, 0.010766983032226562, 0.011184453964233398, 0.011601924896240234, 0.01201939582824707, 0.012436866760253906, 0.012854337692260742, 0.013271808624267578, 0.013689279556274414, 0.01410675048828125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 31.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 966.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 20.0, 37.0, 41.0, 216.0, 2361.0, 14002.0, 1015336.0, 13776.0, 2358.0, 244.0, 49.0, 25.0, 31.0, 4.0, 6.0, 0.0, 0.0, 0.0, 6.0, 19.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9073486328125e-06, -1.8477439880371094e-06, -1.7881393432617188e-06, -1.7285346984863281e-06, -1.6689300537109375e-06, -1.6093254089355469e-06, -1.5497207641601562e-06, -1.4901161193847656e-06, -1.430511474609375e-06, -1.3709068298339844e-06, -1.3113021850585938e-06, -1.2516975402832031e-06, -1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06, 1.7881393432617188e-06, 1.8477439880371094e-06, 1.9073486328125e-06]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 8.0, 5.0, 4.0, 7.0, 10.0, 13.0, 13.0, 18.0, 15.0, 17.0, 25.0, 22.0, 34.0, 30.0, 31.0, 32.0, 41.0, 35.0, 41.0, 56.0, 40.0, 34.0, 33.0, 41.0, 32.0, 32.0, 40.0, 54.0, 34.0, 22.0, 30.0, 25.0, 21.0, 16.0, 14.0, 10.0, 12.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.203125, -2.129730224609375, -2.05633544921875, -1.982940673828125, -1.9095458984375, -1.836151123046875, -1.76275634765625, -1.689361572265625, -1.615966796875, -1.542572021484375, -1.46917724609375, -1.395782470703125, -1.3223876953125, -1.248992919921875, -1.17559814453125, -1.102203369140625, -1.02880859375, -0.955413818359375, -0.88201904296875, -0.808624267578125, -0.7352294921875, -0.661834716796875, -0.58843994140625, -0.515045166015625, -0.441650390625, -0.368255615234375, -0.29486083984375, -0.221466064453125, -0.1480712890625, -0.074676513671875, -0.00128173828125, 0.072113037109375, 0.1455078125, 0.218902587890625, 0.29229736328125, 0.365692138671875, 0.4390869140625, 0.512481689453125, 0.58587646484375, 0.659271240234375, 0.732666015625, 0.806060791015625, 0.87945556640625, 0.952850341796875, 1.0262451171875, 1.099639892578125, 1.17303466796875, 1.246429443359375, 1.31982421875, 1.393218994140625, 1.46661376953125, 1.540008544921875, 1.6134033203125, 1.686798095703125, 1.76019287109375, 1.833587646484375, 1.906982421875, 1.980377197265625, 2.05377197265625, 2.127166748046875, 2.2005615234375, 2.273956298828125, 2.34735107421875, 2.420745849609375, 2.494140625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 3.0, 6.0, 15.0, 15.0, 18.0, 25.0, 46.0, 74.0, 84.0, 139.0, 240.0, 352.0, 538.0, 914.0, 1537.0, 2352.0, 3868.0, 6669.0, 11958.0, 22260.0, 41288.0, 84156.0, 216426.0, 375748.0, 143304.0, 63424.0, 32331.0, 17277.0, 9651.0, 5430.0, 3156.0, 1956.0, 1185.0, 696.0, 476.0, 317.0, 206.0, 140.0, 86.0, 53.0, 40.0, 35.0, 14.0, 15.0, 8.0, 9.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0625, -1.99444580078125, -1.9263916015625, -1.85833740234375, -1.790283203125, -1.72222900390625, -1.6541748046875, -1.58612060546875, -1.51806640625, -1.45001220703125, -1.3819580078125, -1.31390380859375, -1.245849609375, -1.17779541015625, -1.1097412109375, -1.04168701171875, -0.9736328125, -0.90557861328125, -0.8375244140625, -0.76947021484375, -0.701416015625, -0.63336181640625, -0.5653076171875, -0.49725341796875, -0.42919921875, -0.36114501953125, -0.2930908203125, -0.22503662109375, -0.156982421875, -0.08892822265625, -0.0208740234375, 0.04718017578125, 0.115234375, 0.18328857421875, 0.2513427734375, 0.31939697265625, 0.387451171875, 0.45550537109375, 0.5235595703125, 0.59161376953125, 0.65966796875, 0.72772216796875, 0.7957763671875, 0.86383056640625, 0.931884765625, 0.99993896484375, 1.0679931640625, 1.13604736328125, 1.2041015625, 1.27215576171875, 1.3402099609375, 1.40826416015625, 1.476318359375, 1.54437255859375, 1.6124267578125, 1.68048095703125, 1.74853515625, 1.81658935546875, 1.8846435546875, 1.95269775390625, 2.020751953125, 2.08880615234375, 2.1568603515625, 2.22491455078125, 2.29296875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 5.0, 10.0, 7.0, 8.0, 8.0, 12.0, 13.0, 16.0, 25.0, 29.0, 29.0, 34.0, 41.0, 57.0, 66.0, 66.0, 140.0, 345.0, 1529.0, 159.0, 89.0, 71.0, 37.0, 29.0, 44.0, 36.0, 22.0, 24.0, 17.0, 23.0, 15.0, 11.0, 13.0, 8.0, 1.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2421875, -9.902587890625, -9.56298828125, -9.223388671875, -8.8837890625, -8.544189453125, -8.20458984375, -7.864990234375, -7.525390625, -7.185791015625, -6.84619140625, -6.506591796875, -6.1669921875, -5.827392578125, -5.48779296875, -5.148193359375, -4.80859375, -4.468994140625, -4.12939453125, -3.789794921875, -3.4501953125, -3.110595703125, -2.77099609375, -2.431396484375, -2.091796875, -1.752197265625, -1.41259765625, -1.072998046875, -0.7333984375, -0.393798828125, -0.05419921875, 0.285400390625, 0.625, 0.964599609375, 1.30419921875, 1.643798828125, 1.9833984375, 2.322998046875, 2.66259765625, 3.002197265625, 3.341796875, 3.681396484375, 4.02099609375, 4.360595703125, 4.7001953125, 5.039794921875, 5.37939453125, 5.718994140625, 6.05859375, 6.398193359375, 6.73779296875, 7.077392578125, 7.4169921875, 7.756591796875, 8.09619140625, 8.435791015625, 8.775390625, 9.114990234375, 9.45458984375, 9.794189453125, 10.1337890625, 10.473388671875, 10.81298828125, 11.152587890625, 11.4921875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 8.0, 8.0, 20.0, 13.0, 24.0, 31.0, 36.0, 48.0, 64.0, 90.0, 124.0, 160.0, 306.0, 732.0, 2912.0, 34336.0, 2993491.0, 106564.0, 4624.0, 1028.0, 382.0, 216.0, 133.0, 81.0, 63.0, 55.0, 38.0, 31.0, 21.0, 14.0, 9.0, 16.0, 12.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.78125, -22.141845703125, -21.50244140625, -20.863037109375, -20.2236328125, -19.584228515625, -18.94482421875, -18.305419921875, -17.666015625, -17.026611328125, -16.38720703125, -15.747802734375, -15.1083984375, -14.468994140625, -13.82958984375, -13.190185546875, -12.55078125, -11.911376953125, -11.27197265625, -10.632568359375, -9.9931640625, -9.353759765625, -8.71435546875, -8.074951171875, -7.435546875, -6.796142578125, -6.15673828125, -5.517333984375, -4.8779296875, -4.238525390625, -3.59912109375, -2.959716796875, -2.3203125, -1.680908203125, -1.04150390625, -0.402099609375, 0.2373046875, 0.876708984375, 1.51611328125, 2.155517578125, 2.794921875, 3.434326171875, 4.07373046875, 4.713134765625, 5.3525390625, 5.991943359375, 6.63134765625, 7.270751953125, 7.91015625, 8.549560546875, 9.18896484375, 9.828369140625, 10.4677734375, 11.107177734375, 11.74658203125, 12.385986328125, 13.025390625, 13.664794921875, 14.30419921875, 14.943603515625, 15.5830078125, 16.222412109375, 16.86181640625, 17.501220703125, 18.140625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 10.0, 627.0, 377.0, 4.0, 0.0, 2.0], "bins": [-321.0364990234375, -315.677001953125, -310.3175048828125, -304.9580383300781, -299.5985412597656, -294.2390441894531, -288.87957763671875, -283.52008056640625, -278.16058349609375, -272.80108642578125, -267.44158935546875, -262.0821228027344, -256.7226257324219, -251.36312866210938, -246.00364685058594, -240.6441650390625, -235.28466796875, -229.9251708984375, -224.56568908691406, -219.20620727539062, -213.84671020507812, -208.48721313476562, -203.1277313232422, -197.76824951171875, -192.40875244140625, -187.04925537109375, -181.6897735595703, -176.33029174804688, -170.97079467773438, -165.61129760742188, -160.25181579589844, -154.892333984375, -149.53282165527344, -144.17333984375, -138.8138427734375, -133.454345703125, -128.09486389160156, -122.7353744506836, -117.37588500976562, -112.01639556884766, -106.65690612792969, -101.29741668701172, -95.93792724609375, -90.57843780517578, -85.21894836425781, -79.85945892333984, -74.49996948242188, -69.1404800415039, -63.78099060058594, -58.42150115966797, -53.06201171875, -47.70252227783203, -42.34303283691406, -36.983543395996094, -31.624053955078125, -26.264564514160156, -20.905075073242188, -15.545585632324219, -10.18609619140625, -4.826606750488281, 0.5328826904296875, 5.892372131347656, 11.251861572265625, 16.611351013183594, 21.970840454101562]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 9.0, 5.0, 3.0, 4.0, 11.0, 11.0, 11.0, 15.0, 17.0, 20.0, 17.0, 32.0, 24.0, 23.0, 17.0, 30.0, 31.0, 35.0, 44.0, 48.0, 29.0, 52.0, 37.0, 30.0, 34.0, 27.0, 38.0, 29.0, 27.0, 20.0, 35.0, 32.0, 31.0, 21.0, 25.0, 23.0, 16.0, 9.0, 11.0, 17.0, 16.0, 4.0, 9.0, 6.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.73444366455078, -17.103490829467773, -16.4725399017334, -15.84158706665039, -15.210634231567383, -14.579682350158691, -13.94873046875, -13.317777633666992, -12.6868257522583, -12.05587387084961, -11.424921035766602, -10.79396915435791, -10.163017272949219, -9.532064437866211, -8.90111255645752, -8.270160675048828, -7.63920783996582, -7.008255481719971, -6.377303123474121, -5.74635124206543, -5.11539888381958, -4.4844465255737305, -3.85349440574646, -3.2225422859191895, -2.59158992767334, -1.9606376886367798, -1.3296854496002197, -0.6987332105636597, -0.06778097152709961, 0.56317138671875, 1.1941235065460205, 1.825075626373291, 2.4560279846191406, 3.0869803428649902, 3.7179324626922607, 4.348884582519531, 4.979836940765381, 5.6107892990112305, 6.241741180419922, 6.8726935386657715, 7.503645896911621, 8.134597778320312, 8.76555061340332, 9.396502494812012, 10.027454376220703, 10.658407211303711, 11.289359092712402, 11.920310974121094, 12.551263809204102, 13.182215690612793, 13.8131685256958, 14.444120407104492, 15.0750732421875, 15.706025123596191, 16.336977005004883, 16.96792984008789, 17.598880767822266, 18.229833602905273, 18.86078453063965, 19.491737365722656, 20.122690200805664, 20.753643035888672, 21.384593963623047, 22.015546798706055, 22.646499633789062]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 8.0, 11.0, 11.0, 15.0, 14.0, 13.0, 24.0, 22.0, 24.0, 33.0, 24.0, 22.0, 40.0, 41.0, 38.0, 41.0, 40.0, 47.0, 45.0, 28.0, 40.0, 27.0, 33.0, 43.0, 37.0, 40.0, 28.0, 34.0, 25.0, 25.0, 14.0, 10.0, 14.0, 13.0, 6.0, 10.0, 7.0, 10.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.326171875, -2.251739501953125, -2.17730712890625, -2.102874755859375, -2.0284423828125, -1.954010009765625, -1.87957763671875, -1.805145263671875, -1.730712890625, -1.656280517578125, -1.58184814453125, -1.507415771484375, -1.4329833984375, -1.358551025390625, -1.28411865234375, -1.209686279296875, -1.13525390625, -1.060821533203125, -0.98638916015625, -0.911956787109375, -0.8375244140625, -0.763092041015625, -0.68865966796875, -0.614227294921875, -0.539794921875, -0.465362548828125, -0.39093017578125, -0.316497802734375, -0.2420654296875, -0.167633056640625, -0.09320068359375, -0.018768310546875, 0.0556640625, 0.130096435546875, 0.20452880859375, 0.278961181640625, 0.3533935546875, 0.427825927734375, 0.50225830078125, 0.576690673828125, 0.651123046875, 0.725555419921875, 0.79998779296875, 0.874420166015625, 0.9488525390625, 1.023284912109375, 1.09771728515625, 1.172149658203125, 1.24658203125, 1.321014404296875, 1.39544677734375, 1.469879150390625, 1.5443115234375, 1.618743896484375, 1.69317626953125, 1.767608642578125, 1.842041015625, 1.916473388671875, 1.99090576171875, 2.065338134765625, 2.1397705078125, 2.214202880859375, 2.28863525390625, 2.363067626953125, 2.4375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 2.0, 7.0, 2.0, 7.0, 4.0, 6.0, 8.0, 11.0, 18.0, 14.0, 15.0, 18.0, 17.0, 29.0, 29.0, 40.0, 72.0, 169.0, 398.0, 1247.0, 4859.0, 27133.0, 239721.0, 2587714.0, 1220465.0, 94314.0, 13456.0, 2941.0, 843.0, 301.0, 121.0, 73.0, 49.0, 28.0, 31.0, 23.0, 11.0, 14.0, 12.0, 9.0, 7.0, 5.0, 8.0, 7.0, 1.0, 9.0, 7.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.34375, -8.0728759765625, -7.802001953125, -7.5311279296875, -7.26025390625, -6.9893798828125, -6.718505859375, -6.4476318359375, -6.1767578125, -5.9058837890625, -5.635009765625, -5.3641357421875, -5.09326171875, -4.8223876953125, -4.551513671875, -4.2806396484375, -4.009765625, -3.7388916015625, -3.468017578125, -3.1971435546875, -2.92626953125, -2.6553955078125, -2.384521484375, -2.1136474609375, -1.8427734375, -1.5718994140625, -1.301025390625, -1.0301513671875, -0.75927734375, -0.4884033203125, -0.217529296875, 0.0533447265625, 0.32421875, 0.5950927734375, 0.865966796875, 1.1368408203125, 1.40771484375, 1.6785888671875, 1.949462890625, 2.2203369140625, 2.4912109375, 2.7620849609375, 3.032958984375, 3.3038330078125, 3.57470703125, 3.8455810546875, 4.116455078125, 4.3873291015625, 4.658203125, 4.9290771484375, 5.199951171875, 5.4708251953125, 5.74169921875, 6.0125732421875, 6.283447265625, 6.5543212890625, 6.8251953125, 7.0960693359375, 7.366943359375, 7.6378173828125, 7.90869140625, 8.1795654296875, 8.450439453125, 8.7213134765625, 8.9921875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 9.0, 7.0, 9.0, 14.0, 20.0, 29.0, 34.0, 48.0, 54.0, 76.0, 87.0, 123.0, 140.0, 222.0, 227.0, 297.0, 357.0, 385.0, 388.0, 353.0, 282.0, 198.0, 156.0, 142.0, 96.0, 65.0, 67.0, 44.0, 36.0, 27.0, 23.0, 19.0, 7.0, 9.0, 6.0, 5.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.43359375, -4.27349853515625, -4.1134033203125, -3.95330810546875, -3.793212890625, -3.63311767578125, -3.4730224609375, -3.31292724609375, -3.15283203125, -2.99273681640625, -2.8326416015625, -2.67254638671875, -2.512451171875, -2.35235595703125, -2.1922607421875, -2.03216552734375, -1.8720703125, -1.71197509765625, -1.5518798828125, -1.39178466796875, -1.231689453125, -1.07159423828125, -0.9114990234375, -0.75140380859375, -0.59130859375, -0.43121337890625, -0.2711181640625, -0.11102294921875, 0.049072265625, 0.20916748046875, 0.3692626953125, 0.52935791015625, 0.689453125, 0.84954833984375, 1.0096435546875, 1.16973876953125, 1.329833984375, 1.48992919921875, 1.6500244140625, 1.81011962890625, 1.97021484375, 2.13031005859375, 2.2904052734375, 2.45050048828125, 2.610595703125, 2.77069091796875, 2.9307861328125, 3.09088134765625, 3.2509765625, 3.41107177734375, 3.5711669921875, 3.73126220703125, 3.891357421875, 4.05145263671875, 4.2115478515625, 4.37164306640625, 4.53173828125, 4.69183349609375, 4.8519287109375, 5.01202392578125, 5.172119140625, 5.33221435546875, 5.4923095703125, 5.65240478515625, 5.8125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 11.0, 13.0, 10.0, 14.0, 28.0, 31.0, 43.0, 50.0, 66.0, 79.0, 104.0, 134.0, 186.0, 339.0, 688.0, 2233.0, 12044.0, 92964.0, 964973.0, 2733939.0, 341190.0, 36965.0, 5396.0, 1285.0, 492.0, 283.0, 165.0, 131.0, 85.0, 81.0, 57.0, 55.0, 36.0, 29.0, 20.0, 17.0, 11.0, 12.0, 4.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-12.421875, -12.06982421875, -11.7177734375, -11.36572265625, -11.013671875, -10.66162109375, -10.3095703125, -9.95751953125, -9.60546875, -9.25341796875, -8.9013671875, -8.54931640625, -8.197265625, -7.84521484375, -7.4931640625, -7.14111328125, -6.7890625, -6.43701171875, -6.0849609375, -5.73291015625, -5.380859375, -5.02880859375, -4.6767578125, -4.32470703125, -3.97265625, -3.62060546875, -3.2685546875, -2.91650390625, -2.564453125, -2.21240234375, -1.8603515625, -1.50830078125, -1.15625, -0.80419921875, -0.4521484375, -0.10009765625, 0.251953125, 0.60400390625, 0.9560546875, 1.30810546875, 1.66015625, 2.01220703125, 2.3642578125, 2.71630859375, 3.068359375, 3.42041015625, 3.7724609375, 4.12451171875, 4.4765625, 4.82861328125, 5.1806640625, 5.53271484375, 5.884765625, 6.23681640625, 6.5888671875, 6.94091796875, 7.29296875, 7.64501953125, 7.9970703125, 8.34912109375, 8.701171875, 9.05322265625, 9.4052734375, 9.75732421875, 10.109375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 15.0, 23.0, 26.0, 58.0, 74.0, 127.0, 104.0, 130.0, 133.0, 99.0, 79.0, 51.0, 43.0, 15.0, 11.0, 10.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.18479537963867, -31.056053161621094, -29.927310943603516, -28.798568725585938, -27.66982650756836, -26.54108428955078, -25.41234016418457, -24.283597946166992, -23.154855728149414, -22.026113510131836, -20.897371292114258, -19.76862907409668, -18.63988494873047, -17.51114273071289, -16.382400512695312, -15.253658294677734, -14.124916076660156, -12.996173858642578, -11.867431640625, -10.738688468933105, -9.609946250915527, -8.48120403289795, -7.352461338043213, -6.223718643188477, -5.094976425170898, -3.966233968734741, -2.837491512298584, -1.7087490558624268, -0.5800065994262695, 0.5487356185913086, 1.677478313446045, 2.8062210083007812, 3.9349594116210938, 5.063701629638672, 6.192444324493408, 7.3211870193481445, 8.449929237365723, 9.5786714553833, 10.707414627075195, 11.836156845092773, 12.964899063110352, 14.09364128112793, 15.222383499145508, 16.351125717163086, 17.479869842529297, 18.608612060546875, 19.737354278564453, 20.86609649658203, 21.99483871459961, 23.123580932617188, 24.252323150634766, 25.381065368652344, 26.509807586669922, 27.6385498046875, 28.76729393005371, 29.89603614807129, 31.024778366088867, 32.15352249145508, 33.282264709472656, 34.411006927490234, 35.53974914550781, 36.66849136352539, 37.79723358154297, 38.92597579956055, 40.054718017578125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 5.0, 3.0, 13.0, 12.0, 14.0, 10.0, 11.0, 19.0, 24.0, 27.0, 25.0, 36.0, 27.0, 40.0, 34.0, 33.0, 41.0, 39.0, 37.0, 30.0, 43.0, 38.0, 38.0, 35.0, 40.0, 43.0, 36.0, 30.0, 27.0, 26.0, 30.0, 16.0, 16.0, 17.0, 16.0, 13.0, 8.0, 14.0, 6.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-18.091873168945312, -17.55296516418457, -17.01405906677246, -16.47515106201172, -15.93624496459961, -15.397336959838867, -14.858429908752441, -14.319522857666016, -13.78061580657959, -13.241708755493164, -12.702801704406738, -12.163894653320312, -11.62498664855957, -11.086080551147461, -10.547172546386719, -10.008265495300293, -9.469358444213867, -8.930451393127441, -8.391544342041016, -7.852636814117432, -7.313729763031006, -6.77482271194458, -6.235915184020996, -5.69700813293457, -5.1581010818481445, -4.619194030761719, -4.080286979675293, -3.541379451751709, -3.002472400665283, -2.4635653495788574, -1.9246580600738525, -1.3857507705688477, -0.8468437194824219, -0.30793654918670654, 0.2309706211090088, 0.7698777914047241, 1.3087849617004395, 1.8476920127868652, 2.38659930229187, 2.925506591796875, 3.464413642883301, 4.003320693969727, 4.542227745056152, 5.081135272979736, 5.620042324066162, 6.158949375152588, 6.697856903076172, 7.236763954162598, 7.775671005249023, 8.31457805633545, 8.853485107421875, 9.3923921585083, 9.931299209594727, 10.470207214355469, 11.009114265441895, 11.54802131652832, 12.086928367614746, 12.625835418701172, 13.164742469787598, 13.703649520874023, 14.242557525634766, 14.781463623046875, 15.320371627807617, 15.859278678894043, 16.39818572998047]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 3.0, 8.0, 6.0, 7.0, 20.0, 9.0, 13.0, 11.0, 14.0, 22.0, 32.0, 25.0, 29.0, 37.0, 32.0, 44.0, 39.0, 36.0, 35.0, 42.0, 44.0, 47.0, 23.0, 37.0, 51.0, 36.0, 34.0, 32.0, 34.0, 29.0, 27.0, 29.0, 14.0, 17.0, 9.0, 8.0, 11.0, 11.0, 3.0, 7.0, 7.0, 1.0, 6.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.259765625, -2.1829833984375, -2.106201171875, -2.0294189453125, -1.95263671875, -1.8758544921875, -1.799072265625, -1.7222900390625, -1.6455078125, -1.5687255859375, -1.491943359375, -1.4151611328125, -1.33837890625, -1.2615966796875, -1.184814453125, -1.1080322265625, -1.03125, -0.9544677734375, -0.877685546875, -0.8009033203125, -0.72412109375, -0.6473388671875, -0.570556640625, -0.4937744140625, -0.4169921875, -0.3402099609375, -0.263427734375, -0.1866455078125, -0.10986328125, -0.0330810546875, 0.043701171875, 0.1204833984375, 0.197265625, 0.2740478515625, 0.350830078125, 0.4276123046875, 0.50439453125, 0.5811767578125, 0.657958984375, 0.7347412109375, 0.8115234375, 0.8883056640625, 0.965087890625, 1.0418701171875, 1.11865234375, 1.1954345703125, 1.272216796875, 1.3489990234375, 1.42578125, 1.5025634765625, 1.579345703125, 1.6561279296875, 1.73291015625, 1.8096923828125, 1.886474609375, 1.9632568359375, 2.0400390625, 2.1168212890625, 2.193603515625, 2.2703857421875, 2.34716796875, 2.4239501953125, 2.500732421875, 2.5775146484375, 2.654296875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 10.0, 17.0, 28.0, 44.0, 70.0, 118.0, 109.0, 249.0, 318.0, 496.0, 622.0, 987.0, 1427.0, 2087.0, 2895.0, 4329.0, 6298.0, 9639.0, 14505.0, 22587.0, 35080.0, 58273.0, 102190.0, 238475.0, 267166.0, 111061.0, 61827.0, 37558.0, 23536.0, 15233.0, 10006.0, 6838.0, 4536.0, 3048.0, 2172.0, 1522.0, 977.0, 735.0, 467.0, 365.0, 209.0, 148.0, 107.0, 75.0, 40.0, 24.0, 20.0, 18.0, 2.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0133819580078125, -0.012951135635375977, -0.012520313262939453, -0.01208949089050293, -0.011658668518066406, -0.011227846145629883, -0.01079702377319336, -0.010366201400756836, -0.009935379028320312, -0.009504556655883789, -0.009073734283447266, -0.008642911911010742, -0.008212089538574219, -0.007781267166137695, -0.007350444793701172, -0.0069196224212646484, -0.006488800048828125, -0.0060579776763916016, -0.005627155303955078, -0.005196332931518555, -0.004765510559082031, -0.004334688186645508, -0.0039038658142089844, -0.003473043441772461, -0.0030422210693359375, -0.002611398696899414, -0.0021805763244628906, -0.0017497539520263672, -0.0013189315795898438, -0.0008881092071533203, -0.0004572868347167969, -2.6464462280273438e-05, 0.00040435791015625, 0.0008351802825927734, 0.0012660026550292969, 0.0016968250274658203, 0.0021276473999023438, 0.002558469772338867, 0.0029892921447753906, 0.003420114517211914, 0.0038509368896484375, 0.004281759262084961, 0.004712581634521484, 0.005143404006958008, 0.005574226379394531, 0.006005048751831055, 0.006435871124267578, 0.0068666934967041016, 0.007297515869140625, 0.0077283382415771484, 0.008159160614013672, 0.008589982986450195, 0.009020805358886719, 0.009451627731323242, 0.009882450103759766, 0.010313272476196289, 0.010744094848632812, 0.011174917221069336, 0.01160573959350586, 0.012036561965942383, 0.012467384338378906, 0.01289820671081543, 0.013329029083251953, 0.013759851455688477, 0.014190673828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 3.0, 1.0, 6.0, 10.0, 19.0, 11.0, 15.0, 22.0, 21.0, 29.0, 23.0, 21.0, 20.0, 43.0, 42.0, 39.0, 30.0, 51.0, 37.0, 1074.0, 48.0, 40.0, 40.0, 32.0, 35.0, 42.0, 33.0, 27.0, 22.0, 33.0, 25.0, 12.0, 18.0, 14.0, 16.0, 8.0, 10.0, 10.0, 7.0, 8.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6298828125, -1.5752716064453125, -1.520660400390625, -1.4660491943359375, -1.41143798828125, -1.3568267822265625, -1.302215576171875, -1.2476043701171875, -1.1929931640625, -1.1383819580078125, -1.083770751953125, -1.0291595458984375, -0.97454833984375, -0.9199371337890625, -0.865325927734375, -0.8107147216796875, -0.756103515625, -0.7014923095703125, -0.646881103515625, -0.5922698974609375, -0.53765869140625, -0.4830474853515625, -0.428436279296875, -0.3738250732421875, -0.3192138671875, -0.2646026611328125, -0.209991455078125, -0.1553802490234375, -0.10076904296875, -0.0461578369140625, 0.008453369140625, 0.0630645751953125, 0.11767578125, 0.1722869873046875, 0.226898193359375, 0.2815093994140625, 0.33612060546875, 0.3907318115234375, 0.445343017578125, 0.4999542236328125, 0.5545654296875, 0.6091766357421875, 0.663787841796875, 0.7183990478515625, 0.77301025390625, 0.8276214599609375, 0.882232666015625, 0.9368438720703125, 0.991455078125, 1.0460662841796875, 1.100677490234375, 1.1552886962890625, 1.20989990234375, 1.2645111083984375, 1.319122314453125, 1.3737335205078125, 1.4283447265625, 1.4829559326171875, 1.537567138671875, 1.5921783447265625, 1.64678955078125, 1.7014007568359375, 1.756011962890625, 1.8106231689453125, 1.865234375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 19.0, 11.0, 23.0, 37.0, 58.0, 95.0, 107.0, 170.0, 234.0, 411.0, 540.0, 815.0, 1137.0, 1874.0, 2752.0, 4167.0, 6462.0, 9792.0, 15690.0, 25251.0, 41462.0, 70228.0, 136787.0, 1358509.0, 196746.0, 89160.0, 51036.0, 30451.0, 18864.0, 11964.0, 7690.0, 4768.0, 3256.0, 2150.0, 1410.0, 951.0, 644.0, 436.0, 315.0, 217.0, 143.0, 90.0, 62.0, 37.0, 40.0, 20.0, 13.0, 13.0, 6.0, 5.0, 1.0, 3.0, 5.0, 3.0], "bins": [-0.01119232177734375, -0.010860204696655273, -0.010528087615966797, -0.01019597053527832, -0.009863853454589844, -0.009531736373901367, -0.00919961929321289, -0.008867502212524414, -0.008535385131835938, -0.008203268051147461, -0.007871150970458984, -0.007539033889770508, -0.007206916809082031, -0.006874799728393555, -0.006542682647705078, -0.0062105655670166016, -0.005878448486328125, -0.0055463314056396484, -0.005214214324951172, -0.004882097244262695, -0.004549980163574219, -0.004217863082885742, -0.0038857460021972656, -0.003553628921508789, -0.0032215118408203125, -0.002889394760131836, -0.0025572776794433594, -0.002225160598754883, -0.0018930435180664062, -0.0015609264373779297, -0.0012288093566894531, -0.0008966922760009766, -0.0005645751953125, -0.00023245811462402344, 9.965896606445312e-05, 0.0004317760467529297, 0.0007638931274414062, 0.0010960102081298828, 0.0014281272888183594, 0.001760244369506836, 0.0020923614501953125, 0.002424478530883789, 0.0027565956115722656, 0.003088712692260742, 0.0034208297729492188, 0.0037529468536376953, 0.004085063934326172, 0.0044171810150146484, 0.004749298095703125, 0.0050814151763916016, 0.005413532257080078, 0.005745649337768555, 0.006077766418457031, 0.006409883499145508, 0.006742000579833984, 0.007074117660522461, 0.0074062347412109375, 0.007738351821899414, 0.00807046890258789, 0.008402585983276367, 0.008734703063964844, 0.00906682014465332, 0.009398937225341797, 0.009731054306030273, 0.01006317138671875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 51.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 916.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 56.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [19.0, 1.0, 0.0, 6.0, 0.0, 1.0, 0.0, 29.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 28.0, 38.0, 63.0, 76.0, 0.0, 357.0, 3578.0, 25980.0, 988220.0, 26051.0, 3515.0, 342.0, 86.0, 0.0, 54.0, 41.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 0.0, 3.0, 0.0, 6.0, 0.0, 1.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1390075087547302e-06, -1.085922122001648e-06, -1.0328367352485657e-06, -9.797513484954834e-07, -9.266659617424011e-07, -8.735805749893188e-07, -8.204951882362366e-07, -7.674098014831543e-07, -7.14324414730072e-07, -6.612390279769897e-07, -6.081536412239075e-07, -5.550682544708252e-07, -5.019828677177429e-07, -4.4889748096466064e-07, -3.9581209421157837e-07, -3.427267074584961e-07, -2.896413207054138e-07, -2.3655593395233154e-07, -1.8347054719924927e-07, -1.30385160446167e-07, -7.729977369308472e-08, -2.421438694000244e-08, 2.8870999813079834e-08, 8.195638656616211e-08, 1.3504177331924438e-07, 1.8812716007232666e-07, 2.4121254682540894e-07, 2.942979335784912e-07, 3.473833203315735e-07, 4.0046870708465576e-07, 4.5355409383773804e-07, 5.066394805908203e-07, 5.597248673439026e-07, 6.128102540969849e-07, 6.658956408500671e-07, 7.189810276031494e-07, 7.720664143562317e-07, 8.25151801109314e-07, 8.782371878623962e-07, 9.313225746154785e-07, 9.844079613685608e-07, 1.037493348121643e-06, 1.0905787348747253e-06, 1.1436641216278076e-06, 1.1967495083808899e-06, 1.2498348951339722e-06, 1.3029202818870544e-06, 1.3560056686401367e-06, 1.409091055393219e-06, 1.4621764421463013e-06, 1.5152618288993835e-06, 1.5683472156524658e-06, 1.621432602405548e-06, 1.6745179891586304e-06, 1.7276033759117126e-06, 1.780688762664795e-06, 1.8337741494178772e-06, 1.8868595361709595e-06, 1.9399449229240417e-06, 1.993030309677124e-06, 2.0461156964302063e-06, 2.0992010831832886e-06, 2.152286469936371e-06, 2.205371856689453e-06]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1023.0], "bins": [-2.4395898634566038e-08, -2.4014711996755977e-08, -2.3633527135302757e-08, -2.3252340497492696e-08, -2.2871155636039475e-08, -2.2489968998229415e-08, -2.2108782360419355e-08, -2.1727597498966134e-08, -2.1346410861156073e-08, -2.0965224223346013e-08, -2.0584039361892792e-08, -2.020285272408273e-08, -1.982166786262951e-08, -1.944048122481945e-08, -1.905929636336623e-08, -1.867810972555617e-08, -1.829692308774611e-08, -1.7915736449936048e-08, -1.7534551588482827e-08, -1.7153364950672767e-08, -1.6772180089219546e-08, -1.6390993451409486e-08, -1.6009806813599425e-08, -1.5628621952146204e-08, -1.5247437090692983e-08, -1.4866251341061343e-08, -1.4485065591429702e-08, -1.4103878953619642e-08, -1.3722693203988001e-08, -1.334150745435636e-08, -1.296032170472472e-08, -1.257913595509308e-08, -1.2197949317283019e-08, -1.1816763567651378e-08, -1.1435577818019738e-08, -1.1054391180209677e-08, -1.0673205430578037e-08, -1.0292019680946396e-08, -9.910833931314755e-09, -9.529648181683115e-09, -9.148461543873054e-09, -8.767275794241414e-09, -8.386090044609773e-09, -8.004903406799713e-09, -7.623717657168072e-09, -7.242531907536431e-09, -6.861346157904791e-09, -6.48016040827315e-09, -6.0989746586415094e-09, -5.717788909009869e-09, -5.336602715289018e-09, -4.955416965657378e-09, -4.574230771936527e-09, -4.1930450223048865e-09, -3.811859272673246e-09, -3.4306733009970003e-09, -3.0494873293207547e-09, -2.668301357644509e-09, -2.2871153859682636e-09, -1.905929636336623e-09, -1.5247436646603774e-09, -1.1435576929841318e-09, -7.623719433524911e-10, -3.8118597167624557e-10, 0.0]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 3.0, 8.0, 6.0, 7.0, 20.0, 9.0, 13.0, 11.0, 14.0, 22.0, 32.0, 25.0, 29.0, 37.0, 32.0, 44.0, 39.0, 36.0, 35.0, 42.0, 44.0, 47.0, 23.0, 37.0, 51.0, 36.0, 34.0, 32.0, 34.0, 29.0, 27.0, 29.0, 14.0, 17.0, 9.0, 8.0, 11.0, 11.0, 3.0, 7.0, 7.0, 1.0, 6.0, 6.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.259765625, -2.1829833984375, -2.106201171875, -2.0294189453125, -1.95263671875, -1.8758544921875, -1.799072265625, -1.7222900390625, -1.6455078125, -1.5687255859375, -1.491943359375, -1.4151611328125, -1.33837890625, -1.2615966796875, -1.184814453125, -1.1080322265625, -1.03125, -0.9544677734375, -0.877685546875, -0.8009033203125, -0.72412109375, -0.6473388671875, -0.570556640625, -0.4937744140625, -0.4169921875, -0.3402099609375, -0.263427734375, -0.1866455078125, -0.10986328125, -0.0330810546875, 0.043701171875, 0.1204833984375, 0.197265625, 0.2740478515625, 0.350830078125, 0.4276123046875, 0.50439453125, 0.5811767578125, 0.657958984375, 0.7347412109375, 0.8115234375, 0.8883056640625, 0.965087890625, 1.0418701171875, 1.11865234375, 1.1954345703125, 1.272216796875, 1.3489990234375, 1.42578125, 1.5025634765625, 1.579345703125, 1.6561279296875, 1.73291015625, 1.8096923828125, 1.886474609375, 1.9632568359375, 2.0400390625, 2.1168212890625, 2.193603515625, 2.2703857421875, 2.34716796875, 2.4239501953125, 2.500732421875, 2.5775146484375, 2.654296875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 5.0, 8.0, 14.0, 25.0, 49.0, 63.0, 97.0, 187.0, 361.0, 562.0, 1029.0, 1795.0, 3323.0, 6017.0, 11507.0, 21801.0, 41989.0, 81398.0, 197352.0, 430352.0, 123197.0, 60115.0, 31633.0, 16352.0, 8778.0, 4704.0, 2636.0, 1363.0, 772.0, 457.0, 252.0, 166.0, 83.0, 48.0, 24.0, 21.0, 9.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.457275390625, -2.36376953125, -2.270263671875, -2.1767578125, -2.083251953125, -1.98974609375, -1.896240234375, -1.802734375, -1.709228515625, -1.61572265625, -1.522216796875, -1.4287109375, -1.335205078125, -1.24169921875, -1.148193359375, -1.0546875, -0.961181640625, -0.86767578125, -0.774169921875, -0.6806640625, -0.587158203125, -0.49365234375, -0.400146484375, -0.306640625, -0.213134765625, -0.11962890625, -0.026123046875, 0.0673828125, 0.160888671875, 0.25439453125, 0.347900390625, 0.44140625, 0.534912109375, 0.62841796875, 0.721923828125, 0.8154296875, 0.908935546875, 1.00244140625, 1.095947265625, 1.189453125, 1.282958984375, 1.37646484375, 1.469970703125, 1.5634765625, 1.656982421875, 1.75048828125, 1.843994140625, 1.9375, 2.031005859375, 2.12451171875, 2.218017578125, 2.3115234375, 2.405029296875, 2.49853515625, 2.592041015625, 2.685546875, 2.779052734375, 2.87255859375, 2.966064453125, 3.0595703125, 3.153076171875, 3.24658203125, 3.340087890625, 3.43359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 2.0, 3.0, 4.0, 10.0, 9.0, 8.0, 3.0, 4.0, 8.0, 16.0, 22.0, 17.0, 21.0, 26.0, 32.0, 25.0, 47.0, 45.0, 53.0, 56.0, 74.0, 141.0, 1461.0, 372.0, 123.0, 79.0, 56.0, 46.0, 42.0, 33.0, 29.0, 31.0, 32.0, 32.0, 24.0, 11.0, 12.0, 9.0, 7.0, 4.0, 3.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.921875, -9.64581298828125, -9.3697509765625, -9.09368896484375, -8.817626953125, -8.54156494140625, -8.2655029296875, -7.98944091796875, -7.71337890625, -7.43731689453125, -7.1612548828125, -6.88519287109375, -6.609130859375, -6.33306884765625, -6.0570068359375, -5.78094482421875, -5.5048828125, -5.22882080078125, -4.9527587890625, -4.67669677734375, -4.400634765625, -4.12457275390625, -3.8485107421875, -3.57244873046875, -3.29638671875, -3.02032470703125, -2.7442626953125, -2.46820068359375, -2.192138671875, -1.91607666015625, -1.6400146484375, -1.36395263671875, -1.087890625, -0.81182861328125, -0.5357666015625, -0.25970458984375, 0.016357421875, 0.29241943359375, 0.5684814453125, 0.84454345703125, 1.12060546875, 1.39666748046875, 1.6727294921875, 1.94879150390625, 2.224853515625, 2.50091552734375, 2.7769775390625, 3.05303955078125, 3.3291015625, 3.60516357421875, 3.8812255859375, 4.15728759765625, 4.433349609375, 4.70941162109375, 4.9854736328125, 5.26153564453125, 5.53759765625, 5.81365966796875, 6.0897216796875, 6.36578369140625, 6.641845703125, 6.91790771484375, 7.1939697265625, 7.47003173828125, 7.74609375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 7.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 7.0, 6.0, 14.0, 22.0, 21.0, 46.0, 51.0, 61.0, 83.0, 104.0, 139.0, 214.0, 349.0, 1063.0, 11363.0, 735154.0, 2375581.0, 18699.0, 1408.0, 395.0, 228.0, 178.0, 112.0, 86.0, 62.0, 53.0, 38.0, 34.0, 27.0, 18.0, 13.0, 13.0, 5.0, 6.0, 12.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.3125, -14.7470703125, -14.181640625, -13.6162109375, -13.05078125, -12.4853515625, -11.919921875, -11.3544921875, -10.7890625, -10.2236328125, -9.658203125, -9.0927734375, -8.52734375, -7.9619140625, -7.396484375, -6.8310546875, -6.265625, -5.7001953125, -5.134765625, -4.5693359375, -4.00390625, -3.4384765625, -2.873046875, -2.3076171875, -1.7421875, -1.1767578125, -0.611328125, -0.0458984375, 0.51953125, 1.0849609375, 1.650390625, 2.2158203125, 2.78125, 3.3466796875, 3.912109375, 4.4775390625, 5.04296875, 5.6083984375, 6.173828125, 6.7392578125, 7.3046875, 7.8701171875, 8.435546875, 9.0009765625, 9.56640625, 10.1318359375, 10.697265625, 11.2626953125, 11.828125, 12.3935546875, 12.958984375, 13.5244140625, 14.08984375, 14.6552734375, 15.220703125, 15.7861328125, 16.3515625, 16.9169921875, 17.482421875, 18.0478515625, 18.61328125, 19.1787109375, 19.744140625, 20.3095703125, 20.875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 113.0, 800.0, 101.0, 4.0], "bins": [-266.6261291503906, -262.2872619628906, -257.9483947753906, -253.60952758789062, -249.27066040039062, -244.93177795410156, -240.59291076660156, -236.25404357910156, -231.91517639160156, -227.57630920410156, -223.23744201660156, -218.89857482910156, -214.5596923828125, -210.2208251953125, -205.8819580078125, -201.5430908203125, -197.2042236328125, -192.8653564453125, -188.5264892578125, -184.1876220703125, -179.8487548828125, -175.50987243652344, -171.17100524902344, -166.83213806152344, -162.49327087402344, -158.15440368652344, -153.81553649902344, -149.47666931152344, -145.13778686523438, -140.79891967773438, -136.46005249023438, -132.12118530273438, -127.78233337402344, -123.44346618652344, -119.10459899902344, -114.7657241821289, -110.4268569946289, -106.0879898071289, -101.74911499023438, -97.41024780273438, -93.07138061523438, -88.73251342773438, -84.39364624023438, -80.05477142333984, -75.71590423583984, -71.37703704833984, -67.03816223144531, -62.69929504394531, -58.36042785644531, -54.02156066894531, -49.68268966674805, -45.34381866455078, -41.00495147705078, -36.66608428955078, -32.327213287353516, -27.988344192504883, -23.64947509765625, -19.310606002807617, -14.971736907958984, -10.632867813110352, -6.293998718261719, -1.955129623413086, 2.383739471435547, 6.72260856628418, 11.061477661132812]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 7.0, 13.0, 12.0, 10.0, 14.0, 16.0, 18.0, 20.0, 32.0, 22.0, 31.0, 36.0, 32.0, 38.0, 36.0, 43.0, 39.0, 33.0, 32.0, 36.0, 35.0, 34.0, 46.0, 35.0, 37.0, 26.0, 33.0, 25.0, 26.0, 18.0, 19.0, 22.0, 14.0, 18.0, 10.0, 8.0, 13.0, 7.0, 10.0, 2.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.844926834106445, -24.092288970947266, -23.339649200439453, -22.58700942993164, -21.83437156677246, -21.08173370361328, -20.32909393310547, -19.576454162597656, -18.823816299438477, -18.071178436279297, -17.318538665771484, -16.565898895263672, -15.813261032104492, -15.060622215270996, -14.3079833984375, -13.555344581604004, -12.802705764770508, -12.050066947937012, -11.297428131103516, -10.54478931427002, -9.792150497436523, -9.039511680603027, -8.286872863769531, -7.534234046936035, -6.781595230102539, -6.028956413269043, -5.276317596435547, -4.523678779602051, -3.7710399627685547, -3.0184011459350586, -2.2657623291015625, -1.5131235122680664, -0.7604827880859375, -0.007843971252441406, 0.7447948455810547, 1.4974336624145508, 2.250072479248047, 3.002711296081543, 3.755350112915039, 4.507988929748535, 5.260627746582031, 6.013266563415527, 6.765905380249023, 7.5185441970825195, 8.271183013916016, 9.023821830749512, 9.776460647583008, 10.529099464416504, 11.28173828125, 12.034377098083496, 12.787015914916992, 13.539654731750488, 14.292293548583984, 15.04493236541748, 15.797571182250977, 16.550209045410156, 17.30284881591797, 18.05548858642578, 18.80812644958496, 19.56076431274414, 20.313404083251953, 21.066043853759766, 21.818681716918945, 22.571319580078125, 23.323959350585938]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 9.0, 4.0, 8.0, 13.0, 11.0, 6.0, 7.0, 14.0, 18.0, 15.0, 17.0, 23.0, 39.0, 30.0, 37.0, 34.0, 31.0, 36.0, 39.0, 39.0, 30.0, 38.0, 45.0, 46.0, 34.0, 40.0, 35.0, 31.0, 30.0, 18.0, 40.0, 27.0, 25.0, 23.0, 24.0, 17.0, 12.0, 6.0, 9.0, 10.0, 7.0, 3.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.2818603515625, -2.202392578125, -2.1229248046875, -2.04345703125, -1.9639892578125, -1.884521484375, -1.8050537109375, -1.7255859375, -1.6461181640625, -1.566650390625, -1.4871826171875, -1.40771484375, -1.3282470703125, -1.248779296875, -1.1693115234375, -1.08984375, -1.0103759765625, -0.930908203125, -0.8514404296875, -0.77197265625, -0.6925048828125, -0.613037109375, -0.5335693359375, -0.4541015625, -0.3746337890625, -0.295166015625, -0.2156982421875, -0.13623046875, -0.0567626953125, 0.022705078125, 0.1021728515625, 0.181640625, 0.2611083984375, 0.340576171875, 0.4200439453125, 0.49951171875, 0.5789794921875, 0.658447265625, 0.7379150390625, 0.8173828125, 0.8968505859375, 0.976318359375, 1.0557861328125, 1.13525390625, 1.2147216796875, 1.294189453125, 1.3736572265625, 1.453125, 1.5325927734375, 1.612060546875, 1.6915283203125, 1.77099609375, 1.8504638671875, 1.929931640625, 2.0093994140625, 2.0888671875, 2.1683349609375, 2.247802734375, 2.3272705078125, 2.40673828125, 2.4862060546875, 2.565673828125, 2.6451416015625, 2.724609375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 13.0, 7.0, 11.0, 9.0, 12.0, 15.0, 9.0, 25.0, 30.0, 42.0, 46.0, 64.0, 126.0, 222.0, 447.0, 1253.0, 3876.0, 15484.0, 85891.0, 790957.0, 2676925.0, 536980.0, 63938.0, 12416.0, 3241.0, 1099.0, 496.0, 221.0, 129.0, 77.0, 61.0, 29.0, 23.0, 18.0, 16.0, 14.0, 10.0, 5.0, 10.0, 6.0, 2.0, 4.0, 6.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.140625, -6.9058837890625, -6.671142578125, -6.4364013671875, -6.20166015625, -5.9669189453125, -5.732177734375, -5.4974365234375, -5.2626953125, -5.0279541015625, -4.793212890625, -4.5584716796875, -4.32373046875, -4.0889892578125, -3.854248046875, -3.6195068359375, -3.384765625, -3.1500244140625, -2.915283203125, -2.6805419921875, -2.44580078125, -2.2110595703125, -1.976318359375, -1.7415771484375, -1.5068359375, -1.2720947265625, -1.037353515625, -0.8026123046875, -0.56787109375, -0.3331298828125, -0.098388671875, 0.1363525390625, 0.37109375, 0.6058349609375, 0.840576171875, 1.0753173828125, 1.31005859375, 1.5447998046875, 1.779541015625, 2.0142822265625, 2.2490234375, 2.4837646484375, 2.718505859375, 2.9532470703125, 3.18798828125, 3.4227294921875, 3.657470703125, 3.8922119140625, 4.126953125, 4.3616943359375, 4.596435546875, 4.8311767578125, 5.06591796875, 5.3006591796875, 5.535400390625, 5.7701416015625, 6.0048828125, 6.2396240234375, 6.474365234375, 6.7091064453125, 6.94384765625, 7.1785888671875, 7.413330078125, 7.6480712890625, 7.8828125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 10.0, 13.0, 24.0, 30.0, 28.0, 41.0, 53.0, 67.0, 102.0, 139.0, 192.0, 246.0, 319.0, 372.0, 444.0, 455.0, 360.0, 272.0, 254.0, 172.0, 133.0, 93.0, 78.0, 40.0, 36.0, 24.0, 21.0, 18.0, 11.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.67578125, -5.49169921875, -5.3076171875, -5.12353515625, -4.939453125, -4.75537109375, -4.5712890625, -4.38720703125, -4.203125, -4.01904296875, -3.8349609375, -3.65087890625, -3.466796875, -3.28271484375, -3.0986328125, -2.91455078125, -2.73046875, -2.54638671875, -2.3623046875, -2.17822265625, -1.994140625, -1.81005859375, -1.6259765625, -1.44189453125, -1.2578125, -1.07373046875, -0.8896484375, -0.70556640625, -0.521484375, -0.33740234375, -0.1533203125, 0.03076171875, 0.21484375, 0.39892578125, 0.5830078125, 0.76708984375, 0.951171875, 1.13525390625, 1.3193359375, 1.50341796875, 1.6875, 1.87158203125, 2.0556640625, 2.23974609375, 2.423828125, 2.60791015625, 2.7919921875, 2.97607421875, 3.16015625, 3.34423828125, 3.5283203125, 3.71240234375, 3.896484375, 4.08056640625, 4.2646484375, 4.44873046875, 4.6328125, 4.81689453125, 5.0009765625, 5.18505859375, 5.369140625, 5.55322265625, 5.7373046875, 5.92138671875, 6.10546875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 14.0, 21.0, 16.0, 31.0, 31.0, 46.0, 83.0, 123.0, 146.0, 230.0, 333.0, 625.0, 3511.0, 106962.0, 3537351.0, 531688.0, 10913.0, 923.0, 375.0, 248.0, 158.0, 126.0, 83.0, 55.0, 45.0, 45.0, 30.0, 26.0, 11.0, 12.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.765625, -21.13818359375, -20.5107421875, -19.88330078125, -19.255859375, -18.62841796875, -18.0009765625, -17.37353515625, -16.74609375, -16.11865234375, -15.4912109375, -14.86376953125, -14.236328125, -13.60888671875, -12.9814453125, -12.35400390625, -11.7265625, -11.09912109375, -10.4716796875, -9.84423828125, -9.216796875, -8.58935546875, -7.9619140625, -7.33447265625, -6.70703125, -6.07958984375, -5.4521484375, -4.82470703125, -4.197265625, -3.56982421875, -2.9423828125, -2.31494140625, -1.6875, -1.06005859375, -0.4326171875, 0.19482421875, 0.822265625, 1.44970703125, 2.0771484375, 2.70458984375, 3.33203125, 3.95947265625, 4.5869140625, 5.21435546875, 5.841796875, 6.46923828125, 7.0966796875, 7.72412109375, 8.3515625, 8.97900390625, 9.6064453125, 10.23388671875, 10.861328125, 11.48876953125, 12.1162109375, 12.74365234375, 13.37109375, 13.99853515625, 14.6259765625, 15.25341796875, 15.880859375, 16.50830078125, 17.1357421875, 17.76318359375, 18.390625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 12.0, 73.0, 234.0, 379.0, 233.0, 75.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.6937713623047, -125.3545913696289, -122.01541137695312, -118.67623138427734, -115.33705139160156, -111.99787139892578, -108.65869140625, -105.31951904296875, -101.98033142089844, -98.64115142822266, -95.30197143554688, -91.9627914428711, -88.62361145019531, -85.28443145751953, -81.94525146484375, -78.6060791015625, -75.26689910888672, -71.92771911621094, -68.58853912353516, -65.24935913085938, -61.910179138183594, -58.57099914550781, -55.2318229675293, -51.892642974853516, -48.553462982177734, -45.21428298950195, -41.87510299682617, -38.535926818847656, -35.196746826171875, -31.85756492614746, -28.518386840820312, -25.17920684814453, -21.84003448486328, -18.5008544921875, -15.161675453186035, -11.82249641418457, -8.483316421508789, -5.144136428833008, -1.8049583435058594, 1.5342216491699219, 4.873401641845703, 8.212581634521484, 11.55176067352295, 14.890939712524414, 18.230119705200195, 21.569299697875977, 24.908477783203125, 28.247657775878906, 31.586837768554688, 34.92601776123047, 38.26519775390625, 41.60437774658203, 44.94355773925781, 48.282737731933594, 51.62191390991211, 54.96109390258789, 58.30027389526367, 61.63945388793945, 64.97863006591797, 68.31781005859375, 71.65699005126953, 74.99617004394531, 78.3353500366211, 81.67453002929688, 85.01371002197266]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 5.0, 8.0, 7.0, 6.0, 8.0, 8.0, 10.0, 19.0, 13.0, 9.0, 12.0, 26.0, 22.0, 29.0, 21.0, 29.0, 23.0, 29.0, 21.0, 30.0, 35.0, 34.0, 45.0, 42.0, 38.0, 33.0, 39.0, 41.0, 47.0, 21.0, 33.0, 30.0, 28.0, 32.0, 21.0, 20.0, 19.0, 12.0, 15.0, 13.0, 9.0, 11.0, 5.0, 7.0, 7.0, 12.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.971534729003906, -15.46187686920166, -14.952219009399414, -14.442560195922852, -13.932902336120605, -13.42324447631836, -12.913585662841797, -12.40392780303955, -11.894269943237305, -11.384612083435059, -10.874954223632812, -10.36529541015625, -9.855637550354004, -9.345979690551758, -8.836320877075195, -8.32666301727295, -7.817005157470703, -7.307347297668457, -6.797688961029053, -6.288030624389648, -5.778372764587402, -5.268714904785156, -4.759056568145752, -4.249398231506348, -3.7397403717041016, -3.2300822734832764, -2.720424175262451, -2.210766077041626, -1.7011079788208008, -1.1914498805999756, -0.6817917823791504, -0.1721336841583252, 0.3375244140625, 0.8471825122833252, 1.3568406105041504, 1.8664987087249756, 2.376156806945801, 2.885814905166626, 3.395473003387451, 3.9051311016082764, 4.414789199829102, 4.924447059631348, 5.434105396270752, 5.943763732910156, 6.453421592712402, 6.963079452514648, 7.472737789154053, 7.982396125793457, 8.492053985595703, 9.00171184539795, 9.511369705200195, 10.021028518676758, 10.530686378479004, 11.04034423828125, 11.550003051757812, 12.059660911560059, 12.569318771362305, 13.07897663116455, 13.588634490966797, 14.09829330444336, 14.607951164245605, 15.117609024047852, 15.627267837524414, 16.136924743652344, 16.646583557128906]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 8.0, 8.0, 4.0, 12.0, 9.0, 15.0, 13.0, 16.0, 19.0, 24.0, 19.0, 32.0, 30.0, 34.0, 36.0, 45.0, 38.0, 33.0, 43.0, 50.0, 41.0, 43.0, 42.0, 37.0, 36.0, 39.0, 36.0, 30.0, 36.0, 30.0, 26.0, 18.0, 21.0, 15.0, 10.0, 7.0, 10.0, 7.0, 5.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.51953125, -2.436309814453125, -2.35308837890625, -2.269866943359375, -2.1866455078125, -2.103424072265625, -2.02020263671875, -1.936981201171875, -1.853759765625, -1.770538330078125, -1.68731689453125, -1.604095458984375, -1.5208740234375, -1.437652587890625, -1.35443115234375, -1.271209716796875, -1.18798828125, -1.104766845703125, -1.02154541015625, -0.938323974609375, -0.8551025390625, -0.771881103515625, -0.68865966796875, -0.605438232421875, -0.522216796875, -0.438995361328125, -0.35577392578125, -0.272552490234375, -0.1893310546875, -0.106109619140625, -0.02288818359375, 0.060333251953125, 0.1435546875, 0.226776123046875, 0.30999755859375, 0.393218994140625, 0.4764404296875, 0.559661865234375, 0.64288330078125, 0.726104736328125, 0.809326171875, 0.892547607421875, 0.97576904296875, 1.058990478515625, 1.1422119140625, 1.225433349609375, 1.30865478515625, 1.391876220703125, 1.47509765625, 1.558319091796875, 1.64154052734375, 1.724761962890625, 1.8079833984375, 1.891204833984375, 1.97442626953125, 2.057647705078125, 2.140869140625, 2.224090576171875, 2.30731201171875, 2.390533447265625, 2.4737548828125, 2.556976318359375, 2.64019775390625, 2.723419189453125, 2.806640625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 5.0, 9.0, 19.0, 35.0, 29.0, 49.0, 83.0, 106.0, 143.0, 230.0, 335.0, 465.0, 750.0, 1063.0, 1589.0, 2379.0, 3690.0, 5789.0, 9255.0, 14929.0, 24838.0, 42883.0, 79056.0, 168009.0, 350266.0, 159941.0, 76681.0, 41970.0, 24190.0, 14406.0, 8832.0, 5615.0, 3643.0, 2362.0, 1638.0, 1047.0, 711.0, 480.0, 327.0, 243.0, 140.0, 108.0, 75.0, 41.0, 28.0, 25.0, 15.0, 10.0, 6.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01617431640625, -0.015676259994506836, -0.015178203582763672, -0.014680147171020508, -0.014182090759277344, -0.01368403434753418, -0.013185977935791016, -0.012687921524047852, -0.012189865112304688, -0.011691808700561523, -0.01119375228881836, -0.010695695877075195, -0.010197639465332031, -0.009699583053588867, -0.009201526641845703, -0.008703470230102539, -0.008205413818359375, -0.007707357406616211, -0.007209300994873047, -0.006711244583129883, -0.006213188171386719, -0.005715131759643555, -0.005217075347900391, -0.0047190189361572266, -0.0042209625244140625, -0.0037229061126708984, -0.0032248497009277344, -0.0027267932891845703, -0.0022287368774414062, -0.0017306804656982422, -0.0012326240539550781, -0.0007345676422119141, -0.00023651123046875, 0.00026154518127441406, 0.0007596015930175781, 0.0012576580047607422, 0.0017557144165039062, 0.0022537708282470703, 0.0027518272399902344, 0.0032498836517333984, 0.0037479400634765625, 0.0042459964752197266, 0.004744052886962891, 0.005242109298706055, 0.005740165710449219, 0.006238222122192383, 0.006736278533935547, 0.007234334945678711, 0.007732391357421875, 0.008230447769165039, 0.008728504180908203, 0.009226560592651367, 0.009724617004394531, 0.010222673416137695, 0.01072072982788086, 0.011218786239624023, 0.011716842651367188, 0.012214899063110352, 0.012712955474853516, 0.01321101188659668, 0.013709068298339844, 0.014207124710083008, 0.014705181121826172, 0.015203237533569336, 0.0157012939453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 10.0, 11.0, 12.0, 17.0, 9.0, 20.0, 13.0, 34.0, 21.0, 31.0, 20.0, 39.0, 35.0, 28.0, 39.0, 35.0, 38.0, 35.0, 1062.0, 37.0, 48.0, 44.0, 42.0, 33.0, 26.0, 31.0, 42.0, 40.0, 28.0, 26.0, 19.0, 24.0, 12.0, 19.0, 6.0, 9.0, 11.0, 7.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.806640625, -1.7514190673828125, -1.696197509765625, -1.6409759521484375, -1.58575439453125, -1.5305328369140625, -1.475311279296875, -1.4200897216796875, -1.3648681640625, -1.3096466064453125, -1.254425048828125, -1.1992034912109375, -1.14398193359375, -1.0887603759765625, -1.033538818359375, -0.9783172607421875, -0.923095703125, -0.8678741455078125, -0.812652587890625, -0.7574310302734375, -0.70220947265625, -0.6469879150390625, -0.591766357421875, -0.5365447998046875, -0.4813232421875, -0.4261016845703125, -0.370880126953125, -0.3156585693359375, -0.26043701171875, -0.2052154541015625, -0.149993896484375, -0.0947723388671875, -0.03955078125, 0.0156707763671875, 0.070892333984375, 0.1261138916015625, 0.18133544921875, 0.2365570068359375, 0.291778564453125, 0.3470001220703125, 0.4022216796875, 0.4574432373046875, 0.512664794921875, 0.5678863525390625, 0.62310791015625, 0.6783294677734375, 0.733551025390625, 0.7887725830078125, 0.843994140625, 0.8992156982421875, 0.954437255859375, 1.0096588134765625, 1.06488037109375, 1.1201019287109375, 1.175323486328125, 1.2305450439453125, 1.2857666015625, 1.3409881591796875, 1.396209716796875, 1.4514312744140625, 1.50665283203125, 1.5618743896484375, 1.617095947265625, 1.6723175048828125, 1.7275390625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 14.0, 11.0, 24.0, 33.0, 50.0, 71.0, 122.0, 187.0, 265.0, 399.0, 563.0, 982.0, 1543.0, 2188.0, 3621.0, 5786.0, 9224.0, 15008.0, 24491.0, 40315.0, 67074.0, 123018.0, 1316240.0, 227594.0, 104741.0, 59905.0, 35452.0, 22248.0, 13300.0, 8323.0, 5233.0, 3255.0, 2016.0, 1365.0, 868.0, 543.0, 353.0, 229.0, 166.0, 110.0, 62.0, 46.0, 31.0, 18.0, 18.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0105743408203125, -0.010242700576782227, -0.009911060333251953, -0.00957942008972168, -0.009247779846191406, -0.008916139602661133, -0.00858449935913086, -0.008252859115600586, -0.007921218872070312, -0.007589578628540039, -0.007257938385009766, -0.006926298141479492, -0.006594657897949219, -0.006263017654418945, -0.005931377410888672, -0.0055997371673583984, -0.005268096923828125, -0.0049364566802978516, -0.004604816436767578, -0.004273176193237305, -0.003941535949707031, -0.003609895706176758, -0.0032782554626464844, -0.002946615219116211, -0.0026149749755859375, -0.002283334732055664, -0.0019516944885253906, -0.0016200542449951172, -0.0012884140014648438, -0.0009567737579345703, -0.0006251335144042969, -0.00029349327087402344, 3.814697265625e-05, 0.00036978721618652344, 0.0007014274597167969, 0.0010330677032470703, 0.0013647079467773438, 0.0016963481903076172, 0.0020279884338378906, 0.002359628677368164, 0.0026912689208984375, 0.003022909164428711, 0.0033545494079589844, 0.003686189651489258, 0.004017829895019531, 0.004349470138549805, 0.004681110382080078, 0.0050127506256103516, 0.005344390869140625, 0.0056760311126708984, 0.006007671356201172, 0.006339311599731445, 0.006670951843261719, 0.007002592086791992, 0.007334232330322266, 0.007665872573852539, 0.007997512817382812, 0.008329153060913086, 0.00866079330444336, 0.008992433547973633, 0.009324073791503906, 0.00965571403503418, 0.009987354278564453, 0.010318994522094727, 0.010650634765625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 45.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 920.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 4.0, 5.0, 8.0, 0.0, 28.0, 0.0, 2.0, 6.0, 45.0, 56.0, 468.0, 3761.0, 1013982.0, 25755.0, 4200.0, 114.0, 29.0, 41.0, 4.0, 0.0, 14.0, 17.0, 5.0, 3.0, 0.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-06, -3.6582350730895996e-06, -3.56137752532959e-06, -3.46451997756958e-06, -3.3676624298095703e-06, -3.2708048820495605e-06, -3.1739473342895508e-06, -3.077089786529541e-06, -2.9802322387695312e-06, -2.8833746910095215e-06, -2.7865171432495117e-06, -2.689659595489502e-06, -2.592802047729492e-06, -2.4959444999694824e-06, -2.3990869522094727e-06, -2.302229404449463e-06, -2.205371856689453e-06, -2.1085143089294434e-06, -2.0116567611694336e-06, -1.914799213409424e-06, -1.817941665649414e-06, -1.7210841178894043e-06, -1.6242265701293945e-06, -1.5273690223693848e-06, -1.430511474609375e-06, -1.3336539268493652e-06, -1.2367963790893555e-06, -1.1399388313293457e-06, -1.043081283569336e-06, -9.462237358093262e-07, -8.493661880493164e-07, -7.525086402893066e-07, -6.556510925292969e-07, -5.587935447692871e-07, -4.6193599700927734e-07, -3.650784492492676e-07, -2.682209014892578e-07, -1.7136335372924805e-07, -7.450580596923828e-08, 2.2351741790771484e-08, 1.1920928955078125e-07, 2.1606683731079102e-07, 3.129243850708008e-07, 4.0978193283081055e-07, 5.066394805908203e-07, 6.034970283508301e-07, 7.003545761108398e-07, 7.972121238708496e-07, 8.940696716308594e-07, 9.909272193908691e-07, 1.087784767150879e-06, 1.1846423149108887e-06, 1.2814998626708984e-06, 1.3783574104309082e-06, 1.475214958190918e-06, 1.5720725059509277e-06, 1.6689300537109375e-06, 1.7657876014709473e-06, 1.862645149230957e-06, 1.959502696990967e-06, 2.0563602447509766e-06, 2.1532177925109863e-06, 2.250075340270996e-06, 2.346932888031006e-06, 2.4437904357910156e-06]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 8.0, 8.0, 4.0, 12.0, 9.0, 15.0, 13.0, 16.0, 19.0, 24.0, 19.0, 32.0, 30.0, 34.0, 36.0, 45.0, 38.0, 33.0, 43.0, 50.0, 41.0, 43.0, 42.0, 37.0, 36.0, 39.0, 36.0, 30.0, 36.0, 30.0, 26.0, 18.0, 21.0, 15.0, 10.0, 7.0, 10.0, 7.0, 5.0, 4.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.51953125, -2.436309814453125, -2.35308837890625, -2.269866943359375, -2.1866455078125, -2.103424072265625, -2.02020263671875, -1.936981201171875, -1.853759765625, -1.770538330078125, -1.68731689453125, -1.604095458984375, -1.5208740234375, -1.437652587890625, -1.35443115234375, -1.271209716796875, -1.18798828125, -1.104766845703125, -1.02154541015625, -0.938323974609375, -0.8551025390625, -0.771881103515625, -0.68865966796875, -0.605438232421875, -0.522216796875, -0.438995361328125, -0.35577392578125, -0.272552490234375, -0.1893310546875, -0.106109619140625, -0.02288818359375, 0.060333251953125, 0.1435546875, 0.226776123046875, 0.30999755859375, 0.393218994140625, 0.4764404296875, 0.559661865234375, 0.64288330078125, 0.726104736328125, 0.809326171875, 0.892547607421875, 0.97576904296875, 1.058990478515625, 1.1422119140625, 1.225433349609375, 1.30865478515625, 1.391876220703125, 1.47509765625, 1.558319091796875, 1.64154052734375, 1.724761962890625, 1.8079833984375, 1.891204833984375, 1.97442626953125, 2.057647705078125, 2.140869140625, 2.224090576171875, 2.30731201171875, 2.390533447265625, 2.4737548828125, 2.556976318359375, 2.64019775390625, 2.723419189453125, 2.806640625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 7.0, 14.0, 8.0, 18.0, 28.0, 50.0, 79.0, 117.0, 214.0, 294.0, 482.0, 700.0, 1053.0, 1685.0, 2555.0, 3662.0, 5641.0, 8608.0, 13509.0, 23390.0, 45808.0, 110490.0, 331359.0, 297673.0, 99670.0, 42131.0, 21985.0, 12964.0, 8418.0, 5465.0, 3564.0, 2361.0, 1609.0, 1016.0, 647.0, 459.0, 305.0, 193.0, 119.0, 82.0, 52.0, 25.0, 21.0, 12.0, 12.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9248046875, -1.8506317138671875, -1.776458740234375, -1.7022857666015625, -1.62811279296875, -1.5539398193359375, -1.479766845703125, -1.4055938720703125, -1.3314208984375, -1.2572479248046875, -1.183074951171875, -1.1089019775390625, -1.03472900390625, -0.9605560302734375, -0.886383056640625, -0.8122100830078125, -0.738037109375, -0.6638641357421875, -0.589691162109375, -0.5155181884765625, -0.44134521484375, -0.3671722412109375, -0.292999267578125, -0.2188262939453125, -0.1446533203125, -0.0704803466796875, 0.003692626953125, 0.0778656005859375, 0.15203857421875, 0.2262115478515625, 0.300384521484375, 0.3745574951171875, 0.44873046875, 0.5229034423828125, 0.597076416015625, 0.6712493896484375, 0.74542236328125, 0.8195953369140625, 0.893768310546875, 0.9679412841796875, 1.0421142578125, 1.1162872314453125, 1.190460205078125, 1.2646331787109375, 1.33880615234375, 1.4129791259765625, 1.487152099609375, 1.5613250732421875, 1.635498046875, 1.7096710205078125, 1.783843994140625, 1.8580169677734375, 1.93218994140625, 2.0063629150390625, 2.080535888671875, 2.1547088623046875, 2.2288818359375, 2.3030548095703125, 2.377227783203125, 2.4514007568359375, 2.52557373046875, 2.5997467041015625, 2.673919677734375, 2.7480926513671875, 2.822265625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 11.0, 4.0, 6.0, 7.0, 8.0, 10.0, 22.0, 22.0, 31.0, 27.0, 30.0, 34.0, 41.0, 49.0, 33.0, 74.0, 102.0, 226.0, 1545.0, 208.0, 107.0, 58.0, 67.0, 56.0, 38.0, 32.0, 43.0, 27.0, 25.0, 22.0, 13.0, 13.0, 17.0, 9.0, 8.0, 5.0, 4.0, 1.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.0234375, -9.741455078125, -9.45947265625, -9.177490234375, -8.8955078125, -8.613525390625, -8.33154296875, -8.049560546875, -7.767578125, -7.485595703125, -7.20361328125, -6.921630859375, -6.6396484375, -6.357666015625, -6.07568359375, -5.793701171875, -5.51171875, -5.229736328125, -4.94775390625, -4.665771484375, -4.3837890625, -4.101806640625, -3.81982421875, -3.537841796875, -3.255859375, -2.973876953125, -2.69189453125, -2.409912109375, -2.1279296875, -1.845947265625, -1.56396484375, -1.281982421875, -1.0, -0.718017578125, -0.43603515625, -0.154052734375, 0.1279296875, 0.409912109375, 0.69189453125, 0.973876953125, 1.255859375, 1.537841796875, 1.81982421875, 2.101806640625, 2.3837890625, 2.665771484375, 2.94775390625, 3.229736328125, 3.51171875, 3.793701171875, 4.07568359375, 4.357666015625, 4.6396484375, 4.921630859375, 5.20361328125, 5.485595703125, 5.767578125, 6.049560546875, 6.33154296875, 6.613525390625, 6.8955078125, 7.177490234375, 7.45947265625, 7.741455078125, 8.0234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 3.0, 4.0, 7.0, 12.0, 12.0, 14.0, 25.0, 32.0, 38.0, 53.0, 62.0, 68.0, 108.0, 134.0, 174.0, 241.0, 399.0, 1074.0, 7221.0, 225166.0, 2880887.0, 25974.0, 2355.0, 489.0, 279.0, 206.0, 167.0, 98.0, 88.0, 70.0, 59.0, 42.0, 36.0, 17.0, 14.0, 20.0, 11.0, 9.0, 16.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.8885498046875, -13.378662109375, -12.8687744140625, -12.35888671875, -11.8489990234375, -11.339111328125, -10.8292236328125, -10.3193359375, -9.8094482421875, -9.299560546875, -8.7896728515625, -8.27978515625, -7.7698974609375, -7.260009765625, -6.7501220703125, -6.240234375, -5.7303466796875, -5.220458984375, -4.7105712890625, -4.20068359375, -3.6907958984375, -3.180908203125, -2.6710205078125, -2.1611328125, -1.6512451171875, -1.141357421875, -0.6314697265625, -0.12158203125, 0.3883056640625, 0.898193359375, 1.4080810546875, 1.91796875, 2.4278564453125, 2.937744140625, 3.4476318359375, 3.95751953125, 4.4674072265625, 4.977294921875, 5.4871826171875, 5.9970703125, 6.5069580078125, 7.016845703125, 7.5267333984375, 8.03662109375, 8.5465087890625, 9.056396484375, 9.5662841796875, 10.076171875, 10.5860595703125, 11.095947265625, 11.6058349609375, 12.11572265625, 12.6256103515625, 13.135498046875, 13.6453857421875, 14.1552734375, 14.6651611328125, 15.175048828125, 15.6849365234375, 16.19482421875, 16.7047119140625, 17.214599609375, 17.7244873046875, 18.234375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 25.0, 122.0, 291.0, 340.0, 182.0, 48.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.730520248413086, -7.510559558868408, -6.2905988693237305, -5.0706377029418945, -3.850677013397217, -2.630716323852539, -1.4107551574707031, -0.1907949447631836, 1.0291662216186523, 2.24912691116333, 3.469087839126587, 4.689048767089844, 5.9090094566345215, 7.128970146179199, 8.348931312561035, 9.568891525268555, 10.78885269165039, 12.008813858032227, 13.228774070739746, 14.448735237121582, 15.668695449829102, 16.888656616210938, 18.108617782592773, 19.32857894897461, 20.548538208007812, 21.76849937438965, 22.988460540771484, 24.208419799804688, 25.428380966186523, 26.64834213256836, 27.868303298950195, 29.08826446533203, 30.308223724365234, 31.52818489074707, 32.748146057128906, 33.96810531616211, 35.18806838989258, 36.40802764892578, 37.62799072265625, 38.84794998168945, 40.067909240722656, 41.28786849975586, 42.50783157348633, 43.72779083251953, 44.94775390625, 46.1677131652832, 47.387672424316406, 48.607635498046875, 49.827598571777344, 51.04755783081055, 52.267520904541016, 53.48748016357422, 54.70744323730469, 55.92740249633789, 57.147361755371094, 58.36732482910156, 59.587284088134766, 60.80724334716797, 62.02720642089844, 63.24716567993164, 64.46712493896484, 65.68708801269531, 66.90705108642578, 68.12700653076172, 69.34696960449219]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 2.0, 4.0, 7.0, 9.0, 7.0, 9.0, 20.0, 14.0, 20.0, 17.0, 21.0, 24.0, 30.0, 31.0, 41.0, 41.0, 30.0, 40.0, 49.0, 37.0, 46.0, 55.0, 47.0, 51.0, 36.0, 38.0, 36.0, 40.0, 31.0, 33.0, 17.0, 18.0, 17.0, 13.0, 12.0, 13.0, 10.0, 9.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.985671997070312, -23.186918258666992, -22.388166427612305, -21.589412689208984, -20.790658950805664, -19.991907119750977, -19.193153381347656, -18.39440155029297, -17.59564781188965, -16.796894073486328, -15.998141288757324, -15.19938850402832, -14.400635719299316, -13.601882934570312, -12.803129196166992, -12.004376411437988, -11.205622673034668, -10.406869888305664, -9.608116149902344, -8.80936336517334, -8.010610580444336, -7.211857318878174, -6.413104057312012, -5.614351272583008, -4.815598011016846, -4.016844749450684, -3.2180919647216797, -2.4193387031555176, -1.6205856800079346, -0.8218326568603516, -0.023079395294189453, 0.7756733894348145, 1.5744266510009766, 2.3731796741485596, 3.1719326972961426, 3.9706859588623047, 4.769438743591309, 5.568192005157471, 6.366945266723633, 7.165698051452637, 7.964451313018799, 8.763204574584961, 9.561957359313965, 10.360710144042969, 11.159463882446289, 11.958216667175293, 12.756969451904297, 13.555723190307617, 14.354475975036621, 15.153228759765625, 15.951982498168945, 16.750736236572266, 17.549488067626953, 18.348241806030273, 19.146995544433594, 19.94574737548828, 20.7445011138916, 21.543254852294922, 22.34200668334961, 23.14076042175293, 23.93951416015625, 24.738265991210938, 25.537019729614258, 26.335773468017578, 27.134525299072266]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 9.0, 8.0, 7.0, 10.0, 12.0, 12.0, 16.0, 22.0, 21.0, 25.0, 28.0, 31.0, 30.0, 34.0, 40.0, 34.0, 44.0, 41.0, 47.0, 53.0, 29.0, 41.0, 44.0, 39.0, 35.0, 38.0, 31.0, 27.0, 30.0, 29.0, 18.0, 26.0, 12.0, 12.0, 13.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6015625, -2.516021728515625, -2.43048095703125, -2.344940185546875, -2.2593994140625, -2.173858642578125, -2.08831787109375, -2.002777099609375, -1.917236328125, -1.831695556640625, -1.74615478515625, -1.660614013671875, -1.5750732421875, -1.489532470703125, -1.40399169921875, -1.318450927734375, -1.23291015625, -1.147369384765625, -1.06182861328125, -0.976287841796875, -0.8907470703125, -0.805206298828125, -0.71966552734375, -0.634124755859375, -0.548583984375, -0.463043212890625, -0.37750244140625, -0.291961669921875, -0.2064208984375, -0.120880126953125, -0.03533935546875, 0.050201416015625, 0.1357421875, 0.221282958984375, 0.30682373046875, 0.392364501953125, 0.4779052734375, 0.563446044921875, 0.64898681640625, 0.734527587890625, 0.820068359375, 0.905609130859375, 0.99114990234375, 1.076690673828125, 1.1622314453125, 1.247772216796875, 1.33331298828125, 1.418853759765625, 1.50439453125, 1.589935302734375, 1.67547607421875, 1.761016845703125, 1.8465576171875, 1.932098388671875, 2.01763916015625, 2.103179931640625, 2.188720703125, 2.274261474609375, 2.35980224609375, 2.445343017578125, 2.5308837890625, 2.616424560546875, 2.70196533203125, 2.787506103515625, 2.873046875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 6.0, 17.0, 7.0, 9.0, 24.0, 39.0, 35.0, 68.0, 99.0, 233.0, 383.0, 828.0, 1741.0, 4370.0, 12456.0, 43219.0, 190694.0, 1057691.0, 2141286.0, 588223.0, 110633.0, 27777.0, 8451.0, 3151.0, 1368.0, 633.0, 303.0, 180.0, 100.0, 71.0, 56.0, 25.0, 19.0, 13.0, 14.0, 7.0, 6.0, 3.0, 3.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.1373291015625, -4.962158203125, -4.7869873046875, -4.61181640625, -4.4366455078125, -4.261474609375, -4.0863037109375, -3.9111328125, -3.7359619140625, -3.560791015625, -3.3856201171875, -3.21044921875, -3.0352783203125, -2.860107421875, -2.6849365234375, -2.509765625, -2.3345947265625, -2.159423828125, -1.9842529296875, -1.80908203125, -1.6339111328125, -1.458740234375, -1.2835693359375, -1.1083984375, -0.9332275390625, -0.758056640625, -0.5828857421875, -0.40771484375, -0.2325439453125, -0.057373046875, 0.1177978515625, 0.29296875, 0.4681396484375, 0.643310546875, 0.8184814453125, 0.99365234375, 1.1688232421875, 1.343994140625, 1.5191650390625, 1.6943359375, 1.8695068359375, 2.044677734375, 2.2198486328125, 2.39501953125, 2.5701904296875, 2.745361328125, 2.9205322265625, 3.095703125, 3.2708740234375, 3.446044921875, 3.6212158203125, 3.79638671875, 3.9715576171875, 4.146728515625, 4.3218994140625, 4.4970703125, 4.6722412109375, 4.847412109375, 5.0225830078125, 5.19775390625, 5.3729248046875, 5.548095703125, 5.7232666015625, 5.8984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 11.0, 5.0, 13.0, 22.0, 27.0, 51.0, 56.0, 73.0, 83.0, 133.0, 206.0, 253.0, 310.0, 380.0, 442.0, 448.0, 380.0, 325.0, 247.0, 167.0, 123.0, 84.0, 73.0, 44.0, 34.0, 18.0, 16.0, 10.0, 13.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3125, -5.13507080078125, -4.9576416015625, -4.78021240234375, -4.602783203125, -4.42535400390625, -4.2479248046875, -4.07049560546875, -3.89306640625, -3.71563720703125, -3.5382080078125, -3.36077880859375, -3.183349609375, -3.00592041015625, -2.8284912109375, -2.65106201171875, -2.4736328125, -2.29620361328125, -2.1187744140625, -1.94134521484375, -1.763916015625, -1.58648681640625, -1.4090576171875, -1.23162841796875, -1.05419921875, -0.87677001953125, -0.6993408203125, -0.52191162109375, -0.344482421875, -0.16705322265625, 0.0103759765625, 0.18780517578125, 0.365234375, 0.54266357421875, 0.7200927734375, 0.89752197265625, 1.074951171875, 1.25238037109375, 1.4298095703125, 1.60723876953125, 1.78466796875, 1.96209716796875, 2.1395263671875, 2.31695556640625, 2.494384765625, 2.67181396484375, 2.8492431640625, 3.02667236328125, 3.2041015625, 3.38153076171875, 3.5589599609375, 3.73638916015625, 3.913818359375, 4.09124755859375, 4.2686767578125, 4.44610595703125, 4.62353515625, 4.80096435546875, 4.9783935546875, 5.15582275390625, 5.333251953125, 5.51068115234375, 5.6881103515625, 5.86553955078125, 6.04296875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 10.0, 3.0, 14.0, 30.0, 36.0, 56.0, 71.0, 98.0, 154.0, 199.0, 345.0, 671.0, 3431.0, 74683.0, 3127225.0, 963465.0, 20616.0, 1644.0, 513.0, 314.0, 201.0, 134.0, 83.0, 80.0, 57.0, 50.0, 33.0, 15.0, 8.0, 9.0, 8.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.046875, -19.4541015625, -18.861328125, -18.2685546875, -17.67578125, -17.0830078125, -16.490234375, -15.8974609375, -15.3046875, -14.7119140625, -14.119140625, -13.5263671875, -12.93359375, -12.3408203125, -11.748046875, -11.1552734375, -10.5625, -9.9697265625, -9.376953125, -8.7841796875, -8.19140625, -7.5986328125, -7.005859375, -6.4130859375, -5.8203125, -5.2275390625, -4.634765625, -4.0419921875, -3.44921875, -2.8564453125, -2.263671875, -1.6708984375, -1.078125, -0.4853515625, 0.107421875, 0.7001953125, 1.29296875, 1.8857421875, 2.478515625, 3.0712890625, 3.6640625, 4.2568359375, 4.849609375, 5.4423828125, 6.03515625, 6.6279296875, 7.220703125, 7.8134765625, 8.40625, 8.9990234375, 9.591796875, 10.1845703125, 10.77734375, 11.3701171875, 11.962890625, 12.5556640625, 13.1484375, 13.7412109375, 14.333984375, 14.9267578125, 15.51953125, 16.1123046875, 16.705078125, 17.2978515625, 17.890625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 14.0, 26.0, 37.0, 71.0, 99.0, 114.0, 132.0, 155.0, 136.0, 85.0, 54.0, 39.0, 24.0, 14.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.38740158081055, -34.17501449584961, -32.962623596191406, -31.75023651123047, -30.5378475189209, -29.325458526611328, -28.11307144165039, -26.90068244934082, -25.68829345703125, -24.47590446472168, -23.26351547241211, -22.051128387451172, -20.8387393951416, -19.62635040283203, -18.413963317871094, -17.201574325561523, -15.989185333251953, -14.776796340942383, -13.564408302307129, -12.352020263671875, -11.139631271362305, -9.927242279052734, -8.71485424041748, -7.502466201782227, -6.290077209472656, -5.077688694000244, -3.865300178527832, -2.65291166305542, -1.4405231475830078, -0.2281346321105957, 0.9842538833618164, 2.1966419219970703, 3.409027099609375, 4.621415615081787, 5.833804130554199, 7.046192646026611, 8.258581161499023, 9.470970153808594, 10.683358192443848, 11.895746231079102, 13.108135223388672, 14.320524215698242, 15.532912254333496, 16.74530029296875, 17.95768928527832, 19.17007827758789, 20.382465362548828, 21.5948543548584, 22.80724334716797, 24.01963233947754, 25.23202133178711, 26.444408416748047, 27.656797409057617, 28.869186401367188, 30.081573486328125, 31.293962478637695, 32.506351470947266, 33.7187385559082, 34.931129455566406, 36.143516540527344, 37.35590362548828, 38.568294525146484, 39.78068161010742, 40.993072509765625, 42.20545959472656]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 9.0, 11.0, 9.0, 19.0, 16.0, 17.0, 22.0, 27.0, 33.0, 23.0, 21.0, 28.0, 34.0, 30.0, 47.0, 31.0, 34.0, 45.0, 44.0, 35.0, 50.0, 39.0, 39.0, 32.0, 42.0, 32.0, 24.0, 24.0, 37.0, 25.0, 12.0, 17.0, 16.0, 14.0, 14.0, 3.0, 6.0, 4.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.936317443847656, -17.336288452148438, -16.73625946044922, -16.13623046875, -15.536201477050781, -14.936172485351562, -14.336143493652344, -13.736114501953125, -13.136085510253906, -12.536056518554688, -11.936027526855469, -11.33599853515625, -10.735969543457031, -10.135940551757812, -9.535911560058594, -8.935882568359375, -8.335853576660156, -7.7358245849609375, -7.135795593261719, -6.5357666015625, -5.935737609863281, -5.3357086181640625, -4.735679626464844, -4.135650634765625, -3.5356216430664062, -2.9355926513671875, -2.3355636596679688, -1.73553466796875, -1.1355056762695312, -0.5354766845703125, 0.06455230712890625, 0.664581298828125, 1.2646102905273438, 1.8646392822265625, 2.4646682739257812, 3.064697265625, 3.6647262573242188, 4.2647552490234375, 4.864784240722656, 5.464813232421875, 6.064842224121094, 6.6648712158203125, 7.264900207519531, 7.86492919921875, 8.464958190917969, 9.064987182617188, 9.665016174316406, 10.265045166015625, 10.865074157714844, 11.465103149414062, 12.065132141113281, 12.6651611328125, 13.265190124511719, 13.865219116210938, 14.465248107910156, 15.065277099609375, 15.665306091308594, 16.265335083007812, 16.86536407470703, 17.46539306640625, 18.06542205810547, 18.665451049804688, 19.265480041503906, 19.865509033203125, 20.465538024902344]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 14.0, 18.0, 20.0, 19.0, 12.0, 21.0, 25.0, 30.0, 24.0, 27.0, 25.0, 40.0, 43.0, 38.0, 54.0, 34.0, 55.0, 38.0, 43.0, 42.0, 46.0, 32.0, 34.0, 36.0, 31.0, 27.0, 15.0, 26.0, 18.0, 15.0, 15.0, 9.0, 14.0, 6.0, 11.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.568359375, -2.481689453125, -2.39501953125, -2.308349609375, -2.2216796875, -2.135009765625, -2.04833984375, -1.961669921875, -1.875, -1.788330078125, -1.70166015625, -1.614990234375, -1.5283203125, -1.441650390625, -1.35498046875, -1.268310546875, -1.181640625, -1.094970703125, -1.00830078125, -0.921630859375, -0.8349609375, -0.748291015625, -0.66162109375, -0.574951171875, -0.48828125, -0.401611328125, -0.31494140625, -0.228271484375, -0.1416015625, -0.054931640625, 0.03173828125, 0.118408203125, 0.205078125, 0.291748046875, 0.37841796875, 0.465087890625, 0.5517578125, 0.638427734375, 0.72509765625, 0.811767578125, 0.8984375, 0.985107421875, 1.07177734375, 1.158447265625, 1.2451171875, 1.331787109375, 1.41845703125, 1.505126953125, 1.591796875, 1.678466796875, 1.76513671875, 1.851806640625, 1.9384765625, 2.025146484375, 2.11181640625, 2.198486328125, 2.28515625, 2.371826171875, 2.45849609375, 2.545166015625, 2.6318359375, 2.718505859375, 2.80517578125, 2.891845703125, 2.978515625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 14.0, 9.0, 18.0, 22.0, 44.0, 55.0, 88.0, 127.0, 171.0, 271.0, 344.0, 555.0, 821.0, 1236.0, 1791.0, 2620.0, 3814.0, 5661.0, 8678.0, 12995.0, 19501.0, 30771.0, 49934.0, 87234.0, 189151.0, 312299.0, 134232.0, 68983.0, 40954.0, 25738.0, 16615.0, 11204.0, 7446.0, 4840.0, 3219.0, 2326.0, 1543.0, 1045.0, 708.0, 451.0, 321.0, 239.0, 130.0, 112.0, 80.0, 47.0, 39.0, 21.0, 17.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0141143798828125, -0.013663530349731445, -0.01321268081665039, -0.012761831283569336, -0.012310981750488281, -0.011860132217407227, -0.011409282684326172, -0.010958433151245117, -0.010507583618164062, -0.010056734085083008, -0.009605884552001953, -0.009155035018920898, -0.008704185485839844, -0.008253335952758789, -0.007802486419677734, -0.00735163688659668, -0.006900787353515625, -0.00644993782043457, -0.005999088287353516, -0.005548238754272461, -0.005097389221191406, -0.0046465396881103516, -0.004195690155029297, -0.003744840621948242, -0.0032939910888671875, -0.002843141555786133, -0.002392292022705078, -0.0019414424896240234, -0.0014905929565429688, -0.001039743423461914, -0.0005888938903808594, -0.0001380443572998047, 0.00031280517578125, 0.0007636547088623047, 0.0012145042419433594, 0.001665353775024414, 0.0021162033081054688, 0.0025670528411865234, 0.003017902374267578, 0.003468751907348633, 0.0039196014404296875, 0.004370450973510742, 0.004821300506591797, 0.0052721500396728516, 0.005722999572753906, 0.006173849105834961, 0.006624698638916016, 0.00707554817199707, 0.007526397705078125, 0.00797724723815918, 0.008428096771240234, 0.008878946304321289, 0.009329795837402344, 0.009780645370483398, 0.010231494903564453, 0.010682344436645508, 0.011133193969726562, 0.011584043502807617, 0.012034893035888672, 0.012485742568969727, 0.012936592102050781, 0.013387441635131836, 0.01383829116821289, 0.014289140701293945, 0.014739990234375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 12.0, 4.0, 3.0, 11.0, 17.0, 11.0, 17.0, 13.0, 12.0, 27.0, 29.0, 33.0, 31.0, 26.0, 24.0, 29.0, 36.0, 42.0, 35.0, 34.0, 47.0, 1071.0, 36.0, 37.0, 41.0, 37.0, 23.0, 30.0, 31.0, 33.0, 21.0, 28.0, 15.0, 19.0, 16.0, 11.0, 17.0, 10.0, 11.0, 11.0, 10.0, 5.0, 7.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.7587890625, -1.7071685791015625, -1.655548095703125, -1.6039276123046875, -1.55230712890625, -1.5006866455078125, -1.449066162109375, -1.3974456787109375, -1.3458251953125, -1.2942047119140625, -1.242584228515625, -1.1909637451171875, -1.13934326171875, -1.0877227783203125, -1.036102294921875, -0.9844818115234375, -0.932861328125, -0.8812408447265625, -0.829620361328125, -0.7779998779296875, -0.72637939453125, -0.6747589111328125, -0.623138427734375, -0.5715179443359375, -0.5198974609375, -0.4682769775390625, -0.416656494140625, -0.3650360107421875, -0.31341552734375, -0.2617950439453125, -0.210174560546875, -0.1585540771484375, -0.10693359375, -0.0553131103515625, -0.003692626953125, 0.0479278564453125, 0.09954833984375, 0.1511688232421875, 0.202789306640625, 0.2544097900390625, 0.3060302734375, 0.3576507568359375, 0.409271240234375, 0.4608917236328125, 0.51251220703125, 0.5641326904296875, 0.615753173828125, 0.6673736572265625, 0.718994140625, 0.7706146240234375, 0.822235107421875, 0.8738555908203125, 0.92547607421875, 0.9770965576171875, 1.028717041015625, 1.0803375244140625, 1.1319580078125, 1.1835784912109375, 1.235198974609375, 1.2868194580078125, 1.33843994140625, 1.3900604248046875, 1.441680908203125, 1.4933013916015625, 1.544921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 11.0, 9.0, 16.0, 31.0, 47.0, 62.0, 100.0, 137.0, 219.0, 298.0, 537.0, 724.0, 1084.0, 1675.0, 2488.0, 3649.0, 5660.0, 8604.0, 13041.0, 20521.0, 31927.0, 51204.0, 86162.0, 179175.0, 1342780.0, 145159.0, 75069.0, 45057.0, 28705.0, 18420.0, 11851.0, 7598.0, 4977.0, 3347.0, 2238.0, 1476.0, 1027.0, 647.0, 426.0, 325.0, 227.0, 131.0, 95.0, 62.0, 46.0, 32.0, 22.0, 7.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.009490966796875, -0.009178519248962402, -0.008866071701049805, -0.008553624153137207, -0.00824117660522461, -0.007928729057312012, -0.007616281509399414, -0.007303833961486816, -0.006991386413574219, -0.006678938865661621, -0.0063664913177490234, -0.006054043769836426, -0.005741596221923828, -0.0054291486740112305, -0.005116701126098633, -0.004804253578186035, -0.0044918060302734375, -0.00417935848236084, -0.003866910934448242, -0.0035544633865356445, -0.003242015838623047, -0.0029295682907104492, -0.0026171207427978516, -0.002304673194885254, -0.0019922256469726562, -0.0016797780990600586, -0.001367330551147461, -0.0010548830032348633, -0.0007424354553222656, -0.00042998790740966797, -0.00011754035949707031, 0.00019490718841552734, 0.000507354736328125, 0.0008198022842407227, 0.0011322498321533203, 0.001444697380065918, 0.0017571449279785156, 0.0020695924758911133, 0.002382040023803711, 0.0026944875717163086, 0.0030069351196289062, 0.003319382667541504, 0.0036318302154541016, 0.003944277763366699, 0.004256725311279297, 0.0045691728591918945, 0.004881620407104492, 0.00519406795501709, 0.0055065155029296875, 0.005818963050842285, 0.006131410598754883, 0.0064438581466674805, 0.006756305694580078, 0.007068753242492676, 0.0073812007904052734, 0.007693648338317871, 0.008006095886230469, 0.008318543434143066, 0.008630990982055664, 0.008943438529968262, 0.00925588607788086, 0.009568333625793457, 0.009880781173706055, 0.010193228721618652, 0.01050567626953125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 931.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 11.0, 4.0, 0.0, 1.0, 20.0, 4.0, 0.0, 1.0, 1.0, 0.0, 47.0, 19.0, 21.0, 304.0, 2163.0, 20974.0, 1001317.0, 23287.0, 151.0, 98.0, 58.0, 26.0, 10.0, 1.0, 1.0, 1.0, 0.0, 11.0, 0.0, 0.0, 5.0, 0.0, 16.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.187676727771759e-06, -2.1103769540786743e-06, -2.0330771803855896e-06, -1.955777406692505e-06, -1.8784776329994202e-06, -1.8011778593063354e-06, -1.7238780856132507e-06, -1.646578311920166e-06, -1.5692785382270813e-06, -1.4919787645339966e-06, -1.4146789908409119e-06, -1.3373792171478271e-06, -1.2600794434547424e-06, -1.1827796697616577e-06, -1.105479896068573e-06, -1.0281801223754883e-06, -9.508803486824036e-07, -8.735805749893188e-07, -7.962808012962341e-07, -7.189810276031494e-07, -6.416812539100647e-07, -5.6438148021698e-07, -4.870817065238953e-07, -4.0978193283081055e-07, -3.3248215913772583e-07, -2.551823854446411e-07, -1.778826117515564e-07, -1.0058283805847168e-07, -2.3283064365386963e-08, 5.4016709327697754e-08, 1.3131648302078247e-07, 2.086162567138672e-07, 2.859160304069519e-07, 3.632158041000366e-07, 4.4051557779312134e-07, 5.178153514862061e-07, 5.951151251792908e-07, 6.724148988723755e-07, 7.497146725654602e-07, 8.270144462585449e-07, 9.043142199516296e-07, 9.816139936447144e-07, 1.058913767337799e-06, 1.1362135410308838e-06, 1.2135133147239685e-06, 1.2908130884170532e-06, 1.368112862110138e-06, 1.4454126358032227e-06, 1.5227124094963074e-06, 1.600012183189392e-06, 1.6773119568824768e-06, 1.7546117305755615e-06, 1.8319115042686462e-06, 1.909211277961731e-06, 1.9865110516548157e-06, 2.0638108253479004e-06, 2.141110599040985e-06, 2.21841037273407e-06, 2.2957101464271545e-06, 2.3730099201202393e-06, 2.450309693813324e-06, 2.5276094675064087e-06, 2.6049092411994934e-06, 2.682209014892578e-06]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 6.0, 14.0, 18.0, 20.0, 19.0, 12.0, 21.0, 25.0, 30.0, 24.0, 27.0, 25.0, 40.0, 43.0, 38.0, 54.0, 34.0, 55.0, 38.0, 43.0, 42.0, 46.0, 32.0, 34.0, 36.0, 31.0, 27.0, 15.0, 26.0, 18.0, 15.0, 15.0, 9.0, 14.0, 6.0, 11.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.568359375, -2.481689453125, -2.39501953125, -2.308349609375, -2.2216796875, -2.135009765625, -2.04833984375, -1.961669921875, -1.875, -1.788330078125, -1.70166015625, -1.614990234375, -1.5283203125, -1.441650390625, -1.35498046875, -1.268310546875, -1.181640625, -1.094970703125, -1.00830078125, -0.921630859375, -0.8349609375, -0.748291015625, -0.66162109375, -0.574951171875, -0.48828125, -0.401611328125, -0.31494140625, -0.228271484375, -0.1416015625, -0.054931640625, 0.03173828125, 0.118408203125, 0.205078125, 0.291748046875, 0.37841796875, 0.465087890625, 0.5517578125, 0.638427734375, 0.72509765625, 0.811767578125, 0.8984375, 0.985107421875, 1.07177734375, 1.158447265625, 1.2451171875, 1.331787109375, 1.41845703125, 1.505126953125, 1.591796875, 1.678466796875, 1.76513671875, 1.851806640625, 1.9384765625, 2.025146484375, 2.11181640625, 2.198486328125, 2.28515625, 2.371826171875, 2.45849609375, 2.545166015625, 2.6318359375, 2.718505859375, 2.80517578125, 2.891845703125, 2.978515625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 4.0, 19.0, 21.0, 28.0, 43.0, 67.0, 100.0, 142.0, 179.0, 271.0, 442.0, 661.0, 1022.0, 1445.0, 2268.0, 3553.0, 6085.0, 11404.0, 24282.0, 59980.0, 168454.0, 403906.0, 221807.0, 79166.0, 30564.0, 13773.0, 7207.0, 4191.0, 2528.0, 1666.0, 1050.0, 719.0, 493.0, 332.0, 209.0, 152.0, 93.0, 65.0, 45.0, 32.0, 28.0, 23.0, 8.0, 7.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.08160400390625, -2.0089111328125, -1.93621826171875, -1.863525390625, -1.79083251953125, -1.7181396484375, -1.64544677734375, -1.57275390625, -1.50006103515625, -1.4273681640625, -1.35467529296875, -1.281982421875, -1.20928955078125, -1.1365966796875, -1.06390380859375, -0.9912109375, -0.91851806640625, -0.8458251953125, -0.77313232421875, -0.700439453125, -0.62774658203125, -0.5550537109375, -0.48236083984375, -0.40966796875, -0.33697509765625, -0.2642822265625, -0.19158935546875, -0.118896484375, -0.04620361328125, 0.0264892578125, 0.09918212890625, 0.171875, 0.24456787109375, 0.3172607421875, 0.38995361328125, 0.462646484375, 0.53533935546875, 0.6080322265625, 0.68072509765625, 0.75341796875, 0.82611083984375, 0.8988037109375, 0.97149658203125, 1.044189453125, 1.11688232421875, 1.1895751953125, 1.26226806640625, 1.3349609375, 1.40765380859375, 1.4803466796875, 1.55303955078125, 1.625732421875, 1.69842529296875, 1.7711181640625, 1.84381103515625, 1.91650390625, 1.98919677734375, 2.0618896484375, 2.13458251953125, 2.207275390625, 2.27996826171875, 2.3526611328125, 2.42535400390625, 2.498046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 10.0, 11.0, 9.0, 13.0, 21.0, 12.0, 17.0, 29.0, 23.0, 42.0, 32.0, 41.0, 37.0, 42.0, 70.0, 129.0, 352.0, 1559.0, 173.0, 63.0, 62.0, 48.0, 38.0, 39.0, 26.0, 28.0, 20.0, 23.0, 12.0, 10.0, 9.0, 11.0, 10.0, 4.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.593017578125, -9.26416015625, -8.935302734375, -8.6064453125, -8.277587890625, -7.94873046875, -7.619873046875, -7.291015625, -6.962158203125, -6.63330078125, -6.304443359375, -5.9755859375, -5.646728515625, -5.31787109375, -4.989013671875, -4.66015625, -4.331298828125, -4.00244140625, -3.673583984375, -3.3447265625, -3.015869140625, -2.68701171875, -2.358154296875, -2.029296875, -1.700439453125, -1.37158203125, -1.042724609375, -0.7138671875, -0.385009765625, -0.05615234375, 0.272705078125, 0.6015625, 0.930419921875, 1.25927734375, 1.588134765625, 1.9169921875, 2.245849609375, 2.57470703125, 2.903564453125, 3.232421875, 3.561279296875, 3.89013671875, 4.218994140625, 4.5478515625, 4.876708984375, 5.20556640625, 5.534423828125, 5.86328125, 6.192138671875, 6.52099609375, 6.849853515625, 7.1787109375, 7.507568359375, 7.83642578125, 8.165283203125, 8.494140625, 8.822998046875, 9.15185546875, 9.480712890625, 9.8095703125, 10.138427734375, 10.46728515625, 10.796142578125, 11.125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 5.0, 7.0, 7.0, 16.0, 12.0, 15.0, 16.0, 20.0, 38.0, 45.0, 64.0, 77.0, 108.0, 183.0, 262.0, 487.0, 1729.0, 25190.0, 3073128.0, 40612.0, 2150.0, 548.0, 279.0, 177.0, 140.0, 112.0, 69.0, 52.0, 23.0, 25.0, 17.0, 27.0, 10.0, 13.0, 13.0, 10.0, 2.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.90625, -20.283203125, -19.66015625, -19.037109375, -18.4140625, -17.791015625, -17.16796875, -16.544921875, -15.921875, -15.298828125, -14.67578125, -14.052734375, -13.4296875, -12.806640625, -12.18359375, -11.560546875, -10.9375, -10.314453125, -9.69140625, -9.068359375, -8.4453125, -7.822265625, -7.19921875, -6.576171875, -5.953125, -5.330078125, -4.70703125, -4.083984375, -3.4609375, -2.837890625, -2.21484375, -1.591796875, -0.96875, -0.345703125, 0.27734375, 0.900390625, 1.5234375, 2.146484375, 2.76953125, 3.392578125, 4.015625, 4.638671875, 5.26171875, 5.884765625, 6.5078125, 7.130859375, 7.75390625, 8.376953125, 9.0, 9.623046875, 10.24609375, 10.869140625, 11.4921875, 12.115234375, 12.73828125, 13.361328125, 13.984375, 14.607421875, 15.23046875, 15.853515625, 16.4765625, 17.099609375, 17.72265625, 18.345703125, 18.96875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 15.0, 53.0, 163.0, 300.0, 271.0, 146.0, 54.0, 12.0, 3.0], "bins": [-49.93052673339844, -49.08224105834961, -48.23395919799805, -47.38567352294922, -46.537391662597656, -45.68910598754883, -44.840824127197266, -43.99253845214844, -43.144256591796875, -42.29597091674805, -41.447689056396484, -40.599403381347656, -39.751121520996094, -38.902835845947266, -38.0545539855957, -37.206268310546875, -36.35798645019531, -35.509700775146484, -34.66141891479492, -33.813133239746094, -32.96485137939453, -32.1165657043457, -31.26828384399414, -30.420000076293945, -29.571714401245117, -28.723430633544922, -27.875146865844727, -27.02686309814453, -26.178579330444336, -25.33029556274414, -24.482011795043945, -23.63372802734375, -22.785446166992188, -21.937162399291992, -21.088878631591797, -20.2405948638916, -19.392311096191406, -18.54402732849121, -17.695743560791016, -16.84745979309082, -15.999174118041992, -15.150890350341797, -14.302606582641602, -13.454322814941406, -12.606039047241211, -11.757755279541016, -10.90947151184082, -10.061187744140625, -9.21290397644043, -8.364620208740234, -7.516336441040039, -6.668052673339844, -5.819768905639648, -4.971484661102295, -4.1232008934021, -3.2749171257019043, -2.426633358001709, -1.5783495903015137, -0.7300657033920288, 0.11821818351745605, 0.9665019512176514, 1.8147859573364258, 2.663069725036621, 3.5113534927368164, 4.359637260437012]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 8.0, 7.0, 6.0, 9.0, 11.0, 6.0, 12.0, 14.0, 15.0, 22.0, 22.0, 24.0, 30.0, 30.0, 18.0, 31.0, 21.0, 35.0, 41.0, 50.0, 39.0, 47.0, 43.0, 34.0, 40.0, 38.0, 41.0, 51.0, 50.0, 27.0, 32.0, 21.0, 17.0, 24.0, 12.0, 16.0, 10.0, 9.0, 8.0, 8.0, 6.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.588218688964844, -21.821998596191406, -21.05577850341797, -20.2895565032959, -19.52333641052246, -18.757116317749023, -17.990896224975586, -17.224674224853516, -16.458454132080078, -15.69223403930664, -14.926012992858887, -14.15979290008545, -13.393571853637695, -12.627351760864258, -11.86113166809082, -11.094910621643066, -10.328690528869629, -9.562470436096191, -8.796249389648438, -8.030029296875, -7.263808250427246, -6.497588157653809, -5.731367588043213, -4.965147018432617, -4.1989264488220215, -3.432705879211426, -2.66648530960083, -1.9002649784088135, -1.1340444087982178, -0.36782383918762207, 0.39839649200439453, 1.1646170616149902, 1.930837631225586, 2.6970582008361816, 3.4632787704467773, 4.229498863220215, 4.995719909667969, 5.761940002441406, 6.528160572052002, 7.294381141662598, 8.060602188110352, 8.826822280883789, 9.593043327331543, 10.35926342010498, 11.125484466552734, 11.891704559326172, 12.65792465209961, 13.424145698547363, 14.1903657913208, 14.956585884094238, 15.722806930541992, 16.48902702331543, 17.255247116088867, 18.021469116210938, 18.787689208984375, 19.553909301757812, 20.32012939453125, 21.086349487304688, 21.852569580078125, 22.618791580200195, 23.385011672973633, 24.15123176574707, 24.917451858520508, 25.683673858642578, 26.449893951416016]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 3.0, 4.0, 21.0, 16.0, 12.0, 17.0, 26.0, 17.0, 19.0, 31.0, 25.0, 29.0, 40.0, 34.0, 41.0, 41.0, 51.0, 55.0, 26.0, 53.0, 53.0, 33.0, 41.0, 41.0, 32.0, 27.0, 29.0, 31.0, 17.0, 20.0, 19.0, 19.0, 7.0, 15.0, 11.0, 10.0, 9.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.4912109375, -2.400390625, -2.3095703125, -2.21875, -2.1279296875, -2.037109375, -1.9462890625, -1.85546875, -1.7646484375, -1.673828125, -1.5830078125, -1.4921875, -1.4013671875, -1.310546875, -1.2197265625, -1.12890625, -1.0380859375, -0.947265625, -0.8564453125, -0.765625, -0.6748046875, -0.583984375, -0.4931640625, -0.40234375, -0.3115234375, -0.220703125, -0.1298828125, -0.0390625, 0.0517578125, 0.142578125, 0.2333984375, 0.32421875, 0.4150390625, 0.505859375, 0.5966796875, 0.6875, 0.7783203125, 0.869140625, 0.9599609375, 1.05078125, 1.1416015625, 1.232421875, 1.3232421875, 1.4140625, 1.5048828125, 1.595703125, 1.6865234375, 1.77734375, 1.8681640625, 1.958984375, 2.0498046875, 2.140625, 2.2314453125, 2.322265625, 2.4130859375, 2.50390625, 2.5947265625, 2.685546875, 2.7763671875, 2.8671875, 2.9580078125, 3.048828125, 3.1396484375, 3.23046875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 3.0, 10.0, 9.0, 17.0, 26.0, 23.0, 39.0, 45.0, 79.0, 93.0, 128.0, 225.0, 365.0, 749.0, 1821.0, 4851.0, 15661.0, 60400.0, 315908.0, 1685059.0, 1706224.0, 317064.0, 60947.0, 15781.0, 5065.0, 1802.0, 808.0, 361.0, 221.0, 121.0, 92.0, 70.0, 48.0, 45.0, 30.0, 21.0, 20.0, 11.0, 8.0, 8.0, 4.0, 9.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.275146484375, -5.09326171875, -4.911376953125, -4.7294921875, -4.547607421875, -4.36572265625, -4.183837890625, -4.001953125, -3.820068359375, -3.63818359375, -3.456298828125, -3.2744140625, -3.092529296875, -2.91064453125, -2.728759765625, -2.546875, -2.364990234375, -2.18310546875, -2.001220703125, -1.8193359375, -1.637451171875, -1.45556640625, -1.273681640625, -1.091796875, -0.909912109375, -0.72802734375, -0.546142578125, -0.3642578125, -0.182373046875, -0.00048828125, 0.181396484375, 0.36328125, 0.545166015625, 0.72705078125, 0.908935546875, 1.0908203125, 1.272705078125, 1.45458984375, 1.636474609375, 1.818359375, 2.000244140625, 2.18212890625, 2.364013671875, 2.5458984375, 2.727783203125, 2.90966796875, 3.091552734375, 3.2734375, 3.455322265625, 3.63720703125, 3.819091796875, 4.0009765625, 4.182861328125, 4.36474609375, 4.546630859375, 4.728515625, 4.910400390625, 5.09228515625, 5.274169921875, 5.4560546875, 5.637939453125, 5.81982421875, 6.001708984375, 6.18359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 6.0, 6.0, 7.0, 6.0, 10.0, 11.0, 19.0, 19.0, 25.0, 32.0, 45.0, 56.0, 80.0, 89.0, 92.0, 138.0, 151.0, 158.0, 220.0, 301.0, 311.0, 322.0, 344.0, 312.0, 209.0, 218.0, 168.0, 133.0, 122.0, 88.0, 66.0, 61.0, 45.0, 43.0, 25.0, 28.0, 20.0, 22.0, 17.0, 8.0, 11.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.820556640625, -3.69189453125, -3.563232421875, -3.4345703125, -3.305908203125, -3.17724609375, -3.048583984375, -2.919921875, -2.791259765625, -2.66259765625, -2.533935546875, -2.4052734375, -2.276611328125, -2.14794921875, -2.019287109375, -1.890625, -1.761962890625, -1.63330078125, -1.504638671875, -1.3759765625, -1.247314453125, -1.11865234375, -0.989990234375, -0.861328125, -0.732666015625, -0.60400390625, -0.475341796875, -0.3466796875, -0.218017578125, -0.08935546875, 0.039306640625, 0.16796875, 0.296630859375, 0.42529296875, 0.553955078125, 0.6826171875, 0.811279296875, 0.93994140625, 1.068603515625, 1.197265625, 1.325927734375, 1.45458984375, 1.583251953125, 1.7119140625, 1.840576171875, 1.96923828125, 2.097900390625, 2.2265625, 2.355224609375, 2.48388671875, 2.612548828125, 2.7412109375, 2.869873046875, 2.99853515625, 3.127197265625, 3.255859375, 3.384521484375, 3.51318359375, 3.641845703125, 3.7705078125, 3.899169921875, 4.02783203125, 4.156494140625, 4.28515625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 2.0, 5.0, 8.0, 13.0, 12.0, 18.0, 15.0, 22.0, 32.0, 29.0, 57.0, 61.0, 81.0, 85.0, 137.0, 162.0, 221.0, 261.0, 459.0, 1990.0, 45640.0, 2631462.0, 1484296.0, 26174.0, 1508.0, 371.0, 245.0, 183.0, 160.0, 122.0, 112.0, 101.0, 47.0, 39.0, 34.0, 23.0, 26.0, 10.0, 12.0, 6.0, 11.0, 10.0, 3.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-20.671875, -20.0625, -19.453125, -18.84375, -18.234375, -17.625, -17.015625, -16.40625, -15.796875, -15.1875, -14.578125, -13.96875, -13.359375, -12.75, -12.140625, -11.53125, -10.921875, -10.3125, -9.703125, -9.09375, -8.484375, -7.875, -7.265625, -6.65625, -6.046875, -5.4375, -4.828125, -4.21875, -3.609375, -3.0, -2.390625, -1.78125, -1.171875, -0.5625, 0.046875, 0.65625, 1.265625, 1.875, 2.484375, 3.09375, 3.703125, 4.3125, 4.921875, 5.53125, 6.140625, 6.75, 7.359375, 7.96875, 8.578125, 9.1875, 9.796875, 10.40625, 11.015625, 11.625, 12.234375, 12.84375, 13.453125, 14.0625, 14.671875, 15.28125, 15.890625, 16.5, 17.109375, 17.71875, 18.328125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 11.0, 22.0, 56.0, 118.0, 188.0, 249.0, 182.0, 105.0, 55.0, 21.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.02879333496094, -81.19861602783203, -79.36843872070312, -77.53826141357422, -75.70808410644531, -73.8779067993164, -72.0477294921875, -70.21754455566406, -68.38737487792969, -66.55719757080078, -64.72702026367188, -62.89684295654297, -61.06666564941406, -59.236488342285156, -57.406307220458984, -55.57612991333008, -53.745948791503906, -51.915771484375, -50.085594177246094, -48.25541687011719, -46.42523956298828, -44.595062255859375, -42.7648811340332, -40.9347038269043, -39.10452651977539, -37.274349212646484, -35.44417190551758, -33.61399459838867, -31.783815383911133, -29.953638076782227, -28.123458862304688, -26.29328155517578, -24.46310043334961, -22.632923126220703, -20.802745819091797, -18.972566604614258, -17.14238929748535, -15.312211990356445, -13.482033729553223, -11.65185546875, -9.821678161621094, -7.991500377655029, -6.161322593688965, -4.3311448097229, -2.500967025756836, -0.6707897186279297, 1.159388542175293, 2.9895668029785156, 4.819744110107422, 6.649921894073486, 8.48009967803955, 10.310277938842773, 12.14045524597168, 13.970632553100586, 15.800810813903809, 17.63098907470703, 19.461166381835938, 21.291343688964844, 23.12152099609375, 24.95170021057129, 26.781877517700195, 28.6120548248291, 30.44223403930664, 32.27241134643555, 34.10258865356445]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 9.0, 7.0, 8.0, 7.0, 10.0, 10.0, 10.0, 11.0, 22.0, 33.0, 27.0, 26.0, 27.0, 22.0, 26.0, 33.0, 48.0, 40.0, 34.0, 42.0, 34.0, 39.0, 34.0, 43.0, 37.0, 29.0, 42.0, 34.0, 22.0, 32.0, 27.0, 23.0, 28.0, 13.0, 17.0, 15.0, 10.0, 13.0, 7.0, 8.0, 9.0, 5.0, 4.0, 5.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.77703857421875, -16.23661994934082, -15.69620132446289, -15.155782699584961, -14.615364074707031, -14.074945449829102, -13.534526824951172, -12.994108200073242, -12.453689575195312, -11.913270950317383, -11.372852325439453, -10.832433700561523, -10.292015075683594, -9.751596450805664, -9.211177825927734, -8.670759201049805, -8.130340576171875, -7.589921951293945, -7.049503326416016, -6.509084701538086, -5.968666076660156, -5.428247451782227, -4.887828826904297, -4.347410202026367, -3.8069915771484375, -3.266572952270508, -2.726154327392578, -2.1857357025146484, -1.6453170776367188, -1.104898452758789, -0.5644798278808594, -0.024061203002929688, 0.516357421875, 1.0567760467529297, 1.5971946716308594, 2.137613296508789, 2.6780319213867188, 3.2184505462646484, 3.758869171142578, 4.299287796020508, 4.8397064208984375, 5.380125045776367, 5.920543670654297, 6.460962295532227, 7.001380920410156, 7.541799545288086, 8.082218170166016, 8.622636795043945, 9.163055419921875, 9.703474044799805, 10.243892669677734, 10.784311294555664, 11.324729919433594, 11.865148544311523, 12.405567169189453, 12.945985794067383, 13.486404418945312, 14.026823043823242, 14.567241668701172, 15.107660293579102, 15.648078918457031, 16.18849754333496, 16.72891616821289, 17.26933479309082, 17.80975341796875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 6.0, 7.0, 5.0, 14.0, 18.0, 11.0, 14.0, 30.0, 40.0, 26.0, 36.0, 30.0, 35.0, 34.0, 32.0, 38.0, 52.0, 44.0, 56.0, 44.0, 39.0, 46.0, 34.0, 33.0, 34.0, 25.0, 20.0, 27.0, 26.0, 17.0, 16.0, 20.0, 8.0, 11.0, 12.0, 13.0, 4.0, 6.0, 8.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.75390625, -2.66571044921875, -2.5775146484375, -2.48931884765625, -2.401123046875, -2.31292724609375, -2.2247314453125, -2.13653564453125, -2.04833984375, -1.96014404296875, -1.8719482421875, -1.78375244140625, -1.695556640625, -1.60736083984375, -1.5191650390625, -1.43096923828125, -1.3427734375, -1.25457763671875, -1.1663818359375, -1.07818603515625, -0.989990234375, -0.90179443359375, -0.8135986328125, -0.72540283203125, -0.63720703125, -0.54901123046875, -0.4608154296875, -0.37261962890625, -0.284423828125, -0.19622802734375, -0.1080322265625, -0.01983642578125, 0.068359375, 0.15655517578125, 0.2447509765625, 0.33294677734375, 0.421142578125, 0.50933837890625, 0.5975341796875, 0.68572998046875, 0.77392578125, 0.86212158203125, 0.9503173828125, 1.03851318359375, 1.126708984375, 1.21490478515625, 1.3031005859375, 1.39129638671875, 1.4794921875, 1.56768798828125, 1.6558837890625, 1.74407958984375, 1.832275390625, 1.92047119140625, 2.0086669921875, 2.09686279296875, 2.18505859375, 2.27325439453125, 2.3614501953125, 2.44964599609375, 2.537841796875, 2.62603759765625, 2.7142333984375, 2.80242919921875, 2.890625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 12.0, 12.0, 18.0, 42.0, 56.0, 79.0, 122.0, 176.0, 282.0, 431.0, 581.0, 876.0, 1344.0, 2039.0, 2975.0, 4507.0, 6917.0, 10704.0, 16764.0, 26411.0, 42110.0, 70216.0, 135766.0, 322124.0, 184042.0, 84473.0, 49321.0, 30772.0, 19492.0, 12337.0, 7922.0, 5230.0, 3476.0, 2248.0, 1548.0, 1058.0, 680.0, 459.0, 338.0, 192.0, 139.0, 89.0, 62.0, 31.0, 29.0, 22.0, 13.0, 7.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01522064208984375, -0.014754652976989746, -0.014288663864135742, -0.013822674751281738, -0.013356685638427734, -0.01289069652557373, -0.012424707412719727, -0.011958718299865723, -0.011492729187011719, -0.011026740074157715, -0.010560750961303711, -0.010094761848449707, -0.009628772735595703, -0.0091627836227417, -0.008696794509887695, -0.008230805397033691, -0.0077648162841796875, -0.007298827171325684, -0.00683283805847168, -0.006366848945617676, -0.005900859832763672, -0.005434870719909668, -0.004968881607055664, -0.00450289249420166, -0.004036903381347656, -0.0035709142684936523, -0.0031049251556396484, -0.0026389360427856445, -0.0021729469299316406, -0.0017069578170776367, -0.0012409687042236328, -0.0007749795913696289, -0.000308990478515625, 0.0001569986343383789, 0.0006229877471923828, 0.0010889768600463867, 0.0015549659729003906, 0.0020209550857543945, 0.0024869441986083984, 0.0029529333114624023, 0.0034189224243164062, 0.00388491153717041, 0.004350900650024414, 0.004816889762878418, 0.005282878875732422, 0.005748867988586426, 0.00621485710144043, 0.006680846214294434, 0.0071468353271484375, 0.007612824440002441, 0.008078813552856445, 0.00854480266571045, 0.009010791778564453, 0.009476780891418457, 0.009942770004272461, 0.010408759117126465, 0.010874748229980469, 0.011340737342834473, 0.011806726455688477, 0.01227271556854248, 0.012738704681396484, 0.013204693794250488, 0.013670682907104492, 0.014136672019958496, 0.0146026611328125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 9.0, 11.0, 8.0, 20.0, 11.0, 24.0, 23.0, 24.0, 37.0, 30.0, 37.0, 34.0, 34.0, 41.0, 40.0, 47.0, 45.0, 1068.0, 37.0, 46.0, 36.0, 44.0, 35.0, 28.0, 30.0, 42.0, 33.0, 23.0, 19.0, 20.0, 20.0, 14.0, 11.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.21875, -2.15606689453125, -2.0933837890625, -2.03070068359375, -1.968017578125, -1.90533447265625, -1.8426513671875, -1.77996826171875, -1.71728515625, -1.65460205078125, -1.5919189453125, -1.52923583984375, -1.466552734375, -1.40386962890625, -1.3411865234375, -1.27850341796875, -1.2158203125, -1.15313720703125, -1.0904541015625, -1.02777099609375, -0.965087890625, -0.90240478515625, -0.8397216796875, -0.77703857421875, -0.71435546875, -0.65167236328125, -0.5889892578125, -0.52630615234375, -0.463623046875, -0.40093994140625, -0.3382568359375, -0.27557373046875, -0.212890625, -0.15020751953125, -0.0875244140625, -0.02484130859375, 0.037841796875, 0.10052490234375, 0.1632080078125, 0.22589111328125, 0.28857421875, 0.35125732421875, 0.4139404296875, 0.47662353515625, 0.539306640625, 0.60198974609375, 0.6646728515625, 0.72735595703125, 0.7900390625, 0.85272216796875, 0.9154052734375, 0.97808837890625, 1.040771484375, 1.10345458984375, 1.1661376953125, 1.22882080078125, 1.29150390625, 1.35418701171875, 1.4168701171875, 1.47955322265625, 1.542236328125, 1.60491943359375, 1.6676025390625, 1.73028564453125, 1.79296875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 9.0, 7.0, 6.0, 21.0, 23.0, 26.0, 49.0, 94.0, 111.0, 174.0, 243.0, 436.0, 637.0, 1105.0, 1766.0, 2642.0, 4671.0, 7694.0, 13119.0, 22561.0, 39368.0, 69282.0, 134906.0, 1366793.0, 212532.0, 94432.0, 52037.0, 29769.0, 17200.0, 10004.0, 6030.0, 3504.0, 2226.0, 1362.0, 835.0, 525.0, 324.0, 195.0, 157.0, 94.0, 66.0, 32.0, 25.0, 22.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01184844970703125, -0.01145017147064209, -0.01105189323425293, -0.01065361499786377, -0.01025533676147461, -0.00985705852508545, -0.009458780288696289, -0.009060502052307129, -0.008662223815917969, -0.008263945579528809, -0.007865667343139648, -0.007467389106750488, -0.007069110870361328, -0.006670832633972168, -0.006272554397583008, -0.005874276161193848, -0.0054759979248046875, -0.005077719688415527, -0.004679441452026367, -0.004281163215637207, -0.003882884979248047, -0.0034846067428588867, -0.0030863285064697266, -0.0026880502700805664, -0.0022897720336914062, -0.001891493797302246, -0.001493215560913086, -0.0010949373245239258, -0.0006966590881347656, -0.00029838085174560547, 9.989738464355469e-05, 0.0004981756210327148, 0.000896453857421875, 0.0012947320938110352, 0.0016930103302001953, 0.0020912885665893555, 0.0024895668029785156, 0.0028878450393676758, 0.003286123275756836, 0.003684401512145996, 0.004082679748535156, 0.004480957984924316, 0.0048792362213134766, 0.005277514457702637, 0.005675792694091797, 0.006074070930480957, 0.006472349166870117, 0.006870627403259277, 0.0072689056396484375, 0.007667183876037598, 0.008065462112426758, 0.008463740348815918, 0.008862018585205078, 0.009260296821594238, 0.009658575057983398, 0.010056853294372559, 0.010455131530761719, 0.010853409767150879, 0.011251688003540039, 0.0116499662399292, 0.01204824447631836, 0.01244652271270752, 0.01284480094909668, 0.01324307918548584, 0.013641357421875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 927.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.0], "bins": [-1.1920928955078125e-07, -1.1641532182693481e-07, -1.1362135410308838e-07, -1.1082738637924194e-07, -1.0803341865539551e-07, -1.0523945093154907e-07, -1.0244548320770264e-07, -9.96515154838562e-08, -9.685754776000977e-08, -9.406358003616333e-08, -9.12696123123169e-08, -8.847564458847046e-08, -8.568167686462402e-08, -8.288770914077759e-08, -8.009374141693115e-08, -7.729977369308472e-08, -7.450580596923828e-08, -7.171183824539185e-08, -6.891787052154541e-08, -6.612390279769897e-08, -6.332993507385254e-08, -6.05359673500061e-08, -5.774199962615967e-08, -5.494803190231323e-08, -5.21540641784668e-08, -4.936009645462036e-08, -4.6566128730773926e-08, -4.377216100692749e-08, -4.0978193283081055e-08, -3.818422555923462e-08, -3.5390257835388184e-08, -3.259629011154175e-08, -2.9802322387695312e-08, -2.7008354663848877e-08, -2.421438694000244e-08, -2.1420419216156006e-08, -1.862645149230957e-08, -1.5832483768463135e-08, -1.30385160446167e-08, -1.0244548320770264e-08, -7.450580596923828e-09, -4.6566128730773926e-09, -1.862645149230957e-09, 9.313225746154785e-10, 3.725290298461914e-09, 6.51925802230835e-09, 9.313225746154785e-09, 1.210719347000122e-08, 1.4901161193847656e-08, 1.7695128917694092e-08, 2.0489096641540527e-08, 2.3283064365386963e-08, 2.60770320892334e-08, 2.8870999813079834e-08, 3.166496753692627e-08, 3.4458935260772705e-08, 3.725290298461914e-08, 4.0046870708465576e-08, 4.284083843231201e-08, 4.563480615615845e-08, 4.842877388000488e-08, 5.122274160385132e-08, 5.4016709327697754e-08, 5.681067705154419e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [11.0, 0.0, 0.0, 0.0, 1.0, 0.0, 22.0, 0.0, 13.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 22.0, 26.0, 23.0, 23.0, 89.0, 212.0, 2942.0, 0.0, 23400.0, 994937.0, 23486.0, 2909.0, 224.0, 97.0, 13.0, 0.0, 24.0, 24.0, 22.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 21.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3113021850585938e-06, -1.259148120880127e-06, -1.2069940567016602e-06, -1.1548399925231934e-06, -1.1026859283447266e-06, -1.0505318641662598e-06, -9.98377799987793e-07, -9.462237358093262e-07, -8.940696716308594e-07, -8.419156074523926e-07, -7.897615432739258e-07, -7.37607479095459e-07, -6.854534149169922e-07, -6.332993507385254e-07, -5.811452865600586e-07, -5.289912223815918e-07, -4.76837158203125e-07, -4.246830940246582e-07, -3.725290298461914e-07, -3.203749656677246e-07, -2.682209014892578e-07, -2.1606683731079102e-07, -1.6391277313232422e-07, -1.1175870895385742e-07, -5.960464477539063e-08, -7.450580596923828e-09, 4.470348358154297e-08, 9.685754776000977e-08, 1.4901161193847656e-07, 2.0116567611694336e-07, 2.5331974029541016e-07, 3.0547380447387695e-07, 3.5762786865234375e-07, 4.0978193283081055e-07, 4.6193599700927734e-07, 5.140900611877441e-07, 5.662441253662109e-07, 6.183981895446777e-07, 6.705522537231445e-07, 7.227063179016113e-07, 7.748603820800781e-07, 8.270144462585449e-07, 8.791685104370117e-07, 9.313225746154785e-07, 9.834766387939453e-07, 1.0356307029724121e-06, 1.087784767150879e-06, 1.1399388313293457e-06, 1.1920928955078125e-06, 1.2442469596862793e-06, 1.296401023864746e-06, 1.3485550880432129e-06, 1.4007091522216797e-06, 1.4528632164001465e-06, 1.5050172805786133e-06, 1.55717134475708e-06, 1.6093254089355469e-06, 1.6614794731140137e-06, 1.7136335372924805e-06, 1.7657876014709473e-06, 1.817941665649414e-06, 1.8700957298278809e-06, 1.9222497940063477e-06, 1.9744038581848145e-06, 2.0265579223632812e-06]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 6.0, 7.0, 5.0, 14.0, 18.0, 11.0, 14.0, 30.0, 40.0, 26.0, 36.0, 30.0, 35.0, 34.0, 32.0, 38.0, 52.0, 44.0, 56.0, 44.0, 39.0, 46.0, 34.0, 33.0, 34.0, 25.0, 20.0, 27.0, 26.0, 17.0, 16.0, 20.0, 8.0, 11.0, 12.0, 13.0, 4.0, 6.0, 8.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.75390625, -2.66571044921875, -2.5775146484375, -2.48931884765625, -2.401123046875, -2.31292724609375, -2.2247314453125, -2.13653564453125, -2.04833984375, -1.96014404296875, -1.8719482421875, -1.78375244140625, -1.695556640625, -1.60736083984375, -1.5191650390625, -1.43096923828125, -1.3427734375, -1.25457763671875, -1.1663818359375, -1.07818603515625, -0.989990234375, -0.90179443359375, -0.8135986328125, -0.72540283203125, -0.63720703125, -0.54901123046875, -0.4608154296875, -0.37261962890625, -0.284423828125, -0.19622802734375, -0.1080322265625, -0.01983642578125, 0.068359375, 0.15655517578125, 0.2447509765625, 0.33294677734375, 0.421142578125, 0.50933837890625, 0.5975341796875, 0.68572998046875, 0.77392578125, 0.86212158203125, 0.9503173828125, 1.03851318359375, 1.126708984375, 1.21490478515625, 1.3031005859375, 1.39129638671875, 1.4794921875, 1.56768798828125, 1.6558837890625, 1.74407958984375, 1.832275390625, 1.92047119140625, 2.0086669921875, 2.09686279296875, 2.18505859375, 2.27325439453125, 2.3614501953125, 2.44964599609375, 2.537841796875, 2.62603759765625, 2.7142333984375, 2.80242919921875, 2.890625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 7.0, 7.0, 12.0, 24.0, 23.0, 58.0, 74.0, 115.0, 219.0, 307.0, 553.0, 942.0, 1611.0, 2909.0, 4965.0, 8927.0, 17020.0, 34403.0, 83773.0, 320838.0, 396891.0, 96053.0, 37849.0, 18234.0, 9954.0, 5441.0, 3086.0, 1755.0, 938.0, 575.0, 365.0, 217.0, 147.0, 75.0, 57.0, 46.0, 33.0, 19.0, 15.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.90625, -2.81561279296875, -2.7249755859375, -2.63433837890625, -2.543701171875, -2.45306396484375, -2.3624267578125, -2.27178955078125, -2.18115234375, -2.09051513671875, -1.9998779296875, -1.90924072265625, -1.818603515625, -1.72796630859375, -1.6373291015625, -1.54669189453125, -1.4560546875, -1.36541748046875, -1.2747802734375, -1.18414306640625, -1.093505859375, -1.00286865234375, -0.9122314453125, -0.82159423828125, -0.73095703125, -0.64031982421875, -0.5496826171875, -0.45904541015625, -0.368408203125, -0.27777099609375, -0.1871337890625, -0.09649658203125, -0.005859375, 0.08477783203125, 0.1754150390625, 0.26605224609375, 0.356689453125, 0.44732666015625, 0.5379638671875, 0.62860107421875, 0.71923828125, 0.80987548828125, 0.9005126953125, 0.99114990234375, 1.081787109375, 1.17242431640625, 1.2630615234375, 1.35369873046875, 1.4443359375, 1.53497314453125, 1.6256103515625, 1.71624755859375, 1.806884765625, 1.89752197265625, 1.9881591796875, 2.07879638671875, 2.16943359375, 2.26007080078125, 2.3507080078125, 2.44134521484375, 2.531982421875, 2.62261962890625, 2.7132568359375, 2.80389404296875, 2.89453125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 5.0, 6.0, 4.0, 11.0, 10.0, 12.0, 19.0, 16.0, 20.0, 21.0, 24.0, 37.0, 41.0, 42.0, 44.0, 55.0, 46.0, 77.0, 171.0, 1653.0, 215.0, 100.0, 58.0, 48.0, 42.0, 40.0, 31.0, 34.0, 20.0, 29.0, 28.0, 9.0, 13.0, 17.0, 10.0, 10.0, 10.0, 11.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.6171875, -10.3006591796875, -9.984130859375, -9.6676025390625, -9.35107421875, -9.0345458984375, -8.718017578125, -8.4014892578125, -8.0849609375, -7.7684326171875, -7.451904296875, -7.1353759765625, -6.81884765625, -6.5023193359375, -6.185791015625, -5.8692626953125, -5.552734375, -5.2362060546875, -4.919677734375, -4.6031494140625, -4.28662109375, -3.9700927734375, -3.653564453125, -3.3370361328125, -3.0205078125, -2.7039794921875, -2.387451171875, -2.0709228515625, -1.75439453125, -1.4378662109375, -1.121337890625, -0.8048095703125, -0.48828125, -0.1717529296875, 0.144775390625, 0.4613037109375, 0.77783203125, 1.0943603515625, 1.410888671875, 1.7274169921875, 2.0439453125, 2.3604736328125, 2.677001953125, 2.9935302734375, 3.31005859375, 3.6265869140625, 3.943115234375, 4.2596435546875, 4.576171875, 4.8927001953125, 5.209228515625, 5.5257568359375, 5.84228515625, 6.1588134765625, 6.475341796875, 6.7918701171875, 7.1083984375, 7.4249267578125, 7.741455078125, 8.0579833984375, 8.37451171875, 8.6910400390625, 9.007568359375, 9.3240966796875, 9.640625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 11.0, 12.0, 14.0, 11.0, 19.0, 16.0, 18.0, 35.0, 43.0, 53.0, 79.0, 86.0, 119.0, 148.0, 233.0, 455.0, 1725.0, 39345.0, 3068999.0, 31416.0, 1505.0, 435.0, 254.0, 146.0, 122.0, 100.0, 84.0, 55.0, 26.0, 35.0, 16.0, 29.0, 13.0, 15.0, 7.0, 5.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.14208984375, -20.4248046875, -19.70751953125, -18.990234375, -18.27294921875, -17.5556640625, -16.83837890625, -16.12109375, -15.40380859375, -14.6865234375, -13.96923828125, -13.251953125, -12.53466796875, -11.8173828125, -11.10009765625, -10.3828125, -9.66552734375, -8.9482421875, -8.23095703125, -7.513671875, -6.79638671875, -6.0791015625, -5.36181640625, -4.64453125, -3.92724609375, -3.2099609375, -2.49267578125, -1.775390625, -1.05810546875, -0.3408203125, 0.37646484375, 1.09375, 1.81103515625, 2.5283203125, 3.24560546875, 3.962890625, 4.68017578125, 5.3974609375, 6.11474609375, 6.83203125, 7.54931640625, 8.2666015625, 8.98388671875, 9.701171875, 10.41845703125, 11.1357421875, 11.85302734375, 12.5703125, 13.28759765625, 14.0048828125, 14.72216796875, 15.439453125, 16.15673828125, 16.8740234375, 17.59130859375, 18.30859375, 19.02587890625, 19.7431640625, 20.46044921875, 21.177734375, 21.89501953125, 22.6123046875, 23.32958984375, 24.046875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [195.0, 808.0, 15.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.190304756164551, -1.1983695030212402, 2.7935657501220703, 6.785500526428223, 10.777436256408691, 14.76937198638916, 18.761306762695312, 22.75324249267578, 26.74517822265625, 30.73711395263672, 34.72904968261719, 38.720985412597656, 42.712921142578125, 46.704856872558594, 50.6967887878418, 54.688724517822266, 58.680660247802734, 62.6725959777832, 66.6645278930664, 70.65646362304688, 74.64839935302734, 78.64033508300781, 82.63227081298828, 86.62420654296875, 90.61614227294922, 94.60807800292969, 98.60001373291016, 102.59194946289062, 106.5838851928711, 110.57582092285156, 114.5677490234375, 118.5596923828125, 122.55162048339844, 126.5435562133789, 130.53549194335938, 134.5274200439453, 138.5193634033203, 142.51129150390625, 146.50323486328125, 150.4951629638672, 154.4871063232422, 158.47903442382812, 162.47097778320312, 166.46290588378906, 170.45484924316406, 174.44677734375, 178.438720703125, 182.43064880371094, 186.42257690429688, 190.4145050048828, 194.4064483642578, 198.39837646484375, 202.39031982421875, 206.3822479248047, 210.3741912841797, 214.36611938476562, 218.35806274414062, 222.34999084472656, 226.34193420410156, 230.3338623046875, 234.3258056640625, 238.31773376464844, 242.30967712402344, 246.30160522460938, 250.29354858398438]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 5.0, 3.0, 8.0, 7.0, 12.0, 15.0, 12.0, 17.0, 13.0, 22.0, 32.0, 23.0, 25.0, 31.0, 34.0, 46.0, 30.0, 36.0, 32.0, 33.0, 51.0, 37.0, 52.0, 33.0, 31.0, 31.0, 30.0, 36.0, 28.0, 27.0, 26.0, 22.0, 24.0, 17.0, 14.0, 16.0, 13.0, 16.0, 6.0, 4.0, 17.0, 7.0, 3.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-24.78132438659668, -24.04560089111328, -23.309879302978516, -22.574155807495117, -21.83843231201172, -21.10270881652832, -20.366985321044922, -19.631263732910156, -18.895540237426758, -18.15981674194336, -17.424095153808594, -16.688371658325195, -15.952648162841797, -15.216924667358398, -14.481202125549316, -13.745479583740234, -13.009756088256836, -12.274032592773438, -11.538310050964355, -10.802587509155273, -10.066864013671875, -9.331140518188477, -8.595417976379395, -7.859694957733154, -7.123971939086914, -6.388248920440674, -5.652525901794434, -4.916802883148193, -4.181079864501953, -3.445356845855713, -2.7096338272094727, -1.9739108085632324, -1.2381877899169922, -0.502464771270752, 0.23325824737548828, 0.9689812660217285, 1.7047042846679688, 2.440427303314209, 3.176150321960449, 3.9118733406066895, 4.64759635925293, 5.38331937789917, 6.11904239654541, 6.85476541519165, 7.590488433837891, 8.326211929321289, 9.061934471130371, 9.797657012939453, 10.533380508422852, 11.26910400390625, 12.004826545715332, 12.740549087524414, 13.476272583007812, 14.211996078491211, 14.947718620300293, 15.683441162109375, 16.419164657592773, 17.154888153076172, 17.890609741210938, 18.626333236694336, 19.362056732177734, 20.097780227661133, 20.83350372314453, 21.569225311279297, 22.304948806762695]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 3.0, 10.0, 10.0, 10.0, 16.0, 17.0, 22.0, 25.0, 24.0, 39.0, 36.0, 20.0, 40.0, 37.0, 48.0, 46.0, 47.0, 40.0, 44.0, 49.0, 50.0, 42.0, 29.0, 32.0, 30.0, 31.0, 25.0, 21.0, 24.0, 19.0, 15.0, 11.0, 11.0, 18.0, 13.0, 7.0, 4.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.892578125, -2.79925537109375, -2.7059326171875, -2.61260986328125, -2.519287109375, -2.42596435546875, -2.3326416015625, -2.23931884765625, -2.14599609375, -2.05267333984375, -1.9593505859375, -1.86602783203125, -1.772705078125, -1.67938232421875, -1.5860595703125, -1.49273681640625, -1.3994140625, -1.30609130859375, -1.2127685546875, -1.11944580078125, -1.026123046875, -0.93280029296875, -0.8394775390625, -0.74615478515625, -0.65283203125, -0.55950927734375, -0.4661865234375, -0.37286376953125, -0.279541015625, -0.18621826171875, -0.0928955078125, 0.00042724609375, 0.09375, 0.18707275390625, 0.2803955078125, 0.37371826171875, 0.467041015625, 0.56036376953125, 0.6536865234375, 0.74700927734375, 0.84033203125, 0.93365478515625, 1.0269775390625, 1.12030029296875, 1.213623046875, 1.30694580078125, 1.4002685546875, 1.49359130859375, 1.5869140625, 1.68023681640625, 1.7735595703125, 1.86688232421875, 1.960205078125, 2.05352783203125, 2.1468505859375, 2.24017333984375, 2.33349609375, 2.42681884765625, 2.5201416015625, 2.61346435546875, 2.706787109375, 2.80010986328125, 2.8934326171875, 2.98675537109375, 3.080078125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 1.0, 8.0, 10.0, 16.0, 18.0, 21.0, 28.0, 35.0, 59.0, 78.0, 121.0, 299.0, 704.0, 1765.0, 5808.0, 24413.0, 139936.0, 1240918.0, 2380134.0, 336585.0, 48048.0, 10392.0, 2907.0, 1006.0, 428.0, 186.0, 100.0, 66.0, 43.0, 31.0, 13.0, 17.0, 17.0, 10.0, 11.0, 6.0, 8.0, 5.0, 2.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.015625, -6.78338623046875, -6.5511474609375, -6.31890869140625, -6.086669921875, -5.85443115234375, -5.6221923828125, -5.38995361328125, -5.15771484375, -4.92547607421875, -4.6932373046875, -4.46099853515625, -4.228759765625, -3.99652099609375, -3.7642822265625, -3.53204345703125, -3.2998046875, -3.06756591796875, -2.8353271484375, -2.60308837890625, -2.370849609375, -2.13861083984375, -1.9063720703125, -1.67413330078125, -1.44189453125, -1.20965576171875, -0.9774169921875, -0.74517822265625, -0.512939453125, -0.28070068359375, -0.0484619140625, 0.18377685546875, 0.416015625, 0.64825439453125, 0.8804931640625, 1.11273193359375, 1.344970703125, 1.57720947265625, 1.8094482421875, 2.04168701171875, 2.27392578125, 2.50616455078125, 2.7384033203125, 2.97064208984375, 3.202880859375, 3.43511962890625, 3.6673583984375, 3.89959716796875, 4.1318359375, 4.36407470703125, 4.5963134765625, 4.82855224609375, 5.060791015625, 5.29302978515625, 5.5252685546875, 5.75750732421875, 5.98974609375, 6.22198486328125, 6.4542236328125, 6.68646240234375, 6.918701171875, 7.15093994140625, 7.3831787109375, 7.61541748046875, 7.84765625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 2.0, 9.0, 8.0, 14.0, 18.0, 25.0, 37.0, 36.0, 67.0, 86.0, 106.0, 150.0, 158.0, 254.0, 380.0, 396.0, 488.0, 440.0, 340.0, 238.0, 207.0, 171.0, 118.0, 90.0, 65.0, 45.0, 36.0, 36.0, 16.0, 11.0, 7.0, 2.0, 6.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.36737060546875, -5.1917724609375, -5.01617431640625, -4.840576171875, -4.66497802734375, -4.4893798828125, -4.31378173828125, -4.13818359375, -3.96258544921875, -3.7869873046875, -3.61138916015625, -3.435791015625, -3.26019287109375, -3.0845947265625, -2.90899658203125, -2.7333984375, -2.55780029296875, -2.3822021484375, -2.20660400390625, -2.031005859375, -1.85540771484375, -1.6798095703125, -1.50421142578125, -1.32861328125, -1.15301513671875, -0.9774169921875, -0.80181884765625, -0.626220703125, -0.45062255859375, -0.2750244140625, -0.09942626953125, 0.076171875, 0.25177001953125, 0.4273681640625, 0.60296630859375, 0.778564453125, 0.95416259765625, 1.1297607421875, 1.30535888671875, 1.48095703125, 1.65655517578125, 1.8321533203125, 2.00775146484375, 2.183349609375, 2.35894775390625, 2.5345458984375, 2.71014404296875, 2.8857421875, 3.06134033203125, 3.2369384765625, 3.41253662109375, 3.588134765625, 3.76373291015625, 3.9393310546875, 4.11492919921875, 4.29052734375, 4.46612548828125, 4.6417236328125, 4.81732177734375, 4.992919921875, 5.16851806640625, 5.3441162109375, 5.51971435546875, 5.6953125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 10.0, 16.0, 9.0, 25.0, 33.0, 28.0, 75.0, 87.0, 122.0, 166.0, 249.0, 309.0, 482.0, 2192.0, 109337.0, 3897362.0, 179165.0, 2906.0, 565.0, 300.0, 248.0, 154.0, 122.0, 90.0, 55.0, 41.0, 32.0, 29.0, 21.0, 11.0, 10.0, 6.0, 5.0, 4.0, 8.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.640625, -23.859619140625, -23.07861328125, -22.297607421875, -21.5166015625, -20.735595703125, -19.95458984375, -19.173583984375, -18.392578125, -17.611572265625, -16.83056640625, -16.049560546875, -15.2685546875, -14.487548828125, -13.70654296875, -12.925537109375, -12.14453125, -11.363525390625, -10.58251953125, -9.801513671875, -9.0205078125, -8.239501953125, -7.45849609375, -6.677490234375, -5.896484375, -5.115478515625, -4.33447265625, -3.553466796875, -2.7724609375, -1.991455078125, -1.21044921875, -0.429443359375, 0.3515625, 1.132568359375, 1.91357421875, 2.694580078125, 3.4755859375, 4.256591796875, 5.03759765625, 5.818603515625, 6.599609375, 7.380615234375, 8.16162109375, 8.942626953125, 9.7236328125, 10.504638671875, 11.28564453125, 12.066650390625, 12.84765625, 13.628662109375, 14.40966796875, 15.190673828125, 15.9716796875, 16.752685546875, 17.53369140625, 18.314697265625, 19.095703125, 19.876708984375, 20.65771484375, 21.438720703125, 22.2197265625, 23.000732421875, 23.78173828125, 24.562744140625, 25.34375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 9.0, 18.0, 49.0, 60.0, 113.0, 172.0, 179.0, 142.0, 109.0, 86.0, 43.0, 17.0, 10.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.216331481933594, -14.920907020568848, -13.625482559204102, -12.330058097839355, -11.03463363647461, -9.739209175109863, -8.443784713745117, -7.148360252380371, -5.852935791015625, -4.557511329650879, -3.262086868286133, -1.9666624069213867, -0.6712379455566406, 0.6241865158081055, 1.9196109771728516, 3.2150354385375977, 4.510459899902344, 5.80588436126709, 7.101308822631836, 8.396733283996582, 9.692157745361328, 10.987582206726074, 12.28300666809082, 13.578431129455566, 14.873855590820312, 16.169281005859375, 17.464704513549805, 18.760128021240234, 20.055553436279297, 21.35097885131836, 22.64640235900879, 23.94182586669922, 25.23725128173828, 26.532676696777344, 27.828100204467773, 29.123523712158203, 30.418949127197266, 31.714374542236328, 33.009796142578125, 34.30522155761719, 35.60064697265625, 36.89607238769531, 38.191497802734375, 39.48691940307617, 40.782344818115234, 42.0777702331543, 43.373191833496094, 44.668617248535156, 45.96404266357422, 47.25946807861328, 48.554893493652344, 49.85031509399414, 51.1457405090332, 52.441165924072266, 53.73658752441406, 55.032012939453125, 56.32743835449219, 57.62286376953125, 58.91828918457031, 60.21371078491211, 61.50913619995117, 62.804561614990234, 64.09998321533203, 65.3954086303711, 66.69083404541016]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 9.0, 4.0, 6.0, 8.0, 7.0, 21.0, 18.0, 17.0, 30.0, 26.0, 23.0, 32.0, 37.0, 36.0, 42.0, 58.0, 47.0, 55.0, 42.0, 47.0, 46.0, 49.0, 54.0, 26.0, 32.0, 34.0, 24.0, 13.0, 32.0, 24.0, 20.0, 15.0, 12.0, 12.0, 6.0, 11.0, 7.0, 10.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.41748046875, -18.791841506958008, -18.166202545166016, -17.540563583374023, -16.91492462158203, -16.289287567138672, -15.66364860534668, -15.038009643554688, -14.412370681762695, -13.786731719970703, -13.161092758178711, -12.535454750061035, -11.909815788269043, -11.28417682647705, -10.658538818359375, -10.032899856567383, -9.40726089477539, -8.781621932983398, -8.155982971191406, -7.5303449630737305, -6.904706001281738, -6.279067039489746, -5.653428554534912, -5.027790069580078, -4.402151107788086, -3.776512384414673, -3.1508736610412598, -2.5252349376678467, -1.8995962142944336, -1.2739574909210205, -0.6483187675476074, -0.022680282592773438, 0.6029586791992188, 1.2285974025726318, 1.854236125946045, 2.479874849319458, 3.105513572692871, 3.731152296066284, 4.356791019439697, 4.982429504394531, 5.608068466186523, 6.233707427978516, 6.85934591293335, 7.484984397888184, 8.110623359680176, 8.736262321472168, 9.361900329589844, 9.987539291381836, 10.613178253173828, 11.23881721496582, 11.864456176757812, 12.490094184875488, 13.11573314666748, 13.741372108459473, 14.367010116577148, 14.99264907836914, 15.618288040161133, 16.243927001953125, 16.869565963745117, 17.49520492553711, 18.12084197998047, 18.74648094177246, 19.372119903564453, 19.997758865356445, 20.623397827148438]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 11.0, 11.0, 18.0, 20.0, 12.0, 25.0, 25.0, 33.0, 17.0, 22.0, 27.0, 34.0, 37.0, 44.0, 38.0, 55.0, 47.0, 44.0, 33.0, 37.0, 43.0, 32.0, 45.0, 32.0, 31.0, 25.0, 19.0, 23.0, 28.0, 20.0, 19.0, 11.0, 10.0, 9.0, 9.0, 11.0, 7.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.955078125, -2.86663818359375, -2.7781982421875, -2.68975830078125, -2.601318359375, -2.51287841796875, -2.4244384765625, -2.33599853515625, -2.24755859375, -2.15911865234375, -2.0706787109375, -1.98223876953125, -1.893798828125, -1.80535888671875, -1.7169189453125, -1.62847900390625, -1.5400390625, -1.45159912109375, -1.3631591796875, -1.27471923828125, -1.186279296875, -1.09783935546875, -1.0093994140625, -0.92095947265625, -0.83251953125, -0.74407958984375, -0.6556396484375, -0.56719970703125, -0.478759765625, -0.39031982421875, -0.3018798828125, -0.21343994140625, -0.125, -0.03656005859375, 0.0518798828125, 0.14031982421875, 0.228759765625, 0.31719970703125, 0.4056396484375, 0.49407958984375, 0.58251953125, 0.67095947265625, 0.7593994140625, 0.84783935546875, 0.936279296875, 1.02471923828125, 1.1131591796875, 1.20159912109375, 1.2900390625, 1.37847900390625, 1.4669189453125, 1.55535888671875, 1.643798828125, 1.73223876953125, 1.8206787109375, 1.90911865234375, 1.99755859375, 2.08599853515625, 2.1744384765625, 2.26287841796875, 2.351318359375, 2.43975830078125, 2.5281982421875, 2.61663818359375, 2.705078125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 20.0, 22.0, 31.0, 46.0, 62.0, 103.0, 141.0, 194.0, 264.0, 391.0, 559.0, 723.0, 1131.0, 1519.0, 2231.0, 3094.0, 4395.0, 6449.0, 9088.0, 12969.0, 18412.0, 26455.0, 38911.0, 61798.0, 105708.0, 231272.0, 229154.0, 105630.0, 60819.0, 38741.0, 26600.0, 18530.0, 12963.0, 9026.0, 6216.0, 4353.0, 3027.0, 2180.0, 1464.0, 1118.0, 772.0, 567.0, 417.0, 280.0, 209.0, 142.0, 114.0, 78.0, 47.0, 36.0, 30.0, 15.0, 11.0, 8.0, 5.0, 2.0, 2.0], "bins": [-0.0134124755859375, -0.013005971908569336, -0.012599468231201172, -0.012192964553833008, -0.011786460876464844, -0.01137995719909668, -0.010973453521728516, -0.010566949844360352, -0.010160446166992188, -0.009753942489624023, -0.00934743881225586, -0.008940935134887695, -0.008534431457519531, -0.008127927780151367, -0.007721424102783203, -0.007314920425415039, -0.006908416748046875, -0.006501913070678711, -0.006095409393310547, -0.005688905715942383, -0.005282402038574219, -0.004875898361206055, -0.004469394683837891, -0.0040628910064697266, -0.0036563873291015625, -0.0032498836517333984, -0.0028433799743652344, -0.0024368762969970703, -0.0020303726196289062, -0.0016238689422607422, -0.0012173652648925781, -0.0008108615875244141, -0.00040435791015625, 2.1457672119140625e-06, 0.0004086494445800781, 0.0008151531219482422, 0.0012216567993164062, 0.0016281604766845703, 0.0020346641540527344, 0.0024411678314208984, 0.0028476715087890625, 0.0032541751861572266, 0.0036606788635253906, 0.004067182540893555, 0.004473686218261719, 0.004880189895629883, 0.005286693572998047, 0.005693197250366211, 0.006099700927734375, 0.006506204605102539, 0.006912708282470703, 0.007319211959838867, 0.007725715637207031, 0.008132219314575195, 0.00853872299194336, 0.008945226669311523, 0.009351730346679688, 0.009758234024047852, 0.010164737701416016, 0.01057124137878418, 0.010977745056152344, 0.011384248733520508, 0.011790752410888672, 0.012197256088256836, 0.012603759765625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 8.0, 2.0, 6.0, 13.0, 20.0, 25.0, 23.0, 20.0, 25.0, 24.0, 35.0, 38.0, 52.0, 46.0, 42.0, 54.0, 50.0, 53.0, 1066.0, 39.0, 36.0, 41.0, 42.0, 31.0, 38.0, 27.0, 23.0, 27.0, 25.0, 19.0, 20.0, 10.0, 11.0, 12.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.18359375, -2.115631103515625, -2.04766845703125, -1.979705810546875, -1.9117431640625, -1.843780517578125, -1.77581787109375, -1.707855224609375, -1.639892578125, -1.571929931640625, -1.50396728515625, -1.436004638671875, -1.3680419921875, -1.300079345703125, -1.23211669921875, -1.164154052734375, -1.09619140625, -1.028228759765625, -0.96026611328125, -0.892303466796875, -0.8243408203125, -0.756378173828125, -0.68841552734375, -0.620452880859375, -0.552490234375, -0.484527587890625, -0.41656494140625, -0.348602294921875, -0.2806396484375, -0.212677001953125, -0.14471435546875, -0.076751708984375, -0.0087890625, 0.059173583984375, 0.12713623046875, 0.195098876953125, 0.2630615234375, 0.331024169921875, 0.39898681640625, 0.466949462890625, 0.534912109375, 0.602874755859375, 0.67083740234375, 0.738800048828125, 0.8067626953125, 0.874725341796875, 0.94268798828125, 1.010650634765625, 1.07861328125, 1.146575927734375, 1.21453857421875, 1.282501220703125, 1.3504638671875, 1.418426513671875, 1.48638916015625, 1.554351806640625, 1.622314453125, 1.690277099609375, 1.75823974609375, 1.826202392578125, 1.8941650390625, 1.962127685546875, 2.03009033203125, 2.098052978515625, 2.166015625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 11.0, 13.0, 22.0, 41.0, 33.0, 70.0, 119.0, 181.0, 263.0, 407.0, 635.0, 1027.0, 1726.0, 2865.0, 4354.0, 7653.0, 12496.0, 21738.0, 37289.0, 67708.0, 134305.0, 1364971.0, 221020.0, 96199.0, 51020.0, 28958.0, 16738.0, 9940.0, 5922.0, 3583.0, 2166.0, 1381.0, 771.0, 498.0, 363.0, 217.0, 150.0, 95.0, 58.0, 40.0, 29.0, 17.0, 9.0, 18.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01311492919921875, -0.012702107429504395, -0.012289285659790039, -0.011876463890075684, -0.011463642120361328, -0.011050820350646973, -0.010637998580932617, -0.010225176811218262, -0.009812355041503906, -0.00939953327178955, -0.008986711502075195, -0.00857388973236084, -0.008161067962646484, -0.007748246192932129, -0.0073354244232177734, -0.006922602653503418, -0.0065097808837890625, -0.006096959114074707, -0.0056841373443603516, -0.005271315574645996, -0.004858493804931641, -0.004445672035217285, -0.00403285026550293, -0.0036200284957885742, -0.0032072067260742188, -0.0027943849563598633, -0.002381563186645508, -0.0019687414169311523, -0.0015559196472167969, -0.0011430978775024414, -0.0007302761077880859, -0.00031745433807373047, 9.5367431640625e-05, 0.0005081892013549805, 0.0009210109710693359, 0.0013338327407836914, 0.0017466545104980469, 0.0021594762802124023, 0.002572298049926758, 0.0029851198196411133, 0.0033979415893554688, 0.0038107633590698242, 0.00422358512878418, 0.004636406898498535, 0.005049228668212891, 0.005462050437927246, 0.0058748722076416016, 0.006287693977355957, 0.0067005157470703125, 0.007113337516784668, 0.0075261592864990234, 0.007938981056213379, 0.008351802825927734, 0.00876462459564209, 0.009177446365356445, 0.0095902681350708, 0.010003089904785156, 0.010415911674499512, 0.010828733444213867, 0.011241555213928223, 0.011654376983642578, 0.012067198753356934, 0.012480020523071289, 0.012892842292785645, 0.0133056640625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 73.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 881.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 61.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 13.0, 2.0, 24.0, 17.0, 2.0, 0.0, 2.0, 6.0, 67.0, 51.0, 157.0, 3992.0, 32987.0, 1006890.0, 3978.0, 138.0, 72.0, 76.0, 3.0, 4.0, 1.0, 0.0, 11.0, 31.0, 1.0, 19.0, 12.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.993511199951172e-06, -3.893859684467316e-06, -3.7942081689834595e-06, -3.6945566534996033e-06, -3.594905138015747e-06, -3.495253622531891e-06, -3.3956021070480347e-06, -3.2959505915641785e-06, -3.1962990760803223e-06, -3.096647560596466e-06, -2.99699604511261e-06, -2.8973445296287537e-06, -2.7976930141448975e-06, -2.6980414986610413e-06, -2.598389983177185e-06, -2.498738467693329e-06, -2.3990869522094727e-06, -2.2994354367256165e-06, -2.1997839212417603e-06, -2.100132405757904e-06, -2.000480890274048e-06, -1.9008293747901917e-06, -1.8011778593063354e-06, -1.7015263438224792e-06, -1.601874828338623e-06, -1.5022233128547668e-06, -1.4025717973709106e-06, -1.3029202818870544e-06, -1.2032687664031982e-06, -1.103617250919342e-06, -1.0039657354354858e-06, -9.043142199516296e-07, -8.046627044677734e-07, -7.050111889839172e-07, -6.05359673500061e-07, -5.057081580162048e-07, -4.0605664253234863e-07, -3.0640512704849243e-07, -2.0675361156463623e-07, -1.0710209608078003e-07, -7.450580596923828e-09, 9.220093488693237e-08, 1.9185245037078857e-07, 2.915039658546448e-07, 3.91155481338501e-07, 4.908069968223572e-07, 5.904585123062134e-07, 6.901100277900696e-07, 7.897615432739258e-07, 8.89413058757782e-07, 9.890645742416382e-07, 1.0887160897254944e-06, 1.1883676052093506e-06, 1.2880191206932068e-06, 1.387670636177063e-06, 1.4873221516609192e-06, 1.5869736671447754e-06, 1.6866251826286316e-06, 1.7862766981124878e-06, 1.885928213596344e-06, 1.9855797290802e-06, 2.0852312445640564e-06, 2.1848827600479126e-06, 2.284534275531769e-06, 2.384185791015625e-06]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1022.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.063336747772155e-10, 1.812667349554431e-09, 2.7190010243316465e-09, 3.625334699108862e-09, 4.5316683738860775e-09, 5.438002048663293e-09, 6.3443357234405084e-09, 7.250669398217724e-09, 8.15700307299494e-09, 9.063336747772155e-09, 9.96967042254937e-09, 1.0876004097326586e-08, 1.1782337772103801e-08, 1.2688671446881017e-08, 1.3595005121658232e-08, 1.4501338796435448e-08, 1.5407671583034244e-08, 1.631400614598988e-08, 1.7220340708945514e-08, 1.812667349554431e-08, 1.9033006282143106e-08, 1.993934084509874e-08, 2.0845675408054376e-08, 2.1752008194653172e-08, 2.2658340981251968e-08, 2.3564675544207603e-08, 2.4471010107163238e-08, 2.5377342893762034e-08, 2.628367568036083e-08, 2.7190010243316465e-08, 2.80963448062721e-08, 2.9002677592870896e-08, 2.990901037946969e-08, 3.081534316606849e-08, 3.172167950538096e-08, 3.262801229197976e-08, 3.3534345078578554e-08, 3.444068141789103e-08, 3.5347014204489824e-08, 3.625334699108862e-08, 3.7159679777687415e-08, 3.806601256428621e-08, 3.8972348903598686e-08, 3.987868169019748e-08, 4.078501447679628e-08, 4.169135081610875e-08, 4.259768360270755e-08, 4.3504016389306344e-08, 4.441034917590514e-08, 4.5316681962503935e-08, 4.622301830181641e-08, 4.7129351088415206e-08, 4.8035683875014e-08, 4.8942020214326476e-08, 4.984835300092527e-08, 5.075468578752407e-08, 5.1661018574122863e-08, 5.256735136072166e-08, 5.3473687700034134e-08, 5.438002048663293e-08, 5.5286353273231725e-08, 5.61926896125442e-08, 5.7099022399142996e-08, 5.800535518574179e-08]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1022.0], "bins": [-5.960464477539063e-08, -5.8673322200775146e-08, -5.774199962615967e-08, -5.681067705154419e-08, -5.587935447692871e-08, -5.494803190231323e-08, -5.4016709327697754e-08, -5.3085386753082275e-08, -5.21540641784668e-08, -5.122274160385132e-08, -5.029141902923584e-08, -4.936009645462036e-08, -4.842877388000488e-08, -4.7497451305389404e-08, -4.6566128730773926e-08, -4.563480615615845e-08, -4.470348358154297e-08, -4.377216100692749e-08, -4.284083843231201e-08, -4.190951585769653e-08, -4.0978193283081055e-08, -4.0046870708465576e-08, -3.91155481338501e-08, -3.818422555923462e-08, -3.725290298461914e-08, -3.632158041000366e-08, -3.5390257835388184e-08, -3.4458935260772705e-08, -3.3527612686157227e-08, -3.259629011154175e-08, -3.166496753692627e-08, -3.073364496231079e-08, -2.9802322387695312e-08, -2.8870999813079834e-08, -2.7939677238464355e-08, -2.7008354663848877e-08, -2.60770320892334e-08, -2.514570951461792e-08, -2.421438694000244e-08, -2.3283064365386963e-08, -2.2351741790771484e-08, -2.1420419216156006e-08, -2.0489096641540527e-08, -1.955777406692505e-08, -1.862645149230957e-08, -1.7695128917694092e-08, -1.6763806343078613e-08, -1.5832483768463135e-08, -1.4901161193847656e-08, -1.3969838619232178e-08, -1.30385160446167e-08, -1.210719347000122e-08, -1.1175870895385742e-08, -1.0244548320770264e-08, -9.313225746154785e-09, -8.381903171539307e-09, -7.450580596923828e-09, -6.51925802230835e-09, -5.587935447692871e-09, -4.6566128730773926e-09, -3.725290298461914e-09, -2.7939677238464355e-09, -1.862645149230957e-09, -9.313225746154785e-10, 0.0]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 4.0, 11.0, 11.0, 18.0, 20.0, 12.0, 25.0, 25.0, 33.0, 17.0, 22.0, 27.0, 34.0, 37.0, 44.0, 38.0, 55.0, 47.0, 44.0, 33.0, 37.0, 43.0, 32.0, 45.0, 32.0, 31.0, 25.0, 19.0, 23.0, 28.0, 20.0, 19.0, 11.0, 10.0, 9.0, 9.0, 11.0, 7.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-2.955078125, -2.86663818359375, -2.7781982421875, -2.68975830078125, -2.601318359375, -2.51287841796875, -2.4244384765625, -2.33599853515625, -2.24755859375, -2.15911865234375, -2.0706787109375, -1.98223876953125, -1.893798828125, -1.80535888671875, -1.7169189453125, -1.62847900390625, -1.5400390625, -1.45159912109375, -1.3631591796875, -1.27471923828125, -1.186279296875, -1.09783935546875, -1.0093994140625, -0.92095947265625, -0.83251953125, -0.74407958984375, -0.6556396484375, -0.56719970703125, -0.478759765625, -0.39031982421875, -0.3018798828125, -0.21343994140625, -0.125, -0.03656005859375, 0.0518798828125, 0.14031982421875, 0.228759765625, 0.31719970703125, 0.4056396484375, 0.49407958984375, 0.58251953125, 0.67095947265625, 0.7593994140625, 0.84783935546875, 0.936279296875, 1.02471923828125, 1.1131591796875, 1.20159912109375, 1.2900390625, 1.37847900390625, 1.4669189453125, 1.55535888671875, 1.643798828125, 1.73223876953125, 1.8206787109375, 1.90911865234375, 1.99755859375, 2.08599853515625, 2.1744384765625, 2.26287841796875, 2.351318359375, 2.43975830078125, 2.5281982421875, 2.61663818359375, 2.705078125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 6.0, 8.0, 4.0, 8.0, 11.0, 15.0, 24.0, 27.0, 38.0, 75.0, 112.0, 165.0, 286.0, 486.0, 757.0, 1297.0, 2229.0, 3887.0, 6853.0, 11985.0, 21515.0, 40704.0, 85746.0, 237032.0, 395872.0, 122653.0, 53959.0, 27429.0, 15174.0, 8462.0, 4966.0, 2741.0, 1555.0, 961.0, 553.0, 334.0, 186.0, 148.0, 99.0, 57.0, 44.0, 19.0, 18.0, 26.0, 13.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.814453125, -2.7242431640625, -2.634033203125, -2.5438232421875, -2.45361328125, -2.3634033203125, -2.273193359375, -2.1829833984375, -2.0927734375, -2.0025634765625, -1.912353515625, -1.8221435546875, -1.73193359375, -1.6417236328125, -1.551513671875, -1.4613037109375, -1.37109375, -1.2808837890625, -1.190673828125, -1.1004638671875, -1.01025390625, -0.9200439453125, -0.829833984375, -0.7396240234375, -0.6494140625, -0.5592041015625, -0.468994140625, -0.3787841796875, -0.28857421875, -0.1983642578125, -0.108154296875, -0.0179443359375, 0.072265625, 0.1624755859375, 0.252685546875, 0.3428955078125, 0.43310546875, 0.5233154296875, 0.613525390625, 0.7037353515625, 0.7939453125, 0.8841552734375, 0.974365234375, 1.0645751953125, 1.15478515625, 1.2449951171875, 1.335205078125, 1.4254150390625, 1.515625, 1.6058349609375, 1.696044921875, 1.7862548828125, 1.87646484375, 1.9666748046875, 2.056884765625, 2.1470947265625, 2.2373046875, 2.3275146484375, 2.417724609375, 2.5079345703125, 2.59814453125, 2.6883544921875, 2.778564453125, 2.8687744140625, 2.958984375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 9.0, 3.0, 7.0, 10.0, 14.0, 8.0, 10.0, 17.0, 16.0, 17.0, 38.0, 17.0, 31.0, 53.0, 46.0, 52.0, 64.0, 89.0, 214.0, 1598.0, 209.0, 85.0, 59.0, 49.0, 50.0, 51.0, 39.0, 36.0, 19.0, 31.0, 21.0, 14.0, 11.0, 23.0, 8.0, 13.0, 8.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1796875, -8.8885498046875, -8.597412109375, -8.3062744140625, -8.01513671875, -7.7239990234375, -7.432861328125, -7.1417236328125, -6.8505859375, -6.5594482421875, -6.268310546875, -5.9771728515625, -5.68603515625, -5.3948974609375, -5.103759765625, -4.8126220703125, -4.521484375, -4.2303466796875, -3.939208984375, -3.6480712890625, -3.35693359375, -3.0657958984375, -2.774658203125, -2.4835205078125, -2.1923828125, -1.9012451171875, -1.610107421875, -1.3189697265625, -1.02783203125, -0.7366943359375, -0.445556640625, -0.1544189453125, 0.13671875, 0.4278564453125, 0.718994140625, 1.0101318359375, 1.30126953125, 1.5924072265625, 1.883544921875, 2.1746826171875, 2.4658203125, 2.7569580078125, 3.048095703125, 3.3392333984375, 3.63037109375, 3.9215087890625, 4.212646484375, 4.5037841796875, 4.794921875, 5.0860595703125, 5.377197265625, 5.6683349609375, 5.95947265625, 6.2506103515625, 6.541748046875, 6.8328857421875, 7.1240234375, 7.4151611328125, 7.706298828125, 7.9974365234375, 8.28857421875, 8.5797119140625, 8.870849609375, 9.1619873046875, 9.453125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 6.0, 10.0, 13.0, 17.0, 25.0, 22.0, 30.0, 50.0, 61.0, 63.0, 99.0, 146.0, 182.0, 272.0, 452.0, 1532.0, 15282.0, 960764.0, 2142126.0, 21138.0, 1901.0, 463.0, 281.0, 195.0, 129.0, 98.0, 66.0, 58.0, 40.0, 34.0, 24.0, 20.0, 15.0, 19.0, 15.0, 8.0, 6.0, 7.0, 8.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.78125, -16.2735595703125, -15.765869140625, -15.2581787109375, -14.75048828125, -14.2427978515625, -13.735107421875, -13.2274169921875, -12.7197265625, -12.2120361328125, -11.704345703125, -11.1966552734375, -10.68896484375, -10.1812744140625, -9.673583984375, -9.1658935546875, -8.658203125, -8.1505126953125, -7.642822265625, -7.1351318359375, -6.62744140625, -6.1197509765625, -5.612060546875, -5.1043701171875, -4.5966796875, -4.0889892578125, -3.581298828125, -3.0736083984375, -2.56591796875, -2.0582275390625, -1.550537109375, -1.0428466796875, -0.53515625, -0.0274658203125, 0.480224609375, 0.9879150390625, 1.49560546875, 2.0032958984375, 2.510986328125, 3.0186767578125, 3.5263671875, 4.0340576171875, 4.541748046875, 5.0494384765625, 5.55712890625, 6.0648193359375, 6.572509765625, 7.0802001953125, 7.587890625, 8.0955810546875, 8.603271484375, 9.1109619140625, 9.61865234375, 10.1263427734375, 10.634033203125, 11.1417236328125, 11.6494140625, 12.1571044921875, 12.664794921875, 13.1724853515625, 13.68017578125, 14.1878662109375, 14.695556640625, 15.2032470703125, 15.7109375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 60.0, 284.0, 454.0, 193.0, 17.0, 2.0, 1.0], "bins": [-98.02595520019531, -96.37340545654297, -94.7208480834961, -93.06829833984375, -91.4157485961914, -89.76319885253906, -88.11064147949219, -86.45809173583984, -84.8055419921875, -83.15299224853516, -81.50043487548828, -79.84788513183594, -78.1953353881836, -76.54278564453125, -74.89022827148438, -73.23767852783203, -71.58512115478516, -69.93257141113281, -68.28001403808594, -66.6274642944336, -64.97491455078125, -63.32236099243164, -61.66980743408203, -60.01725769042969, -58.36470413208008, -56.71215057373047, -55.059600830078125, -53.407047271728516, -51.754493713378906, -50.10194396972656, -48.44939041137695, -46.796836853027344, -45.144290924072266, -43.491737365722656, -41.83918762207031, -40.1866340637207, -38.534080505371094, -36.88153076171875, -35.22897720336914, -33.57642364501953, -31.923873901367188, -30.27132225036621, -28.618770599365234, -26.966217041015625, -25.31366539001465, -23.661113739013672, -22.008560180664062, -20.356008529663086, -18.70345687866211, -17.050905227661133, -15.39835262298584, -13.745800018310547, -12.09324836730957, -10.440696716308594, -8.7881441116333, -7.135591506958008, -5.483038902282715, -3.83048677444458, -2.1779346466064453, -0.5253825187683105, 1.1271696090698242, 2.779721260070801, 4.432273864746094, 6.084826469421387, 7.737378120422363]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 4.0, 8.0, 10.0, 6.0, 9.0, 16.0, 17.0, 17.0, 18.0, 27.0, 19.0, 32.0, 40.0, 31.0, 40.0, 31.0, 37.0, 43.0, 49.0, 44.0, 51.0, 38.0, 39.0, 41.0, 46.0, 33.0, 32.0, 34.0, 31.0, 25.0, 27.0, 18.0, 18.0, 13.0, 12.0, 7.0, 8.0, 7.0, 8.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.095500946044922, -20.347705841064453, -19.59990882873535, -18.85211181640625, -18.10431671142578, -17.356521606445312, -16.60872459411621, -15.860928535461426, -15.11313247680664, -14.365336418151855, -13.61754035949707, -12.869744300842285, -12.1219482421875, -11.374152183532715, -10.62635612487793, -9.878560066223145, -9.13076400756836, -8.382967948913574, -7.635171890258789, -6.887375831604004, -6.139579772949219, -5.391783714294434, -4.643987655639648, -3.8961915969848633, -3.148395538330078, -2.400599479675293, -1.6528034210205078, -0.9050073623657227, -0.1572113037109375, 0.5905847549438477, 1.3383808135986328, 2.086176872253418, 2.833972930908203, 3.5817689895629883, 4.329565048217773, 5.077361106872559, 5.825157165527344, 6.572953224182129, 7.320749282836914, 8.0685453414917, 8.816341400146484, 9.56413745880127, 10.311933517456055, 11.05972957611084, 11.807525634765625, 12.55532169342041, 13.303117752075195, 14.05091381072998, 14.798709869384766, 15.54650592803955, 16.294301986694336, 17.042098999023438, 17.789894104003906, 18.537689208984375, 19.285486221313477, 20.033283233642578, 20.781078338623047, 21.528873443603516, 22.276670455932617, 23.02446746826172, 23.772262573242188, 24.520057678222656, 25.267854690551758, 26.01565170288086, 26.763446807861328]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 18.0, 18.0, 16.0, 23.0, 19.0, 25.0, 27.0, 28.0, 40.0, 41.0, 40.0, 45.0, 36.0, 50.0, 40.0, 48.0, 41.0, 41.0, 38.0, 37.0, 36.0, 39.0, 28.0, 26.0, 26.0, 30.0, 17.0, 19.0, 20.0, 10.0, 6.0, 8.0, 8.0, 12.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.19140625, -3.09185791015625, -2.9923095703125, -2.89276123046875, -2.793212890625, -2.69366455078125, -2.5941162109375, -2.49456787109375, -2.39501953125, -2.29547119140625, -2.1959228515625, -2.09637451171875, -1.996826171875, -1.89727783203125, -1.7977294921875, -1.69818115234375, -1.5986328125, -1.49908447265625, -1.3995361328125, -1.29998779296875, -1.200439453125, -1.10089111328125, -1.0013427734375, -0.90179443359375, -0.80224609375, -0.70269775390625, -0.6031494140625, -0.50360107421875, -0.404052734375, -0.30450439453125, -0.2049560546875, -0.10540771484375, -0.005859375, 0.09368896484375, 0.1932373046875, 0.29278564453125, 0.392333984375, 0.49188232421875, 0.5914306640625, 0.69097900390625, 0.79052734375, 0.89007568359375, 0.9896240234375, 1.08917236328125, 1.188720703125, 1.28826904296875, 1.3878173828125, 1.48736572265625, 1.5869140625, 1.68646240234375, 1.7860107421875, 1.88555908203125, 1.985107421875, 2.08465576171875, 2.1842041015625, 2.28375244140625, 2.38330078125, 2.48284912109375, 2.5823974609375, 2.68194580078125, 2.781494140625, 2.88104248046875, 2.9805908203125, 3.08013916015625, 3.1796875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 8.0, 9.0, 10.0, 15.0, 15.0, 15.0, 22.0, 29.0, 41.0, 75.0, 105.0, 281.0, 868.0, 3163.0, 16501.0, 131020.0, 1822234.0, 2046196.0, 149737.0, 18582.0, 3672.0, 960.0, 299.0, 129.0, 66.0, 53.0, 34.0, 20.0, 27.0, 19.0, 12.0, 8.0, 11.0, 10.0, 7.0, 7.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.25, -8.961181640625, -8.67236328125, -8.383544921875, -8.0947265625, -7.805908203125, -7.51708984375, -7.228271484375, -6.939453125, -6.650634765625, -6.36181640625, -6.072998046875, -5.7841796875, -5.495361328125, -5.20654296875, -4.917724609375, -4.62890625, -4.340087890625, -4.05126953125, -3.762451171875, -3.4736328125, -3.184814453125, -2.89599609375, -2.607177734375, -2.318359375, -2.029541015625, -1.74072265625, -1.451904296875, -1.1630859375, -0.874267578125, -0.58544921875, -0.296630859375, -0.0078125, 0.281005859375, 0.56982421875, 0.858642578125, 1.1474609375, 1.436279296875, 1.72509765625, 2.013916015625, 2.302734375, 2.591552734375, 2.88037109375, 3.169189453125, 3.4580078125, 3.746826171875, 4.03564453125, 4.324462890625, 4.61328125, 4.902099609375, 5.19091796875, 5.479736328125, 5.7685546875, 6.057373046875, 6.34619140625, 6.635009765625, 6.923828125, 7.212646484375, 7.50146484375, 7.790283203125, 8.0791015625, 8.367919921875, 8.65673828125, 8.945556640625, 9.234375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 8.0, 13.0, 17.0, 6.0, 17.0, 34.0, 27.0, 48.0, 48.0, 67.0, 73.0, 84.0, 150.0, 177.0, 231.0, 278.0, 348.0, 416.0, 361.0, 354.0, 308.0, 225.0, 171.0, 128.0, 83.0, 86.0, 73.0, 49.0, 37.0, 43.0, 20.0, 22.0, 16.0, 14.0, 14.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.3125, -4.169189453125, -4.02587890625, -3.882568359375, -3.7392578125, -3.595947265625, -3.45263671875, -3.309326171875, -3.166015625, -3.022705078125, -2.87939453125, -2.736083984375, -2.5927734375, -2.449462890625, -2.30615234375, -2.162841796875, -2.01953125, -1.876220703125, -1.73291015625, -1.589599609375, -1.4462890625, -1.302978515625, -1.15966796875, -1.016357421875, -0.873046875, -0.729736328125, -0.58642578125, -0.443115234375, -0.2998046875, -0.156494140625, -0.01318359375, 0.130126953125, 0.2734375, 0.416748046875, 0.56005859375, 0.703369140625, 0.8466796875, 0.989990234375, 1.13330078125, 1.276611328125, 1.419921875, 1.563232421875, 1.70654296875, 1.849853515625, 1.9931640625, 2.136474609375, 2.27978515625, 2.423095703125, 2.56640625, 2.709716796875, 2.85302734375, 2.996337890625, 3.1396484375, 3.282958984375, 3.42626953125, 3.569580078125, 3.712890625, 3.856201171875, 3.99951171875, 4.142822265625, 4.2861328125, 4.429443359375, 4.57275390625, 4.716064453125, 4.859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 6.0, 16.0, 13.0, 18.0, 21.0, 25.0, 26.0, 51.0, 63.0, 82.0, 111.0, 125.0, 189.0, 252.0, 345.0, 1056.0, 24246.0, 3364574.0, 794177.0, 6955.0, 627.0, 329.0, 241.0, 196.0, 138.0, 81.0, 75.0, 65.0, 43.0, 38.0, 23.0, 19.0, 8.0, 9.0, 15.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.109375, -27.27880859375, -26.4482421875, -25.61767578125, -24.787109375, -23.95654296875, -23.1259765625, -22.29541015625, -21.46484375, -20.63427734375, -19.8037109375, -18.97314453125, -18.142578125, -17.31201171875, -16.4814453125, -15.65087890625, -14.8203125, -13.98974609375, -13.1591796875, -12.32861328125, -11.498046875, -10.66748046875, -9.8369140625, -9.00634765625, -8.17578125, -7.34521484375, -6.5146484375, -5.68408203125, -4.853515625, -4.02294921875, -3.1923828125, -2.36181640625, -1.53125, -0.70068359375, 0.1298828125, 0.96044921875, 1.791015625, 2.62158203125, 3.4521484375, 4.28271484375, 5.11328125, 5.94384765625, 6.7744140625, 7.60498046875, 8.435546875, 9.26611328125, 10.0966796875, 10.92724609375, 11.7578125, 12.58837890625, 13.4189453125, 14.24951171875, 15.080078125, 15.91064453125, 16.7412109375, 17.57177734375, 18.40234375, 19.23291015625, 20.0634765625, 20.89404296875, 21.724609375, 22.55517578125, 23.3857421875, 24.21630859375, 25.046875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 15.0, 16.0, 23.0, 34.0, 45.0, 66.0, 102.0, 103.0, 103.0, 103.0, 96.0, 93.0, 71.0, 52.0, 29.0, 23.0, 10.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.040903091430664, -24.22721290588379, -23.413524627685547, -22.599834442138672, -21.786144256591797, -20.972455978393555, -20.15876579284668, -19.345077514648438, -18.531387329101562, -17.717697143554688, -16.904008865356445, -16.09031867980957, -15.276629447937012, -14.462940216064453, -13.649250030517578, -12.83556079864502, -12.021871566772461, -11.208182334899902, -10.394493103027344, -9.580802917480469, -8.76711368560791, -7.953424453735352, -7.139734745025635, -6.326045036315918, -5.512355804443359, -4.698666572570801, -3.884976863861084, -3.0712873935699463, -2.2575979232788086, -1.44390869140625, -0.6302189826965332, 0.1834707260131836, 0.997161865234375, 1.8108513355255127, 2.6245408058166504, 3.438230276107788, 4.251919746398926, 5.065608978271484, 5.879298686981201, 6.692988395690918, 7.506677627563477, 8.320366859436035, 9.134056091308594, 9.947746276855469, 10.761435508728027, 11.575124740600586, 12.388814926147461, 13.20250415802002, 14.016193389892578, 14.829882621765137, 15.643571853637695, 16.45726203918457, 17.270950317382812, 18.084640502929688, 18.898330688476562, 19.712020874023438, 20.52570915222168, 21.339399337768555, 22.153087615966797, 22.966777801513672, 23.780467987060547, 24.59415626525879, 25.407846450805664, 26.221534729003906, 27.03522491455078]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 9.0, 3.0, 8.0, 9.0, 9.0, 12.0, 20.0, 18.0, 23.0, 27.0, 34.0, 35.0, 35.0, 43.0, 43.0, 45.0, 38.0, 46.0, 30.0, 46.0, 47.0, 46.0, 40.0, 35.0, 42.0, 39.0, 33.0, 29.0, 23.0, 26.0, 25.0, 17.0, 16.0, 16.0, 8.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.3619384765625, -21.730127334594727, -21.098318099975586, -20.466506958007812, -19.834697723388672, -19.2028865814209, -18.571075439453125, -17.939266204833984, -17.30745506286621, -16.675643920898438, -16.043834686279297, -15.412023544311523, -14.780213356018066, -14.14840316772461, -13.516592025756836, -12.884781837463379, -12.252971649169922, -11.621161460876465, -10.989351272583008, -10.357540130615234, -9.725729942321777, -9.09391975402832, -8.462108612060547, -7.83029842376709, -7.198488235473633, -6.566678047180176, -5.9348673820495605, -5.303056716918945, -4.671246528625488, -4.039436340332031, -3.407625675201416, -2.775815010070801, -2.1440048217773438, -1.5121943950653076, -0.8803839683532715, -0.24857354164123535, 0.3832368850708008, 1.015047311782837, 1.646857738494873, 2.2786684036254883, 2.9104785919189453, 3.5422890186309814, 4.174099445343018, 4.805910110473633, 5.43772029876709, 6.069530487060547, 6.701341152191162, 7.333151817321777, 7.964962005615234, 8.596772193908691, 9.228582382202148, 9.860393524169922, 10.492203712463379, 11.124013900756836, 11.75582504272461, 12.387635231018066, 13.019445419311523, 13.65125560760498, 14.283065795898438, 14.914876937866211, 15.546687126159668, 16.178497314453125, 16.8103084564209, 17.442119598388672, 18.073928833007812]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 7.0, 16.0, 25.0, 35.0, 22.0, 41.0, 31.0, 30.0, 41.0, 38.0, 38.0, 47.0, 58.0, 54.0, 55.0, 53.0, 46.0, 40.0, 43.0, 40.0, 36.0, 32.0, 19.0, 31.0, 26.0, 20.0, 9.0, 8.0, 10.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.919189453125, -3.80322265625, -3.687255859375, -3.5712890625, -3.455322265625, -3.33935546875, -3.223388671875, -3.107421875, -2.991455078125, -2.87548828125, -2.759521484375, -2.6435546875, -2.527587890625, -2.41162109375, -2.295654296875, -2.1796875, -2.063720703125, -1.94775390625, -1.831787109375, -1.7158203125, -1.599853515625, -1.48388671875, -1.367919921875, -1.251953125, -1.135986328125, -1.02001953125, -0.904052734375, -0.7880859375, -0.672119140625, -0.55615234375, -0.440185546875, -0.32421875, -0.208251953125, -0.09228515625, 0.023681640625, 0.1396484375, 0.255615234375, 0.37158203125, 0.487548828125, 0.603515625, 0.719482421875, 0.83544921875, 0.951416015625, 1.0673828125, 1.183349609375, 1.29931640625, 1.415283203125, 1.53125, 1.647216796875, 1.76318359375, 1.879150390625, 1.9951171875, 2.111083984375, 2.22705078125, 2.343017578125, 2.458984375, 2.574951171875, 2.69091796875, 2.806884765625, 2.9228515625, 3.038818359375, 3.15478515625, 3.270751953125, 3.38671875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 16.0, 15.0, 22.0, 34.0, 60.0, 82.0, 145.0, 216.0, 321.0, 610.0, 960.0, 1604.0, 2674.0, 4767.0, 8167.0, 14516.0, 25665.0, 47695.0, 94517.0, 229987.0, 352576.0, 126914.0, 61727.0, 32694.0, 18127.0, 10178.0, 6031.0, 3317.0, 1916.0, 1157.0, 715.0, 395.0, 235.0, 187.0, 93.0, 81.0, 41.0, 27.0, 22.0, 14.0, 14.0, 7.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0242767333984375, -0.02358698844909668, -0.02289724349975586, -0.02220749855041504, -0.02151775360107422, -0.0208280086517334, -0.020138263702392578, -0.019448518753051758, -0.018758773803710938, -0.018069028854370117, -0.017379283905029297, -0.016689538955688477, -0.015999794006347656, -0.015310049057006836, -0.014620304107666016, -0.013930559158325195, -0.013240814208984375, -0.012551069259643555, -0.011861324310302734, -0.011171579360961914, -0.010481834411621094, -0.009792089462280273, -0.009102344512939453, -0.008412599563598633, -0.0077228546142578125, -0.007033109664916992, -0.006343364715576172, -0.0056536197662353516, -0.004963874816894531, -0.004274129867553711, -0.0035843849182128906, -0.0028946399688720703, -0.00220489501953125, -0.0015151500701904297, -0.0008254051208496094, -0.00013566017150878906, 0.0005540847778320312, 0.0012438297271728516, 0.0019335746765136719, 0.002623319625854492, 0.0033130645751953125, 0.004002809524536133, 0.004692554473876953, 0.0053822994232177734, 0.006072044372558594, 0.006761789321899414, 0.007451534271240234, 0.008141279220581055, 0.008831024169921875, 0.009520769119262695, 0.010210514068603516, 0.010900259017944336, 0.011590003967285156, 0.012279748916625977, 0.012969493865966797, 0.013659238815307617, 0.014348983764648438, 0.015038728713989258, 0.015728473663330078, 0.0164182186126709, 0.01710796356201172, 0.01779770851135254, 0.01848745346069336, 0.01917719841003418, 0.019866943359375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 8.0, 8.0, 16.0, 16.0, 12.0, 19.0, 27.0, 24.0, 27.0, 21.0, 32.0, 39.0, 36.0, 29.0, 34.0, 27.0, 30.0, 46.0, 1061.0, 42.0, 42.0, 32.0, 37.0, 28.0, 39.0, 38.0, 27.0, 33.0, 31.0, 23.0, 26.0, 17.0, 13.0, 13.0, 12.0, 12.0, 6.0, 11.0, 4.0, 6.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8183441162109375, -1.758758544921875, -1.6991729736328125, -1.63958740234375, -1.5800018310546875, -1.520416259765625, -1.4608306884765625, -1.4012451171875, -1.3416595458984375, -1.282073974609375, -1.2224884033203125, -1.16290283203125, -1.1033172607421875, -1.043731689453125, -0.9841461181640625, -0.924560546875, -0.8649749755859375, -0.805389404296875, -0.7458038330078125, -0.68621826171875, -0.6266326904296875, -0.567047119140625, -0.5074615478515625, -0.4478759765625, -0.3882904052734375, -0.328704833984375, -0.2691192626953125, -0.20953369140625, -0.1499481201171875, -0.090362548828125, -0.0307769775390625, 0.02880859375, 0.0883941650390625, 0.147979736328125, 0.2075653076171875, 0.26715087890625, 0.3267364501953125, 0.386322021484375, 0.4459075927734375, 0.5054931640625, 0.5650787353515625, 0.624664306640625, 0.6842498779296875, 0.74383544921875, 0.8034210205078125, 0.863006591796875, 0.9225921630859375, 0.982177734375, 1.0417633056640625, 1.101348876953125, 1.1609344482421875, 1.22052001953125, 1.2801055908203125, 1.339691162109375, 1.3992767333984375, 1.4588623046875, 1.5184478759765625, 1.578033447265625, 1.6376190185546875, 1.69720458984375, 1.7567901611328125, 1.816375732421875, 1.8759613037109375, 1.935546875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 14.0, 29.0, 35.0, 46.0, 48.0, 95.0, 168.0, 247.0, 358.0, 506.0, 797.0, 1264.0, 1928.0, 2914.0, 4449.0, 7161.0, 11035.0, 17574.0, 28485.0, 46274.0, 77277.0, 142260.0, 1338332.0, 182168.0, 91030.0, 53894.0, 32694.0, 20331.0, 12802.0, 8132.0, 5059.0, 3361.0, 2196.0, 1377.0, 918.0, 610.0, 451.0, 276.0, 185.0, 119.0, 89.0, 43.0, 30.0, 23.0, 19.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0118408203125, -0.011478185653686523, -0.011115550994873047, -0.01075291633605957, -0.010390281677246094, -0.010027647018432617, -0.00966501235961914, -0.009302377700805664, -0.008939743041992188, -0.008577108383178711, -0.008214473724365234, -0.007851839065551758, -0.007489204406738281, -0.007126569747924805, -0.006763935089111328, -0.0064013004302978516, -0.006038665771484375, -0.0056760311126708984, -0.005313396453857422, -0.004950761795043945, -0.004588127136230469, -0.004225492477416992, -0.0038628578186035156, -0.003500223159790039, -0.0031375885009765625, -0.002774953842163086, -0.0024123191833496094, -0.002049684524536133, -0.0016870498657226562, -0.0013244152069091797, -0.0009617805480957031, -0.0005991458892822266, -0.00023651123046875, 0.00012612342834472656, 0.0004887580871582031, 0.0008513927459716797, 0.0012140274047851562, 0.0015766620635986328, 0.0019392967224121094, 0.002301931381225586, 0.0026645660400390625, 0.003027200698852539, 0.0033898353576660156, 0.003752470016479492, 0.004115104675292969, 0.004477739334106445, 0.004840373992919922, 0.0052030086517333984, 0.005565643310546875, 0.0059282779693603516, 0.006290912628173828, 0.006653547286987305, 0.007016181945800781, 0.007378816604614258, 0.007741451263427734, 0.008104085922241211, 0.008466720581054688, 0.008829355239868164, 0.00919198989868164, 0.009554624557495117, 0.009917259216308594, 0.01027989387512207, 0.010642528533935547, 0.011005163192749023, 0.0113677978515625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 87.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 839.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 86.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.7229467630386353e-07, -1.6577541828155518e-07, -1.5925616025924683e-07, -1.5273690223693848e-07, -1.4621764421463013e-07, -1.3969838619232178e-07, -1.3317912817001343e-07, -1.2665987014770508e-07, -1.2014061212539673e-07, -1.1362135410308838e-07, -1.0710209608078003e-07, -1.0058283805847168e-07, -9.406358003616333e-08, -8.754432201385498e-08, -8.102506399154663e-08, -7.450580596923828e-08, -6.798654794692993e-08, -6.146728992462158e-08, -5.494803190231323e-08, -4.842877388000488e-08, -4.190951585769653e-08, -3.5390257835388184e-08, -2.8870999813079834e-08, -2.2351741790771484e-08, -1.5832483768463135e-08, -9.313225746154785e-09, -2.7939677238464355e-09, 3.725290298461914e-09, 1.0244548320770264e-08, 1.6763806343078613e-08, 2.3283064365386963e-08, 2.9802322387695312e-08, 3.632158041000366e-08, 4.284083843231201e-08, 4.936009645462036e-08, 5.587935447692871e-08, 6.239861249923706e-08, 6.891787052154541e-08, 7.543712854385376e-08, 8.195638656616211e-08, 8.847564458847046e-08, 9.499490261077881e-08, 1.0151416063308716e-07, 1.0803341865539551e-07, 1.1455267667770386e-07, 1.210719347000122e-07, 1.2759119272232056e-07, 1.341104507446289e-07, 1.4062970876693726e-07, 1.471489667892456e-07, 1.5366822481155396e-07, 1.601874828338623e-07, 1.6670674085617065e-07, 1.73225998878479e-07, 1.7974525690078735e-07, 1.862645149230957e-07, 1.9278377294540405e-07, 1.993030309677124e-07, 2.0582228899002075e-07, 2.123415470123291e-07, 2.1886080503463745e-07, 2.253800630569458e-07, 2.3189932107925415e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 14.0, 25.0, 30.0, 22.0, 1.0, 2.0, 11.0, 85.0, 116.0, 558.0, 46634.0, 1000180.0, 573.0, 112.0, 52.0, 50.0, 3.0, 0.0, 21.0, 19.0, 34.0, 17.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-06, -4.636123776435852e-06, -4.503875970840454e-06, -4.371628165245056e-06, -4.239380359649658e-06, -4.10713255405426e-06, -3.974884748458862e-06, -3.842636942863464e-06, -3.7103891372680664e-06, -3.5781413316726685e-06, -3.4458935260772705e-06, -3.3136457204818726e-06, -3.1813979148864746e-06, -3.0491501092910767e-06, -2.9169023036956787e-06, -2.7846544981002808e-06, -2.652406692504883e-06, -2.520158886909485e-06, -2.387911081314087e-06, -2.255663275718689e-06, -2.123415470123291e-06, -1.991167664527893e-06, -1.8589198589324951e-06, -1.7266720533370972e-06, -1.5944242477416992e-06, -1.4621764421463013e-06, -1.3299286365509033e-06, -1.1976808309555054e-06, -1.0654330253601074e-06, -9.331852197647095e-07, -8.009374141693115e-07, -6.686896085739136e-07, -5.364418029785156e-07, -4.041939973831177e-07, -2.7194619178771973e-07, -1.3969838619232178e-07, -7.450580596923828e-09, 1.2479722499847412e-07, 2.5704503059387207e-07, 3.8929283618927e-07, 5.21540641784668e-07, 6.537884473800659e-07, 7.860362529754639e-07, 9.182840585708618e-07, 1.0505318641662598e-06, 1.1827796697616577e-06, 1.3150274753570557e-06, 1.4472752809524536e-06, 1.5795230865478516e-06, 1.7117708921432495e-06, 1.8440186977386475e-06, 1.9762665033340454e-06, 2.1085143089294434e-06, 2.2407621145248413e-06, 2.3730099201202393e-06, 2.505257725715637e-06, 2.637505531311035e-06, 2.769753336906433e-06, 2.902001142501831e-06, 3.034248948097229e-06, 3.166496753692627e-06, 3.298744559288025e-06, 3.430992364883423e-06, 3.563240170478821e-06, 3.6954879760742188e-06]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 2.3011285932295067e-10, 4.6022571864590134e-10, 6.903385640910642e-10, 9.204514372918027e-10, 1.1505643104925412e-09, 1.3806771281821284e-09, 1.6107900568940181e-09, 1.8409028745836054e-09, 2.071015803295495e-09, 2.3011286209850823e-09, 2.5312414386746696e-09, 2.761354256364257e-09, 2.991467074053844e-09, 3.2215798917434313e-09, 3.4516929314776235e-09, 3.6818057491672107e-09, 3.911918788901403e-09, 4.14203160659099e-09, 4.372144424280577e-09, 4.602257241970165e-09, 4.832370059659752e-09, 5.062482877349339e-09, 5.292595695038926e-09, 5.522708512728514e-09, 5.752821330418101e-09, 5.982934148107688e-09, 6.213046965797275e-09, 6.4431597834868626e-09, 6.67327260117645e-09, 6.903385418866037e-09, 7.133498680644834e-09, 7.363611498334421e-09, 7.593724760113219e-09, 7.823837577802806e-09, 8.053950395492393e-09, 8.28406321318198e-09, 8.514176030871567e-09, 8.744288848561155e-09, 8.974401666250742e-09, 9.20451448394033e-09, 9.434627301629916e-09, 9.664740119319504e-09, 9.894852937009091e-09, 1.0124965754698678e-08, 1.0355078572388265e-08, 1.0585191390077853e-08, 1.081530420776744e-08, 1.1045417025457027e-08, 1.1275529843146614e-08, 1.1505642660836202e-08, 1.1735755478525789e-08, 1.1965868296215376e-08, 1.2195981113904963e-08, 1.242609393159455e-08, 1.2656206749284138e-08, 1.2886320455152145e-08, 1.3116433272841732e-08, 1.334654609053132e-08, 1.3576658908220907e-08, 1.3806771725910494e-08, 1.4036884543600081e-08, 1.4266997361289668e-08, 1.4497110178979256e-08, 1.4727222996668843e-08]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1023.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 11.0, 7.0, 16.0, 25.0, 35.0, 22.0, 41.0, 31.0, 30.0, 41.0, 38.0, 38.0, 47.0, 58.0, 54.0, 55.0, 53.0, 46.0, 40.0, 43.0, 40.0, 36.0, 32.0, 19.0, 31.0, 26.0, 20.0, 9.0, 8.0, 10.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03515625, -3.919189453125, -3.80322265625, -3.687255859375, -3.5712890625, -3.455322265625, -3.33935546875, -3.223388671875, -3.107421875, -2.991455078125, -2.87548828125, -2.759521484375, -2.6435546875, -2.527587890625, -2.41162109375, -2.295654296875, -2.1796875, -2.063720703125, -1.94775390625, -1.831787109375, -1.7158203125, -1.599853515625, -1.48388671875, -1.367919921875, -1.251953125, -1.135986328125, -1.02001953125, -0.904052734375, -0.7880859375, -0.672119140625, -0.55615234375, -0.440185546875, -0.32421875, -0.208251953125, -0.09228515625, 0.023681640625, 0.1396484375, 0.255615234375, 0.37158203125, 0.487548828125, 0.603515625, 0.719482421875, 0.83544921875, 0.951416015625, 1.0673828125, 1.183349609375, 1.29931640625, 1.415283203125, 1.53125, 1.647216796875, 1.76318359375, 1.879150390625, 1.9951171875, 2.111083984375, 2.22705078125, 2.343017578125, 2.458984375, 2.574951171875, 2.69091796875, 2.806884765625, 2.9228515625, 3.038818359375, 3.15478515625, 3.270751953125, 3.38671875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 13.0, 15.0, 14.0, 27.0, 49.0, 62.0, 85.0, 132.0, 216.0, 442.0, 1056.0, 2814.0, 7952.0, 22928.0, 100084.0, 715148.0, 152961.0, 28944.0, 9695.0, 3434.0, 1301.0, 503.0, 252.0, 135.0, 77.0, 53.0, 51.0, 28.0, 16.0, 16.0, 11.0, 9.0, 6.0, 10.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69921875, -5.53448486328125, -5.3697509765625, -5.20501708984375, -5.040283203125, -4.87554931640625, -4.7108154296875, -4.54608154296875, -4.38134765625, -4.21661376953125, -4.0518798828125, -3.88714599609375, -3.722412109375, -3.55767822265625, -3.3929443359375, -3.22821044921875, -3.0634765625, -2.89874267578125, -2.7340087890625, -2.56927490234375, -2.404541015625, -2.23980712890625, -2.0750732421875, -1.91033935546875, -1.74560546875, -1.58087158203125, -1.4161376953125, -1.25140380859375, -1.086669921875, -0.92193603515625, -0.7572021484375, -0.59246826171875, -0.427734375, -0.26300048828125, -0.0982666015625, 0.06646728515625, 0.231201171875, 0.39593505859375, 0.5606689453125, 0.72540283203125, 0.89013671875, 1.05487060546875, 1.2196044921875, 1.38433837890625, 1.549072265625, 1.71380615234375, 1.8785400390625, 2.04327392578125, 2.2080078125, 2.37274169921875, 2.5374755859375, 2.70220947265625, 2.866943359375, 3.03167724609375, 3.1964111328125, 3.36114501953125, 3.52587890625, 3.69061279296875, 3.8553466796875, 4.02008056640625, 4.184814453125, 4.34954833984375, 4.5142822265625, 4.67901611328125, 4.84375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 7.0, 6.0, 9.0, 8.0, 7.0, 5.0, 17.0, 11.0, 17.0, 10.0, 12.0, 17.0, 25.0, 28.0, 33.0, 38.0, 31.0, 33.0, 58.0, 55.0, 97.0, 221.0, 1656.0, 163.0, 75.0, 48.0, 35.0, 40.0, 35.0, 38.0, 22.0, 19.0, 31.0, 23.0, 20.0, 16.0, 20.0, 14.0, 10.0, 12.0, 11.0, 8.0, 5.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.78125, -8.4920654296875, -8.202880859375, -7.9136962890625, -7.62451171875, -7.3353271484375, -7.046142578125, -6.7569580078125, -6.4677734375, -6.1785888671875, -5.889404296875, -5.6002197265625, -5.31103515625, -5.0218505859375, -4.732666015625, -4.4434814453125, -4.154296875, -3.8651123046875, -3.575927734375, -3.2867431640625, -2.99755859375, -2.7083740234375, -2.419189453125, -2.1300048828125, -1.8408203125, -1.5516357421875, -1.262451171875, -0.9732666015625, -0.68408203125, -0.3948974609375, -0.105712890625, 0.1834716796875, 0.47265625, 0.7618408203125, 1.051025390625, 1.3402099609375, 1.62939453125, 1.9185791015625, 2.207763671875, 2.4969482421875, 2.7861328125, 3.0753173828125, 3.364501953125, 3.6536865234375, 3.94287109375, 4.2320556640625, 4.521240234375, 4.8104248046875, 5.099609375, 5.3887939453125, 5.677978515625, 5.9671630859375, 6.25634765625, 6.5455322265625, 6.834716796875, 7.1239013671875, 7.4130859375, 7.7022705078125, 7.991455078125, 8.2806396484375, 8.56982421875, 8.8590087890625, 9.148193359375, 9.4373779296875, 9.7265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 5.0, 4.0, 6.0, 14.0, 8.0, 15.0, 12.0, 24.0, 18.0, 23.0, 40.0, 29.0, 35.0, 49.0, 65.0, 115.0, 140.0, 255.0, 650.0, 4288.0, 703249.0, 2428852.0, 6155.0, 778.0, 262.0, 162.0, 109.0, 77.0, 51.0, 43.0, 27.0, 21.0, 14.0, 13.0, 16.0, 14.0, 14.0, 13.0, 6.0, 6.0, 12.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-23.53125, -22.84033203125, -22.1494140625, -21.45849609375, -20.767578125, -20.07666015625, -19.3857421875, -18.69482421875, -18.00390625, -17.31298828125, -16.6220703125, -15.93115234375, -15.240234375, -14.54931640625, -13.8583984375, -13.16748046875, -12.4765625, -11.78564453125, -11.0947265625, -10.40380859375, -9.712890625, -9.02197265625, -8.3310546875, -7.64013671875, -6.94921875, -6.25830078125, -5.5673828125, -4.87646484375, -4.185546875, -3.49462890625, -2.8037109375, -2.11279296875, -1.421875, -0.73095703125, -0.0400390625, 0.65087890625, 1.341796875, 2.03271484375, 2.7236328125, 3.41455078125, 4.10546875, 4.79638671875, 5.4873046875, 6.17822265625, 6.869140625, 7.56005859375, 8.2509765625, 8.94189453125, 9.6328125, 10.32373046875, 11.0146484375, 11.70556640625, 12.396484375, 13.08740234375, 13.7783203125, 14.46923828125, 15.16015625, 15.85107421875, 16.5419921875, 17.23291015625, 17.923828125, 18.61474609375, 19.3056640625, 19.99658203125, 20.6875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 18.0, 39.0, 70.0, 96.0, 116.0, 152.0, 154.0, 139.0, 81.0, 65.0, 30.0, 23.0, 8.0, 8.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.624663352966309, -5.2265753746032715, -4.828487396240234, -4.4303998947143555, -4.032311916351318, -3.6342239379882812, -3.2361361980438232, -2.8380484580993652, -2.439960479736328, -2.041872501373291, -1.643784761428833, -1.2456969022750854, -0.8476090431213379, -0.44952118396759033, -0.05143332481384277, 0.34665441513061523, 0.7447423934936523, 1.1428302526474, 1.5409181118011475, 1.939005970954895, 2.3370938301086426, 2.7351818084716797, 3.1332695484161377, 3.5313572883605957, 3.929445266723633, 4.32753324508667, 4.725621223449707, 5.123708724975586, 5.521796703338623, 5.91988468170166, 6.317972183227539, 6.716060161590576, 7.11414909362793, 7.512237071990967, 7.910325050354004, 8.308412551879883, 8.706501007080078, 9.104588508605957, 9.502676010131836, 9.900764465332031, 10.29885196685791, 10.696939468383789, 11.095027923583984, 11.493115425109863, 11.891202926635742, 12.289291381835938, 12.687378883361816, 13.085466384887695, 13.48355484008789, 13.88164234161377, 14.279730796813965, 14.677818298339844, 15.075906753540039, 15.473994255065918, 15.872081756591797, 16.270170211791992, 16.668258666992188, 17.066347122192383, 17.464433670043945, 17.86252212524414, 18.260610580444336, 18.6586971282959, 19.056785583496094, 19.45487403869629, 19.85296058654785]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 9.0, 4.0, 9.0, 17.0, 14.0, 19.0, 17.0, 29.0, 22.0, 38.0, 29.0, 30.0, 38.0, 47.0, 49.0, 44.0, 44.0, 53.0, 44.0, 41.0, 44.0, 43.0, 46.0, 33.0, 44.0, 33.0, 25.0, 20.0, 19.0, 22.0, 15.0, 13.0, 8.0, 12.0, 5.0, 3.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.866119384765625, -33.842620849609375, -32.81912612915039, -31.79562759399414, -30.77212905883789, -29.748632431030273, -28.725135803222656, -27.701637268066406, -26.67814064025879, -25.654644012451172, -24.631145477294922, -23.607648849487305, -22.584152221679688, -21.560653686523438, -20.53715705871582, -19.513660430908203, -18.490161895751953, -17.466665267944336, -16.443166732788086, -15.419670104980469, -14.396172523498535, -13.372674942016602, -12.349178314208984, -11.32568073272705, -10.302183151245117, -9.278685569763184, -8.25518798828125, -7.231691360473633, -6.208193778991699, -5.184696197509766, -4.16119909286499, -3.137701988220215, -2.114208221435547, -1.0907108783721924, -0.06721353530883789, 0.9562838077545166, 1.979781150817871, 3.0032787322998047, 4.02677583694458, 5.0502729415893555, 6.073770523071289, 7.097268104553223, 8.120765686035156, 9.144262313842773, 10.167759895324707, 11.19125747680664, 12.214754104614258, 13.238251686096191, 14.261749267578125, 15.285246849060059, 16.308744430541992, 17.33224105834961, 18.35573959350586, 19.379236221313477, 20.402732849121094, 21.426231384277344, 22.44972801208496, 23.473224639892578, 24.496723175048828, 25.520219802856445, 26.543716430664062, 27.567214965820312, 28.59071159362793, 29.614208221435547, 30.637706756591797]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 6.0, 5.0, 12.0, 9.0, 20.0, 32.0, 33.0, 26.0, 37.0, 34.0, 37.0, 41.0, 46.0, 40.0, 52.0, 57.0, 53.0, 48.0, 47.0, 52.0, 42.0, 30.0, 38.0, 28.0, 31.0, 30.0, 25.0, 29.0, 14.0, 8.0, 10.0, 10.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.083953857421875, -3.96087646484375, -3.837799072265625, -3.7147216796875, -3.591644287109375, -3.46856689453125, -3.345489501953125, -3.222412109375, -3.099334716796875, -2.97625732421875, -2.853179931640625, -2.7301025390625, -2.607025146484375, -2.48394775390625, -2.360870361328125, -2.23779296875, -2.114715576171875, -1.99163818359375, -1.868560791015625, -1.7454833984375, -1.622406005859375, -1.49932861328125, -1.376251220703125, -1.253173828125, -1.130096435546875, -1.00701904296875, -0.883941650390625, -0.7608642578125, -0.637786865234375, -0.51470947265625, -0.391632080078125, -0.2685546875, -0.145477294921875, -0.02239990234375, 0.100677490234375, 0.2237548828125, 0.346832275390625, 0.46990966796875, 0.592987060546875, 0.716064453125, 0.839141845703125, 0.96221923828125, 1.085296630859375, 1.2083740234375, 1.331451416015625, 1.45452880859375, 1.577606201171875, 1.70068359375, 1.823760986328125, 1.94683837890625, 2.069915771484375, 2.1929931640625, 2.316070556640625, 2.43914794921875, 2.562225341796875, 2.685302734375, 2.808380126953125, 2.93145751953125, 3.054534912109375, 3.1776123046875, 3.300689697265625, 3.42376708984375, 3.546844482421875, 3.669921875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 22.0, 23.0, 33.0, 48.0, 75.0, 130.0, 212.0, 318.0, 485.0, 852.0, 1439.0, 2629.0, 5074.0, 10092.0, 20514.0, 44757.0, 104572.0, 266941.0, 675883.0, 1258672.0, 1037679.0, 452914.0, 175046.0, 72178.0, 31965.0, 15352.0, 7430.0, 3914.0, 2116.0, 1094.0, 678.0, 424.0, 254.0, 169.0, 97.0, 62.0, 43.0, 26.0, 22.0, 12.0, 7.0, 5.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.625, -3.520782470703125, -3.41656494140625, -3.312347412109375, -3.2081298828125, -3.103912353515625, -2.99969482421875, -2.895477294921875, -2.791259765625, -2.687042236328125, -2.58282470703125, -2.478607177734375, -2.3743896484375, -2.270172119140625, -2.16595458984375, -2.061737060546875, -1.95751953125, -1.853302001953125, -1.74908447265625, -1.644866943359375, -1.5406494140625, -1.436431884765625, -1.33221435546875, -1.227996826171875, -1.123779296875, -1.019561767578125, -0.91534423828125, -0.811126708984375, -0.7069091796875, -0.602691650390625, -0.49847412109375, -0.394256591796875, -0.2900390625, -0.185821533203125, -0.08160400390625, 0.022613525390625, 0.1268310546875, 0.231048583984375, 0.33526611328125, 0.439483642578125, 0.543701171875, 0.647918701171875, 0.75213623046875, 0.856353759765625, 0.9605712890625, 1.064788818359375, 1.16900634765625, 1.273223876953125, 1.37744140625, 1.481658935546875, 1.58587646484375, 1.690093994140625, 1.7943115234375, 1.898529052734375, 2.00274658203125, 2.106964111328125, 2.211181640625, 2.315399169921875, 2.41961669921875, 2.523834228515625, 2.6280517578125, 2.732269287109375, 2.83648681640625, 2.940704345703125, 3.044921875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 6.0, 14.0, 15.0, 17.0, 28.0, 38.0, 38.0, 64.0, 69.0, 85.0, 102.0, 135.0, 180.0, 251.0, 272.0, 337.0, 372.0, 399.0, 318.0, 249.0, 228.0, 167.0, 132.0, 106.0, 92.0, 74.0, 50.0, 51.0, 42.0, 28.0, 13.0, 18.0, 19.0, 12.0, 4.0, 10.0, 11.0, 4.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.77734375, -4.62762451171875, -4.4779052734375, -4.32818603515625, -4.178466796875, -4.02874755859375, -3.8790283203125, -3.72930908203125, -3.57958984375, -3.42987060546875, -3.2801513671875, -3.13043212890625, -2.980712890625, -2.83099365234375, -2.6812744140625, -2.53155517578125, -2.3818359375, -2.23211669921875, -2.0823974609375, -1.93267822265625, -1.782958984375, -1.63323974609375, -1.4835205078125, -1.33380126953125, -1.18408203125, -1.03436279296875, -0.8846435546875, -0.73492431640625, -0.585205078125, -0.43548583984375, -0.2857666015625, -0.13604736328125, 0.013671875, 0.16339111328125, 0.3131103515625, 0.46282958984375, 0.612548828125, 0.76226806640625, 0.9119873046875, 1.06170654296875, 1.21142578125, 1.36114501953125, 1.5108642578125, 1.66058349609375, 1.810302734375, 1.96002197265625, 2.1097412109375, 2.25946044921875, 2.4091796875, 2.55889892578125, 2.7086181640625, 2.85833740234375, 3.008056640625, 3.15777587890625, 3.3074951171875, 3.45721435546875, 3.60693359375, 3.75665283203125, 3.9063720703125, 4.05609130859375, 4.205810546875, 4.35552978515625, 4.5052490234375, 4.65496826171875, 4.8046875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 5.0, 4.0, 9.0, 16.0, 6.0, 20.0, 21.0, 31.0, 29.0, 51.0, 64.0, 92.0, 98.0, 149.0, 197.0, 265.0, 379.0, 722.0, 3108.0, 76417.0, 3370893.0, 724153.0, 14518.0, 1361.0, 496.0, 325.0, 240.0, 136.0, 118.0, 103.0, 63.0, 50.0, 42.0, 28.0, 22.0, 16.0, 10.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.337158203125, -17.72119140625, -17.105224609375, -16.4892578125, -15.873291015625, -15.25732421875, -14.641357421875, -14.025390625, -13.409423828125, -12.79345703125, -12.177490234375, -11.5615234375, -10.945556640625, -10.32958984375, -9.713623046875, -9.09765625, -8.481689453125, -7.86572265625, -7.249755859375, -6.6337890625, -6.017822265625, -5.40185546875, -4.785888671875, -4.169921875, -3.553955078125, -2.93798828125, -2.322021484375, -1.7060546875, -1.090087890625, -0.47412109375, 0.141845703125, 0.7578125, 1.373779296875, 1.98974609375, 2.605712890625, 3.2216796875, 3.837646484375, 4.45361328125, 5.069580078125, 5.685546875, 6.301513671875, 6.91748046875, 7.533447265625, 8.1494140625, 8.765380859375, 9.38134765625, 9.997314453125, 10.61328125, 11.229248046875, 11.84521484375, 12.461181640625, 13.0771484375, 13.693115234375, 14.30908203125, 14.925048828125, 15.541015625, 16.156982421875, 16.77294921875, 17.388916015625, 18.0048828125, 18.620849609375, 19.23681640625, 19.852783203125, 20.46875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 12.0, 47.0, 166.0, 322.0, 263.0, 148.0, 38.0, 15.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.80194091796875, -109.36416625976562, -106.92639923095703, -104.4886245727539, -102.05085754394531, -99.61308288574219, -97.17530822753906, -94.73754119873047, -92.29976654052734, -89.86199188232422, -87.42422485351562, -84.9864501953125, -82.5486831665039, -80.11090850830078, -77.67314147949219, -75.23536682128906, -72.79759216308594, -70.35981750488281, -67.92205047607422, -65.4842758178711, -63.046504974365234, -60.608734130859375, -58.170963287353516, -55.733192443847656, -53.29542541503906, -50.8576545715332, -48.419883728027344, -45.98210906982422, -43.54433822631836, -41.1065673828125, -38.66879653930664, -36.23102569580078, -33.793251037597656, -31.355480194091797, -28.917707443237305, -26.479936599731445, -24.042163848876953, -21.604393005371094, -19.166622161865234, -16.728849411010742, -14.291078567504883, -11.853306770324707, -9.415534973144531, -6.977764129638672, -4.539992332458496, -2.1022205352783203, 0.33555030822753906, 2.7733230590820312, 5.211093902587891, 7.648865699768066, 10.086637496948242, 12.524408340454102, 14.962180137634277, 17.399951934814453, 19.837722778320312, 22.275495529174805, 24.713266372680664, 27.151037216186523, 29.588809967041016, 32.026580810546875, 34.464351654052734, 36.902122497558594, 39.33989715576172, 41.77766799926758, 44.21543884277344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 1.0, 5.0, 10.0, 3.0, 9.0, 7.0, 18.0, 13.0, 14.0, 20.0, 20.0, 13.0, 23.0, 24.0, 36.0, 28.0, 34.0, 52.0, 38.0, 37.0, 38.0, 54.0, 39.0, 41.0, 38.0, 46.0, 41.0, 42.0, 36.0, 34.0, 32.0, 30.0, 21.0, 25.0, 17.0, 5.0, 12.0, 8.0, 9.0, 9.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5845947265625, -18.91526222229004, -18.245929718017578, -17.576597213745117, -16.907264709472656, -16.237934112548828, -15.568601608276367, -14.899269104003906, -14.229936599731445, -13.560604095458984, -12.891271591186523, -12.221940040588379, -11.552607536315918, -10.883275032043457, -10.213943481445312, -9.544610977172852, -8.87527847290039, -8.20594596862793, -7.536613941192627, -6.867281913757324, -6.197949409484863, -5.528616905212402, -4.8592848777771, -4.189952850341797, -3.520620346069336, -2.851288080215454, -2.1819558143615723, -1.5126235485076904, -0.8432912826538086, -0.17395901679992676, 0.4953732490539551, 1.1647052764892578, 1.8340377807617188, 2.5033700466156006, 3.1727023124694824, 3.8420345783233643, 4.511366844177246, 5.180699348449707, 5.85003137588501, 6.5193634033203125, 7.188695907592773, 7.858028411865234, 8.527360916137695, 9.19669246673584, 9.8660249710083, 10.535357475280762, 11.204689025878906, 11.874021530151367, 12.543354034423828, 13.212686538696289, 13.88201904296875, 14.551350593566895, 15.220683097839355, 15.890015602111816, 16.55934715270996, 17.228679656982422, 17.898012161254883, 18.567344665527344, 19.236677169799805, 19.906009674072266, 20.575340270996094, 21.244672775268555, 21.914005279541016, 22.583337783813477, 23.252670288085938]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 11.0, 11.0, 7.0, 21.0, 12.0, 24.0, 45.0, 32.0, 25.0, 39.0, 42.0, 33.0, 35.0, 41.0, 58.0, 58.0, 55.0, 43.0, 42.0, 45.0, 45.0, 45.0, 37.0, 29.0, 28.0, 23.0, 23.0, 19.0, 19.0, 12.0, 15.0, 6.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.08984375, -3.97320556640625, -3.8565673828125, -3.73992919921875, -3.623291015625, -3.50665283203125, -3.3900146484375, -3.27337646484375, -3.15673828125, -3.04010009765625, -2.9234619140625, -2.80682373046875, -2.690185546875, -2.57354736328125, -2.4569091796875, -2.34027099609375, -2.2236328125, -2.10699462890625, -1.9903564453125, -1.87371826171875, -1.757080078125, -1.64044189453125, -1.5238037109375, -1.40716552734375, -1.29052734375, -1.17388916015625, -1.0572509765625, -0.94061279296875, -0.823974609375, -0.70733642578125, -0.5906982421875, -0.47406005859375, -0.357421875, -0.24078369140625, -0.1241455078125, -0.00750732421875, 0.109130859375, 0.22576904296875, 0.3424072265625, 0.45904541015625, 0.57568359375, 0.69232177734375, 0.8089599609375, 0.92559814453125, 1.042236328125, 1.15887451171875, 1.2755126953125, 1.39215087890625, 1.5087890625, 1.62542724609375, 1.7420654296875, 1.85870361328125, 1.975341796875, 2.09197998046875, 2.2086181640625, 2.32525634765625, 2.44189453125, 2.55853271484375, 2.6751708984375, 2.79180908203125, 2.908447265625, 3.02508544921875, 3.1417236328125, 3.25836181640625, 3.375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 9.0, 20.0, 25.0, 32.0, 43.0, 63.0, 115.0, 155.0, 227.0, 309.0, 528.0, 805.0, 1330.0, 2078.0, 3358.0, 5349.0, 8659.0, 13979.0, 22794.0, 37245.0, 62672.0, 113493.0, 280613.0, 243714.0, 102683.0, 57764.0, 34673.0, 21025.0, 13150.0, 8210.0, 4954.0, 3078.0, 1933.0, 1244.0, 771.0, 459.0, 334.0, 213.0, 131.0, 94.0, 59.0, 47.0, 24.0, 26.0, 25.0, 14.0, 8.0, 6.0, 7.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.018951416015625, -0.01839280128479004, -0.017834186553955078, -0.017275571823120117, -0.016716957092285156, -0.016158342361450195, -0.015599727630615234, -0.015041112899780273, -0.014482498168945312, -0.013923883438110352, -0.01336526870727539, -0.01280665397644043, -0.012248039245605469, -0.011689424514770508, -0.011130809783935547, -0.010572195053100586, -0.010013580322265625, -0.009454965591430664, -0.008896350860595703, -0.008337736129760742, -0.007779121398925781, -0.00722050666809082, -0.006661891937255859, -0.0061032772064208984, -0.0055446624755859375, -0.0049860477447509766, -0.004427433013916016, -0.0038688182830810547, -0.0033102035522460938, -0.002751588821411133, -0.002192974090576172, -0.001634359359741211, -0.00107574462890625, -0.0005171298980712891, 4.1484832763671875e-05, 0.0006000995635986328, 0.0011587142944335938, 0.0017173290252685547, 0.0022759437561035156, 0.0028345584869384766, 0.0033931732177734375, 0.0039517879486083984, 0.004510402679443359, 0.00506901741027832, 0.005627632141113281, 0.006186246871948242, 0.006744861602783203, 0.007303476333618164, 0.007862091064453125, 0.008420705795288086, 0.008979320526123047, 0.009537935256958008, 0.010096549987792969, 0.01065516471862793, 0.01121377944946289, 0.011772394180297852, 0.012331008911132812, 0.012889623641967773, 0.013448238372802734, 0.014006853103637695, 0.014565467834472656, 0.015124082565307617, 0.015682697296142578, 0.01624131202697754, 0.0167999267578125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 6.0, 0.0, 6.0, 6.0, 9.0, 8.0, 14.0, 17.0, 16.0, 21.0, 28.0, 26.0, 30.0, 38.0, 37.0, 36.0, 37.0, 50.0, 45.0, 50.0, 1075.0, 38.0, 47.0, 47.0, 35.0, 37.0, 31.0, 39.0, 32.0, 22.0, 21.0, 19.0, 14.0, 22.0, 13.0, 9.0, 7.0, 10.0, 8.0, 7.0, 4.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9892578125, -1.9214935302734375, -1.853729248046875, -1.7859649658203125, -1.71820068359375, -1.6504364013671875, -1.582672119140625, -1.5149078369140625, -1.4471435546875, -1.3793792724609375, -1.311614990234375, -1.2438507080078125, -1.17608642578125, -1.1083221435546875, -1.040557861328125, -0.9727935791015625, -0.905029296875, -0.8372650146484375, -0.769500732421875, -0.7017364501953125, -0.63397216796875, -0.5662078857421875, -0.498443603515625, -0.4306793212890625, -0.3629150390625, -0.2951507568359375, -0.227386474609375, -0.1596221923828125, -0.09185791015625, -0.0240936279296875, 0.043670654296875, 0.1114349365234375, 0.17919921875, 0.2469635009765625, 0.314727783203125, 0.3824920654296875, 0.45025634765625, 0.5180206298828125, 0.585784912109375, 0.6535491943359375, 0.7213134765625, 0.7890777587890625, 0.856842041015625, 0.9246063232421875, 0.99237060546875, 1.0601348876953125, 1.127899169921875, 1.1956634521484375, 1.263427734375, 1.3311920166015625, 1.398956298828125, 1.4667205810546875, 1.53448486328125, 1.6022491455078125, 1.670013427734375, 1.7377777099609375, 1.8055419921875, 1.8733062744140625, 1.941070556640625, 2.0088348388671875, 2.07659912109375, 2.1443634033203125, 2.212127685546875, 2.2798919677734375, 2.34765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 11.0, 15.0, 32.0, 26.0, 50.0, 64.0, 109.0, 218.0, 326.0, 480.0, 742.0, 1237.0, 2025.0, 3129.0, 5036.0, 8290.0, 13582.0, 22869.0, 39567.0, 71621.0, 148211.0, 1388718.0, 192988.0, 84839.0, 46151.0, 26424.0, 15471.0, 9598.0, 5488.0, 3618.0, 2255.0, 1408.0, 908.0, 594.0, 367.0, 239.0, 168.0, 107.0, 44.0, 31.0, 26.0, 17.0, 15.0, 8.0, 9.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.014434814453125, -0.014005661010742188, -0.013576507568359375, -0.013147354125976562, -0.01271820068359375, -0.012289047241210938, -0.011859893798828125, -0.011430740356445312, -0.0110015869140625, -0.010572433471679688, -0.010143280029296875, -0.009714126586914062, -0.00928497314453125, -0.008855819702148438, -0.008426666259765625, -0.007997512817382812, -0.007568359375, -0.0071392059326171875, -0.006710052490234375, -0.0062808990478515625, -0.00585174560546875, -0.0054225921630859375, -0.004993438720703125, -0.0045642852783203125, -0.0041351318359375, -0.0037059783935546875, -0.003276824951171875, -0.0028476715087890625, -0.00241851806640625, -0.0019893646240234375, -0.001560211181640625, -0.0011310577392578125, -0.000701904296875, -0.0002727508544921875, 0.000156402587890625, 0.0005855560302734375, 0.00101470947265625, 0.0014438629150390625, 0.001873016357421875, 0.0023021697998046875, 0.0027313232421875, 0.0031604766845703125, 0.003589630126953125, 0.0040187835693359375, 0.00444793701171875, 0.0048770904541015625, 0.005306243896484375, 0.0057353973388671875, 0.00616455078125, 0.0065937042236328125, 0.007022857666015625, 0.0074520111083984375, 0.00788116455078125, 0.008310317993164062, 0.008739471435546875, 0.009168624877929688, 0.0095977783203125, 0.010026931762695312, 0.010456085205078125, 0.010885238647460938, 0.01131439208984375, 0.011743545532226562, 0.012172698974609375, 0.012601852416992188, 0.013031005859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 815.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 90.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 13.0, 44.0, 15.0, 23.0, 10.0, 0.0, 7.0, 41.0, 67.0, 65.0, 257.0, 4954.0, 991059.0, 51461.0, 257.0, 48.0, 75.0, 41.0, 4.0, 2.0, 6.0, 21.0, 21.0, 37.0, 16.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.874301910400391e-06, -3.7513673305511475e-06, -3.6284327507019043e-06, -3.505498170852661e-06, -3.382563591003418e-06, -3.259629011154175e-06, -3.1366944313049316e-06, -3.0137598514556885e-06, -2.8908252716064453e-06, -2.767890691757202e-06, -2.644956111907959e-06, -2.522021532058716e-06, -2.3990869522094727e-06, -2.2761523723602295e-06, -2.1532177925109863e-06, -2.030283212661743e-06, -1.9073486328125e-06, -1.7844140529632568e-06, -1.6614794731140137e-06, -1.5385448932647705e-06, -1.4156103134155273e-06, -1.2926757335662842e-06, -1.169741153717041e-06, -1.0468065738677979e-06, -9.238719940185547e-07, -8.009374141693115e-07, -6.780028343200684e-07, -5.550682544708252e-07, -4.3213367462158203e-07, -3.0919909477233887e-07, -1.862645149230957e-07, -6.332993507385254e-08, 5.960464477539063e-08, 1.825392246246338e-07, 3.0547380447387695e-07, 4.284083843231201e-07, 5.513429641723633e-07, 6.742775440216064e-07, 7.972121238708496e-07, 9.201467037200928e-07, 1.043081283569336e-06, 1.166015863418579e-06, 1.2889504432678223e-06, 1.4118850231170654e-06, 1.5348196029663086e-06, 1.6577541828155518e-06, 1.780688762664795e-06, 1.903623342514038e-06, 2.0265579223632812e-06, 2.1494925022125244e-06, 2.2724270820617676e-06, 2.3953616619110107e-06, 2.518296241760254e-06, 2.641230821609497e-06, 2.7641654014587402e-06, 2.8870999813079834e-06, 3.0100345611572266e-06, 3.1329691410064697e-06, 3.255903720855713e-06, 3.378838300704956e-06, 3.5017728805541992e-06, 3.6247074604034424e-06, 3.7476420402526855e-06, 3.870576620101929e-06, 3.993511199951172e-06]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1022.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.357754773172019e-08, -5.245936307574084e-08, -5.134118197247517e-08, -5.022299731649582e-08, -4.910481266051647e-08, -4.7986628004537124e-08, -4.6868446901271454e-08, -4.5750262245292106e-08, -4.463207758931276e-08, -4.351389293333341e-08, -4.239571183006774e-08, -4.127752717408839e-08, -4.015934251810904e-08, -3.9041157862129694e-08, -3.7922976758864024e-08, -3.6804792102884676e-08, -3.5686610999619006e-08, -3.456842634363966e-08, -3.345024524037399e-08, -3.233206058439464e-08, -3.121387592841529e-08, -3.009569127243594e-08, -2.8977510169170273e-08, -2.7859325513190925e-08, -2.6741140857211576e-08, -2.5622957977589067e-08, -2.450477332160972e-08, -2.338659044198721e-08, -2.226840578600786e-08, -2.1150222906385352e-08, -2.0032040026762843e-08, -1.8913855370783494e-08, -1.7795668938447307e-08, -1.6677486058824798e-08, -1.555930140284545e-08, -1.444111852322294e-08, -1.3322933867243592e-08, -1.2204750987621082e-08, -1.1086567219820154e-08, -9.968383452019225e-09, -8.850199684218296e-09, -7.732015916417367e-09, -6.613832148616439e-09, -5.49564882490472e-09, -4.377465057103791e-09, -3.259281289302862e-09, -2.1410979655911433e-09, -1.0229141977902145e-09, 9.526957001071423e-11, 1.2134532267893405e-09, 2.331636883567967e-09, 3.4498204293242907e-09, 4.5680041971252194e-09, 5.686187964926148e-09, 6.804371288637867e-09, 7.922555056438796e-09, 9.040738824239725e-09, 1.0158922592040653e-08, 1.1277106359841582e-08, 1.2395290127642511e-08, 1.351347300726502e-08, 1.4631657663244368e-08, 1.5749840542866878e-08, 1.6868025198846226e-08, 1.7986208078468735e-08]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1022.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [0.0, 9.313225746154785e-10, 1.862645149230957e-09, 2.7939677238464355e-09, 3.725290298461914e-09, 4.6566128730773926e-09, 5.587935447692871e-09, 6.51925802230835e-09, 7.450580596923828e-09, 8.381903171539307e-09, 9.313225746154785e-09, 1.0244548320770264e-08, 1.1175870895385742e-08, 1.210719347000122e-08, 1.30385160446167e-08, 1.3969838619232178e-08, 1.4901161193847656e-08, 1.5832483768463135e-08, 1.6763806343078613e-08, 1.7695128917694092e-08, 1.862645149230957e-08, 1.955777406692505e-08, 2.0489096641540527e-08, 2.1420419216156006e-08, 2.2351741790771484e-08, 2.3283064365386963e-08, 2.421438694000244e-08, 2.514570951461792e-08, 2.60770320892334e-08, 2.7008354663848877e-08, 2.7939677238464355e-08, 2.8870999813079834e-08, 2.9802322387695312e-08, 3.073364496231079e-08, 3.166496753692627e-08, 3.259629011154175e-08, 3.3527612686157227e-08, 3.4458935260772705e-08, 3.5390257835388184e-08, 3.632158041000366e-08, 3.725290298461914e-08, 3.818422555923462e-08, 3.91155481338501e-08, 4.0046870708465576e-08, 4.0978193283081055e-08, 4.190951585769653e-08, 4.284083843231201e-08, 4.377216100692749e-08, 4.470348358154297e-08, 4.563480615615845e-08, 4.6566128730773926e-08, 4.7497451305389404e-08, 4.842877388000488e-08, 4.936009645462036e-08, 5.029141902923584e-08, 5.122274160385132e-08, 5.21540641784668e-08, 5.3085386753082275e-08, 5.4016709327697754e-08, 5.494803190231323e-08, 5.587935447692871e-08, 5.681067705154419e-08, 5.774199962615967e-08, 5.8673322200775146e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 11.0, 11.0, 7.0, 21.0, 12.0, 24.0, 45.0, 32.0, 25.0, 39.0, 42.0, 33.0, 35.0, 41.0, 58.0, 58.0, 55.0, 43.0, 42.0, 45.0, 45.0, 45.0, 37.0, 29.0, 28.0, 23.0, 23.0, 19.0, 19.0, 12.0, 15.0, 6.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.08984375, -3.97320556640625, -3.8565673828125, -3.73992919921875, -3.623291015625, -3.50665283203125, -3.3900146484375, -3.27337646484375, -3.15673828125, -3.04010009765625, -2.9234619140625, -2.80682373046875, -2.690185546875, -2.57354736328125, -2.4569091796875, -2.34027099609375, -2.2236328125, -2.10699462890625, -1.9903564453125, -1.87371826171875, -1.757080078125, -1.64044189453125, -1.5238037109375, -1.40716552734375, -1.29052734375, -1.17388916015625, -1.0572509765625, -0.94061279296875, -0.823974609375, -0.70733642578125, -0.5906982421875, -0.47406005859375, -0.357421875, -0.24078369140625, -0.1241455078125, -0.00750732421875, 0.109130859375, 0.22576904296875, 0.3424072265625, 0.45904541015625, 0.57568359375, 0.69232177734375, 0.8089599609375, 0.92559814453125, 1.042236328125, 1.15887451171875, 1.2755126953125, 1.39215087890625, 1.5087890625, 1.62542724609375, 1.7420654296875, 1.85870361328125, 1.975341796875, 2.09197998046875, 2.2086181640625, 2.32525634765625, 2.44189453125, 2.55853271484375, 2.6751708984375, 2.79180908203125, 2.908447265625, 3.02508544921875, 3.1417236328125, 3.25836181640625, 3.375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 10.0, 22.0, 27.0, 48.0, 47.0, 89.0, 134.0, 244.0, 343.0, 551.0, 834.0, 1221.0, 1916.0, 2766.0, 4489.0, 6857.0, 10968.0, 18066.0, 29198.0, 50138.0, 92572.0, 191853.0, 287498.0, 157782.0, 78270.0, 43655.0, 25924.0, 15704.0, 9562.0, 6251.0, 4081.0, 2633.0, 1638.0, 1104.0, 695.0, 457.0, 324.0, 207.0, 116.0, 101.0, 57.0, 34.0, 19.0, 16.0, 9.0, 8.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0], "bins": [-2.546875, -2.4727783203125, -2.398681640625, -2.3245849609375, -2.25048828125, -2.1763916015625, -2.102294921875, -2.0281982421875, -1.9541015625, -1.8800048828125, -1.805908203125, -1.7318115234375, -1.65771484375, -1.5836181640625, -1.509521484375, -1.4354248046875, -1.361328125, -1.2872314453125, -1.213134765625, -1.1390380859375, -1.06494140625, -0.9908447265625, -0.916748046875, -0.8426513671875, -0.7685546875, -0.6944580078125, -0.620361328125, -0.5462646484375, -0.47216796875, -0.3980712890625, -0.323974609375, -0.2498779296875, -0.17578125, -0.1016845703125, -0.027587890625, 0.0465087890625, 0.12060546875, 0.1947021484375, 0.268798828125, 0.3428955078125, 0.4169921875, 0.4910888671875, 0.565185546875, 0.6392822265625, 0.71337890625, 0.7874755859375, 0.861572265625, 0.9356689453125, 1.009765625, 1.0838623046875, 1.157958984375, 1.2320556640625, 1.30615234375, 1.3802490234375, 1.454345703125, 1.5284423828125, 1.6025390625, 1.6766357421875, 1.750732421875, 1.8248291015625, 1.89892578125, 1.9730224609375, 2.047119140625, 2.1212158203125, 2.1953125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 5.0, 3.0, 6.0, 8.0, 6.0, 7.0, 11.0, 5.0, 12.0, 12.0, 10.0, 13.0, 24.0, 25.0, 27.0, 32.0, 23.0, 24.0, 42.0, 35.0, 48.0, 58.0, 141.0, 329.0, 1411.0, 187.0, 85.0, 54.0, 49.0, 41.0, 34.0, 51.0, 28.0, 25.0, 21.0, 23.0, 17.0, 24.0, 24.0, 8.0, 11.0, 15.0, 10.0, 6.0, 6.0, 5.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-8.9375, -8.66796875, -8.3984375, -8.12890625, -7.859375, -7.58984375, -7.3203125, -7.05078125, -6.78125, -6.51171875, -6.2421875, -5.97265625, -5.703125, -5.43359375, -5.1640625, -4.89453125, -4.625, -4.35546875, -4.0859375, -3.81640625, -3.546875, -3.27734375, -3.0078125, -2.73828125, -2.46875, -2.19921875, -1.9296875, -1.66015625, -1.390625, -1.12109375, -0.8515625, -0.58203125, -0.3125, -0.04296875, 0.2265625, 0.49609375, 0.765625, 1.03515625, 1.3046875, 1.57421875, 1.84375, 2.11328125, 2.3828125, 2.65234375, 2.921875, 3.19140625, 3.4609375, 3.73046875, 4.0, 4.26953125, 4.5390625, 4.80859375, 5.078125, 5.34765625, 5.6171875, 5.88671875, 6.15625, 6.42578125, 6.6953125, 6.96484375, 7.234375, 7.50390625, 7.7734375, 8.04296875, 8.3125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 7.0, 6.0, 4.0, 13.0, 19.0, 18.0, 13.0, 16.0, 35.0, 30.0, 40.0, 36.0, 71.0, 74.0, 105.0, 165.0, 163.0, 300.0, 528.0, 1841.0, 11717.0, 136702.0, 2772118.0, 202294.0, 15721.0, 2064.0, 548.0, 297.0, 165.0, 120.0, 107.0, 75.0, 69.0, 52.0, 39.0, 24.0, 22.0, 21.0, 11.0, 7.0, 9.0, 9.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5078125, -11.1431884765625, -10.778564453125, -10.4139404296875, -10.04931640625, -9.6846923828125, -9.320068359375, -8.9554443359375, -8.5908203125, -8.2261962890625, -7.861572265625, -7.4969482421875, -7.13232421875, -6.7677001953125, -6.403076171875, -6.0384521484375, -5.673828125, -5.3092041015625, -4.944580078125, -4.5799560546875, -4.21533203125, -3.8507080078125, -3.486083984375, -3.1214599609375, -2.7568359375, -2.3922119140625, -2.027587890625, -1.6629638671875, -1.29833984375, -0.9337158203125, -0.569091796875, -0.2044677734375, 0.16015625, 0.5247802734375, 0.889404296875, 1.2540283203125, 1.61865234375, 1.9832763671875, 2.347900390625, 2.7125244140625, 3.0771484375, 3.4417724609375, 3.806396484375, 4.1710205078125, 4.53564453125, 4.9002685546875, 5.264892578125, 5.6295166015625, 5.994140625, 6.3587646484375, 6.723388671875, 7.0880126953125, 7.45263671875, 7.8172607421875, 8.181884765625, 8.5465087890625, 8.9111328125, 9.2757568359375, 9.640380859375, 10.0050048828125, 10.36962890625, 10.7342529296875, 11.098876953125, 11.4635009765625, 11.828125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [197.0, 780.0, 40.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.472397327423096, -1.4493160247802734, 2.573765277862549, 6.596847057342529, 10.619928359985352, 14.643009185791016, 18.666091918945312, 22.689172744750977, 26.71225357055664, 30.735334396362305, 34.75841522216797, 38.781497955322266, 42.80458068847656, 46.827659606933594, 50.85074234008789, 54.87382507324219, 58.89690399169922, 62.919986724853516, 66.94306945800781, 70.96614837646484, 74.98922729492188, 79.01231384277344, 83.03539276123047, 87.0584716796875, 91.08155059814453, 95.10462951660156, 99.12771606445312, 103.15079498291016, 107.17387390136719, 111.19696044921875, 115.22003936767578, 119.24311828613281, 123.26618957519531, 127.28926849365234, 131.31234741210938, 135.33543395996094, 139.3585205078125, 143.381591796875, 147.40467834472656, 151.42776489257812, 155.45083618164062, 159.4739227294922, 163.4969940185547, 167.52008056640625, 171.5431671142578, 175.5662384033203, 179.58932495117188, 183.61241149902344, 187.635498046875, 191.65858459472656, 195.68165588378906, 199.70474243164062, 203.7278289794922, 207.7509002685547, 211.77398681640625, 215.7970733642578, 219.8201446533203, 223.84323120117188, 227.86630249023438, 231.88938903808594, 235.9124755859375, 239.935546875, 243.95863342285156, 247.98171997070312, 252.00479125976562]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 7.0, 6.0, 4.0, 6.0, 6.0, 8.0, 8.0, 11.0, 12.0, 13.0, 14.0, 13.0, 24.0, 13.0, 15.0, 29.0, 26.0, 26.0, 25.0, 24.0, 28.0, 29.0, 35.0, 35.0, 26.0, 34.0, 54.0, 42.0, 35.0, 40.0, 24.0, 32.0, 22.0, 36.0, 29.0, 17.0, 21.0, 27.0, 21.0, 19.0, 18.0, 11.0, 16.0, 14.0, 10.0, 7.0, 4.0, 4.0, 8.0, 3.0, 6.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-21.229881286621094, -20.539918899536133, -19.84995460510254, -19.159992218017578, -18.470027923583984, -17.780065536499023, -17.090103149414062, -16.40013885498047, -15.710175514221191, -15.020212173461914, -14.330248832702637, -13.64028549194336, -12.950323104858398, -12.260358810424805, -11.570396423339844, -10.880433082580566, -10.190469741821289, -9.500506401062012, -8.810543060302734, -8.120580673217773, -7.430616855621338, -6.7406535148620605, -6.050690650939941, -5.360727310180664, -4.670763969421387, -3.9808006286621094, -3.290837526321411, -2.600874423980713, -1.9109110832214355, -1.2209477424621582, -0.5309848785400391, 0.15897846221923828, 0.8489437103271484, 1.5389069318771362, 2.228870153427124, 2.9188332557678223, 3.6087965965270996, 4.298759937286377, 4.988722801208496, 5.678686141967773, 6.368649482727051, 7.058612823486328, 7.7485761642456055, 8.438539505004883, 9.128501892089844, 9.818466186523438, 10.508428573608398, 11.198391914367676, 11.888355255126953, 12.57831859588623, 13.268281936645508, 13.958244323730469, 14.648208618164062, 15.338171005249023, 16.028133392333984, 16.718097686767578, 17.408061981201172, 18.098024368286133, 18.787988662719727, 19.477951049804688, 20.16791534423828, 20.857877731323242, 21.547840118408203, 22.237804412841797, 22.927766799926758]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 2.0, 10.0, 15.0, 14.0, 13.0, 28.0, 26.0, 34.0, 42.0, 27.0, 31.0, 42.0, 34.0, 45.0, 54.0, 46.0, 43.0, 62.0, 39.0, 42.0, 41.0, 43.0, 39.0, 38.0, 24.0, 22.0, 29.0, 21.0, 18.0, 18.0, 11.0, 9.0, 13.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.140625, -4.024261474609375, -3.90789794921875, -3.791534423828125, -3.6751708984375, -3.558807373046875, -3.44244384765625, -3.326080322265625, -3.209716796875, -3.093353271484375, -2.97698974609375, -2.860626220703125, -2.7442626953125, -2.627899169921875, -2.51153564453125, -2.395172119140625, -2.27880859375, -2.162445068359375, -2.04608154296875, -1.929718017578125, -1.8133544921875, -1.696990966796875, -1.58062744140625, -1.464263916015625, -1.347900390625, -1.231536865234375, -1.11517333984375, -0.998809814453125, -0.8824462890625, -0.766082763671875, -0.64971923828125, -0.533355712890625, -0.4169921875, -0.300628662109375, -0.18426513671875, -0.067901611328125, 0.0484619140625, 0.164825439453125, 0.28118896484375, 0.397552490234375, 0.513916015625, 0.630279541015625, 0.74664306640625, 0.863006591796875, 0.9793701171875, 1.095733642578125, 1.21209716796875, 1.328460693359375, 1.44482421875, 1.561187744140625, 1.67755126953125, 1.793914794921875, 1.9102783203125, 2.026641845703125, 2.14300537109375, 2.259368896484375, 2.375732421875, 2.492095947265625, 2.60845947265625, 2.724822998046875, 2.8411865234375, 2.957550048828125, 3.07391357421875, 3.190277099609375, 3.306640625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 5.0, 3.0, 1.0, 9.0, 7.0, 9.0, 13.0, 21.0, 20.0, 18.0, 23.0, 33.0, 36.0, 51.0, 96.0, 279.0, 823.0, 3291.0, 15294.0, 99169.0, 1134971.0, 2634752.0, 263464.0, 32956.0, 6483.0, 1566.0, 453.0, 152.0, 69.0, 56.0, 33.0, 20.0, 22.0, 14.0, 13.0, 12.0, 15.0, 13.0, 3.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.846923828125, -7.56884765625, -7.290771484375, -7.0126953125, -6.734619140625, -6.45654296875, -6.178466796875, -5.900390625, -5.622314453125, -5.34423828125, -5.066162109375, -4.7880859375, -4.510009765625, -4.23193359375, -3.953857421875, -3.67578125, -3.397705078125, -3.11962890625, -2.841552734375, -2.5634765625, -2.285400390625, -2.00732421875, -1.729248046875, -1.451171875, -1.173095703125, -0.89501953125, -0.616943359375, -0.3388671875, -0.060791015625, 0.21728515625, 0.495361328125, 0.7734375, 1.051513671875, 1.32958984375, 1.607666015625, 1.8857421875, 2.163818359375, 2.44189453125, 2.719970703125, 2.998046875, 3.276123046875, 3.55419921875, 3.832275390625, 4.1103515625, 4.388427734375, 4.66650390625, 4.944580078125, 5.22265625, 5.500732421875, 5.77880859375, 6.056884765625, 6.3349609375, 6.613037109375, 6.89111328125, 7.169189453125, 7.447265625, 7.725341796875, 8.00341796875, 8.281494140625, 8.5595703125, 8.837646484375, 9.11572265625, 9.393798828125, 9.671875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 13.0, 13.0, 27.0, 32.0, 47.0, 64.0, 94.0, 116.0, 137.0, 235.0, 318.0, 437.0, 540.0, 510.0, 408.0, 306.0, 212.0, 145.0, 110.0, 84.0, 59.0, 37.0, 27.0, 28.0, 25.0, 5.0, 7.0, 13.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.0078125, -6.8123779296875, -6.616943359375, -6.4215087890625, -6.22607421875, -6.0306396484375, -5.835205078125, -5.6397705078125, -5.4443359375, -5.2489013671875, -5.053466796875, -4.8580322265625, -4.66259765625, -4.4671630859375, -4.271728515625, -4.0762939453125, -3.880859375, -3.6854248046875, -3.489990234375, -3.2945556640625, -3.09912109375, -2.9036865234375, -2.708251953125, -2.5128173828125, -2.3173828125, -2.1219482421875, -1.926513671875, -1.7310791015625, -1.53564453125, -1.3402099609375, -1.144775390625, -0.9493408203125, -0.75390625, -0.5584716796875, -0.363037109375, -0.1676025390625, 0.02783203125, 0.2232666015625, 0.418701171875, 0.6141357421875, 0.8095703125, 1.0050048828125, 1.200439453125, 1.3958740234375, 1.59130859375, 1.7867431640625, 1.982177734375, 2.1776123046875, 2.373046875, 2.5684814453125, 2.763916015625, 2.9593505859375, 3.15478515625, 3.3502197265625, 3.545654296875, 3.7410888671875, 3.9365234375, 4.1319580078125, 4.327392578125, 4.5228271484375, 4.71826171875, 4.9136962890625, 5.109130859375, 5.3045654296875, 5.5]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 6.0, 7.0, 8.0, 21.0, 10.0, 25.0, 35.0, 42.0, 51.0, 65.0, 86.0, 127.0, 191.0, 199.0, 357.0, 740.0, 4168.0, 86896.0, 3520138.0, 564348.0, 13923.0, 1397.0, 468.0, 265.0, 181.0, 125.0, 105.0, 98.0, 55.0, 39.0, 38.0, 14.0, 20.0, 9.0, 11.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.875, -18.218017578125, -17.56103515625, -16.904052734375, -16.2470703125, -15.590087890625, -14.93310546875, -14.276123046875, -13.619140625, -12.962158203125, -12.30517578125, -11.648193359375, -10.9912109375, -10.334228515625, -9.67724609375, -9.020263671875, -8.36328125, -7.706298828125, -7.04931640625, -6.392333984375, -5.7353515625, -5.078369140625, -4.42138671875, -3.764404296875, -3.107421875, -2.450439453125, -1.79345703125, -1.136474609375, -0.4794921875, 0.177490234375, 0.83447265625, 1.491455078125, 2.1484375, 2.805419921875, 3.46240234375, 4.119384765625, 4.7763671875, 5.433349609375, 6.09033203125, 6.747314453125, 7.404296875, 8.061279296875, 8.71826171875, 9.375244140625, 10.0322265625, 10.689208984375, 11.34619140625, 12.003173828125, 12.66015625, 13.317138671875, 13.97412109375, 14.631103515625, 15.2880859375, 15.945068359375, 16.60205078125, 17.259033203125, 17.916015625, 18.572998046875, 19.22998046875, 19.886962890625, 20.5439453125, 21.200927734375, 21.85791015625, 22.514892578125, 23.171875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 19.0, 28.0, 59.0, 83.0, 116.0, 136.0, 144.0, 138.0, 110.0, 72.0, 49.0, 25.0, 12.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.35489273071289, -45.3507080078125, -44.346527099609375, -43.342342376708984, -42.338157653808594, -41.3339729309082, -40.32978820800781, -39.32560729980469, -38.3214225769043, -37.317237854003906, -36.31305694580078, -35.30887222290039, -34.3046875, -33.30050277709961, -32.29631805419922, -31.292137145996094, -30.287952423095703, -29.283767700195312, -28.279584884643555, -27.275402069091797, -26.271217346191406, -25.267032623291016, -24.262849807739258, -23.2586669921875, -22.25448226928711, -21.25029754638672, -20.24611473083496, -19.241931915283203, -18.237747192382812, -17.233562469482422, -16.229379653930664, -15.22519588470459, -14.22100830078125, -13.216824531555176, -12.212640762329102, -11.208456993103027, -10.204273223876953, -9.200089454650879, -8.195905685424805, -7.1917219161987305, -6.187538146972656, -5.183354377746582, -4.179170608520508, -3.1749868392944336, -2.1708030700683594, -1.1666193008422852, -0.16243553161621094, 0.8417482376098633, 1.8459320068359375, 2.8501157760620117, 3.854299545288086, 4.85848331451416, 5.862667083740234, 6.866850852966309, 7.871034622192383, 8.875218391418457, 9.879402160644531, 10.883585929870605, 11.88776969909668, 12.891953468322754, 13.896137237548828, 14.900321006774902, 15.904504776000977, 16.908687591552734, 17.912872314453125]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 2.0, 3.0, 4.0, 6.0, 10.0, 9.0, 11.0, 15.0, 19.0, 24.0, 22.0, 29.0, 21.0, 38.0, 39.0, 26.0, 33.0, 44.0, 39.0, 42.0, 50.0, 43.0, 36.0, 41.0, 38.0, 35.0, 28.0, 35.0, 43.0, 19.0, 26.0, 27.0, 20.0, 22.0, 14.0, 21.0, 17.0, 16.0, 7.0, 10.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.529922485351562, -18.9344539642334, -18.338987350463867, -17.743518829345703, -17.148052215576172, -16.552583694458008, -15.957115173339844, -15.361647605895996, -14.766180038452148, -14.1707124710083, -13.575244903564453, -12.979776382446289, -12.384308815002441, -11.788841247558594, -11.19337272644043, -10.597905158996582, -10.002437591552734, -9.406970024108887, -8.811502456665039, -8.216033935546875, -7.620566368103027, -7.02509880065918, -6.429630756378174, -5.834162712097168, -5.23869514465332, -4.643227577209473, -4.047759532928467, -3.45229172706604, -2.8568239212036133, -2.2613561153411865, -1.6658883094787598, -1.070420265197754, -0.47495269775390625, 0.12051510810852051, 0.7159829139709473, 1.311450719833374, 1.9069185256958008, 2.5023863315582275, 3.0978541374206543, 3.69332218170166, 4.288789749145508, 4.8842573165893555, 5.479725360870361, 6.075193405151367, 6.670660972595215, 7.2661285400390625, 7.861596584320068, 8.457064628601074, 9.052532196044922, 9.64799976348877, 10.243467330932617, 10.838935852050781, 11.434403419494629, 12.029870986938477, 12.62533950805664, 13.220807075500488, 13.816274642944336, 14.411742210388184, 15.007209777832031, 15.602678298950195, 16.19814682006836, 16.79361343383789, 17.389081954956055, 17.98455047607422, 18.58001708984375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 10.0, 15.0, 12.0, 17.0, 20.0, 29.0, 30.0, 29.0, 31.0, 41.0, 39.0, 42.0, 51.0, 51.0, 45.0, 43.0, 43.0, 40.0, 52.0, 45.0, 44.0, 34.0, 33.0, 31.0, 28.0, 18.0, 17.0, 18.0, 17.0, 14.0, 8.0, 12.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.41796875, -4.300048828125, -4.18212890625, -4.064208984375, -3.9462890625, -3.828369140625, -3.71044921875, -3.592529296875, -3.474609375, -3.356689453125, -3.23876953125, -3.120849609375, -3.0029296875, -2.885009765625, -2.76708984375, -2.649169921875, -2.53125, -2.413330078125, -2.29541015625, -2.177490234375, -2.0595703125, -1.941650390625, -1.82373046875, -1.705810546875, -1.587890625, -1.469970703125, -1.35205078125, -1.234130859375, -1.1162109375, -0.998291015625, -0.88037109375, -0.762451171875, -0.64453125, -0.526611328125, -0.40869140625, -0.290771484375, -0.1728515625, -0.054931640625, 0.06298828125, 0.180908203125, 0.298828125, 0.416748046875, 0.53466796875, 0.652587890625, 0.7705078125, 0.888427734375, 1.00634765625, 1.124267578125, 1.2421875, 1.360107421875, 1.47802734375, 1.595947265625, 1.7138671875, 1.831787109375, 1.94970703125, 2.067626953125, 2.185546875, 2.303466796875, 2.42138671875, 2.539306640625, 2.6572265625, 2.775146484375, 2.89306640625, 3.010986328125, 3.12890625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 6.0, 10.0, 12.0, 23.0, 29.0, 56.0, 69.0, 90.0, 169.0, 248.0, 396.0, 578.0, 963.0, 1432.0, 2373.0, 3590.0, 5747.0, 9156.0, 14667.0, 24134.0, 39981.0, 69366.0, 134177.0, 312686.0, 202415.0, 93838.0, 51823.0, 30774.0, 18649.0, 11419.0, 7153.0, 4603.0, 2862.0, 1819.0, 1121.0, 756.0, 464.0, 330.0, 188.0, 135.0, 86.0, 55.0, 31.0, 30.0, 15.0, 13.0, 5.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 4.0], "bins": [-0.020111083984375, -0.019515037536621094, -0.018918991088867188, -0.01832294464111328, -0.017726898193359375, -0.01713085174560547, -0.016534805297851562, -0.015938758850097656, -0.01534271240234375, -0.014746665954589844, -0.014150619506835938, -0.013554573059082031, -0.012958526611328125, -0.012362480163574219, -0.011766433715820312, -0.011170387268066406, -0.0105743408203125, -0.009978294372558594, -0.009382247924804688, -0.008786201477050781, -0.008190155029296875, -0.007594108581542969, -0.0069980621337890625, -0.006402015686035156, -0.00580596923828125, -0.005209922790527344, -0.0046138763427734375, -0.004017829895019531, -0.003421783447265625, -0.0028257369995117188, -0.0022296905517578125, -0.0016336441040039062, -0.00103759765625, -0.00044155120849609375, 0.0001544952392578125, 0.0007505416870117188, 0.001346588134765625, 0.0019426345825195312, 0.0025386810302734375, 0.0031347274780273438, 0.00373077392578125, 0.004326820373535156, 0.0049228668212890625, 0.005518913269042969, 0.006114959716796875, 0.006711006164550781, 0.0073070526123046875, 0.007903099060058594, 0.0084991455078125, 0.009095191955566406, 0.009691238403320312, 0.010287284851074219, 0.010883331298828125, 0.011479377746582031, 0.012075424194335938, 0.012671470642089844, 0.01326751708984375, 0.013863563537597656, 0.014459609985351562, 0.015055656433105469, 0.015651702880859375, 0.01624774932861328, 0.016843795776367188, 0.017439842224121094, 0.018035888671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 11.0, 4.0, 9.0, 5.0, 2.0, 7.0, 11.0, 16.0, 24.0, 20.0, 31.0, 23.0, 26.0, 37.0, 33.0, 59.0, 41.0, 49.0, 40.0, 48.0, 1067.0, 45.0, 29.0, 48.0, 49.0, 34.0, 47.0, 30.0, 25.0, 32.0, 28.0, 18.0, 12.0, 13.0, 13.0, 14.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.23828125, -2.16455078125, -2.0908203125, -2.01708984375, -1.943359375, -1.86962890625, -1.7958984375, -1.72216796875, -1.6484375, -1.57470703125, -1.5009765625, -1.42724609375, -1.353515625, -1.27978515625, -1.2060546875, -1.13232421875, -1.05859375, -0.98486328125, -0.9111328125, -0.83740234375, -0.763671875, -0.68994140625, -0.6162109375, -0.54248046875, -0.46875, -0.39501953125, -0.3212890625, -0.24755859375, -0.173828125, -0.10009765625, -0.0263671875, 0.04736328125, 0.12109375, 0.19482421875, 0.2685546875, 0.34228515625, 0.416015625, 0.48974609375, 0.5634765625, 0.63720703125, 0.7109375, 0.78466796875, 0.8583984375, 0.93212890625, 1.005859375, 1.07958984375, 1.1533203125, 1.22705078125, 1.30078125, 1.37451171875, 1.4482421875, 1.52197265625, 1.595703125, 1.66943359375, 1.7431640625, 1.81689453125, 1.890625, 1.96435546875, 2.0380859375, 2.11181640625, 2.185546875, 2.25927734375, 2.3330078125, 2.40673828125, 2.48046875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 11.0, 15.0, 34.0, 49.0, 59.0, 98.0, 109.0, 191.0, 305.0, 456.0, 638.0, 1001.0, 1557.0, 2583.0, 3988.0, 6580.0, 10695.0, 18159.0, 31321.0, 55978.0, 106821.0, 251026.0, 1336967.0, 121379.0, 61876.0, 34422.0, 19891.0, 11864.0, 6995.0, 4352.0, 2743.0, 1705.0, 1141.0, 712.0, 483.0, 306.0, 181.0, 128.0, 79.0, 56.0, 46.0, 46.0, 29.0, 17.0, 11.0, 7.0, 7.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0148773193359375, -0.014427661895751953, -0.013978004455566406, -0.01352834701538086, -0.013078689575195312, -0.012629032135009766, -0.012179374694824219, -0.011729717254638672, -0.011280059814453125, -0.010830402374267578, -0.010380744934082031, -0.009931087493896484, -0.009481430053710938, -0.00903177261352539, -0.008582115173339844, -0.008132457733154297, -0.00768280029296875, -0.007233142852783203, -0.006783485412597656, -0.006333827972412109, -0.0058841705322265625, -0.005434513092041016, -0.004984855651855469, -0.004535198211669922, -0.004085540771484375, -0.003635883331298828, -0.0031862258911132812, -0.0027365684509277344, -0.0022869110107421875, -0.0018372535705566406, -0.0013875961303710938, -0.0009379386901855469, -0.00048828125, -3.8623809814453125e-05, 0.00041103363037109375, 0.0008606910705566406, 0.0013103485107421875, 0.0017600059509277344, 0.0022096633911132812, 0.002659320831298828, 0.003108978271484375, 0.003558635711669922, 0.004008293151855469, 0.004457950592041016, 0.0049076080322265625, 0.005357265472412109, 0.005806922912597656, 0.006256580352783203, 0.00670623779296875, 0.007155895233154297, 0.007605552673339844, 0.00805521011352539, 0.008504867553710938, 0.008954524993896484, 0.009404182434082031, 0.009853839874267578, 0.010303497314453125, 0.010753154754638672, 0.011202812194824219, 0.011652469635009766, 0.012102127075195312, 0.01255178451538086, 0.013001441955566406, 0.013451099395751953, 0.0139007568359375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 109.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 776.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 105.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 35.0, 44.0, 27.0, 6.0, 2.0, 0.0, 1.0, 85.0, 51.0, 89.0, 307.0, 4777.0, 986377.0, 55593.0, 464.0, 312.0, 93.0, 54.0, 82.0, 7.0, 0.0, 1.0, 21.0, 14.0, 31.0, 47.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9206275939941406e-06, -2.8079375624656677e-06, -2.695247530937195e-06, -2.582557499408722e-06, -2.469867467880249e-06, -2.357177436351776e-06, -2.2444874048233032e-06, -2.1317973732948303e-06, -2.0191073417663574e-06, -1.9064173102378845e-06, -1.7937272787094116e-06, -1.6810372471809387e-06, -1.5683472156524658e-06, -1.455657184123993e-06, -1.34296715259552e-06, -1.2302771210670471e-06, -1.1175870895385742e-06, -1.0048970580101013e-06, -8.922070264816284e-07, -7.795169949531555e-07, -6.668269634246826e-07, -5.541369318962097e-07, -4.414469003677368e-07, -3.287568688392639e-07, -2.1606683731079102e-07, -1.0337680578231812e-07, 9.313225746154785e-09, 1.2200325727462769e-07, 2.3469328880310059e-07, 3.473833203315735e-07, 4.600733518600464e-07, 5.727633833885193e-07, 6.854534149169922e-07, 7.981434464454651e-07, 9.10833477973938e-07, 1.0235235095024109e-06, 1.1362135410308838e-06, 1.2489035725593567e-06, 1.3615936040878296e-06, 1.4742836356163025e-06, 1.5869736671447754e-06, 1.6996636986732483e-06, 1.8123537302017212e-06, 1.925043761730194e-06, 2.037733793258667e-06, 2.15042382478714e-06, 2.263113856315613e-06, 2.3758038878440857e-06, 2.4884939193725586e-06, 2.6011839509010315e-06, 2.7138739824295044e-06, 2.8265640139579773e-06, 2.93925404548645e-06, 3.051944077014923e-06, 3.164634108543396e-06, 3.277324140071869e-06, 3.390014171600342e-06, 3.5027042031288147e-06, 3.6153942346572876e-06, 3.7280842661857605e-06, 3.840774297714233e-06, 3.953464329242706e-06, 4.066154360771179e-06, 4.178844392299652e-06, 4.291534423828125e-06]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 10.0, 15.0, 12.0, 17.0, 20.0, 29.0, 30.0, 29.0, 31.0, 41.0, 39.0, 42.0, 51.0, 51.0, 45.0, 43.0, 43.0, 40.0, 52.0, 45.0, 44.0, 34.0, 33.0, 31.0, 28.0, 18.0, 17.0, 18.0, 17.0, 14.0, 8.0, 12.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.41796875, -4.300048828125, -4.18212890625, -4.064208984375, -3.9462890625, -3.828369140625, -3.71044921875, -3.592529296875, -3.474609375, -3.356689453125, -3.23876953125, -3.120849609375, -3.0029296875, -2.885009765625, -2.76708984375, -2.649169921875, -2.53125, -2.413330078125, -2.29541015625, -2.177490234375, -2.0595703125, -1.941650390625, -1.82373046875, -1.705810546875, -1.587890625, -1.469970703125, -1.35205078125, -1.234130859375, -1.1162109375, -0.998291015625, -0.88037109375, -0.762451171875, -0.64453125, -0.526611328125, -0.40869140625, -0.290771484375, -0.1728515625, -0.054931640625, 0.06298828125, 0.180908203125, 0.298828125, 0.416748046875, 0.53466796875, 0.652587890625, 0.7705078125, 0.888427734375, 1.00634765625, 1.124267578125, 1.2421875, 1.360107421875, 1.47802734375, 1.595947265625, 1.7138671875, 1.831787109375, 1.94970703125, 2.067626953125, 2.185546875, 2.303466796875, 2.42138671875, 2.539306640625, 2.6572265625, 2.775146484375, 2.89306640625, 3.010986328125, 3.12890625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 17.0, 15.0, 21.0, 22.0, 48.0, 56.0, 95.0, 139.0, 248.0, 498.0, 1304.0, 3274.0, 8835.0, 25915.0, 96336.0, 645350.0, 203489.0, 41143.0, 13318.0, 4959.0, 1918.0, 724.0, 334.0, 172.0, 86.0, 61.0, 35.0, 28.0, 23.0, 20.0, 9.0, 18.0, 9.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-7.484375, -7.28582763671875, -7.0872802734375, -6.88873291015625, -6.690185546875, -6.49163818359375, -6.2930908203125, -6.09454345703125, -5.89599609375, -5.69744873046875, -5.4989013671875, -5.30035400390625, -5.101806640625, -4.90325927734375, -4.7047119140625, -4.50616455078125, -4.3076171875, -4.10906982421875, -3.9105224609375, -3.71197509765625, -3.513427734375, -3.31488037109375, -3.1163330078125, -2.91778564453125, -2.71923828125, -2.52069091796875, -2.3221435546875, -2.12359619140625, -1.925048828125, -1.72650146484375, -1.5279541015625, -1.32940673828125, -1.130859375, -0.93231201171875, -0.7337646484375, -0.53521728515625, -0.336669921875, -0.13812255859375, 0.0604248046875, 0.25897216796875, 0.45751953125, 0.65606689453125, 0.8546142578125, 1.05316162109375, 1.251708984375, 1.45025634765625, 1.6488037109375, 1.84735107421875, 2.0458984375, 2.24444580078125, 2.4429931640625, 2.64154052734375, 2.840087890625, 3.03863525390625, 3.2371826171875, 3.43572998046875, 3.63427734375, 3.83282470703125, 4.0313720703125, 4.22991943359375, 4.428466796875, 4.62701416015625, 4.8255615234375, 5.02410888671875, 5.22265625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 4.0, 5.0, 12.0, 11.0, 19.0, 17.0, 19.0, 30.0, 28.0, 37.0, 32.0, 36.0, 51.0, 52.0, 52.0, 108.0, 453.0, 1536.0, 119.0, 60.0, 69.0, 33.0, 31.0, 39.0, 34.0, 23.0, 21.0, 22.0, 21.0, 9.0, 15.0, 8.0, 16.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.7734375, -11.3946533203125, -11.015869140625, -10.6370849609375, -10.25830078125, -9.8795166015625, -9.500732421875, -9.1219482421875, -8.7431640625, -8.3643798828125, -7.985595703125, -7.6068115234375, -7.22802734375, -6.8492431640625, -6.470458984375, -6.0916748046875, -5.712890625, -5.3341064453125, -4.955322265625, -4.5765380859375, -4.19775390625, -3.8189697265625, -3.440185546875, -3.0614013671875, -2.6826171875, -2.3038330078125, -1.925048828125, -1.5462646484375, -1.16748046875, -0.7886962890625, -0.409912109375, -0.0311279296875, 0.34765625, 0.7264404296875, 1.105224609375, 1.4840087890625, 1.86279296875, 2.2415771484375, 2.620361328125, 2.9991455078125, 3.3779296875, 3.7567138671875, 4.135498046875, 4.5142822265625, 4.89306640625, 5.2718505859375, 5.650634765625, 6.0294189453125, 6.408203125, 6.7869873046875, 7.165771484375, 7.5445556640625, 7.92333984375, 8.3021240234375, 8.680908203125, 9.0596923828125, 9.4384765625, 9.8172607421875, 10.196044921875, 10.5748291015625, 10.95361328125, 11.3323974609375, 11.711181640625, 12.0899658203125, 12.46875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 7.0, 15.0, 7.0, 15.0, 10.0, 20.0, 27.0, 27.0, 44.0, 52.0, 60.0, 89.0, 124.0, 282.0, 830.0, 5757.0, 227039.0, 2892944.0, 15800.0, 1564.0, 358.0, 180.0, 104.0, 91.0, 60.0, 41.0, 28.0, 31.0, 25.0, 16.0, 17.0, 11.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-22.875, -22.185791015625, -21.49658203125, -20.807373046875, -20.1181640625, -19.428955078125, -18.73974609375, -18.050537109375, -17.361328125, -16.672119140625, -15.98291015625, -15.293701171875, -14.6044921875, -13.915283203125, -13.22607421875, -12.536865234375, -11.84765625, -11.158447265625, -10.46923828125, -9.780029296875, -9.0908203125, -8.401611328125, -7.71240234375, -7.023193359375, -6.333984375, -5.644775390625, -4.95556640625, -4.266357421875, -3.5771484375, -2.887939453125, -2.19873046875, -1.509521484375, -0.8203125, -0.131103515625, 0.55810546875, 1.247314453125, 1.9365234375, 2.625732421875, 3.31494140625, 4.004150390625, 4.693359375, 5.382568359375, 6.07177734375, 6.760986328125, 7.4501953125, 8.139404296875, 8.82861328125, 9.517822265625, 10.20703125, 10.896240234375, 11.58544921875, 12.274658203125, 12.9638671875, 13.653076171875, 14.34228515625, 15.031494140625, 15.720703125, 16.409912109375, 17.09912109375, 17.788330078125, 18.4775390625, 19.166748046875, 19.85595703125, 20.545166015625, 21.234375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [28.0, 143.0, 432.0, 319.0, 81.0, 14.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.330500602722168, -2.7925734519958496, -1.2546460628509521, 0.2832813262939453, 1.8212084770202637, 3.359135627746582, 4.897063255310059, 6.434989929199219, 7.972917556762695, 9.510845184326172, 11.048771858215332, 12.586699485778809, 14.124626159667969, 15.662553787231445, 17.200481414794922, 18.738407135009766, 20.276336669921875, 21.81426429748535, 23.352191925048828, 24.890117645263672, 26.42804527282715, 27.965972900390625, 29.5039005279541, 31.041828155517578, 32.57975387573242, 34.117679595947266, 35.655609130859375, 37.19353485107422, 38.73146438598633, 40.26939010620117, 41.80731964111328, 43.345245361328125, 44.883174896240234, 46.42110061645508, 47.95903015136719, 49.49695587158203, 51.03488540649414, 52.572811126708984, 54.110740661621094, 55.64866638183594, 57.18659210205078, 58.724517822265625, 60.262447357177734, 61.80037307739258, 63.33830261230469, 64.87622833251953, 66.41415405273438, 67.95207977294922, 69.4900131225586, 71.02793884277344, 72.56586456298828, 74.10379791259766, 75.6417236328125, 77.17964935302734, 78.71757507324219, 80.25550079345703, 81.79342651367188, 83.33135223388672, 84.86927795410156, 86.40721130371094, 87.94513702392578, 89.48306274414062, 91.02098846435547, 92.55891418457031, 94.09684753417969]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 16.0, 7.0, 12.0, 13.0, 13.0, 30.0, 34.0, 31.0, 46.0, 43.0, 51.0, 51.0, 46.0, 49.0, 54.0, 49.0, 46.0, 51.0, 45.0, 54.0, 45.0, 34.0, 37.0, 35.0, 26.0, 22.0, 8.0, 12.0, 6.0, 14.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.21537399291992, -39.067710876464844, -37.920047760009766, -36.77238082885742, -35.624717712402344, -34.477054595947266, -33.32939147949219, -32.181724548339844, -31.034061431884766, -29.886398315429688, -28.738733291625977, -27.5910701751709, -26.443405151367188, -25.29574203491211, -24.14807891845703, -23.00041389465332, -21.852750778198242, -20.705087661743164, -19.557422637939453, -18.409759521484375, -17.262094497680664, -16.114431381225586, -14.966767311096191, -13.819103240966797, -12.671439170837402, -11.523775100708008, -10.376111030578613, -9.228446960449219, -8.08078384399414, -6.933119297027588, -5.785455703735352, -4.637791633605957, -3.4901275634765625, -2.342463493347168, -1.1947996616363525, -0.04713582992553711, 1.1005282402038574, 2.248192310333252, 3.3958559036254883, 4.543519973754883, 5.691184043884277, 6.838848114013672, 7.986512184143066, 9.134176254272461, 10.281839370727539, 11.42950439453125, 12.577167510986328, 13.724831581115723, 14.872495651245117, 16.020158767700195, 17.167823791503906, 18.315486907958984, 19.463151931762695, 20.610815048217773, 21.758480072021484, 22.906143188476562, 24.05380630493164, 25.20146942138672, 26.34913444519043, 27.496797561645508, 28.64446258544922, 29.792125701904297, 30.939788818359375, 32.08745574951172, 33.2351188659668]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 7.0, 5.0, 11.0, 20.0, 22.0, 16.0, 19.0, 28.0, 23.0, 32.0, 34.0, 39.0, 46.0, 41.0, 48.0, 40.0, 44.0, 50.0, 40.0, 51.0, 48.0, 34.0, 34.0, 41.0, 36.0, 35.0, 19.0, 16.0, 15.0, 25.0, 17.0, 15.0, 10.0, 9.0, 12.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-4.48828125, -4.3675537109375, -4.246826171875, -4.1260986328125, -4.00537109375, -3.8846435546875, -3.763916015625, -3.6431884765625, -3.5224609375, -3.4017333984375, -3.281005859375, -3.1602783203125, -3.03955078125, -2.9188232421875, -2.798095703125, -2.6773681640625, -2.556640625, -2.4359130859375, -2.315185546875, -2.1944580078125, -2.07373046875, -1.9530029296875, -1.832275390625, -1.7115478515625, -1.5908203125, -1.4700927734375, -1.349365234375, -1.2286376953125, -1.10791015625, -0.9871826171875, -0.866455078125, -0.7457275390625, -0.625, -0.5042724609375, -0.383544921875, -0.2628173828125, -0.14208984375, -0.0213623046875, 0.099365234375, 0.2200927734375, 0.3408203125, 0.4615478515625, 0.582275390625, 0.7030029296875, 0.82373046875, 0.9444580078125, 1.065185546875, 1.1859130859375, 1.306640625, 1.4273681640625, 1.548095703125, 1.6688232421875, 1.78955078125, 1.9102783203125, 2.031005859375, 2.1517333984375, 2.2724609375, 2.3931884765625, 2.513916015625, 2.6346435546875, 2.75537109375, 2.8760986328125, 2.996826171875, 3.1175537109375, 3.23828125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 11.0, 16.0, 12.0, 18.0, 24.0, 22.0, 40.0, 37.0, 89.0, 152.0, 273.0, 722.0, 2000.0, 6019.0, 22149.0, 104480.0, 726278.0, 2583257.0, 623733.0, 94328.0, 21291.0, 5958.0, 1926.0, 708.0, 316.0, 146.0, 78.0, 37.0, 43.0, 28.0, 17.0, 11.0, 13.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.59765625, -7.3636474609375, -7.129638671875, -6.8956298828125, -6.66162109375, -6.4276123046875, -6.193603515625, -5.9595947265625, -5.7255859375, -5.4915771484375, -5.257568359375, -5.0235595703125, -4.78955078125, -4.5555419921875, -4.321533203125, -4.0875244140625, -3.853515625, -3.6195068359375, -3.385498046875, -3.1514892578125, -2.91748046875, -2.6834716796875, -2.449462890625, -2.2154541015625, -1.9814453125, -1.7474365234375, -1.513427734375, -1.2794189453125, -1.04541015625, -0.8114013671875, -0.577392578125, -0.3433837890625, -0.109375, 0.1246337890625, 0.358642578125, 0.5926513671875, 0.82666015625, 1.0606689453125, 1.294677734375, 1.5286865234375, 1.7626953125, 1.9967041015625, 2.230712890625, 2.4647216796875, 2.69873046875, 2.9327392578125, 3.166748046875, 3.4007568359375, 3.634765625, 3.8687744140625, 4.102783203125, 4.3367919921875, 4.57080078125, 4.8048095703125, 5.038818359375, 5.2728271484375, 5.5068359375, 5.7408447265625, 5.974853515625, 6.2088623046875, 6.44287109375, 6.6768798828125, 6.910888671875, 7.1448974609375, 7.37890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 4.0, 10.0, 15.0, 14.0, 14.0, 35.0, 39.0, 37.0, 48.0, 58.0, 102.0, 124.0, 147.0, 203.0, 265.0, 318.0, 420.0, 391.0, 399.0, 327.0, 247.0, 184.0, 160.0, 125.0, 78.0, 68.0, 61.0, 46.0, 32.0, 26.0, 18.0, 12.0, 9.0, 5.0, 8.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3671875, -5.21148681640625, -5.0557861328125, -4.90008544921875, -4.744384765625, -4.58868408203125, -4.4329833984375, -4.27728271484375, -4.12158203125, -3.96588134765625, -3.8101806640625, -3.65447998046875, -3.498779296875, -3.34307861328125, -3.1873779296875, -3.03167724609375, -2.8759765625, -2.72027587890625, -2.5645751953125, -2.40887451171875, -2.253173828125, -2.09747314453125, -1.9417724609375, -1.78607177734375, -1.63037109375, -1.47467041015625, -1.3189697265625, -1.16326904296875, -1.007568359375, -0.85186767578125, -0.6961669921875, -0.54046630859375, -0.384765625, -0.22906494140625, -0.0733642578125, 0.08233642578125, 0.238037109375, 0.39373779296875, 0.5494384765625, 0.70513916015625, 0.86083984375, 1.01654052734375, 1.1722412109375, 1.32794189453125, 1.483642578125, 1.63934326171875, 1.7950439453125, 1.95074462890625, 2.1064453125, 2.26214599609375, 2.4178466796875, 2.57354736328125, 2.729248046875, 2.88494873046875, 3.0406494140625, 3.19635009765625, 3.35205078125, 3.50775146484375, 3.6634521484375, 3.81915283203125, 3.974853515625, 4.13055419921875, 4.2862548828125, 4.44195556640625, 4.59765625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 7.0, 13.0, 16.0, 20.0, 23.0, 34.0, 41.0, 67.0, 68.0, 103.0, 129.0, 184.0, 244.0, 477.0, 1327.0, 6561.0, 62774.0, 1332953.0, 2658710.0, 116775.0, 10319.0, 1814.0, 594.0, 281.0, 191.0, 132.0, 93.0, 90.0, 67.0, 36.0, 35.0, 25.0, 19.0, 9.0, 8.0, 8.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.473876953125, -12.99462890625, -12.515380859375, -12.0361328125, -11.556884765625, -11.07763671875, -10.598388671875, -10.119140625, -9.639892578125, -9.16064453125, -8.681396484375, -8.2021484375, -7.722900390625, -7.24365234375, -6.764404296875, -6.28515625, -5.805908203125, -5.32666015625, -4.847412109375, -4.3681640625, -3.888916015625, -3.40966796875, -2.930419921875, -2.451171875, -1.971923828125, -1.49267578125, -1.013427734375, -0.5341796875, -0.054931640625, 0.42431640625, 0.903564453125, 1.3828125, 1.862060546875, 2.34130859375, 2.820556640625, 3.2998046875, 3.779052734375, 4.25830078125, 4.737548828125, 5.216796875, 5.696044921875, 6.17529296875, 6.654541015625, 7.1337890625, 7.613037109375, 8.09228515625, 8.571533203125, 9.05078125, 9.530029296875, 10.00927734375, 10.488525390625, 10.9677734375, 11.447021484375, 11.92626953125, 12.405517578125, 12.884765625, 13.364013671875, 13.84326171875, 14.322509765625, 14.8017578125, 15.281005859375, 15.76025390625, 16.239501953125, 16.71875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 12.0, 28.0, 41.0, 83.0, 146.0, 188.0, 187.0, 143.0, 92.0, 53.0, 16.0, 13.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.303102493286133, -10.067081451416016, -8.831060409545898, -7.595038890838623, -6.359017848968506, -5.122996807098389, -3.8869752883911133, -2.650954246520996, -1.414933204650879, -0.17891204357147217, 1.0571091175079346, 2.293130397796631, 3.529151439666748, 4.765172481536865, 6.001194000244141, 7.237215042114258, 8.473236083984375, 9.709257125854492, 10.94527816772461, 12.181299209594727, 13.417320251464844, 14.653341293334961, 15.889363288879395, 17.125385284423828, 18.361404418945312, 19.59742546081543, 20.833446502685547, 22.069467544555664, 23.30548858642578, 24.5415096282959, 25.777530670166016, 27.013553619384766, 28.249576568603516, 29.485597610473633, 30.72161865234375, 31.957639694213867, 33.193660736083984, 34.429683685302734, 35.66570281982422, 36.90172576904297, 38.13774490356445, 39.3737678527832, 40.60978698730469, 41.84580993652344, 43.08182907104492, 44.31785202026367, 45.553871154785156, 46.789894104003906, 48.025917053222656, 49.261940002441406, 50.49795913696289, 51.73398208618164, 52.970001220703125, 54.206024169921875, 55.44204330444336, 56.67806625366211, 57.914085388183594, 59.150108337402344, 60.38612747192383, 61.62215042114258, 62.85816955566406, 64.09419250488281, 65.33021545410156, 66.56623077392578, 67.80225372314453]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 3.0, 11.0, 16.0, 10.0, 13.0, 20.0, 12.0, 23.0, 19.0, 25.0, 24.0, 32.0, 31.0, 27.0, 35.0, 42.0, 37.0, 45.0, 50.0, 33.0, 40.0, 46.0, 38.0, 50.0, 38.0, 30.0, 33.0, 21.0, 35.0, 31.0, 21.0, 14.0, 11.0, 12.0, 12.0, 14.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.468196868896484, -15.89360237121582, -15.319007873535156, -14.744413375854492, -14.169818878173828, -13.595224380493164, -13.0206298828125, -12.446035385131836, -11.871440887451172, -11.296846389770508, -10.722251892089844, -10.14765739440918, -9.573062896728516, -8.998468399047852, -8.423873901367188, -7.849279880523682, -7.274685859680176, -6.700091361999512, -6.125496864318848, -5.550902366638184, -4.9763078689575195, -4.4017133712768555, -3.8271193504333496, -3.2525248527526855, -2.6779303550720215, -2.1033358573913574, -1.528741478919983, -0.9541471004486084, -0.37955260276794434, 0.19504189491271973, 0.7696361541748047, 1.3442306518554688, 1.9188251495361328, 2.493419647216797, 3.068014144897461, 3.642608404159546, 4.217203140258789, 4.791797637939453, 5.366391658782959, 5.940986156463623, 6.515580654144287, 7.090175151824951, 7.664769649505615, 8.239363670349121, 8.813958168029785, 9.38855266571045, 9.963147163391113, 10.537741661071777, 11.112336158752441, 11.686930656433105, 12.26152515411377, 12.836119651794434, 13.410714149475098, 13.985308647155762, 14.55990219116211, 15.134496688842773, 15.709091186523438, 16.2836856842041, 16.858280181884766, 17.43287467956543, 18.007469177246094, 18.582063674926758, 19.156658172607422, 19.731252670288086, 20.30584716796875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 4.0, 15.0, 10.0, 16.0, 20.0, 12.0, 17.0, 23.0, 22.0, 23.0, 31.0, 29.0, 40.0, 41.0, 25.0, 45.0, 55.0, 42.0, 39.0, 40.0, 39.0, 34.0, 48.0, 28.0, 45.0, 33.0, 33.0, 25.0, 22.0, 24.0, 16.0, 18.0, 16.0, 20.0, 15.0, 3.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.625, -3.514434814453125, -3.40386962890625, -3.293304443359375, -3.1827392578125, -3.072174072265625, -2.96160888671875, -2.851043701171875, -2.740478515625, -2.629913330078125, -2.51934814453125, -2.408782958984375, -2.2982177734375, -2.187652587890625, -2.07708740234375, -1.966522216796875, -1.85595703125, -1.745391845703125, -1.63482666015625, -1.524261474609375, -1.4136962890625, -1.303131103515625, -1.19256591796875, -1.082000732421875, -0.971435546875, -0.860870361328125, -0.75030517578125, -0.639739990234375, -0.5291748046875, -0.418609619140625, -0.30804443359375, -0.197479248046875, -0.0869140625, 0.023651123046875, 0.13421630859375, 0.244781494140625, 0.3553466796875, 0.465911865234375, 0.57647705078125, 0.687042236328125, 0.797607421875, 0.908172607421875, 1.01873779296875, 1.129302978515625, 1.2398681640625, 1.350433349609375, 1.46099853515625, 1.571563720703125, 1.68212890625, 1.792694091796875, 1.90325927734375, 2.013824462890625, 2.1243896484375, 2.234954833984375, 2.34552001953125, 2.456085205078125, 2.566650390625, 2.677215576171875, 2.78778076171875, 2.898345947265625, 3.0089111328125, 3.119476318359375, 3.23004150390625, 3.340606689453125, 3.451171875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 6.0, 8.0, 9.0, 12.0, 30.0, 35.0, 50.0, 74.0, 103.0, 161.0, 181.0, 296.0, 383.0, 606.0, 758.0, 1221.0, 1636.0, 2405.0, 3604.0, 5046.0, 7224.0, 10639.0, 15811.0, 24064.0, 35783.0, 56084.0, 92623.0, 181005.0, 264275.0, 131486.0, 73998.0, 45826.0, 30291.0, 20135.0, 13322.0, 9001.0, 6068.0, 4445.0, 3001.0, 2176.0, 1327.0, 981.0, 693.0, 528.0, 332.0, 242.0, 171.0, 108.0, 102.0, 61.0, 47.0, 32.0, 21.0, 12.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0], "bins": [-0.016387939453125, -0.015880346298217773, -0.015372753143310547, -0.01486515998840332, -0.014357566833496094, -0.013849973678588867, -0.01334238052368164, -0.012834787368774414, -0.012327194213867188, -0.011819601058959961, -0.011312007904052734, -0.010804414749145508, -0.010296821594238281, -0.009789228439331055, -0.009281635284423828, -0.008774042129516602, -0.008266448974609375, -0.0077588558197021484, -0.007251262664794922, -0.006743669509887695, -0.006236076354980469, -0.005728483200073242, -0.005220890045166016, -0.004713296890258789, -0.0042057037353515625, -0.003698110580444336, -0.0031905174255371094, -0.002682924270629883, -0.0021753311157226562, -0.0016677379608154297, -0.0011601448059082031, -0.0006525516510009766, -0.00014495849609375, 0.00036263465881347656, 0.0008702278137207031, 0.0013778209686279297, 0.0018854141235351562, 0.002393007278442383, 0.0029006004333496094, 0.003408193588256836, 0.0039157867431640625, 0.004423379898071289, 0.004930973052978516, 0.005438566207885742, 0.005946159362792969, 0.006453752517700195, 0.006961345672607422, 0.0074689388275146484, 0.007976531982421875, 0.008484125137329102, 0.008991718292236328, 0.009499311447143555, 0.010006904602050781, 0.010514497756958008, 0.011022090911865234, 0.011529684066772461, 0.012037277221679688, 0.012544870376586914, 0.01305246353149414, 0.013560056686401367, 0.014067649841308594, 0.01457524299621582, 0.015082836151123047, 0.015590429306030273, 0.0160980224609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 6.0, 8.0, 8.0, 16.0, 16.0, 18.0, 17.0, 22.0, 22.0, 25.0, 34.0, 42.0, 39.0, 42.0, 38.0, 58.0, 50.0, 1073.0, 40.0, 57.0, 47.0, 43.0, 56.0, 38.0, 29.0, 27.0, 18.0, 31.0, 19.0, 13.0, 16.0, 11.0, 8.0, 6.0, 7.0, 2.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4296875, -2.351715087890625, -2.27374267578125, -2.195770263671875, -2.1177978515625, -2.039825439453125, -1.96185302734375, -1.883880615234375, -1.805908203125, -1.727935791015625, -1.64996337890625, -1.571990966796875, -1.4940185546875, -1.416046142578125, -1.33807373046875, -1.260101318359375, -1.18212890625, -1.104156494140625, -1.02618408203125, -0.948211669921875, -0.8702392578125, -0.792266845703125, -0.71429443359375, -0.636322021484375, -0.558349609375, -0.480377197265625, -0.40240478515625, -0.324432373046875, -0.2464599609375, -0.168487548828125, -0.09051513671875, -0.012542724609375, 0.0654296875, 0.143402099609375, 0.22137451171875, 0.299346923828125, 0.3773193359375, 0.455291748046875, 0.53326416015625, 0.611236572265625, 0.689208984375, 0.767181396484375, 0.84515380859375, 0.923126220703125, 1.0010986328125, 1.079071044921875, 1.15704345703125, 1.235015869140625, 1.31298828125, 1.390960693359375, 1.46893310546875, 1.546905517578125, 1.6248779296875, 1.702850341796875, 1.78082275390625, 1.858795166015625, 1.936767578125, 2.014739990234375, 2.09271240234375, 2.170684814453125, 2.2486572265625, 2.326629638671875, 2.40460205078125, 2.482574462890625, 2.560546875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 9.0, 16.0, 14.0, 24.0, 30.0, 52.0, 77.0, 109.0, 156.0, 270.0, 338.0, 542.0, 858.0, 1196.0, 2023.0, 3131.0, 4907.0, 7938.0, 12719.0, 21932.0, 37702.0, 70248.0, 147672.0, 1389621.0, 197703.0, 86475.0, 45386.0, 25706.0, 15262.0, 9143.0, 5855.0, 3469.0, 2287.0, 1481.0, 919.0, 597.0, 440.0, 292.0, 197.0, 111.0, 78.0, 51.0, 34.0, 24.0, 15.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01522064208984375, -0.014754533767700195, -0.01428842544555664, -0.013822317123413086, -0.013356208801269531, -0.012890100479125977, -0.012423992156982422, -0.011957883834838867, -0.011491775512695312, -0.011025667190551758, -0.010559558868408203, -0.010093450546264648, -0.009627342224121094, -0.009161233901977539, -0.008695125579833984, -0.00822901725769043, -0.007762908935546875, -0.00729680061340332, -0.006830692291259766, -0.006364583969116211, -0.005898475646972656, -0.0054323673248291016, -0.004966259002685547, -0.004500150680541992, -0.0040340423583984375, -0.003567934036254883, -0.003101825714111328, -0.0026357173919677734, -0.0021696090698242188, -0.001703500747680664, -0.0012373924255371094, -0.0007712841033935547, -0.00030517578125, 0.0001609325408935547, 0.0006270408630371094, 0.001093149185180664, 0.0015592575073242188, 0.0020253658294677734, 0.002491474151611328, 0.002957582473754883, 0.0034236907958984375, 0.003889799118041992, 0.004355907440185547, 0.0048220157623291016, 0.005288124084472656, 0.005754232406616211, 0.006220340728759766, 0.00668644905090332, 0.007152557373046875, 0.00761866569519043, 0.008084774017333984, 0.008550882339477539, 0.009016990661621094, 0.009483098983764648, 0.009949207305908203, 0.010415315628051758, 0.010881423950195312, 0.011347532272338867, 0.011813640594482422, 0.012279748916625977, 0.012745857238769531, 0.013211965560913086, 0.01367807388305664, 0.014144182205200195, 0.01461029052734375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 119.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 717.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 134.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.300366759300232e-07, -2.2165477275848389e-07, -2.1327286958694458e-07, -2.0489096641540527e-07, -1.9650906324386597e-07, -1.8812716007232666e-07, -1.7974525690078735e-07, -1.7136335372924805e-07, -1.6298145055770874e-07, -1.5459954738616943e-07, -1.4621764421463013e-07, -1.3783574104309082e-07, -1.2945383787155151e-07, -1.210719347000122e-07, -1.126900315284729e-07, -1.043081283569336e-07, -9.592622518539429e-08, -8.754432201385498e-08, -7.916241884231567e-08, -7.078051567077637e-08, -6.239861249923706e-08, -5.4016709327697754e-08, -4.563480615615845e-08, -3.725290298461914e-08, -2.8870999813079834e-08, -2.0489096641540527e-08, -1.210719347000122e-08, -3.725290298461914e-09, 4.6566128730773926e-09, 1.30385160446167e-08, 2.1420419216156006e-08, 2.9802322387695312e-08, 3.818422555923462e-08, 4.6566128730773926e-08, 5.494803190231323e-08, 6.332993507385254e-08, 7.171183824539185e-08, 8.009374141693115e-08, 8.847564458847046e-08, 9.685754776000977e-08, 1.0523945093154907e-07, 1.1362135410308838e-07, 1.2200325727462769e-07, 1.30385160446167e-07, 1.387670636177063e-07, 1.471489667892456e-07, 1.555308699607849e-07, 1.6391277313232422e-07, 1.7229467630386353e-07, 1.8067657947540283e-07, 1.8905848264694214e-07, 1.9744038581848145e-07, 2.0582228899002075e-07, 2.1420419216156006e-07, 2.2258609533309937e-07, 2.3096799850463867e-07, 2.39349901676178e-07, 2.477318048477173e-07, 2.561137080192566e-07, 2.644956111907959e-07, 2.728775143623352e-07, 2.812594175338745e-07, 2.896413207054138e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 10.0, 5.0, 2.0, 0.0, 4.0, 1.0, 17.0, 60.0, 77.0, 6.0, 6.0, 91.0, 113.0, 273.0, 8753.0, 1029750.0, 8736.0, 284.0, 103.0, 91.0, 5.0, 36.0, 88.0, 16.0, 2.0, 7.0, 1.0, 0.0, 3.0, 7.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.258487701416016e-06, -6.081536412239075e-06, -5.904585123062134e-06, -5.727633833885193e-06, -5.550682544708252e-06, -5.373731255531311e-06, -5.19677996635437e-06, -5.019828677177429e-06, -4.842877388000488e-06, -4.665926098823547e-06, -4.4889748096466064e-06, -4.3120235204696655e-06, -4.135072231292725e-06, -3.958120942115784e-06, -3.7811696529388428e-06, -3.604218363761902e-06, -3.427267074584961e-06, -3.25031578540802e-06, -3.073364496231079e-06, -2.896413207054138e-06, -2.7194619178771973e-06, -2.5425106287002563e-06, -2.3655593395233154e-06, -2.1886080503463745e-06, -2.0116567611694336e-06, -1.8347054719924927e-06, -1.6577541828155518e-06, -1.4808028936386108e-06, -1.30385160446167e-06, -1.126900315284729e-06, -9.499490261077881e-07, -7.729977369308472e-07, -5.960464477539062e-07, -4.1909515857696533e-07, -2.421438694000244e-07, -6.51925802230835e-08, 1.1175870895385742e-07, 2.8870999813079834e-07, 4.6566128730773926e-07, 6.426125764846802e-07, 8.195638656616211e-07, 9.96515154838562e-07, 1.173466444015503e-06, 1.3504177331924438e-06, 1.5273690223693848e-06, 1.7043203115463257e-06, 1.8812716007232666e-06, 2.0582228899002075e-06, 2.2351741790771484e-06, 2.4121254682540894e-06, 2.5890767574310303e-06, 2.766028046607971e-06, 2.942979335784912e-06, 3.119930624961853e-06, 3.296881914138794e-06, 3.473833203315735e-06, 3.6507844924926758e-06, 3.827735781669617e-06, 4.004687070846558e-06, 4.1816383600234985e-06, 4.3585896492004395e-06, 4.53554093837738e-06, 4.712492227554321e-06, 4.889443516731262e-06, 5.066394805908203e-06]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1004.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.492702908644787e-08, -5.963182303503345e-08, -5.4336616983619024e-08, -4.90414109322046e-08, -4.3746204880790174e-08, -3.845099882937575e-08, -3.3155792777961324e-08, -2.78605867265469e-08, -2.2565380675132474e-08, -1.727017462371805e-08, -1.1974968572303624e-08, -6.679762520889199e-09, -1.3845564694747736e-09, 3.910649581939651e-09, 9.205855633354076e-09, 1.4501061684768501e-08, 1.9796267736182926e-08, 2.509147378759735e-08, 3.0386679839011776e-08, 3.56818858904262e-08, 4.0977091941840627e-08, 4.627229799325505e-08, 5.1567504044669477e-08, 5.68627100960839e-08, 6.215791614749833e-08, 6.745312219891275e-08, 7.274832825032718e-08, 7.80435343017416e-08, 8.333874035315603e-08, 8.863394640457045e-08, 9.392915245598488e-08, 9.92243585073993e-08, 1.0451955745338637e-07, 1.098147635048008e-07, 1.1510996955621522e-07, 1.2040517560762964e-07, 1.2570038165904407e-07, 1.309955877104585e-07, 1.3629079376187292e-07, 1.4158599981328734e-07, 1.4688120586470177e-07, 1.521764119161162e-07, 1.5747161796753062e-07, 1.6276682401894504e-07, 1.6806203007035947e-07, 1.733572361217739e-07, 1.7865244217318832e-07, 1.8394764822460274e-07, 1.8924285427601717e-07, 1.945380603274316e-07, 1.9983326637884602e-07, 2.0512847243026044e-07, 2.1042367848167487e-07, 2.157188845330893e-07, 2.2101409058450372e-07, 2.2630929663591814e-07, 2.3160450268733257e-07, 2.36899708738747e-07, 2.421949147901614e-07, 2.4749010663072113e-07, 2.5278532689299027e-07, 2.580805471552594e-07, 2.633757389958191e-07, 2.6867093083637883e-07, 2.7396615109864797e-07]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1005.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0], "bins": [-5.960464477539063e-08, -5.774199962615967e-08, -5.587935447692871e-08, -5.4016709327697754e-08, -5.21540641784668e-08, -5.029141902923584e-08, -4.842877388000488e-08, -4.6566128730773926e-08, -4.470348358154297e-08, -4.284083843231201e-08, -4.0978193283081055e-08, -3.91155481338501e-08, -3.725290298461914e-08, -3.5390257835388184e-08, -3.3527612686157227e-08, -3.166496753692627e-08, -2.9802322387695312e-08, -2.7939677238464355e-08, -2.60770320892334e-08, -2.421438694000244e-08, -2.2351741790771484e-08, -2.0489096641540527e-08, -1.862645149230957e-08, -1.6763806343078613e-08, -1.4901161193847656e-08, -1.30385160446167e-08, -1.1175870895385742e-08, -9.313225746154785e-09, -7.450580596923828e-09, -5.587935447692871e-09, -3.725290298461914e-09, -1.862645149230957e-09, 0.0, 1.862645149230957e-09, 3.725290298461914e-09, 5.587935447692871e-09, 7.450580596923828e-09, 9.313225746154785e-09, 1.1175870895385742e-08, 1.30385160446167e-08, 1.4901161193847656e-08, 1.6763806343078613e-08, 1.862645149230957e-08, 2.0489096641540527e-08, 2.2351741790771484e-08, 2.421438694000244e-08, 2.60770320892334e-08, 2.7939677238464355e-08, 2.9802322387695312e-08, 3.166496753692627e-08, 3.3527612686157227e-08, 3.5390257835388184e-08, 3.725290298461914e-08, 3.91155481338501e-08, 4.0978193283081055e-08, 4.284083843231201e-08, 4.470348358154297e-08, 4.6566128730773926e-08, 4.842877388000488e-08, 5.029141902923584e-08, 5.21540641784668e-08, 5.4016709327697754e-08, 5.587935447692871e-08, 5.774199962615967e-08, 5.960464477539063e-08]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 4.0, 15.0, 10.0, 16.0, 20.0, 12.0, 17.0, 23.0, 22.0, 23.0, 31.0, 29.0, 40.0, 41.0, 25.0, 45.0, 55.0, 42.0, 39.0, 40.0, 39.0, 34.0, 48.0, 28.0, 45.0, 33.0, 33.0, 25.0, 22.0, 24.0, 16.0, 18.0, 16.0, 20.0, 15.0, 3.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.625, -3.514434814453125, -3.40386962890625, -3.293304443359375, -3.1827392578125, -3.072174072265625, -2.96160888671875, -2.851043701171875, -2.740478515625, -2.629913330078125, -2.51934814453125, -2.408782958984375, -2.2982177734375, -2.187652587890625, -2.07708740234375, -1.966522216796875, -1.85595703125, -1.745391845703125, -1.63482666015625, -1.524261474609375, -1.4136962890625, -1.303131103515625, -1.19256591796875, -1.082000732421875, -0.971435546875, -0.860870361328125, -0.75030517578125, -0.639739990234375, -0.5291748046875, -0.418609619140625, -0.30804443359375, -0.197479248046875, -0.0869140625, 0.023651123046875, 0.13421630859375, 0.244781494140625, 0.3553466796875, 0.465911865234375, 0.57647705078125, 0.687042236328125, 0.797607421875, 0.908172607421875, 1.01873779296875, 1.129302978515625, 1.2398681640625, 1.350433349609375, 1.46099853515625, 1.571563720703125, 1.68212890625, 1.792694091796875, 1.90325927734375, 2.013824462890625, 2.1243896484375, 2.234954833984375, 2.34552001953125, 2.456085205078125, 2.566650390625, 2.677215576171875, 2.78778076171875, 2.898345947265625, 3.0089111328125, 3.119476318359375, 3.23004150390625, 3.340606689453125, 3.451171875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 11.0, 0.0, 7.0, 8.0, 6.0, 24.0, 25.0, 38.0, 36.0, 50.0, 73.0, 92.0, 140.0, 188.0, 275.0, 521.0, 1042.0, 2021.0, 4326.0, 10607.0, 26822.0, 83991.0, 682849.0, 168543.0, 39908.0, 15031.0, 5978.0, 2722.0, 1330.0, 705.0, 401.0, 197.0, 136.0, 111.0, 72.0, 59.0, 44.0, 50.0, 34.0, 16.0, 17.0, 9.0, 9.0, 9.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.890625, -6.67987060546875, -6.4691162109375, -6.25836181640625, -6.047607421875, -5.83685302734375, -5.6260986328125, -5.41534423828125, -5.20458984375, -4.99383544921875, -4.7830810546875, -4.57232666015625, -4.361572265625, -4.15081787109375, -3.9400634765625, -3.72930908203125, -3.5185546875, -3.30780029296875, -3.0970458984375, -2.88629150390625, -2.675537109375, -2.46478271484375, -2.2540283203125, -2.04327392578125, -1.83251953125, -1.62176513671875, -1.4110107421875, -1.20025634765625, -0.989501953125, -0.77874755859375, -0.5679931640625, -0.35723876953125, -0.146484375, 0.06427001953125, 0.2750244140625, 0.48577880859375, 0.696533203125, 0.90728759765625, 1.1180419921875, 1.32879638671875, 1.53955078125, 1.75030517578125, 1.9610595703125, 2.17181396484375, 2.382568359375, 2.59332275390625, 2.8040771484375, 3.01483154296875, 3.2255859375, 3.43634033203125, 3.6470947265625, 3.85784912109375, 4.068603515625, 4.27935791015625, 4.4901123046875, 4.70086669921875, 4.91162109375, 5.12237548828125, 5.3331298828125, 5.54388427734375, 5.754638671875, 5.96539306640625, 6.1761474609375, 6.38690185546875, 6.59765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 9.0, 2.0, 2.0, 13.0, 11.0, 10.0, 24.0, 16.0, 30.0, 20.0, 30.0, 30.0, 45.0, 40.0, 49.0, 58.0, 61.0, 114.0, 1542.0, 401.0, 97.0, 52.0, 52.0, 47.0, 33.0, 43.0, 27.0, 30.0, 37.0, 25.0, 17.0, 25.0, 10.0, 6.0, 12.0, 9.0, 6.0, 7.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.9609375, -11.6185302734375, -11.276123046875, -10.9337158203125, -10.59130859375, -10.2489013671875, -9.906494140625, -9.5640869140625, -9.2216796875, -8.8792724609375, -8.536865234375, -8.1944580078125, -7.85205078125, -7.5096435546875, -7.167236328125, -6.8248291015625, -6.482421875, -6.1400146484375, -5.797607421875, -5.4552001953125, -5.11279296875, -4.7703857421875, -4.427978515625, -4.0855712890625, -3.7431640625, -3.4007568359375, -3.058349609375, -2.7159423828125, -2.37353515625, -2.0311279296875, -1.688720703125, -1.3463134765625, -1.00390625, -0.6614990234375, -0.319091796875, 0.0233154296875, 0.36572265625, 0.7081298828125, 1.050537109375, 1.3929443359375, 1.7353515625, 2.0777587890625, 2.420166015625, 2.7625732421875, 3.10498046875, 3.4473876953125, 3.789794921875, 4.1322021484375, 4.474609375, 4.8170166015625, 5.159423828125, 5.5018310546875, 5.84423828125, 6.1866455078125, 6.529052734375, 6.8714599609375, 7.2138671875, 7.5562744140625, 7.898681640625, 8.2410888671875, 8.58349609375, 8.9259033203125, 9.268310546875, 9.6107177734375, 9.953125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 4.0, 7.0, 14.0, 11.0, 17.0, 29.0, 15.0, 30.0, 40.0, 46.0, 56.0, 91.0, 113.0, 188.0, 343.0, 1026.0, 10175.0, 713567.0, 2404028.0, 13559.0, 1296.0, 363.0, 214.0, 120.0, 79.0, 53.0, 42.0, 35.0, 34.0, 28.0, 14.0, 18.0, 10.0, 12.0, 3.0, 3.0, 10.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.17578125, -18.4921875, -17.80859375, -17.125, -16.44140625, -15.7578125, -15.07421875, -14.390625, -13.70703125, -13.0234375, -12.33984375, -11.65625, -10.97265625, -10.2890625, -9.60546875, -8.921875, -8.23828125, -7.5546875, -6.87109375, -6.1875, -5.50390625, -4.8203125, -4.13671875, -3.453125, -2.76953125, -2.0859375, -1.40234375, -0.71875, -0.03515625, 0.6484375, 1.33203125, 2.015625, 2.69921875, 3.3828125, 4.06640625, 4.75, 5.43359375, 6.1171875, 6.80078125, 7.484375, 8.16796875, 8.8515625, 9.53515625, 10.21875, 10.90234375, 11.5859375, 12.26953125, 12.953125, 13.63671875, 14.3203125, 15.00390625, 15.6875, 16.37109375, 17.0546875, 17.73828125, 18.421875, 19.10546875, 19.7890625, 20.47265625, 21.15625, 21.83984375, 22.5234375, 23.20703125, 23.890625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 14.0, 31.0, 63.0, 181.0, 247.0, 248.0, 142.0, 61.0, 18.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.3286018371582, -34.506431579589844, -33.684261322021484, -32.862091064453125, -32.039920806884766, -31.21775245666504, -30.39558219909668, -29.573413848876953, -28.751243591308594, -27.929073333740234, -27.106903076171875, -26.28473472595215, -25.46256446838379, -24.64039421081543, -23.81822395324707, -22.996055603027344, -22.173885345458984, -21.351715087890625, -20.529544830322266, -19.70737648010254, -18.88520622253418, -18.06303596496582, -17.24086570739746, -16.418697357177734, -15.596525192260742, -14.774354934692383, -13.95218563079834, -13.13001537322998, -12.307846069335938, -11.485675811767578, -10.663505554199219, -9.841336250305176, -9.019166946411133, -8.196996688842773, -7.3748273849487305, -6.552657127380371, -5.730487823486328, -4.908317565917969, -4.086147785186768, -3.2639780044555664, -2.4418082237243652, -1.619638442993164, -0.7974685430526733, 0.024701356887817383, 0.8468711376190186, 1.6690411567687988, 2.4912109375, 3.313380718231201, 4.135550498962402, 4.9577202796936035, 5.779890060424805, 6.602060317993164, 7.424229621887207, 8.246399879455566, 9.06856918334961, 9.890739440917969, 10.712909698486328, 11.535079956054688, 12.35724925994873, 13.17941951751709, 14.001588821411133, 14.823759078979492, 15.645929336547852, 16.468097686767578, 17.290267944335938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 10.0, 17.0, 11.0, 23.0, 28.0, 20.0, 37.0, 25.0, 38.0, 34.0, 35.0, 53.0, 52.0, 38.0, 48.0, 42.0, 39.0, 45.0, 38.0, 48.0, 35.0, 35.0, 41.0, 29.0, 30.0, 21.0, 14.0, 15.0, 14.0, 14.0, 11.0, 13.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.01033592224121, -29.10943031311035, -28.208524703979492, -27.3076171875, -26.40671157836914, -25.50580596923828, -24.604900360107422, -23.703994750976562, -22.803089141845703, -21.902183532714844, -21.001277923583984, -20.100372314453125, -19.199464797973633, -18.298559188842773, -17.397653579711914, -16.496747970581055, -15.595840454101562, -14.694934844970703, -13.794028282165527, -12.893122673034668, -11.992216110229492, -11.091310501098633, -10.190404891967773, -9.289499282836914, -8.388592720031738, -7.487686634063721, -6.586780548095703, -5.685874938964844, -4.784968852996826, -3.8840627670288086, -2.983157157897949, -2.0822510719299316, -1.1813430786132812, -0.2804371118545532, 0.6204688549041748, 1.5213747024536133, 2.422280788421631, 3.3231868743896484, 4.224092483520508, 5.124998569488525, 6.025904655456543, 6.9268107414245605, 7.827716827392578, 8.728622436523438, 9.629528045654297, 10.530434608459473, 11.431340217590332, 12.332246780395508, 13.233152389526367, 14.134057998657227, 15.034964561462402, 15.935870170593262, 16.836776733398438, 17.737682342529297, 18.638587951660156, 19.539493560791016, 20.440399169921875, 21.341304779052734, 22.242210388183594, 23.143115997314453, 24.044023513793945, 24.944929122924805, 25.845834732055664, 26.746740341186523, 27.647647857666016]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 6.0, 11.0, 7.0, 15.0, 19.0, 10.0, 22.0, 18.0, 19.0, 24.0, 29.0, 27.0, 30.0, 35.0, 37.0, 37.0, 34.0, 43.0, 41.0, 49.0, 37.0, 42.0, 39.0, 39.0, 36.0, 36.0, 27.0, 31.0, 30.0, 27.0, 24.0, 17.0, 14.0, 16.0, 14.0, 9.0, 11.0, 7.0, 8.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.50390625, -3.393096923828125, -3.28228759765625, -3.171478271484375, -3.0606689453125, -2.949859619140625, -2.83905029296875, -2.728240966796875, -2.617431640625, -2.506622314453125, -2.39581298828125, -2.285003662109375, -2.1741943359375, -2.063385009765625, -1.95257568359375, -1.841766357421875, -1.73095703125, -1.620147705078125, -1.50933837890625, -1.398529052734375, -1.2877197265625, -1.176910400390625, -1.06610107421875, -0.955291748046875, -0.844482421875, -0.733673095703125, -0.62286376953125, -0.512054443359375, -0.4012451171875, -0.290435791015625, -0.17962646484375, -0.068817138671875, 0.0419921875, 0.152801513671875, 0.26361083984375, 0.374420166015625, 0.4852294921875, 0.596038818359375, 0.70684814453125, 0.817657470703125, 0.928466796875, 1.039276123046875, 1.15008544921875, 1.260894775390625, 1.3717041015625, 1.482513427734375, 1.59332275390625, 1.704132080078125, 1.81494140625, 1.925750732421875, 2.03656005859375, 2.147369384765625, 2.2581787109375, 2.368988037109375, 2.47979736328125, 2.590606689453125, 2.701416015625, 2.812225341796875, 2.92303466796875, 3.033843994140625, 3.1446533203125, 3.255462646484375, 3.36627197265625, 3.477081298828125, 3.587890625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 8.0, 7.0, 9.0, 15.0, 18.0, 24.0, 40.0, 50.0, 98.0, 181.0, 317.0, 595.0, 1354.0, 3054.0, 7793.0, 22460.0, 76467.0, 364329.0, 2091854.0, 1338226.0, 209682.0, 50908.0, 16085.0, 5997.0, 2393.0, 1069.0, 571.0, 275.0, 135.0, 87.0, 37.0, 50.0, 17.0, 24.0, 13.0, 13.0, 6.0, 5.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.0703125, -7.84515380859375, -7.6199951171875, -7.39483642578125, -7.169677734375, -6.94451904296875, -6.7193603515625, -6.49420166015625, -6.26904296875, -6.04388427734375, -5.8187255859375, -5.59356689453125, -5.368408203125, -5.14324951171875, -4.9180908203125, -4.69293212890625, -4.4677734375, -4.24261474609375, -4.0174560546875, -3.79229736328125, -3.567138671875, -3.34197998046875, -3.1168212890625, -2.89166259765625, -2.66650390625, -2.44134521484375, -2.2161865234375, -1.99102783203125, -1.765869140625, -1.54071044921875, -1.3155517578125, -1.09039306640625, -0.865234375, -0.64007568359375, -0.4149169921875, -0.18975830078125, 0.035400390625, 0.26055908203125, 0.4857177734375, 0.71087646484375, 0.93603515625, 1.16119384765625, 1.3863525390625, 1.61151123046875, 1.836669921875, 2.06182861328125, 2.2869873046875, 2.51214599609375, 2.7373046875, 2.96246337890625, 3.1876220703125, 3.41278076171875, 3.637939453125, 3.86309814453125, 4.0882568359375, 4.31341552734375, 4.53857421875, 4.76373291015625, 4.9888916015625, 5.21405029296875, 5.439208984375, 5.66436767578125, 5.8895263671875, 6.11468505859375, 6.33984375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 7.0, 8.0, 18.0, 22.0, 20.0, 21.0, 43.0, 55.0, 70.0, 88.0, 117.0, 129.0, 218.0, 268.0, 299.0, 386.0, 452.0, 397.0, 310.0, 261.0, 202.0, 144.0, 112.0, 88.0, 70.0, 67.0, 40.0, 31.0, 33.0, 19.0, 13.0, 17.0, 10.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.87109375, -4.71136474609375, -4.5516357421875, -4.39190673828125, -4.232177734375, -4.07244873046875, -3.9127197265625, -3.75299072265625, -3.59326171875, -3.43353271484375, -3.2738037109375, -3.11407470703125, -2.954345703125, -2.79461669921875, -2.6348876953125, -2.47515869140625, -2.3154296875, -2.15570068359375, -1.9959716796875, -1.83624267578125, -1.676513671875, -1.51678466796875, -1.3570556640625, -1.19732666015625, -1.03759765625, -0.87786865234375, -0.7181396484375, -0.55841064453125, -0.398681640625, -0.23895263671875, -0.0792236328125, 0.08050537109375, 0.240234375, 0.39996337890625, 0.5596923828125, 0.71942138671875, 0.879150390625, 1.03887939453125, 1.1986083984375, 1.35833740234375, 1.51806640625, 1.67779541015625, 1.8375244140625, 1.99725341796875, 2.156982421875, 2.31671142578125, 2.4764404296875, 2.63616943359375, 2.7958984375, 2.95562744140625, 3.1153564453125, 3.27508544921875, 3.434814453125, 3.59454345703125, 3.7542724609375, 3.91400146484375, 4.07373046875, 4.23345947265625, 4.3931884765625, 4.55291748046875, 4.712646484375, 4.87237548828125, 5.0321044921875, 5.19183349609375, 5.3515625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 10.0, 9.0, 8.0, 18.0, 18.0, 21.0, 22.0, 37.0, 60.0, 51.0, 76.0, 113.0, 153.0, 179.0, 295.0, 647.0, 2187.0, 10393.0, 77808.0, 1108773.0, 2788851.0, 178739.0, 19953.0, 3698.0, 930.0, 413.0, 208.0, 154.0, 108.0, 92.0, 57.0, 41.0, 35.0, 33.0, 26.0, 10.0, 10.0, 12.0, 11.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.140625, -13.68701171875, -13.2333984375, -12.77978515625, -12.326171875, -11.87255859375, -11.4189453125, -10.96533203125, -10.51171875, -10.05810546875, -9.6044921875, -9.15087890625, -8.697265625, -8.24365234375, -7.7900390625, -7.33642578125, -6.8828125, -6.42919921875, -5.9755859375, -5.52197265625, -5.068359375, -4.61474609375, -4.1611328125, -3.70751953125, -3.25390625, -2.80029296875, -2.3466796875, -1.89306640625, -1.439453125, -0.98583984375, -0.5322265625, -0.07861328125, 0.375, 0.82861328125, 1.2822265625, 1.73583984375, 2.189453125, 2.64306640625, 3.0966796875, 3.55029296875, 4.00390625, 4.45751953125, 4.9111328125, 5.36474609375, 5.818359375, 6.27197265625, 6.7255859375, 7.17919921875, 7.6328125, 8.08642578125, 8.5400390625, 8.99365234375, 9.447265625, 9.90087890625, 10.3544921875, 10.80810546875, 11.26171875, 11.71533203125, 12.1689453125, 12.62255859375, 13.076171875, 13.52978515625, 13.9833984375, 14.43701171875, 14.890625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 13.0, 22.0, 30.0, 41.0, 52.0, 71.0, 82.0, 86.0, 86.0, 115.0, 89.0, 79.0, 76.0, 42.0, 31.0, 31.0, 20.0, 16.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.477941513061523, -24.74338150024414, -24.00882339477539, -23.274263381958008, -22.539703369140625, -21.805143356323242, -21.070585250854492, -20.33602523803711, -19.601465225219727, -18.866905212402344, -18.132347106933594, -17.39778709411621, -16.663227081298828, -15.928668022155762, -15.194108963012695, -14.459548950195312, -13.724989891052246, -12.99043083190918, -12.255870819091797, -11.52131175994873, -10.786751747131348, -10.052192687988281, -9.317632675170898, -8.583073616027832, -7.848514080047607, -7.113954544067383, -6.379395008087158, -5.644835472106934, -4.910276412963867, -4.175716400146484, -3.441157341003418, -2.7065978050231934, -1.9720382690429688, -1.2374787330627441, -0.5029193162918091, 0.23164010047912598, 0.9661996364593506, 1.7007591724395752, 2.4353184700012207, 3.1698780059814453, 3.90443754196167, 4.6389970779418945, 5.373556613922119, 6.108116149902344, 6.84267520904541, 7.577235221862793, 8.31179428100586, 9.046354293823242, 9.780913352966309, 10.515472412109375, 11.250032424926758, 11.984591484069824, 12.719151496887207, 13.453710556030273, 14.188270568847656, 14.922829627990723, 15.657388687133789, 16.391948699951172, 17.126506805419922, 17.861066818237305, 18.595626831054688, 19.33018684387207, 20.06474494934082, 20.799304962158203, 21.533864974975586]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 5.0, 10.0, 16.0, 11.0, 12.0, 12.0, 16.0, 16.0, 23.0, 22.0, 22.0, 37.0, 24.0, 35.0, 40.0, 35.0, 36.0, 50.0, 44.0, 37.0, 48.0, 45.0, 32.0, 35.0, 36.0, 46.0, 28.0, 34.0, 35.0, 28.0, 17.0, 11.0, 16.0, 20.0, 12.0, 14.0, 7.0, 10.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-21.35034942626953, -20.72182846069336, -20.093305587768555, -19.464784622192383, -18.836261749267578, -18.207740783691406, -17.5792179107666, -16.95069694519043, -16.322174072265625, -15.693652153015137, -15.065130233764648, -14.43660831451416, -13.808086395263672, -13.1795654296875, -12.551043510437012, -11.922521591186523, -11.294000625610352, -10.665478706359863, -10.036956787109375, -9.408434867858887, -8.779912948608398, -8.151391983032227, -7.522870063781738, -6.89434814453125, -6.265826225280762, -5.637304306030273, -5.008782386779785, -4.380260944366455, -3.751739025115967, -3.1232171058654785, -2.4946954250335693, -1.8661737442016602, -1.2376518249511719, -0.6091300249099731, 0.019391775131225586, 0.6479135751724243, 1.276435375213623, 1.9049572944641113, 2.5334789752960205, 3.1620006561279297, 3.790522575378418, 4.419044494628906, 5.0475664138793945, 5.676087856292725, 6.304609775543213, 6.933131694793701, 7.561653137207031, 8.19017505645752, 8.818696975708008, 9.447218894958496, 10.075740814208984, 10.704262733459473, 11.332784652709961, 11.961305618286133, 12.589827537536621, 13.21834945678711, 13.846871376037598, 14.475393295288086, 15.103915214538574, 15.732437133789062, 16.360958099365234, 16.98948097229004, 17.61800193786621, 18.246524810791016, 18.875045776367188]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 8.0, 8.0, 9.0, 19.0, 16.0, 21.0, 22.0, 16.0, 34.0, 23.0, 39.0, 37.0, 48.0, 41.0, 43.0, 36.0, 49.0, 43.0, 50.0, 47.0, 50.0, 39.0, 41.0, 32.0, 26.0, 34.0, 28.0, 19.0, 15.0, 20.0, 11.0, 13.0, 14.0, 11.0, 11.0, 5.0, 11.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.9375, -3.81298828125, -3.6884765625, -3.56396484375, -3.439453125, -3.31494140625, -3.1904296875, -3.06591796875, -2.94140625, -2.81689453125, -2.6923828125, -2.56787109375, -2.443359375, -2.31884765625, -2.1943359375, -2.06982421875, -1.9453125, -1.82080078125, -1.6962890625, -1.57177734375, -1.447265625, -1.32275390625, -1.1982421875, -1.07373046875, -0.94921875, -0.82470703125, -0.7001953125, -0.57568359375, -0.451171875, -0.32666015625, -0.2021484375, -0.07763671875, 0.046875, 0.17138671875, 0.2958984375, 0.42041015625, 0.544921875, 0.66943359375, 0.7939453125, 0.91845703125, 1.04296875, 1.16748046875, 1.2919921875, 1.41650390625, 1.541015625, 1.66552734375, 1.7900390625, 1.91455078125, 2.0390625, 2.16357421875, 2.2880859375, 2.41259765625, 2.537109375, 2.66162109375, 2.7861328125, 2.91064453125, 3.03515625, 3.15966796875, 3.2841796875, 3.40869140625, 3.533203125, 3.65771484375, 3.7822265625, 3.90673828125, 4.03125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 9.0, 15.0, 14.0, 27.0, 42.0, 50.0, 70.0, 110.0, 183.0, 293.0, 544.0, 949.0, 1673.0, 2784.0, 5041.0, 9262.0, 17215.0, 32718.0, 67378.0, 166938.0, 427891.0, 172627.0, 69866.0, 33304.0, 17802.0, 9638.0, 5358.0, 2895.0, 1554.0, 908.0, 500.0, 336.0, 226.0, 110.0, 90.0, 49.0, 28.0, 20.0, 17.0, 8.0, 1.0, 8.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0296630859375, -0.028750896453857422, -0.027838706970214844, -0.026926517486572266, -0.026014328002929688, -0.02510213851928711, -0.02418994903564453, -0.023277759552001953, -0.022365570068359375, -0.021453380584716797, -0.02054119110107422, -0.01962900161743164, -0.018716812133789062, -0.017804622650146484, -0.016892433166503906, -0.015980243682861328, -0.01506805419921875, -0.014155864715576172, -0.013243675231933594, -0.012331485748291016, -0.011419296264648438, -0.01050710678100586, -0.009594917297363281, -0.008682727813720703, -0.007770538330078125, -0.006858348846435547, -0.005946159362792969, -0.005033969879150391, -0.0041217803955078125, -0.0032095909118652344, -0.0022974014282226562, -0.0013852119445800781, -0.0004730224609375, 0.0004391670227050781, 0.0013513565063476562, 0.0022635459899902344, 0.0031757354736328125, 0.004087924957275391, 0.005000114440917969, 0.005912303924560547, 0.006824493408203125, 0.007736682891845703, 0.008648872375488281, 0.00956106185913086, 0.010473251342773438, 0.011385440826416016, 0.012297630310058594, 0.013209819793701172, 0.01412200927734375, 0.015034198760986328, 0.015946388244628906, 0.016858577728271484, 0.017770767211914062, 0.01868295669555664, 0.01959514617919922, 0.020507335662841797, 0.021419525146484375, 0.022331714630126953, 0.02324390411376953, 0.02415609359741211, 0.025068283081054688, 0.025980472564697266, 0.026892662048339844, 0.027804851531982422, 0.028717041015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 7.0, 10.0, 10.0, 17.0, 11.0, 14.0, 17.0, 14.0, 25.0, 26.0, 23.0, 27.0, 38.0, 37.0, 33.0, 36.0, 38.0, 33.0, 46.0, 1064.0, 40.0, 38.0, 49.0, 40.0, 37.0, 34.0, 32.0, 22.0, 24.0, 23.0, 24.0, 17.0, 21.0, 16.0, 15.0, 12.0, 12.0, 6.0, 4.0, 6.0, 4.0, 2.0, 7.0, 2.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.16015625, -2.087646484375, -2.01513671875, -1.942626953125, -1.8701171875, -1.797607421875, -1.72509765625, -1.652587890625, -1.580078125, -1.507568359375, -1.43505859375, -1.362548828125, -1.2900390625, -1.217529296875, -1.14501953125, -1.072509765625, -1.0, -0.927490234375, -0.85498046875, -0.782470703125, -0.7099609375, -0.637451171875, -0.56494140625, -0.492431640625, -0.419921875, -0.347412109375, -0.27490234375, -0.202392578125, -0.1298828125, -0.057373046875, 0.01513671875, 0.087646484375, 0.16015625, 0.232666015625, 0.30517578125, 0.377685546875, 0.4501953125, 0.522705078125, 0.59521484375, 0.667724609375, 0.740234375, 0.812744140625, 0.88525390625, 0.957763671875, 1.0302734375, 1.102783203125, 1.17529296875, 1.247802734375, 1.3203125, 1.392822265625, 1.46533203125, 1.537841796875, 1.6103515625, 1.682861328125, 1.75537109375, 1.827880859375, 1.900390625, 1.972900390625, 2.04541015625, 2.117919921875, 2.1904296875, 2.262939453125, 2.33544921875, 2.407958984375, 2.48046875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 14.0, 13.0, 15.0, 47.0, 45.0, 118.0, 107.0, 196.0, 262.0, 427.0, 650.0, 840.0, 1362.0, 2033.0, 2897.0, 4468.0, 6875.0, 10571.0, 16489.0, 26264.0, 41700.0, 70555.0, 134304.0, 1342258.0, 199441.0, 92175.0, 52988.0, 32344.0, 20256.0, 12847.0, 8248.0, 5457.0, 3564.0, 2393.0, 1606.0, 1006.0, 704.0, 474.0, 337.0, 250.0, 160.0, 105.0, 73.0, 55.0, 47.0, 32.0, 20.0, 10.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0], "bins": [-0.01480865478515625, -0.014369606971740723, -0.013930559158325195, -0.013491511344909668, -0.01305246353149414, -0.012613415718078613, -0.012174367904663086, -0.011735320091247559, -0.011296272277832031, -0.010857224464416504, -0.010418176651000977, -0.00997912883758545, -0.009540081024169922, -0.009101033210754395, -0.008661985397338867, -0.00822293758392334, -0.0077838897705078125, -0.007344841957092285, -0.006905794143676758, -0.0064667463302612305, -0.006027698516845703, -0.005588650703430176, -0.0051496028900146484, -0.004710555076599121, -0.004271507263183594, -0.0038324594497680664, -0.003393411636352539, -0.0029543638229370117, -0.0025153160095214844, -0.002076268196105957, -0.0016372203826904297, -0.0011981725692749023, -0.000759124755859375, -0.00032007694244384766, 0.00011897087097167969, 0.000558018684387207, 0.0009970664978027344, 0.0014361143112182617, 0.001875162124633789, 0.0023142099380493164, 0.0027532577514648438, 0.003192305564880371, 0.0036313533782958984, 0.004070401191711426, 0.004509449005126953, 0.0049484968185424805, 0.005387544631958008, 0.005826592445373535, 0.0062656402587890625, 0.00670468807220459, 0.007143735885620117, 0.0075827836990356445, 0.008021831512451172, 0.0084608793258667, 0.008899927139282227, 0.009338974952697754, 0.009778022766113281, 0.010217070579528809, 0.010656118392944336, 0.011095166206359863, 0.01153421401977539, 0.011973261833190918, 0.012412309646606445, 0.012851357460021973, 0.0132904052734375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 146.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 631.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 165.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0], "bins": [-2.980232238769531e-07, -2.905726432800293e-07, -2.8312206268310547e-07, -2.7567148208618164e-07, -2.682209014892578e-07, -2.60770320892334e-07, -2.5331974029541016e-07, -2.4586915969848633e-07, -2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 9.0, 11.0, 10.0, 5.0, 4.0, 0.0, 2.0, 14.0, 52.0, 68.0, 55.0, 11.0, 122.0, 115.0, 104.0, 409.0, 11468.0, 933672.0, 101177.0, 560.0, 213.0, 63.0, 174.0, 16.0, 8.0, 73.0, 54.0, 40.0, 8.0, 0.0, 0.0, 8.0, 4.0, 8.0, 8.0, 14.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.814697265625e-06, -3.666616976261139e-06, -3.518536686897278e-06, -3.3704563975334167e-06, -3.2223761081695557e-06, -3.0742958188056946e-06, -2.9262155294418335e-06, -2.7781352400779724e-06, -2.6300549507141113e-06, -2.4819746613502502e-06, -2.333894371986389e-06, -2.185814082622528e-06, -2.037733793258667e-06, -1.889653503894806e-06, -1.7415732145309448e-06, -1.5934929251670837e-06, -1.4454126358032227e-06, -1.2973323464393616e-06, -1.1492520570755005e-06, -1.0011717677116394e-06, -8.530914783477783e-07, -7.050111889839172e-07, -5.569308996200562e-07, -4.0885061025619507e-07, -2.60770320892334e-07, -1.126900315284729e-07, 3.5390257835388184e-08, 1.8347054719924927e-07, 3.3155083656311035e-07, 4.796311259269714e-07, 6.277114152908325e-07, 7.757917046546936e-07, 9.238719940185547e-07, 1.0719522833824158e-06, 1.2200325727462769e-06, 1.368112862110138e-06, 1.516193151473999e-06, 1.6642734408378601e-06, 1.8123537302017212e-06, 1.9604340195655823e-06, 2.1085143089294434e-06, 2.2565945982933044e-06, 2.4046748876571655e-06, 2.5527551770210266e-06, 2.7008354663848877e-06, 2.8489157557487488e-06, 2.99699604511261e-06, 3.145076334476471e-06, 3.293156623840332e-06, 3.441236913204193e-06, 3.589317202568054e-06, 3.7373974919319153e-06, 3.885477781295776e-06, 4.0335580706596375e-06, 4.1816383600234985e-06, 4.32971864938736e-06, 4.477798938751221e-06, 4.625879228115082e-06, 4.773959517478943e-06, 4.922039806842804e-06, 5.070120096206665e-06, 5.218200385570526e-06, 5.366280674934387e-06, 5.514360964298248e-06, 5.662441253662109e-06]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 978.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.877844320271834e-08, -9.563981251403675e-08, -9.25011747199278e-08, -8.936254403124622e-08, -8.622390623713727e-08, -8.308527554845568e-08, -7.99466448597741e-08, -7.680800706566515e-08, -7.36693692715562e-08, -7.053073858287462e-08, -6.739210078876567e-08, -6.425347010008409e-08, -6.111483230597514e-08, -5.7976201617293555e-08, -5.483756737589829e-08, -5.169893313450302e-08, -4.8560302445821435e-08, -4.542166820442617e-08, -4.22830339630309e-08, -3.9144403274349315e-08, -3.600576548024037e-08, -3.286713479155878e-08, -2.9728500550163517e-08, -2.658986630876825e-08, -2.3451232067372985e-08, -2.031259782597772e-08, -1.7173963584582452e-08, -1.4035331119544026e-08, -1.089669687814876e-08, -7.758062636753493e-09, -4.6194301717150665e-09, -1.4807959303198004e-09, 1.6578312056481082e-09, 4.7964650029541644e-09, 7.93509880026022e-09, 1.1073732153477067e-08, 1.4212366394872333e-08, 1.73510006362676e-08, 2.0489633101306026e-08, 2.3628267342701292e-08, 2.676690158409656e-08, 2.9905535825491825e-08, 3.304417006688709e-08, 3.618280430828236e-08, 3.9321434996963944e-08, 4.246007279107289e-08, 4.5598703479754477e-08, 4.873733772114974e-08, 5.187597196254501e-08, 5.5014606203940275e-08, 5.815324044533554e-08, 6.129187113401713e-08, 6.443050892812607e-08, 6.756913961680766e-08, 7.070777030548925e-08, 7.384640809959819e-08, 7.698504589370714e-08, 8.012367658238873e-08, 8.326231437649767e-08, 8.640094506517926e-08, 8.95395828592882e-08, 9.267821354796979e-08, 9.581684423665138e-08, 9.895548203076032e-08, 1.0209411271944191e-07]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [25.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 977.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.960464477539063e-08, -5.681067705154419e-08, -5.4016709327697754e-08, -5.122274160385132e-08, -4.842877388000488e-08, -4.563480615615845e-08, -4.284083843231201e-08, -4.0046870708465576e-08, -3.725290298461914e-08, -3.4458935260772705e-08, -3.166496753692627e-08, -2.8870999813079834e-08, -2.60770320892334e-08, -2.3283064365386963e-08, -2.0489096641540527e-08, -1.7695128917694092e-08, -1.4901161193847656e-08, -1.210719347000122e-08, -9.313225746154785e-09, -6.51925802230835e-09, -3.725290298461914e-09, -9.313225746154785e-10, 1.862645149230957e-09, 4.6566128730773926e-09, 7.450580596923828e-09, 1.0244548320770264e-08, 1.30385160446167e-08, 1.5832483768463135e-08, 1.862645149230957e-08, 2.1420419216156006e-08, 2.421438694000244e-08, 2.7008354663848877e-08, 2.9802322387695312e-08, 3.259629011154175e-08, 3.5390257835388184e-08, 3.818422555923462e-08, 4.0978193283081055e-08, 4.377216100692749e-08, 4.6566128730773926e-08, 4.936009645462036e-08, 5.21540641784668e-08, 5.494803190231323e-08, 5.774199962615967e-08, 6.05359673500061e-08, 6.332993507385254e-08, 6.612390279769897e-08, 6.891787052154541e-08, 7.171183824539185e-08, 7.450580596923828e-08, 7.729977369308472e-08, 8.009374141693115e-08, 8.288770914077759e-08, 8.568167686462402e-08, 8.847564458847046e-08, 9.12696123123169e-08, 9.406358003616333e-08, 9.685754776000977e-08, 9.96515154838562e-08, 1.0244548320770264e-07, 1.0523945093154907e-07, 1.0803341865539551e-07, 1.1082738637924194e-07, 1.1362135410308838e-07, 1.1641532182693481e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 8.0, 8.0, 9.0, 19.0, 16.0, 21.0, 22.0, 16.0, 34.0, 23.0, 39.0, 37.0, 48.0, 41.0, 43.0, 36.0, 49.0, 43.0, 50.0, 47.0, 50.0, 39.0, 41.0, 32.0, 26.0, 34.0, 28.0, 19.0, 15.0, 20.0, 11.0, 13.0, 14.0, 11.0, 11.0, 5.0, 11.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.9375, -3.81298828125, -3.6884765625, -3.56396484375, -3.439453125, -3.31494140625, -3.1904296875, -3.06591796875, -2.94140625, -2.81689453125, -2.6923828125, -2.56787109375, -2.443359375, -2.31884765625, -2.1943359375, -2.06982421875, -1.9453125, -1.82080078125, -1.6962890625, -1.57177734375, -1.447265625, -1.32275390625, -1.1982421875, -1.07373046875, -0.94921875, -0.82470703125, -0.7001953125, -0.57568359375, -0.451171875, -0.32666015625, -0.2021484375, -0.07763671875, 0.046875, 0.17138671875, 0.2958984375, 0.42041015625, 0.544921875, 0.66943359375, 0.7939453125, 0.91845703125, 1.04296875, 1.16748046875, 1.2919921875, 1.41650390625, 1.541015625, 1.66552734375, 1.7900390625, 1.91455078125, 2.0390625, 2.16357421875, 2.2880859375, 2.41259765625, 2.537109375, 2.66162109375, 2.7861328125, 2.91064453125, 3.03515625, 3.15966796875, 3.2841796875, 3.40869140625, 3.533203125, 3.65771484375, 3.7822265625, 3.90673828125, 4.03125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 0.0, 9.0, 8.0, 14.0, 29.0, 33.0, 62.0, 82.0, 106.0, 181.0, 306.0, 530.0, 844.0, 1457.0, 2428.0, 4069.0, 6887.0, 12559.0, 22621.0, 42413.0, 81115.0, 173816.0, 334426.0, 182509.0, 84458.0, 43596.0, 23404.0, 12897.0, 7334.0, 4106.0, 2456.0, 1492.0, 823.0, 544.0, 356.0, 208.0, 123.0, 92.0, 57.0, 37.0, 27.0, 11.0, 12.0, 5.0, 9.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0390625, -3.91094970703125, -3.7828369140625, -3.65472412109375, -3.526611328125, -3.39849853515625, -3.2703857421875, -3.14227294921875, -3.01416015625, -2.88604736328125, -2.7579345703125, -2.62982177734375, -2.501708984375, -2.37359619140625, -2.2454833984375, -2.11737060546875, -1.9892578125, -1.86114501953125, -1.7330322265625, -1.60491943359375, -1.476806640625, -1.34869384765625, -1.2205810546875, -1.09246826171875, -0.96435546875, -0.83624267578125, -0.7081298828125, -0.58001708984375, -0.451904296875, -0.32379150390625, -0.1956787109375, -0.06756591796875, 0.060546875, 0.18865966796875, 0.3167724609375, 0.44488525390625, 0.572998046875, 0.70111083984375, 0.8292236328125, 0.95733642578125, 1.08544921875, 1.21356201171875, 1.3416748046875, 1.46978759765625, 1.597900390625, 1.72601318359375, 1.8541259765625, 1.98223876953125, 2.1103515625, 2.23846435546875, 2.3665771484375, 2.49468994140625, 2.622802734375, 2.75091552734375, 2.8790283203125, 3.00714111328125, 3.13525390625, 3.26336669921875, 3.3914794921875, 3.51959228515625, 3.647705078125, 3.77581787109375, 3.9039306640625, 4.03204345703125, 4.16015625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 11.0, 7.0, 7.0, 12.0, 17.0, 29.0, 13.0, 18.0, 30.0, 38.0, 30.0, 32.0, 57.0, 80.0, 94.0, 166.0, 1384.0, 406.0, 157.0, 102.0, 62.0, 48.0, 46.0, 30.0, 39.0, 29.0, 28.0, 21.0, 13.0, 13.0, 9.0, 11.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9296875, -11.518310546875, -11.10693359375, -10.695556640625, -10.2841796875, -9.872802734375, -9.46142578125, -9.050048828125, -8.638671875, -8.227294921875, -7.81591796875, -7.404541015625, -6.9931640625, -6.581787109375, -6.17041015625, -5.759033203125, -5.34765625, -4.936279296875, -4.52490234375, -4.113525390625, -3.7021484375, -3.290771484375, -2.87939453125, -2.468017578125, -2.056640625, -1.645263671875, -1.23388671875, -0.822509765625, -0.4111328125, 0.000244140625, 0.41162109375, 0.822998046875, 1.234375, 1.645751953125, 2.05712890625, 2.468505859375, 2.8798828125, 3.291259765625, 3.70263671875, 4.114013671875, 4.525390625, 4.936767578125, 5.34814453125, 5.759521484375, 6.1708984375, 6.582275390625, 6.99365234375, 7.405029296875, 7.81640625, 8.227783203125, 8.63916015625, 9.050537109375, 9.4619140625, 9.873291015625, 10.28466796875, 10.696044921875, 11.107421875, 11.518798828125, 11.93017578125, 12.341552734375, 12.7529296875, 13.164306640625, 13.57568359375, 13.987060546875, 14.3984375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 8.0, 10.0, 24.0, 29.0, 57.0, 103.0, 135.0, 293.0, 629.0, 2098.0, 14035.0, 217587.0, 2790941.0, 108166.0, 8829.0, 1554.0, 511.0, 261.0, 143.0, 96.0, 58.0, 41.0, 32.0, 13.0, 16.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.1160888671875, -14.583740234375, -14.0513916015625, -13.51904296875, -12.9866943359375, -12.454345703125, -11.9219970703125, -11.3896484375, -10.8572998046875, -10.324951171875, -9.7926025390625, -9.26025390625, -8.7279052734375, -8.195556640625, -7.6632080078125, -7.130859375, -6.5985107421875, -6.066162109375, -5.5338134765625, -5.00146484375, -4.4691162109375, -3.936767578125, -3.4044189453125, -2.8720703125, -2.3397216796875, -1.807373046875, -1.2750244140625, -0.74267578125, -0.2103271484375, 0.322021484375, 0.8543701171875, 1.38671875, 1.9190673828125, 2.451416015625, 2.9837646484375, 3.51611328125, 4.0484619140625, 4.580810546875, 5.1131591796875, 5.6455078125, 6.1778564453125, 6.710205078125, 7.2425537109375, 7.77490234375, 8.3072509765625, 8.839599609375, 9.3719482421875, 9.904296875, 10.4366455078125, 10.968994140625, 11.5013427734375, 12.03369140625, 12.5660400390625, 13.098388671875, 13.6307373046875, 14.1630859375, 14.6954345703125, 15.227783203125, 15.7601318359375, 16.29248046875, 16.8248291015625, 17.357177734375, 17.8895263671875, 18.421875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [2.0, 7.0, 214.0, 579.0, 207.0, 12.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.43085765838623, -8.188886642456055, -4.946916580200195, -1.7049455642700195, 1.5370244979858398, 4.778994560241699, 8.020966529846191, 11.26293659210205, 14.50490665435791, 17.746877670288086, 20.988847732543945, 24.230819702148438, 27.472789764404297, 30.714759826660156, 33.956729888916016, 37.198699951171875, 40.440670013427734, 43.682640075683594, 46.92461013793945, 50.16658020019531, 53.40855407714844, 56.65052032470703, 59.892494201660156, 63.134464263916016, 66.37643432617188, 69.618408203125, 72.8603744506836, 76.10234832763672, 79.34431457519531, 82.58628845214844, 85.82826232910156, 89.07022857666016, 92.31219482421875, 95.55416870117188, 98.79613494873047, 102.0381088256836, 105.28007507324219, 108.52204895019531, 111.76402282714844, 115.00598907470703, 118.24795532226562, 121.48992919921875, 124.73189544677734, 127.97386932373047, 131.21583557128906, 134.4578094482422, 137.6997833251953, 140.94174194335938, 144.1837158203125, 147.42568969726562, 150.66766357421875, 153.9096221923828, 157.15159606933594, 160.39356994628906, 163.6355438232422, 166.87750244140625, 170.11949157714844, 173.36146545410156, 176.6034393310547, 179.84539794921875, 183.08737182617188, 186.329345703125, 189.57131958007812, 192.81329345703125, 196.0552520751953]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 15.0, 7.0, 10.0, 16.0, 8.0, 11.0, 14.0, 17.0, 22.0, 19.0, 30.0, 24.0, 29.0, 39.0, 35.0, 39.0, 47.0, 35.0, 35.0, 50.0, 33.0, 38.0, 52.0, 33.0, 39.0, 21.0, 25.0, 32.0, 34.0, 22.0, 26.0, 24.0, 24.0, 21.0, 10.0, 8.0, 15.0, 3.0, 13.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-24.566593170166016, -23.82815170288086, -23.08970832824707, -22.351266860961914, -21.612823486328125, -20.87438201904297, -20.135940551757812, -19.397499084472656, -18.659055709838867, -17.92061424255371, -17.182170867919922, -16.443729400634766, -15.705286979675293, -14.96684455871582, -14.228403091430664, -13.489960670471191, -12.751518249511719, -12.013075828552246, -11.274633407592773, -10.536191940307617, -9.797749519348145, -9.059307098388672, -8.320865631103516, -7.582423210144043, -6.84398078918457, -6.105538368225098, -5.367096424102783, -4.628654479980469, -3.890212059020996, -3.1517698764801025, -2.413327693939209, -1.6748857498168945, -0.9364452362060547, -0.19800305366516113, 0.5404391288757324, 1.278881311416626, 2.0173234939575195, 2.755765676498413, 3.4942078590393066, 4.232649803161621, 4.971092224121094, 5.709534645080566, 6.447976589202881, 7.186418533325195, 7.924860954284668, 8.66330337524414, 9.401744842529297, 10.14018726348877, 10.878629684448242, 11.617072105407715, 12.355514526367188, 13.093955993652344, 13.832398414611816, 14.570840835571289, 15.309282302856445, 16.047725677490234, 16.78616714477539, 17.524608612060547, 18.263051986694336, 19.001493453979492, 19.73993682861328, 20.478378295898438, 21.216819763183594, 21.95526123046875, 22.69370460510254]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 7.0, 6.0, 8.0, 9.0, 9.0, 17.0, 18.0, 29.0, 22.0, 25.0, 22.0, 25.0, 45.0, 43.0, 40.0, 31.0, 47.0, 42.0, 38.0, 42.0, 44.0, 41.0, 55.0, 49.0, 32.0, 41.0, 22.0, 25.0, 28.0, 24.0, 20.0, 10.0, 20.0, 9.0, 11.0, 12.0, 6.0, 7.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.78125, -3.65606689453125, -3.5308837890625, -3.40570068359375, -3.280517578125, -3.15533447265625, -3.0301513671875, -2.90496826171875, -2.77978515625, -2.65460205078125, -2.5294189453125, -2.40423583984375, -2.279052734375, -2.15386962890625, -2.0286865234375, -1.90350341796875, -1.7783203125, -1.65313720703125, -1.5279541015625, -1.40277099609375, -1.277587890625, -1.15240478515625, -1.0272216796875, -0.90203857421875, -0.77685546875, -0.65167236328125, -0.5264892578125, -0.40130615234375, -0.276123046875, -0.15093994140625, -0.0257568359375, 0.09942626953125, 0.224609375, 0.34979248046875, 0.4749755859375, 0.60015869140625, 0.725341796875, 0.85052490234375, 0.9757080078125, 1.10089111328125, 1.22607421875, 1.35125732421875, 1.4764404296875, 1.60162353515625, 1.726806640625, 1.85198974609375, 1.9771728515625, 2.10235595703125, 2.2275390625, 2.35272216796875, 2.4779052734375, 2.60308837890625, 2.728271484375, 2.85345458984375, 2.9786376953125, 3.10382080078125, 3.22900390625, 3.35418701171875, 3.4793701171875, 3.60455322265625, 3.729736328125, 3.85491943359375, 3.9801025390625, 4.10528564453125, 4.23046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 16.0, 22.0, 39.0, 66.0, 80.0, 153.0, 247.0, 420.0, 908.0, 2038.0, 5166.0, 14582.0, 49167.0, 250323.0, 2231264.0, 1431181.0, 153894.0, 35599.0, 11375.0, 4174.0, 1794.0, 812.0, 412.0, 177.0, 132.0, 75.0, 42.0, 33.0, 22.0, 10.0, 9.0, 8.0, 2.0, 3.0, 2.0, 6.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69921875, -7.41278076171875, -7.1263427734375, -6.83990478515625, -6.553466796875, -6.26702880859375, -5.9805908203125, -5.69415283203125, -5.40771484375, -5.12127685546875, -4.8348388671875, -4.54840087890625, -4.261962890625, -3.97552490234375, -3.6890869140625, -3.40264892578125, -3.1162109375, -2.82977294921875, -2.5433349609375, -2.25689697265625, -1.970458984375, -1.68402099609375, -1.3975830078125, -1.11114501953125, -0.82470703125, -0.53826904296875, -0.2518310546875, 0.03460693359375, 0.321044921875, 0.60748291015625, 0.8939208984375, 1.18035888671875, 1.466796875, 1.75323486328125, 2.0396728515625, 2.32611083984375, 2.612548828125, 2.89898681640625, 3.1854248046875, 3.47186279296875, 3.75830078125, 4.04473876953125, 4.3311767578125, 4.61761474609375, 4.904052734375, 5.19049072265625, 5.4769287109375, 5.76336669921875, 6.0498046875, 6.33624267578125, 6.6226806640625, 6.90911865234375, 7.195556640625, 7.48199462890625, 7.7684326171875, 8.05487060546875, 8.34130859375, 8.62774658203125, 8.9141845703125, 9.20062255859375, 9.487060546875, 9.77349853515625, 10.0599365234375, 10.34637451171875, 10.6328125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 11.0, 9.0, 17.0, 26.0, 44.0, 62.0, 73.0, 79.0, 121.0, 207.0, 291.0, 420.0, 599.0, 584.0, 476.0, 291.0, 216.0, 180.0, 95.0, 82.0, 63.0, 38.0, 31.0, 16.0, 12.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03125, -4.8131103515625, -4.594970703125, -4.3768310546875, -4.15869140625, -3.9405517578125, -3.722412109375, -3.5042724609375, -3.2861328125, -3.0679931640625, -2.849853515625, -2.6317138671875, -2.41357421875, -2.1954345703125, -1.977294921875, -1.7591552734375, -1.541015625, -1.3228759765625, -1.104736328125, -0.8865966796875, -0.66845703125, -0.4503173828125, -0.232177734375, -0.0140380859375, 0.2041015625, 0.4222412109375, 0.640380859375, 0.8585205078125, 1.07666015625, 1.2947998046875, 1.512939453125, 1.7310791015625, 1.94921875, 2.1673583984375, 2.385498046875, 2.6036376953125, 2.82177734375, 3.0399169921875, 3.258056640625, 3.4761962890625, 3.6943359375, 3.9124755859375, 4.130615234375, 4.3487548828125, 4.56689453125, 4.7850341796875, 5.003173828125, 5.2213134765625, 5.439453125, 5.6575927734375, 5.875732421875, 6.0938720703125, 6.31201171875, 6.5301513671875, 6.748291015625, 6.9664306640625, 7.1845703125, 7.4027099609375, 7.620849609375, 7.8389892578125, 8.05712890625, 8.2752685546875, 8.493408203125, 8.7115478515625, 8.9296875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 6.0, 10.0, 2.0, 11.0, 24.0, 22.0, 32.0, 41.0, 74.0, 104.0, 189.0, 362.0, 735.0, 1680.0, 4177.0, 12526.0, 44357.0, 187567.0, 1187573.0, 2318209.0, 334875.0, 72128.0, 19293.0, 6031.0, 2229.0, 972.0, 438.0, 243.0, 139.0, 63.0, 48.0, 34.0, 34.0, 19.0, 11.0, 10.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.875, -9.5860595703125, -9.297119140625, -9.0081787109375, -8.71923828125, -8.4302978515625, -8.141357421875, -7.8524169921875, -7.5634765625, -7.2745361328125, -6.985595703125, -6.6966552734375, -6.40771484375, -6.1187744140625, -5.829833984375, -5.5408935546875, -5.251953125, -4.9630126953125, -4.674072265625, -4.3851318359375, -4.09619140625, -3.8072509765625, -3.518310546875, -3.2293701171875, -2.9404296875, -2.6514892578125, -2.362548828125, -2.0736083984375, -1.78466796875, -1.4957275390625, -1.206787109375, -0.9178466796875, -0.62890625, -0.3399658203125, -0.051025390625, 0.2379150390625, 0.52685546875, 0.8157958984375, 1.104736328125, 1.3936767578125, 1.6826171875, 1.9715576171875, 2.260498046875, 2.5494384765625, 2.83837890625, 3.1273193359375, 3.416259765625, 3.7052001953125, 3.994140625, 4.2830810546875, 4.572021484375, 4.8609619140625, 5.14990234375, 5.4388427734375, 5.727783203125, 6.0167236328125, 6.3056640625, 6.5946044921875, 6.883544921875, 7.1724853515625, 7.46142578125, 7.7503662109375, 8.039306640625, 8.3282470703125, 8.6171875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 11.0, 22.0, 29.0, 30.0, 63.0, 90.0, 121.0, 115.0, 114.0, 118.0, 103.0, 66.0, 57.0, 25.0, 18.0, 11.0, 6.0, 4.0, 4.0], "bins": [-48.4801139831543, -47.56629180908203, -46.65247344970703, -45.738651275634766, -44.8248291015625, -43.9110107421875, -42.997188568115234, -42.08336639404297, -41.16954803466797, -40.2557258605957, -39.3419075012207, -38.42808532714844, -37.51426315307617, -36.60044479370117, -35.686622619628906, -34.772804260253906, -33.85898208618164, -32.945159912109375, -32.031341552734375, -31.11751937866211, -30.203699111938477, -29.289878845214844, -28.376056671142578, -27.462236404418945, -26.54841423034668, -25.634593963623047, -24.72077178955078, -23.80695152282715, -22.893131256103516, -21.97930908203125, -21.065488815307617, -20.151668548583984, -19.23784637451172, -18.324026107788086, -17.41020393371582, -16.496383666992188, -15.582563400268555, -14.668742179870605, -13.754920959472656, -12.841100692749023, -11.92728042602539, -11.013459205627441, -10.099638938903809, -9.18581771850586, -8.271997451782227, -7.358176231384277, -6.444355487823486, -5.530534744262695, -4.6167144775390625, -3.7028937339782715, -2.7890729904174805, -1.8752520084381104, -0.9614312648773193, -0.04761028289794922, 0.8662104606628418, 1.7800312042236328, 2.693851947784424, 3.607672691345215, 4.521493434906006, 5.435314178466797, 6.349135398864746, 7.262956142425537, 8.176776885986328, 9.090597152709961, 10.00441837310791]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 11.0, 10.0, 9.0, 14.0, 11.0, 25.0, 22.0, 24.0, 27.0, 15.0, 23.0, 32.0, 30.0, 40.0, 44.0, 37.0, 32.0, 26.0, 40.0, 34.0, 48.0, 37.0, 35.0, 32.0, 31.0, 34.0, 44.0, 30.0, 18.0, 32.0, 18.0, 18.0, 23.0, 17.0, 15.0, 6.0, 10.0, 14.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-19.134492874145508, -18.515792846679688, -17.897090911865234, -17.278390884399414, -16.659690856933594, -16.04098892211914, -15.42228889465332, -14.803587913513184, -14.184886932373047, -13.56618595123291, -12.947484970092773, -12.328784942626953, -11.710083961486816, -11.09138298034668, -10.47268295288086, -9.853981971740723, -9.235280990600586, -8.61658000946045, -7.997879505157471, -7.379179000854492, -6.7604780197143555, -6.141777038574219, -5.52307653427124, -4.904376029968262, -4.285675048828125, -3.6669743061065674, -3.0482735633850098, -2.429572820663452, -1.8108720779418945, -1.192171335220337, -0.5734705924987793, 0.04522991180419922, 0.6639328002929688, 1.2826335430145264, 1.901334285736084, 2.5200350284576416, 3.138735771179199, 3.757436513900757, 4.3761372566223145, 4.994837760925293, 5.61353874206543, 6.232239723205566, 6.850940227508545, 7.469640731811523, 8.08834171295166, 8.707042694091797, 9.325742721557617, 9.944443702697754, 10.56314468383789, 11.181845664978027, 11.800546646118164, 12.419246673583984, 13.037947654724121, 13.656648635864258, 14.275348663330078, 14.894049644470215, 15.512750625610352, 16.131450653076172, 16.750152587890625, 17.368852615356445, 17.987552642822266, 18.60625457763672, 19.22495460510254, 19.84365463256836, 20.462356567382812]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 5.0, 5.0, 6.0, 12.0, 14.0, 12.0, 17.0, 29.0, 29.0, 25.0, 31.0, 31.0, 35.0, 41.0, 48.0, 48.0, 59.0, 39.0, 50.0, 33.0, 52.0, 29.0, 48.0, 28.0, 41.0, 37.0, 35.0, 29.0, 26.0, 19.0, 20.0, 26.0, 9.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1484375, -4.0076904296875, -3.866943359375, -3.7261962890625, -3.58544921875, -3.4447021484375, -3.303955078125, -3.1632080078125, -3.0224609375, -2.8817138671875, -2.740966796875, -2.6002197265625, -2.45947265625, -2.3187255859375, -2.177978515625, -2.0372314453125, -1.896484375, -1.7557373046875, -1.614990234375, -1.4742431640625, -1.33349609375, -1.1927490234375, -1.052001953125, -0.9112548828125, -0.7705078125, -0.6297607421875, -0.489013671875, -0.3482666015625, -0.20751953125, -0.0667724609375, 0.073974609375, 0.2147216796875, 0.35546875, 0.4962158203125, 0.636962890625, 0.7777099609375, 0.91845703125, 1.0592041015625, 1.199951171875, 1.3406982421875, 1.4814453125, 1.6221923828125, 1.762939453125, 1.9036865234375, 2.04443359375, 2.1851806640625, 2.325927734375, 2.4666748046875, 2.607421875, 2.7481689453125, 2.888916015625, 3.0296630859375, 3.17041015625, 3.3111572265625, 3.451904296875, 3.5926513671875, 3.7333984375, 3.8741455078125, 4.014892578125, 4.1556396484375, 4.29638671875, 4.4371337890625, 4.577880859375, 4.7186279296875, 4.859375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 4.0, 8.0, 10.0, 14.0, 21.0, 16.0, 39.0, 50.0, 70.0, 152.0, 172.0, 262.0, 473.0, 599.0, 1060.0, 1778.0, 2842.0, 4826.0, 8435.0, 14362.0, 24287.0, 42488.0, 75915.0, 154407.0, 334118.0, 182851.0, 85963.0, 47185.0, 27227.0, 15897.0, 9260.0, 5363.0, 3289.0, 1889.0, 1154.0, 737.0, 432.0, 298.0, 192.0, 148.0, 71.0, 49.0, 53.0, 33.0, 22.0, 10.0, 13.0, 6.0, 4.0, 0.0, 2.0, 1.0, 4.0, 3.0], "bins": [-0.02764892578125, -0.026849746704101562, -0.026050567626953125, -0.025251388549804688, -0.02445220947265625, -0.023653030395507812, -0.022853851318359375, -0.022054672241210938, -0.0212554931640625, -0.020456314086914062, -0.019657135009765625, -0.018857955932617188, -0.01805877685546875, -0.017259597778320312, -0.016460418701171875, -0.015661239624023438, -0.014862060546875, -0.014062881469726562, -0.013263702392578125, -0.012464523315429688, -0.01166534423828125, -0.010866165161132812, -0.010066986083984375, -0.009267807006835938, -0.0084686279296875, -0.0076694488525390625, -0.006870269775390625, -0.0060710906982421875, -0.00527191162109375, -0.0044727325439453125, -0.003673553466796875, -0.0028743743896484375, -0.0020751953125, -0.0012760162353515625, -0.000476837158203125, 0.0003223419189453125, 0.00112152099609375, 0.0019207000732421875, 0.002719879150390625, 0.0035190582275390625, 0.0043182373046875, 0.0051174163818359375, 0.005916595458984375, 0.0067157745361328125, 0.00751495361328125, 0.008314132690429688, 0.009113311767578125, 0.009912490844726562, 0.010711669921875, 0.011510848999023438, 0.012310028076171875, 0.013109207153320312, 0.01390838623046875, 0.014707565307617188, 0.015506744384765625, 0.016305923461914062, 0.0171051025390625, 0.017904281616210938, 0.018703460693359375, 0.019502639770507812, 0.02030181884765625, 0.021100997924804688, 0.021900177001953125, 0.022699356079101562, 0.02349853515625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 4.0, 5.0, 5.0, 5.0, 7.0, 14.0, 11.0, 11.0, 11.0, 12.0, 15.0, 31.0, 28.0, 21.0, 29.0, 33.0, 42.0, 47.0, 37.0, 42.0, 37.0, 39.0, 1069.0, 51.0, 54.0, 31.0, 31.0, 38.0, 35.0, 35.0, 23.0, 17.0, 22.0, 16.0, 22.0, 12.0, 9.0, 17.0, 14.0, 14.0, 7.0, 6.0, 1.0, 2.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-2.681640625, -2.601837158203125, -2.52203369140625, -2.442230224609375, -2.3624267578125, -2.282623291015625, -2.20281982421875, -2.123016357421875, -2.043212890625, -1.963409423828125, -1.88360595703125, -1.803802490234375, -1.7239990234375, -1.644195556640625, -1.56439208984375, -1.484588623046875, -1.40478515625, -1.324981689453125, -1.24517822265625, -1.165374755859375, -1.0855712890625, -1.005767822265625, -0.92596435546875, -0.846160888671875, -0.766357421875, -0.686553955078125, -0.60675048828125, -0.526947021484375, -0.4471435546875, -0.367340087890625, -0.28753662109375, -0.207733154296875, -0.1279296875, -0.048126220703125, 0.03167724609375, 0.111480712890625, 0.1912841796875, 0.271087646484375, 0.35089111328125, 0.430694580078125, 0.510498046875, 0.590301513671875, 0.67010498046875, 0.749908447265625, 0.8297119140625, 0.909515380859375, 0.98931884765625, 1.069122314453125, 1.14892578125, 1.228729248046875, 1.30853271484375, 1.388336181640625, 1.4681396484375, 1.547943115234375, 1.62774658203125, 1.707550048828125, 1.787353515625, 1.867156982421875, 1.94696044921875, 2.026763916015625, 2.1065673828125, 2.186370849609375, 2.26617431640625, 2.345977783203125, 2.42578125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 10.0, 5.0, 5.0, 4.0, 9.0, 21.0, 28.0, 51.0, 51.0, 85.0, 96.0, 178.0, 284.0, 369.0, 497.0, 729.0, 1137.0, 1607.0, 2429.0, 3687.0, 5499.0, 8515.0, 12992.0, 21024.0, 33881.0, 58086.0, 106366.0, 254792.0, 1316904.0, 111910.0, 60256.0, 34955.0, 21572.0, 13339.0, 8514.0, 5816.0, 3608.0, 2456.0, 1806.0, 1100.0, 748.0, 523.0, 397.0, 220.0, 152.0, 139.0, 119.0, 64.0, 33.0, 26.0, 11.0, 14.0, 11.0, 8.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01471710205078125, -0.014227032661437988, -0.013736963272094727, -0.013246893882751465, -0.012756824493408203, -0.012266755104064941, -0.01177668571472168, -0.011286616325378418, -0.010796546936035156, -0.010306477546691895, -0.009816408157348633, -0.009326338768005371, -0.00883626937866211, -0.008346199989318848, -0.007856130599975586, -0.007366061210632324, -0.0068759918212890625, -0.006385922431945801, -0.005895853042602539, -0.005405783653259277, -0.004915714263916016, -0.004425644874572754, -0.003935575485229492, -0.0034455060958862305, -0.0029554367065429688, -0.002465367317199707, -0.0019752979278564453, -0.0014852285385131836, -0.0009951591491699219, -0.0005050897598266602, -1.5020370483398438e-05, 0.0004750490188598633, 0.000965118408203125, 0.0014551877975463867, 0.0019452571868896484, 0.00243532657623291, 0.002925395965576172, 0.0034154653549194336, 0.0039055347442626953, 0.004395604133605957, 0.004885673522949219, 0.0053757429122924805, 0.005865812301635742, 0.006355881690979004, 0.006845951080322266, 0.007336020469665527, 0.007826089859008789, 0.00831615924835205, 0.008806228637695312, 0.009296298027038574, 0.009786367416381836, 0.010276436805725098, 0.01076650619506836, 0.011256575584411621, 0.011746644973754883, 0.012236714363098145, 0.012726783752441406, 0.013216853141784668, 0.01370692253112793, 0.014196991920471191, 0.014687061309814453, 0.015177130699157715, 0.015667200088500977, 0.01615726947784424, 0.0166473388671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 204.0, 0.0, 0.0, 0.0, 0.0, 0.0, 478.0, 0.0, 0.0, 0.0, 0.0, 188.0, 0.0, 0.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.46451997756958e-07, -3.3527612686157227e-07, -3.241002559661865e-07, -3.129243850708008e-07, -3.0174851417541504e-07, -2.905726432800293e-07, -2.7939677238464355e-07, -2.682209014892578e-07, -2.5704503059387207e-07, -2.4586915969848633e-07, -2.3469328880310059e-07, -2.2351741790771484e-07, -2.123415470123291e-07, -2.0116567611694336e-07, -1.8998980522155762e-07, -1.7881393432617188e-07, -1.6763806343078613e-07, -1.564621925354004e-07, -1.4528632164001465e-07, -1.341104507446289e-07, -1.2293457984924316e-07, -1.1175870895385742e-07, -1.0058283805847168e-07, -8.940696716308594e-08, -7.82310962677002e-08, -6.705522537231445e-08, -5.587935447692871e-08, -4.470348358154297e-08, -3.3527612686157227e-08, -2.2351741790771484e-08, -1.1175870895385742e-08, 0.0, 1.1175870895385742e-08, 2.2351741790771484e-08, 3.3527612686157227e-08, 4.470348358154297e-08, 5.587935447692871e-08, 6.705522537231445e-08, 7.82310962677002e-08, 8.940696716308594e-08, 1.0058283805847168e-07, 1.1175870895385742e-07, 1.2293457984924316e-07, 1.341104507446289e-07, 1.4528632164001465e-07, 1.564621925354004e-07, 1.6763806343078613e-07, 1.7881393432617188e-07, 1.8998980522155762e-07, 2.0116567611694336e-07, 2.123415470123291e-07, 2.2351741790771484e-07, 2.3469328880310059e-07, 2.4586915969848633e-07, 2.5704503059387207e-07, 2.682209014892578e-07, 2.7939677238464355e-07, 2.905726432800293e-07, 3.0174851417541504e-07, 3.129243850708008e-07, 3.241002559661865e-07, 3.3527612686157227e-07, 3.46451997756958e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 8.0, 6.0, 2.0, 2.0, 35.0, 27.0, 14.0, 1.0, 53.0, 71.0, 50.0, 128.0, 302.0, 229.0, 1219.0, 895471.0, 149319.0, 765.0, 214.0, 273.0, 97.0, 96.0, 56.0, 30.0, 1.0, 16.0, 32.0, 13.0, 3.0, 2.0, 5.0, 3.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-06, -6.812624633312225e-06, -6.591901183128357e-06, -6.3711777329444885e-06, -6.15045428276062e-06, -5.929730832576752e-06, -5.709007382392883e-06, -5.488283932209015e-06, -5.2675604820251465e-06, -5.046837031841278e-06, -4.82611358165741e-06, -4.605390131473541e-06, -4.384666681289673e-06, -4.1639432311058044e-06, -3.943219780921936e-06, -3.7224963307380676e-06, -3.5017728805541992e-06, -3.281049430370331e-06, -3.0603259801864624e-06, -2.839602530002594e-06, -2.6188790798187256e-06, -2.398155629634857e-06, -2.1774321794509888e-06, -1.9567087292671204e-06, -1.735985279083252e-06, -1.5152618288993835e-06, -1.2945383787155151e-06, -1.0738149285316467e-06, -8.530914783477783e-07, -6.323680281639099e-07, -4.116445779800415e-07, -1.909211277961731e-07, 2.9802322387695312e-08, 2.505257725715637e-07, 4.7124922275543213e-07, 6.919726729393005e-07, 9.126961231231689e-07, 1.1334195733070374e-06, 1.3541430234909058e-06, 1.5748664736747742e-06, 1.7955899238586426e-06, 2.016313374042511e-06, 2.2370368242263794e-06, 2.457760274410248e-06, 2.678483724594116e-06, 2.8992071747779846e-06, 3.119930624961853e-06, 3.3406540751457214e-06, 3.56137752532959e-06, 3.7821009755134583e-06, 4.002824425697327e-06, 4.223547875881195e-06, 4.4442713260650635e-06, 4.664994776248932e-06, 4.8857182264328e-06, 5.106441676616669e-06, 5.327165126800537e-06, 5.5478885769844055e-06, 5.768612027168274e-06, 5.989335477352142e-06, 6.210058927536011e-06, 6.430782377719879e-06, 6.6515058279037476e-06, 6.872229278087616e-06, 7.092952728271484e-06]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 40.0, 888.0, 65.0, 14.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3163825087758596e-06, -1.2823385304727708e-06, -1.248294552169682e-06, -1.2142505738665932e-06, -1.1802065955635044e-06, -1.1461626172604156e-06, -1.1121186389573268e-06, -1.0780745469674002e-06, -1.0440305686643114e-06, -1.0099865903612226e-06, -9.759426120581338e-07, -9.41898633755045e-07, -9.078546554519562e-07, -8.738106771488674e-07, -8.397666420023597e-07, -8.057226636992709e-07, -7.71678742239601e-07, -7.376347639365122e-07, -7.035907856334234e-07, -6.695468073303346e-07, -6.355028290272458e-07, -6.014588507241569e-07, -5.674148155776493e-07, -5.333708372745605e-07, -4.993268589714717e-07, -4.6528288066838286e-07, -4.3123890236529405e-07, -3.971948956404958e-07, -3.63150917337407e-07, -3.291069390343182e-07, -2.9506293230951997e-07, -2.6101895400643116e-07, -2.2697508939018007e-07, -1.9293111108709127e-07, -1.5888711857314775e-07, -1.2484312605920422e-07, -9.079914775611542e-08, -5.675516945302661e-08, -2.271117693908309e-08, 1.1332815574860433e-08, 4.537679387794924e-08, 7.94207792864654e-08, 1.1346476469498157e-07, 1.475087572089251e-07, 1.815527355120139e-07, 2.155967138151027e-07, 2.4964072053990094e-07, 2.8368469884298975e-07, 3.1772867714607855e-07, 3.5177265544916736e-07, 3.8581663375225617e-07, 4.198606404770544e-07, 4.539046187801432e-07, 4.879485686615226e-07, 5.219926038080303e-07, 5.560365821111191e-07, 5.900805604142079e-07, 6.241245387172967e-07, 6.581685170203855e-07, 6.922124953234743e-07, 7.26256530469982e-07, 7.603005087730708e-07, 7.943444870761596e-07, 8.283884653792484e-07, 8.624324436823372e-07]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 101.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 813.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 99.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 5.0, 5.0, 6.0, 12.0, 14.0, 12.0, 17.0, 29.0, 29.0, 25.0, 31.0, 31.0, 35.0, 41.0, 48.0, 48.0, 59.0, 39.0, 50.0, 33.0, 52.0, 29.0, 48.0, 28.0, 41.0, 37.0, 35.0, 29.0, 26.0, 19.0, 20.0, 26.0, 9.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1484375, -4.0076904296875, -3.866943359375, -3.7261962890625, -3.58544921875, -3.4447021484375, -3.303955078125, -3.1632080078125, -3.0224609375, -2.8817138671875, -2.740966796875, -2.6002197265625, -2.45947265625, -2.3187255859375, -2.177978515625, -2.0372314453125, -1.896484375, -1.7557373046875, -1.614990234375, -1.4742431640625, -1.33349609375, -1.1927490234375, -1.052001953125, -0.9112548828125, -0.7705078125, -0.6297607421875, -0.489013671875, -0.3482666015625, -0.20751953125, -0.0667724609375, 0.073974609375, 0.2147216796875, 0.35546875, 0.4962158203125, 0.636962890625, 0.7777099609375, 0.91845703125, 1.0592041015625, 1.199951171875, 1.3406982421875, 1.4814453125, 1.6221923828125, 1.762939453125, 1.9036865234375, 2.04443359375, 2.1851806640625, 2.325927734375, 2.4666748046875, 2.607421875, 2.7481689453125, 2.888916015625, 3.0296630859375, 3.17041015625, 3.3111572265625, 3.451904296875, 3.5926513671875, 3.7333984375, 3.8741455078125, 4.014892578125, 4.1556396484375, 4.29638671875, 4.4371337890625, 4.577880859375, 4.7186279296875, 4.859375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 13.0, 9.0, 22.0, 24.0, 43.0, 67.0, 99.0, 155.0, 230.0, 371.0, 670.0, 1113.0, 1836.0, 3270.0, 5642.0, 10505.0, 19370.0, 35581.0, 65358.0, 126624.0, 306979.0, 242079.0, 104726.0, 56128.0, 30368.0, 16526.0, 8890.0, 4939.0, 2865.0, 1568.0, 939.0, 554.0, 335.0, 223.0, 145.0, 77.0, 66.0, 34.0, 30.0, 17.0, 17.0, 12.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.32421875, -4.18853759765625, -4.0528564453125, -3.91717529296875, -3.781494140625, -3.64581298828125, -3.5101318359375, -3.37445068359375, -3.23876953125, -3.10308837890625, -2.9674072265625, -2.83172607421875, -2.696044921875, -2.56036376953125, -2.4246826171875, -2.28900146484375, -2.1533203125, -2.01763916015625, -1.8819580078125, -1.74627685546875, -1.610595703125, -1.47491455078125, -1.3392333984375, -1.20355224609375, -1.06787109375, -0.93218994140625, -0.7965087890625, -0.66082763671875, -0.525146484375, -0.38946533203125, -0.2537841796875, -0.11810302734375, 0.017578125, 0.15325927734375, 0.2889404296875, 0.42462158203125, 0.560302734375, 0.69598388671875, 0.8316650390625, 0.96734619140625, 1.10302734375, 1.23870849609375, 1.3743896484375, 1.51007080078125, 1.645751953125, 1.78143310546875, 1.9171142578125, 2.05279541015625, 2.1884765625, 2.32415771484375, 2.4598388671875, 2.59552001953125, 2.731201171875, 2.86688232421875, 3.0025634765625, 3.13824462890625, 3.27392578125, 3.40960693359375, 3.5452880859375, 3.68096923828125, 3.816650390625, 3.95233154296875, 4.0880126953125, 4.22369384765625, 4.359375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 7.0, 4.0, 8.0, 5.0, 18.0, 16.0, 16.0, 17.0, 22.0, 16.0, 38.0, 27.0, 45.0, 41.0, 44.0, 77.0, 114.0, 197.0, 1497.0, 262.0, 158.0, 74.0, 65.0, 40.0, 41.0, 45.0, 26.0, 17.0, 18.0, 18.0, 12.0, 15.0, 17.0, 7.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.03125, -11.6842041015625, -11.337158203125, -10.9901123046875, -10.64306640625, -10.2960205078125, -9.948974609375, -9.6019287109375, -9.2548828125, -8.9078369140625, -8.560791015625, -8.2137451171875, -7.86669921875, -7.5196533203125, -7.172607421875, -6.8255615234375, -6.478515625, -6.1314697265625, -5.784423828125, -5.4373779296875, -5.09033203125, -4.7432861328125, -4.396240234375, -4.0491943359375, -3.7021484375, -3.3551025390625, -3.008056640625, -2.6610107421875, -2.31396484375, -1.9669189453125, -1.619873046875, -1.2728271484375, -0.92578125, -0.5787353515625, -0.231689453125, 0.1153564453125, 0.46240234375, 0.8094482421875, 1.156494140625, 1.5035400390625, 1.8505859375, 2.1976318359375, 2.544677734375, 2.8917236328125, 3.23876953125, 3.5858154296875, 3.932861328125, 4.2799072265625, 4.626953125, 4.9739990234375, 5.321044921875, 5.6680908203125, 6.01513671875, 6.3621826171875, 6.709228515625, 7.0562744140625, 7.4033203125, 7.7503662109375, 8.097412109375, 8.4444580078125, 8.79150390625, 9.1385498046875, 9.485595703125, 9.8326416015625, 10.1796875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 8.0, 8.0, 11.0, 8.0, 18.0, 21.0, 38.0, 39.0, 64.0, 67.0, 93.0, 135.0, 203.0, 372.0, 866.0, 3503.0, 24868.0, 307248.0, 2647200.0, 142961.0, 14082.0, 2219.0, 666.0, 298.0, 193.0, 116.0, 96.0, 78.0, 48.0, 33.0, 31.0, 25.0, 22.0, 19.0, 17.0, 8.0, 8.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.03125, -13.5977783203125, -13.164306640625, -12.7308349609375, -12.29736328125, -11.8638916015625, -11.430419921875, -10.9969482421875, -10.5634765625, -10.1300048828125, -9.696533203125, -9.2630615234375, -8.82958984375, -8.3961181640625, -7.962646484375, -7.5291748046875, -7.095703125, -6.6622314453125, -6.228759765625, -5.7952880859375, -5.36181640625, -4.9283447265625, -4.494873046875, -4.0614013671875, -3.6279296875, -3.1944580078125, -2.760986328125, -2.3275146484375, -1.89404296875, -1.4605712890625, -1.027099609375, -0.5936279296875, -0.16015625, 0.2733154296875, 0.706787109375, 1.1402587890625, 1.57373046875, 2.0072021484375, 2.440673828125, 2.8741455078125, 3.3076171875, 3.7410888671875, 4.174560546875, 4.6080322265625, 5.04150390625, 5.4749755859375, 5.908447265625, 6.3419189453125, 6.775390625, 7.2088623046875, 7.642333984375, 8.0758056640625, 8.50927734375, 8.9427490234375, 9.376220703125, 9.8096923828125, 10.2431640625, 10.6766357421875, 11.110107421875, 11.5435791015625, 11.97705078125, 12.4105224609375, 12.843994140625, 13.2774658203125, 13.7109375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 7.0, 42.0, 319.0, 486.0, 151.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.276069641113281, -9.38602352142334, -6.495977401733398, -3.605931282043457, -0.7158851623535156, 2.174160957336426, 5.064207077026367, 7.954254150390625, 10.84429931640625, 13.734345436096191, 16.624391555786133, 19.51443862915039, 22.404483795166016, 25.29452896118164, 28.1845760345459, 31.074623107910156, 33.96466827392578, 36.854713439941406, 39.74475860595703, 42.63480758666992, 45.52485275268555, 48.41489791870117, 51.30494689941406, 54.19499206542969, 57.08503723144531, 59.97508239746094, 62.86512756347656, 65.75517272949219, 68.64521789550781, 71.53527069091797, 74.4253158569336, 77.31536102294922, 80.20539855957031, 83.09544372558594, 85.98548889160156, 88.87553405761719, 91.76557922363281, 94.65563201904297, 97.5456771850586, 100.43572235107422, 103.32576751708984, 106.21581268310547, 109.1058578491211, 111.99590301513672, 114.88595581054688, 117.7760009765625, 120.66604614257812, 123.55609130859375, 126.44613647460938, 129.336181640625, 132.22622680664062, 135.11627197265625, 138.00631713867188, 140.8963623046875, 143.78640747070312, 146.67645263671875, 149.56649780273438, 152.45654296875, 155.34658813476562, 158.23663330078125, 161.12667846679688, 164.0167236328125, 166.90676879882812, 169.79681396484375, 172.68687438964844]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 2.0, 4.0, 10.0, 6.0, 9.0, 15.0, 9.0, 12.0, 15.0, 17.0, 20.0, 26.0, 25.0, 30.0, 34.0, 24.0, 37.0, 33.0, 35.0, 39.0, 39.0, 48.0, 44.0, 40.0, 38.0, 39.0, 31.0, 27.0, 28.0, 40.0, 23.0, 36.0, 27.0, 28.0, 13.0, 22.0, 13.0, 13.0, 13.0, 8.0, 4.0, 8.0, 3.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.122787475585938, -18.476417541503906, -17.830047607421875, -17.183677673339844, -16.537307739257812, -15.890938758850098, -15.244569778442383, -14.598199844360352, -13.95182991027832, -13.305459976196289, -12.659090042114258, -12.012721061706543, -11.366351127624512, -10.71998119354248, -10.073612213134766, -9.427242279052734, -8.780872344970703, -8.134502410888672, -7.488132953643799, -6.841763496398926, -6.1953935623168945, -5.549023628234863, -4.90265417098999, -4.256284713745117, -3.609914779663086, -2.963545083999634, -2.3171753883361816, -1.6708056926727295, -1.0244359970092773, -0.3780663013458252, 0.26830339431762695, 0.9146728515625, 1.5610427856445312, 2.2074124813079834, 2.8537821769714355, 3.5001518726348877, 4.14652156829834, 4.792891502380371, 5.439260959625244, 6.085630416870117, 6.732000350952148, 7.37837028503418, 8.024740219116211, 8.671109199523926, 9.317479133605957, 9.963849067687988, 10.610218048095703, 11.256587982177734, 11.902957916259766, 12.549327850341797, 13.195697784423828, 13.842066764831543, 14.488436698913574, 15.134806632995605, 15.78117561340332, 16.42754554748535, 17.073915481567383, 17.720285415649414, 18.366655349731445, 19.013025283813477, 19.659393310546875, 20.305763244628906, 20.952133178710938, 21.59850311279297, 22.244873046875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 8.0, 8.0, 9.0, 10.0, 14.0, 17.0, 27.0, 16.0, 20.0, 35.0, 27.0, 36.0, 59.0, 42.0, 45.0, 37.0, 52.0, 43.0, 48.0, 43.0, 44.0, 45.0, 47.0, 38.0, 27.0, 34.0, 33.0, 19.0, 23.0, 25.0, 13.0, 12.0, 15.0, 5.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.02685546875, -3.8818359375, -3.73681640625, -3.591796875, -3.44677734375, -3.3017578125, -3.15673828125, -3.01171875, -2.86669921875, -2.7216796875, -2.57666015625, -2.431640625, -2.28662109375, -2.1416015625, -1.99658203125, -1.8515625, -1.70654296875, -1.5615234375, -1.41650390625, -1.271484375, -1.12646484375, -0.9814453125, -0.83642578125, -0.69140625, -0.54638671875, -0.4013671875, -0.25634765625, -0.111328125, 0.03369140625, 0.1787109375, 0.32373046875, 0.46875, 0.61376953125, 0.7587890625, 0.90380859375, 1.048828125, 1.19384765625, 1.3388671875, 1.48388671875, 1.62890625, 1.77392578125, 1.9189453125, 2.06396484375, 2.208984375, 2.35400390625, 2.4990234375, 2.64404296875, 2.7890625, 2.93408203125, 3.0791015625, 3.22412109375, 3.369140625, 3.51416015625, 3.6591796875, 3.80419921875, 3.94921875, 4.09423828125, 4.2392578125, 4.38427734375, 4.529296875, 4.67431640625, 4.8193359375, 4.96435546875, 5.109375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 8.0, 12.0, 12.0, 19.0, 21.0, 28.0, 41.0, 49.0, 79.0, 90.0, 131.0, 229.0, 361.0, 558.0, 6080.0, 4179324.0, 5643.0, 534.0, 328.0, 219.0, 126.0, 93.0, 80.0, 51.0, 42.0, 32.0, 18.0, 20.0, 10.0, 14.0, 8.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3125, -64.8642578125, -62.416015625, -59.9677734375, -57.51953125, -55.0712890625, -52.623046875, -50.1748046875, -47.7265625, -45.2783203125, -42.830078125, -40.3818359375, -37.93359375, -35.4853515625, -33.037109375, -30.5888671875, -28.140625, -25.6923828125, -23.244140625, -20.7958984375, -18.34765625, -15.8994140625, -13.451171875, -11.0029296875, -8.5546875, -6.1064453125, -3.658203125, -1.2099609375, 1.23828125, 3.6865234375, 6.134765625, 8.5830078125, 11.03125, 13.4794921875, 15.927734375, 18.3759765625, 20.82421875, 23.2724609375, 25.720703125, 28.1689453125, 30.6171875, 33.0654296875, 35.513671875, 37.9619140625, 40.41015625, 42.8583984375, 45.306640625, 47.7548828125, 50.203125, 52.6513671875, 55.099609375, 57.5478515625, 59.99609375, 62.4443359375, 64.892578125, 67.3408203125, 69.7890625, 72.2373046875, 74.685546875, 77.1337890625, 79.58203125, 82.0302734375, 84.478515625, 86.9267578125, 89.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 5.0, 9.0, 13.0, 17.0, 19.0, 22.0, 34.0, 37.0, 50.0, 77.0, 87.0, 105.0, 159.0, 245.0, 330.0, 473.0, 607.0, 553.0, 352.0, 214.0, 162.0, 126.0, 90.0, 57.0, 54.0, 34.0, 24.0, 24.0, 19.0, 11.0, 14.0, 11.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.26953125, -5.08502197265625, -4.9005126953125, -4.71600341796875, -4.531494140625, -4.34698486328125, -4.1624755859375, -3.97796630859375, -3.79345703125, -3.60894775390625, -3.4244384765625, -3.23992919921875, -3.055419921875, -2.87091064453125, -2.6864013671875, -2.50189208984375, -2.3173828125, -2.13287353515625, -1.9483642578125, -1.76385498046875, -1.579345703125, -1.39483642578125, -1.2103271484375, -1.02581787109375, -0.84130859375, -0.65679931640625, -0.4722900390625, -0.28778076171875, -0.103271484375, 0.08123779296875, 0.2657470703125, 0.45025634765625, 0.634765625, 0.81927490234375, 1.0037841796875, 1.18829345703125, 1.372802734375, 1.55731201171875, 1.7418212890625, 1.92633056640625, 2.11083984375, 2.29534912109375, 2.4798583984375, 2.66436767578125, 2.848876953125, 3.03338623046875, 3.2178955078125, 3.40240478515625, 3.5869140625, 3.77142333984375, 3.9559326171875, 4.14044189453125, 4.324951171875, 4.50946044921875, 4.6939697265625, 4.87847900390625, 5.06298828125, 5.24749755859375, 5.4320068359375, 5.61651611328125, 5.801025390625, 5.98553466796875, 6.1700439453125, 6.35455322265625, 6.5390625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 5.0, 11.0, 7.0, 12.0, 13.0, 8.0, 15.0, 24.0, 27.0, 26.0, 44.0, 39.0, 55.0, 117.0, 258.0, 925.0, 11272.0, 487914.0, 3638439.0, 51561.0, 2545.0, 451.0, 162.0, 73.0, 62.0, 44.0, 36.0, 30.0, 17.0, 15.0, 14.0, 14.0, 11.0, 8.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.421875, -29.604736328125, -28.78759765625, -27.970458984375, -27.1533203125, -26.336181640625, -25.51904296875, -24.701904296875, -23.884765625, -23.067626953125, -22.25048828125, -21.433349609375, -20.6162109375, -19.799072265625, -18.98193359375, -18.164794921875, -17.34765625, -16.530517578125, -15.71337890625, -14.896240234375, -14.0791015625, -13.261962890625, -12.44482421875, -11.627685546875, -10.810546875, -9.993408203125, -9.17626953125, -8.359130859375, -7.5419921875, -6.724853515625, -5.90771484375, -5.090576171875, -4.2734375, -3.456298828125, -2.63916015625, -1.822021484375, -1.0048828125, -0.187744140625, 0.62939453125, 1.446533203125, 2.263671875, 3.080810546875, 3.89794921875, 4.715087890625, 5.5322265625, 6.349365234375, 7.16650390625, 7.983642578125, 8.80078125, 9.617919921875, 10.43505859375, 11.252197265625, 12.0693359375, 12.886474609375, 13.70361328125, 14.520751953125, 15.337890625, 16.155029296875, 16.97216796875, 17.789306640625, 18.6064453125, 19.423583984375, 20.24072265625, 21.057861328125, 21.875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 114.0, 447.0, 343.0, 94.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.72113037109375, -27.287437438964844, -23.853742599487305, -20.420047760009766, -16.98635482788086, -13.552661895751953, -10.118967056274414, -6.685272216796875, -3.2515792846679688, 0.1821146011352539, 3.6158084869384766, 7.049502372741699, 10.483196258544922, 13.916889190673828, 17.350584030151367, 20.784278869628906, 24.217971801757812, 27.65166473388672, 31.085359573364258, 34.5190544128418, 37.9527473449707, 41.38644027709961, 44.82013702392578, 48.25382995605469, 51.687522888183594, 55.1212158203125, 58.554908752441406, 61.98860549926758, 65.42230224609375, 68.85598754882812, 72.28968811035156, 75.72338104248047, 79.15707397460938, 82.59076690673828, 86.02445983886719, 89.4581527709961, 92.891845703125, 96.32554626464844, 99.75923919677734, 103.19293212890625, 106.62662506103516, 110.06031799316406, 113.49401092529297, 116.92770385742188, 120.36140441894531, 123.79508972167969, 127.22879028320312, 130.6624755859375, 134.09617614746094, 137.52987670898438, 140.96356201171875, 144.3972625732422, 147.83094787597656, 151.2646484375, 154.69833374023438, 158.1320343017578, 161.56573486328125, 164.9994354248047, 168.43312072753906, 171.8668212890625, 175.30050659179688, 178.7342071533203, 182.1678924560547, 185.60159301757812, 189.0352783203125]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 3.0, 7.0, 13.0, 11.0, 15.0, 19.0, 17.0, 20.0, 17.0, 32.0, 40.0, 29.0, 48.0, 35.0, 45.0, 41.0, 32.0, 38.0, 56.0, 43.0, 36.0, 49.0, 48.0, 32.0, 35.0, 23.0, 27.0, 32.0, 29.0, 22.0, 21.0, 16.0, 16.0, 6.0, 16.0, 8.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.727737426757812, -20.0755615234375, -19.423385620117188, -18.771209716796875, -18.119033813476562, -17.46685791015625, -16.814682006835938, -16.162506103515625, -15.510330200195312, -14.858154296875, -14.205978393554688, -13.553802490234375, -12.901626586914062, -12.24945068359375, -11.597274780273438, -10.945098876953125, -10.292922973632812, -9.6407470703125, -8.988571166992188, -8.336395263671875, -7.6842193603515625, -7.03204345703125, -6.3798675537109375, -5.727691650390625, -5.0755157470703125, -4.42333984375, -3.7711639404296875, -3.118988037109375, -2.4668121337890625, -1.81463623046875, -1.1624603271484375, -0.510284423828125, 0.1418895721435547, 0.7940654754638672, 1.4462413787841797, 2.098417282104492, 2.7505931854248047, 3.402769088745117, 4.05494499206543, 4.707120895385742, 5.359296798706055, 6.011472702026367, 6.66364860534668, 7.315824508666992, 7.968000411987305, 8.620176315307617, 9.27235221862793, 9.924528121948242, 10.576704025268555, 11.228879928588867, 11.88105583190918, 12.533231735229492, 13.185407638549805, 13.837583541870117, 14.48975944519043, 15.141935348510742, 15.794111251831055, 16.446287155151367, 17.09846305847168, 17.750638961791992, 18.402814865112305, 19.054990768432617, 19.70716667175293, 20.359342575073242, 21.011518478393555]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 15.0, 13.0, 11.0, 24.0, 20.0, 25.0, 32.0, 29.0, 24.0, 30.0, 43.0, 40.0, 56.0, 51.0, 58.0, 41.0, 49.0, 56.0, 35.0, 47.0, 33.0, 37.0, 29.0, 31.0, 25.0, 28.0, 20.0, 17.0, 25.0, 10.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.30596923828125, -4.1627197265625, -4.01947021484375, -3.876220703125, -3.73297119140625, -3.5897216796875, -3.44647216796875, -3.30322265625, -3.15997314453125, -3.0167236328125, -2.87347412109375, -2.730224609375, -2.58697509765625, -2.4437255859375, -2.30047607421875, -2.1572265625, -2.01397705078125, -1.8707275390625, -1.72747802734375, -1.584228515625, -1.44097900390625, -1.2977294921875, -1.15447998046875, -1.01123046875, -0.86798095703125, -0.7247314453125, -0.58148193359375, -0.438232421875, -0.29498291015625, -0.1517333984375, -0.00848388671875, 0.134765625, 0.27801513671875, 0.4212646484375, 0.56451416015625, 0.707763671875, 0.85101318359375, 0.9942626953125, 1.13751220703125, 1.28076171875, 1.42401123046875, 1.5672607421875, 1.71051025390625, 1.853759765625, 1.99700927734375, 2.1402587890625, 2.28350830078125, 2.4267578125, 2.57000732421875, 2.7132568359375, 2.85650634765625, 2.999755859375, 3.14300537109375, 3.2862548828125, 3.42950439453125, 3.57275390625, 3.71600341796875, 3.8592529296875, 4.00250244140625, 4.145751953125, 4.28900146484375, 4.4322509765625, 4.57550048828125, 4.71875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 2.0, 11.0, 13.0, 25.0, 42.0, 42.0, 70.0, 107.0, 176.0, 250.0, 425.0, 666.0, 1018.0, 1805.0, 3108.0, 5240.0, 8930.0, 15730.0, 27060.0, 47339.0, 92936.0, 244275.0, 344691.0, 120125.0, 57798.0, 32042.0, 18570.0, 10673.0, 6211.0, 3529.0, 2168.0, 1309.0, 783.0, 499.0, 321.0, 210.0, 116.0, 80.0, 48.0, 39.0, 20.0, 22.0, 7.0, 11.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029083251953125, -0.028149843215942383, -0.027216434478759766, -0.02628302574157715, -0.02534961700439453, -0.024416208267211914, -0.023482799530029297, -0.02254939079284668, -0.021615982055664062, -0.020682573318481445, -0.019749164581298828, -0.01881575584411621, -0.017882347106933594, -0.016948938369750977, -0.01601552963256836, -0.015082120895385742, -0.014148712158203125, -0.013215303421020508, -0.01228189468383789, -0.011348485946655273, -0.010415077209472656, -0.009481668472290039, -0.008548259735107422, -0.007614850997924805, -0.0066814422607421875, -0.00574803352355957, -0.004814624786376953, -0.003881216049194336, -0.0029478073120117188, -0.0020143985748291016, -0.0010809898376464844, -0.0001475811004638672, 0.00078582763671875, 0.0017192363739013672, 0.0026526451110839844, 0.0035860538482666016, 0.004519462585449219, 0.005452871322631836, 0.006386280059814453, 0.00731968879699707, 0.008253097534179688, 0.009186506271362305, 0.010119915008544922, 0.011053323745727539, 0.011986732482910156, 0.012920141220092773, 0.01385354995727539, 0.014786958694458008, 0.015720367431640625, 0.016653776168823242, 0.01758718490600586, 0.018520593643188477, 0.019454002380371094, 0.02038741111755371, 0.021320819854736328, 0.022254228591918945, 0.023187637329101562, 0.02412104606628418, 0.025054454803466797, 0.025987863540649414, 0.02692127227783203, 0.02785468101501465, 0.028788089752197266, 0.029721498489379883, 0.0306549072265625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 13.0, 14.0, 11.0, 12.0, 12.0, 15.0, 15.0, 15.0, 14.0, 24.0, 31.0, 16.0, 30.0, 28.0, 36.0, 22.0, 42.0, 41.0, 34.0, 28.0, 1075.0, 29.0, 35.0, 45.0, 42.0, 38.0, 29.0, 25.0, 33.0, 29.0, 20.0, 18.0, 25.0, 17.0, 13.0, 18.0, 15.0, 8.0, 12.0, 7.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.453125, -2.375396728515625, -2.29766845703125, -2.219940185546875, -2.1422119140625, -2.064483642578125, -1.98675537109375, -1.909027099609375, -1.831298828125, -1.753570556640625, -1.67584228515625, -1.598114013671875, -1.5203857421875, -1.442657470703125, -1.36492919921875, -1.287200927734375, -1.20947265625, -1.131744384765625, -1.05401611328125, -0.976287841796875, -0.8985595703125, -0.820831298828125, -0.74310302734375, -0.665374755859375, -0.587646484375, -0.509918212890625, -0.43218994140625, -0.354461669921875, -0.2767333984375, -0.199005126953125, -0.12127685546875, -0.043548583984375, 0.0341796875, 0.111907958984375, 0.18963623046875, 0.267364501953125, 0.3450927734375, 0.422821044921875, 0.50054931640625, 0.578277587890625, 0.656005859375, 0.733734130859375, 0.81146240234375, 0.889190673828125, 0.9669189453125, 1.044647216796875, 1.12237548828125, 1.200103759765625, 1.27783203125, 1.355560302734375, 1.43328857421875, 1.511016845703125, 1.5887451171875, 1.666473388671875, 1.74420166015625, 1.821929931640625, 1.899658203125, 1.977386474609375, 2.05511474609375, 2.132843017578125, 2.2105712890625, 2.288299560546875, 2.36602783203125, 2.443756103515625, 2.521484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 7.0, 9.0, 24.0, 44.0, 43.0, 78.0, 126.0, 166.0, 249.0, 350.0, 542.0, 864.0, 1233.0, 1739.0, 2597.0, 3975.0, 5844.0, 8817.0, 13572.0, 20499.0, 31746.0, 50160.0, 85867.0, 173841.0, 1339521.0, 147214.0, 76879.0, 45936.0, 29106.0, 18932.0, 12415.0, 8157.0, 5528.0, 3621.0, 2484.0, 1632.0, 1116.0, 767.0, 495.0, 291.0, 190.0, 134.0, 109.0, 77.0, 47.0, 34.0, 14.0, 15.0, 9.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.0153961181640625, -0.014920949935913086, -0.014445781707763672, -0.013970613479614258, -0.013495445251464844, -0.01302027702331543, -0.012545108795166016, -0.012069940567016602, -0.011594772338867188, -0.011119604110717773, -0.01064443588256836, -0.010169267654418945, -0.009694099426269531, -0.009218931198120117, -0.008743762969970703, -0.008268594741821289, -0.007793426513671875, -0.007318258285522461, -0.006843090057373047, -0.006367921829223633, -0.005892753601074219, -0.005417585372924805, -0.004942417144775391, -0.0044672489166259766, -0.0039920806884765625, -0.0035169124603271484, -0.0030417442321777344, -0.0025665760040283203, -0.0020914077758789062, -0.0016162395477294922, -0.0011410713195800781, -0.0006659030914306641, -0.00019073486328125, 0.00028443336486816406, 0.0007596015930175781, 0.0012347698211669922, 0.0017099380493164062, 0.0021851062774658203, 0.0026602745056152344, 0.0031354427337646484, 0.0036106109619140625, 0.0040857791900634766, 0.004560947418212891, 0.005036115646362305, 0.005511283874511719, 0.005986452102661133, 0.006461620330810547, 0.006936788558959961, 0.007411956787109375, 0.007887125015258789, 0.008362293243408203, 0.008837461471557617, 0.009312629699707031, 0.009787797927856445, 0.01026296615600586, 0.010738134384155273, 0.011213302612304688, 0.011688470840454102, 0.012163639068603516, 0.01263880729675293, 0.013113975524902344, 0.013589143753051758, 0.014064311981201172, 0.014539480209350586, 0.0150146484375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 65.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 200.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 467.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 193.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.300366759300232e-07, -2.2165477275848389e-07, -2.1327286958694458e-07, -2.0489096641540527e-07, -1.9650906324386597e-07, -1.8812716007232666e-07, -1.7974525690078735e-07, -1.7136335372924805e-07, -1.6298145055770874e-07, -1.5459954738616943e-07, -1.4621764421463013e-07, -1.3783574104309082e-07, -1.2945383787155151e-07, -1.210719347000122e-07, -1.126900315284729e-07, -1.043081283569336e-07, -9.592622518539429e-08, -8.754432201385498e-08, -7.916241884231567e-08, -7.078051567077637e-08, -6.239861249923706e-08, -5.4016709327697754e-08, -4.563480615615845e-08, -3.725290298461914e-08, -2.8870999813079834e-08, -2.0489096641540527e-08, -1.210719347000122e-08, -3.725290298461914e-09, 4.6566128730773926e-09, 1.30385160446167e-08, 2.1420419216156006e-08, 2.9802322387695312e-08, 3.818422555923462e-08, 4.6566128730773926e-08, 5.494803190231323e-08, 6.332993507385254e-08, 7.171183824539185e-08, 8.009374141693115e-08, 8.847564458847046e-08, 9.685754776000977e-08, 1.0523945093154907e-07, 1.1362135410308838e-07, 1.2200325727462769e-07, 1.30385160446167e-07, 1.387670636177063e-07, 1.471489667892456e-07, 1.555308699607849e-07, 1.6391277313232422e-07, 1.7229467630386353e-07, 1.8067657947540283e-07, 1.8905848264694214e-07, 1.9744038581848145e-07, 2.0582228899002075e-07, 2.1420419216156006e-07, 2.2258609533309937e-07, 2.3096799850463867e-07, 2.39349901676178e-07, 2.477318048477173e-07, 2.561137080192566e-07, 2.644956111907959e-07, 2.728775143623352e-07, 2.812594175338745e-07, 2.896413207054138e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 3.0, 9.0, 5.0, 4.0, 0.0, 0.0, 6.0, 28.0, 28.0, 3.0, 12.0, 5.0, 33.0, 18.0, 58.0, 96.0, 32.0, 119.0, 212.0, 172.0, 459.0, 3369.0, 145920.0, 893308.0, 3341.0, 464.0, 123.0, 196.0, 167.0, 50.0, 78.0, 74.0, 30.0, 40.0, 7.0, 9.0, 6.0, 17.0, 35.0, 4.0, 6.0, 2.0, 0.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.616806447505951e-06, -5.451962351799011e-06, -5.2871182560920715e-06, -5.122274160385132e-06, -4.957430064678192e-06, -4.7925859689712524e-06, -4.627741873264313e-06, -4.462897777557373e-06, -4.298053681850433e-06, -4.133209586143494e-06, -3.968365490436554e-06, -3.8035213947296143e-06, -3.6386772990226746e-06, -3.473833203315735e-06, -3.308989107608795e-06, -3.1441450119018555e-06, -2.9793009161949158e-06, -2.814456820487976e-06, -2.6496127247810364e-06, -2.4847686290740967e-06, -2.319924533367157e-06, -2.1550804376602173e-06, -1.9902363419532776e-06, -1.8253922462463379e-06, -1.6605481505393982e-06, -1.4957040548324585e-06, -1.3308599591255188e-06, -1.166015863418579e-06, -1.0011717677116394e-06, -8.363276720046997e-07, -6.7148357629776e-07, -5.066394805908203e-07, -3.417953848838806e-07, -1.7695128917694092e-07, -1.210719347000122e-08, 1.5273690223693848e-07, 3.175809979438782e-07, 4.824250936508179e-07, 6.472691893577576e-07, 8.121132850646973e-07, 9.76957380771637e-07, 1.1418014764785767e-06, 1.3066455721855164e-06, 1.471489667892456e-06, 1.6363337635993958e-06, 1.8011778593063354e-06, 1.966021955013275e-06, 2.130866050720215e-06, 2.2957101464271545e-06, 2.4605542421340942e-06, 2.625398337841034e-06, 2.7902424335479736e-06, 2.9550865292549133e-06, 3.119930624961853e-06, 3.2847747206687927e-06, 3.4496188163757324e-06, 3.614462912082672e-06, 3.779307007789612e-06, 3.9441511034965515e-06, 4.108995199203491e-06, 4.273839294910431e-06, 4.438683390617371e-06, 4.60352748632431e-06, 4.76837158203125e-06]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 10.0, 18.0, 15.0, 13.0, 26.0, 756.0, 25.0, 26.0, 22.0, 26.0, 13.0, 10.0, 6.0, 6.0, 3.0, 9.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6370029243262252e-07, -1.5685598953041335e-07, -1.500117008390589e-07, -1.4316739793684974e-07, -1.363231092454953e-07, -1.2947880634328612e-07, -1.2263450344107696e-07, -1.1579021474972251e-07, -1.089459189529407e-07, -1.021016231561589e-07, -9.525732735937709e-08, -8.841303156259528e-08, -8.156872866038611e-08, -7.472443996903166e-08, -6.78801370668225e-08, -6.103584127004069e-08, -5.4191545473258884e-08, -4.734724967647708e-08, -4.050295387969527e-08, -3.365865453019978e-08, -2.6814358733417976e-08, -1.9970062936636168e-08, -1.3125763587140682e-08, -6.2814677903588745e-09, 5.62828006422933e-10, 7.40712469138316e-09, 1.4251421376343387e-08, 2.1095718949482034e-08, 2.794001474626384e-08, 3.478431054304565e-08, 4.1628609892541135e-08, 4.847290568932294e-08, 5.531720148610475e-08, 6.216149728288656e-08, 6.900579307966836e-08, 7.585009598187753e-08, 8.269438467323198e-08, 8.953868757544114e-08, 9.638298337222295e-08, 1.0322727916900476e-07, 1.1007157496578657e-07, 1.1691587076256837e-07, 1.2376017366477754e-07, 1.30604462356132e-07, 1.3744876525834115e-07, 1.442930539496956e-07, 1.5113735685190477e-07, 1.5798164554325922e-07, 1.6482594844546838e-07, 1.7167025134767755e-07, 1.78514540039032e-07, 1.8535884294124116e-07, 1.9220313163259561e-07, 1.9904743453480478e-07, 2.0589172322615923e-07, 2.127360261283684e-07, 2.1958032903057756e-07, 2.2642463193278672e-07, 2.3326892062414117e-07, 2.4011322352635034e-07, 2.469575122177048e-07, 2.5380180090905924e-07, 2.606461180221231e-07, 2.6749040671347757e-07, 2.74334695404832e-07]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 127.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 736.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 129.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1920928955078125e-07, -1.1455267667770386e-07, -1.0989606380462646e-07, -1.0523945093154907e-07, -1.0058283805847168e-07, -9.592622518539429e-08, -9.12696123123169e-08, -8.66129994392395e-08, -8.195638656616211e-08, -7.729977369308472e-08, -7.264316082000732e-08, -6.798654794692993e-08, -6.332993507385254e-08, -5.8673322200775146e-08, -5.4016709327697754e-08, -4.936009645462036e-08, -4.470348358154297e-08, -4.0046870708465576e-08, -3.5390257835388184e-08, -3.073364496231079e-08, -2.60770320892334e-08, -2.1420419216156006e-08, -1.6763806343078613e-08, -1.210719347000122e-08, -7.450580596923828e-09, -2.7939677238464355e-09, 1.862645149230957e-09, 6.51925802230835e-09, 1.1175870895385742e-08, 1.5832483768463135e-08, 2.0489096641540527e-08, 2.514570951461792e-08, 2.9802322387695312e-08, 3.4458935260772705e-08, 3.91155481338501e-08, 4.377216100692749e-08, 4.842877388000488e-08, 5.3085386753082275e-08, 5.774199962615967e-08, 6.239861249923706e-08, 6.705522537231445e-08, 7.171183824539185e-08, 7.636845111846924e-08, 8.102506399154663e-08, 8.568167686462402e-08, 9.033828973770142e-08, 9.499490261077881e-08, 9.96515154838562e-08, 1.043081283569336e-07, 1.0896474123001099e-07, 1.1362135410308838e-07, 1.1827796697616577e-07, 1.2293457984924316e-07, 1.2759119272232056e-07, 1.3224780559539795e-07, 1.3690441846847534e-07, 1.4156103134155273e-07, 1.4621764421463013e-07, 1.5087425708770752e-07, 1.555308699607849e-07, 1.601874828338623e-07, 1.648440957069397e-07, 1.695007085800171e-07, 1.7415732145309448e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 15.0, 13.0, 11.0, 24.0, 20.0, 25.0, 32.0, 29.0, 24.0, 30.0, 43.0, 40.0, 56.0, 51.0, 58.0, 41.0, 49.0, 56.0, 35.0, 47.0, 33.0, 37.0, 29.0, 31.0, 25.0, 28.0, 20.0, 17.0, 25.0, 10.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.30596923828125, -4.1627197265625, -4.01947021484375, -3.876220703125, -3.73297119140625, -3.5897216796875, -3.44647216796875, -3.30322265625, -3.15997314453125, -3.0167236328125, -2.87347412109375, -2.730224609375, -2.58697509765625, -2.4437255859375, -2.30047607421875, -2.1572265625, -2.01397705078125, -1.8707275390625, -1.72747802734375, -1.584228515625, -1.44097900390625, -1.2977294921875, -1.15447998046875, -1.01123046875, -0.86798095703125, -0.7247314453125, -0.58148193359375, -0.438232421875, -0.29498291015625, -0.1517333984375, -0.00848388671875, 0.134765625, 0.27801513671875, 0.4212646484375, 0.56451416015625, 0.707763671875, 0.85101318359375, 0.9942626953125, 1.13751220703125, 1.28076171875, 1.42401123046875, 1.5672607421875, 1.71051025390625, 1.853759765625, 1.99700927734375, 2.1402587890625, 2.28350830078125, 2.4267578125, 2.57000732421875, 2.7132568359375, 2.85650634765625, 2.999755859375, 3.14300537109375, 3.2862548828125, 3.42950439453125, 3.57275390625, 3.71600341796875, 3.8592529296875, 4.00250244140625, 4.145751953125, 4.28900146484375, 4.4322509765625, 4.57550048828125, 4.71875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 13.0, 8.0, 15.0, 19.0, 25.0, 48.0, 57.0, 81.0, 129.0, 193.0, 289.0, 363.0, 564.0, 823.0, 1272.0, 2126.0, 3418.0, 6139.0, 11013.0, 21808.0, 45896.0, 110402.0, 324522.0, 318895.0, 107943.0, 44931.0, 21308.0, 10836.0, 5923.0, 3444.0, 2078.0, 1395.0, 802.0, 563.0, 411.0, 248.0, 188.0, 98.0, 85.0, 50.0, 40.0, 28.0, 16.0, 12.0, 8.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.22265625, -5.05938720703125, -4.8961181640625, -4.73284912109375, -4.569580078125, -4.40631103515625, -4.2430419921875, -4.07977294921875, -3.91650390625, -3.75323486328125, -3.5899658203125, -3.42669677734375, -3.263427734375, -3.10015869140625, -2.9368896484375, -2.77362060546875, -2.6103515625, -2.44708251953125, -2.2838134765625, -2.12054443359375, -1.957275390625, -1.79400634765625, -1.6307373046875, -1.46746826171875, -1.30419921875, -1.14093017578125, -0.9776611328125, -0.81439208984375, -0.651123046875, -0.48785400390625, -0.3245849609375, -0.16131591796875, 0.001953125, 0.16522216796875, 0.3284912109375, 0.49176025390625, 0.655029296875, 0.81829833984375, 0.9815673828125, 1.14483642578125, 1.30810546875, 1.47137451171875, 1.6346435546875, 1.79791259765625, 1.961181640625, 2.12445068359375, 2.2877197265625, 2.45098876953125, 2.6142578125, 2.77752685546875, 2.9407958984375, 3.10406494140625, 3.267333984375, 3.43060302734375, 3.5938720703125, 3.75714111328125, 3.92041015625, 4.08367919921875, 4.2469482421875, 4.41021728515625, 4.573486328125, 4.73675537109375, 4.9000244140625, 5.06329345703125, 5.2265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 12.0, 14.0, 14.0, 21.0, 27.0, 26.0, 41.0, 40.0, 52.0, 69.0, 78.0, 130.0, 290.0, 1539.0, 207.0, 109.0, 69.0, 56.0, 44.0, 41.0, 31.0, 28.0, 22.0, 22.0, 16.0, 9.0, 13.0, 3.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.41357421875, -13.0224609375, -12.63134765625, -12.240234375, -11.84912109375, -11.4580078125, -11.06689453125, -10.67578125, -10.28466796875, -9.8935546875, -9.50244140625, -9.111328125, -8.72021484375, -8.3291015625, -7.93798828125, -7.546875, -7.15576171875, -6.7646484375, -6.37353515625, -5.982421875, -5.59130859375, -5.2001953125, -4.80908203125, -4.41796875, -4.02685546875, -3.6357421875, -3.24462890625, -2.853515625, -2.46240234375, -2.0712890625, -1.68017578125, -1.2890625, -0.89794921875, -0.5068359375, -0.11572265625, 0.275390625, 0.66650390625, 1.0576171875, 1.44873046875, 1.83984375, 2.23095703125, 2.6220703125, 3.01318359375, 3.404296875, 3.79541015625, 4.1865234375, 4.57763671875, 4.96875, 5.35986328125, 5.7509765625, 6.14208984375, 6.533203125, 6.92431640625, 7.3154296875, 7.70654296875, 8.09765625, 8.48876953125, 8.8798828125, 9.27099609375, 9.662109375, 10.05322265625, 10.4443359375, 10.83544921875, 11.2265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 9.0, 7.0, 7.0, 18.0, 23.0, 35.0, 75.0, 110.0, 174.0, 333.0, 934.0, 12484.0, 3113947.0, 15693.0, 996.0, 386.0, 168.0, 104.0, 62.0, 38.0, 27.0, 12.0, 12.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.8125, -42.54345703125, -41.2744140625, -40.00537109375, -38.736328125, -37.46728515625, -36.1982421875, -34.92919921875, -33.66015625, -32.39111328125, -31.1220703125, -29.85302734375, -28.583984375, -27.31494140625, -26.0458984375, -24.77685546875, -23.5078125, -22.23876953125, -20.9697265625, -19.70068359375, -18.431640625, -17.16259765625, -15.8935546875, -14.62451171875, -13.35546875, -12.08642578125, -10.8173828125, -9.54833984375, -8.279296875, -7.01025390625, -5.7412109375, -4.47216796875, -3.203125, -1.93408203125, -0.6650390625, 0.60400390625, 1.873046875, 3.14208984375, 4.4111328125, 5.68017578125, 6.94921875, 8.21826171875, 9.4873046875, 10.75634765625, 12.025390625, 13.29443359375, 14.5634765625, 15.83251953125, 17.1015625, 18.37060546875, 19.6396484375, 20.90869140625, 22.177734375, 23.44677734375, 24.7158203125, 25.98486328125, 27.25390625, 28.52294921875, 29.7919921875, 31.06103515625, 32.330078125, 33.59912109375, 34.8681640625, 36.13720703125, 37.40625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 49.0, 281.0, 427.0, 204.0, 39.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.09678268432617, -43.83516311645508, -41.57353973388672, -39.311920166015625, -37.05030059814453, -34.78867721557617, -32.52705764770508, -30.26543617248535, -28.003814697265625, -25.7421932220459, -23.480571746826172, -21.218952178955078, -18.95733070373535, -16.695709228515625, -14.434088706970215, -12.172468185424805, -9.910846710205078, -7.64922571182251, -5.387604713439941, -3.125983715057373, -0.8643627166748047, 1.3972587585449219, 3.658879280090332, 5.920499801635742, 8.182121276855469, 10.443742752075195, 12.705363273620605, 14.966983795166016, 17.228605270385742, 19.49022674560547, 21.751846313476562, 24.01346778869629, 26.27508544921875, 28.536706924438477, 30.798328399658203, 33.0599479675293, 35.321571350097656, 37.58319091796875, 39.844810485839844, 42.10643005371094, 44.3680534362793, 46.62967300415039, 48.89129638671875, 51.152915954589844, 53.41453552246094, 55.6761589050293, 57.93777847290039, 60.19940185546875, 62.461021423339844, 64.72264099121094, 66.98426055908203, 69.24588775634766, 71.50750732421875, 73.76912689208984, 76.03074645996094, 78.29236602783203, 80.55398559570312, 82.81560516357422, 85.07722473144531, 87.33885192871094, 89.60047149658203, 91.86209106445312, 94.12371063232422, 96.38533020019531, 98.64695739746094]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 13.0, 10.0, 6.0, 7.0, 11.0, 14.0, 21.0, 18.0, 21.0, 26.0, 30.0, 26.0, 33.0, 27.0, 33.0, 35.0, 33.0, 45.0, 44.0, 39.0, 40.0, 37.0, 49.0, 25.0, 42.0, 37.0, 28.0, 33.0, 31.0, 23.0, 25.0, 18.0, 26.0, 12.0, 11.0, 19.0, 12.0, 6.0, 8.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.42755889892578, -23.595754623413086, -22.763952255249023, -21.932147979736328, -21.100343704223633, -20.268539428710938, -19.436737060546875, -18.60493278503418, -17.773128509521484, -16.94132423400879, -16.109521865844727, -15.277717590332031, -14.445913314819336, -13.614109992980957, -12.782306671142578, -11.950502395629883, -11.11870002746582, -10.286896705627441, -9.455092430114746, -8.623289108276367, -7.79148530960083, -6.959681510925293, -6.127878189086914, -5.296074390411377, -4.46427059173584, -3.6324667930603027, -2.8006632328033447, -1.9688596725463867, -1.1370558738708496, -0.3052520751953125, 0.5265512466430664, 1.3583550453186035, 2.1901588439941406, 3.0219626426696777, 3.8537662029266357, 4.685569763183594, 5.517373561859131, 6.349177360534668, 7.180980682373047, 8.012784957885742, 8.844588279724121, 9.6763916015625, 10.508195877075195, 11.339999198913574, 12.171802520751953, 13.003606796264648, 13.835410118103027, 14.667213439941406, 15.499017715454102, 16.330821990966797, 17.16262435913086, 17.994428634643555, 18.82623291015625, 19.658035278320312, 20.489839553833008, 21.321643829345703, 22.153446197509766, 22.98525047302246, 23.817052841186523, 24.64885711669922, 25.480661392211914, 26.31246566772461, 27.144268035888672, 27.976072311401367, 28.807876586914062]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 14.0, 9.0, 12.0, 15.0, 19.0, 26.0, 19.0, 27.0, 33.0, 34.0, 37.0, 41.0, 41.0, 49.0, 35.0, 64.0, 45.0, 53.0, 62.0, 36.0, 39.0, 33.0, 42.0, 31.0, 30.0, 21.0, 21.0, 22.0, 10.0, 16.0, 11.0, 12.0, 6.0, 7.0, 3.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -4.000732421875, -3.85693359375, -3.713134765625, -3.5693359375, -3.425537109375, -3.28173828125, -3.137939453125, -2.994140625, -2.850341796875, -2.70654296875, -2.562744140625, -2.4189453125, -2.275146484375, -2.13134765625, -1.987548828125, -1.84375, -1.699951171875, -1.55615234375, -1.412353515625, -1.2685546875, -1.124755859375, -0.98095703125, -0.837158203125, -0.693359375, -0.549560546875, -0.40576171875, -0.261962890625, -0.1181640625, 0.025634765625, 0.16943359375, 0.313232421875, 0.45703125, 0.600830078125, 0.74462890625, 0.888427734375, 1.0322265625, 1.176025390625, 1.31982421875, 1.463623046875, 1.607421875, 1.751220703125, 1.89501953125, 2.038818359375, 2.1826171875, 2.326416015625, 2.47021484375, 2.614013671875, 2.7578125, 2.901611328125, 3.04541015625, 3.189208984375, 3.3330078125, 3.476806640625, 3.62060546875, 3.764404296875, 3.908203125, 4.052001953125, 4.19580078125, 4.339599609375, 4.4833984375, 4.627197265625, 4.77099609375, 4.914794921875, 5.05859375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 9.0, 14.0, 15.0, 21.0, 28.0, 41.0, 53.0, 63.0, 95.0, 144.0, 209.0, 374.0, 636.0, 1074.0, 2201.0, 4731.0, 12942.0, 52142.0, 429107.0, 2463962.0, 1074655.0, 116463.0, 21732.0, 7087.0, 2996.0, 1362.0, 774.0, 455.0, 284.0, 187.0, 118.0, 69.0, 55.0, 48.0, 33.0, 20.0, 19.0, 14.0, 14.0, 6.0, 5.0, 10.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.44384765625, -7.1845703125, -6.92529296875, -6.666015625, -6.40673828125, -6.1474609375, -5.88818359375, -5.62890625, -5.36962890625, -5.1103515625, -4.85107421875, -4.591796875, -4.33251953125, -4.0732421875, -3.81396484375, -3.5546875, -3.29541015625, -3.0361328125, -2.77685546875, -2.517578125, -2.25830078125, -1.9990234375, -1.73974609375, -1.48046875, -1.22119140625, -0.9619140625, -0.70263671875, -0.443359375, -0.18408203125, 0.0751953125, 0.33447265625, 0.59375, 0.85302734375, 1.1123046875, 1.37158203125, 1.630859375, 1.89013671875, 2.1494140625, 2.40869140625, 2.66796875, 2.92724609375, 3.1865234375, 3.44580078125, 3.705078125, 3.96435546875, 4.2236328125, 4.48291015625, 4.7421875, 5.00146484375, 5.2607421875, 5.52001953125, 5.779296875, 6.03857421875, 6.2978515625, 6.55712890625, 6.81640625, 7.07568359375, 7.3349609375, 7.59423828125, 7.853515625, 8.11279296875, 8.3720703125, 8.63134765625, 8.890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 7.0, 2.0, 5.0, 11.0, 12.0, 13.0, 19.0, 18.0, 32.0, 43.0, 37.0, 64.0, 81.0, 79.0, 128.0, 170.0, 191.0, 254.0, 309.0, 413.0, 417.0, 385.0, 317.0, 230.0, 155.0, 155.0, 96.0, 92.0, 67.0, 50.0, 42.0, 44.0, 37.0, 22.0, 13.0, 18.0, 14.0, 8.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.11737060546875, -4.9534912109375, -4.78961181640625, -4.625732421875, -4.46185302734375, -4.2979736328125, -4.13409423828125, -3.97021484375, -3.80633544921875, -3.6424560546875, -3.47857666015625, -3.314697265625, -3.15081787109375, -2.9869384765625, -2.82305908203125, -2.6591796875, -2.49530029296875, -2.3314208984375, -2.16754150390625, -2.003662109375, -1.83978271484375, -1.6759033203125, -1.51202392578125, -1.34814453125, -1.18426513671875, -1.0203857421875, -0.85650634765625, -0.692626953125, -0.52874755859375, -0.3648681640625, -0.20098876953125, -0.037109375, 0.12677001953125, 0.2906494140625, 0.45452880859375, 0.618408203125, 0.78228759765625, 0.9461669921875, 1.11004638671875, 1.27392578125, 1.43780517578125, 1.6016845703125, 1.76556396484375, 1.929443359375, 2.09332275390625, 2.2572021484375, 2.42108154296875, 2.5849609375, 2.74884033203125, 2.9127197265625, 3.07659912109375, 3.240478515625, 3.40435791015625, 3.5682373046875, 3.73211669921875, 3.89599609375, 4.05987548828125, 4.2237548828125, 4.38763427734375, 4.551513671875, 4.71539306640625, 4.8792724609375, 5.04315185546875, 5.20703125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 18.0, 16.0, 36.0, 47.0, 70.0, 109.0, 146.0, 221.0, 360.0, 629.0, 1133.0, 2626.0, 7608.0, 34143.0, 221676.0, 2034447.0, 1662905.0, 186803.0, 29618.0, 6825.0, 2275.0, 984.0, 585.0, 337.0, 207.0, 125.0, 95.0, 67.0, 42.0, 20.0, 21.0, 16.0, 13.0, 11.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.33984375, -7.05706787109375, -6.7742919921875, -6.49151611328125, -6.208740234375, -5.92596435546875, -5.6431884765625, -5.36041259765625, -5.07763671875, -4.79486083984375, -4.5120849609375, -4.22930908203125, -3.946533203125, -3.66375732421875, -3.3809814453125, -3.09820556640625, -2.8154296875, -2.53265380859375, -2.2498779296875, -1.96710205078125, -1.684326171875, -1.40155029296875, -1.1187744140625, -0.83599853515625, -0.55322265625, -0.27044677734375, 0.0123291015625, 0.29510498046875, 0.577880859375, 0.86065673828125, 1.1434326171875, 1.42620849609375, 1.708984375, 1.99176025390625, 2.2745361328125, 2.55731201171875, 2.840087890625, 3.12286376953125, 3.4056396484375, 3.68841552734375, 3.97119140625, 4.25396728515625, 4.5367431640625, 4.81951904296875, 5.102294921875, 5.38507080078125, 5.6678466796875, 5.95062255859375, 6.2333984375, 6.51617431640625, 6.7989501953125, 7.08172607421875, 7.364501953125, 7.64727783203125, 7.9300537109375, 8.21282958984375, 8.49560546875, 8.77838134765625, 9.0611572265625, 9.34393310546875, 9.626708984375, 9.90948486328125, 10.1922607421875, 10.47503662109375, 10.7578125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 43.0, 409.0, 498.0, 61.0, 2.0, 1.0, 2.0], "bins": [-292.6775207519531, -287.7196044921875, -282.76165771484375, -277.8037414550781, -272.8457946777344, -267.88787841796875, -262.929931640625, -257.9720153808594, -253.01406860351562, -248.05613708496094, -243.09820556640625, -238.14027404785156, -233.18234252929688, -228.2244110107422, -223.2664794921875, -218.30856323242188, -213.3506317138672, -208.3927001953125, -203.4347686767578, -198.47683715820312, -193.51890563964844, -188.56097412109375, -183.60304260253906, -178.64511108398438, -173.68719482421875, -168.72926330566406, -163.77133178710938, -158.8134002685547, -153.85546875, -148.8975372314453, -143.93960571289062, -138.981689453125, -134.02374267578125, -129.06581115722656, -124.10787963867188, -119.14994812011719, -114.1920166015625, -109.23408508300781, -104.27616119384766, -99.31822967529297, -94.36029052734375, -89.40235900878906, -84.44442749023438, -79.48649597167969, -74.528564453125, -69.57063293457031, -64.61270904541016, -59.65477752685547, -54.69684600830078, -49.738914489746094, -44.780982971191406, -39.823055267333984, -34.8651237487793, -29.90719223022461, -24.949262619018555, -19.9913330078125, -15.033403396606445, -10.075472831726074, -5.117542266845703, -0.15961170196533203, 4.798318862915039, 9.756250381469727, 14.714179992675781, 19.672109603881836, 24.630041122436523]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 7.0, 8.0, 14.0, 14.0, 20.0, 19.0, 21.0, 15.0, 27.0, 25.0, 28.0, 35.0, 39.0, 48.0, 64.0, 35.0, 35.0, 47.0, 48.0, 49.0, 46.0, 42.0, 47.0, 34.0, 31.0, 29.0, 27.0, 20.0, 31.0, 17.0, 19.0, 17.0, 16.0, 13.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.451316833496094, -28.645355224609375, -27.839391708374023, -27.033430099487305, -26.227468490600586, -25.421504974365234, -24.615543365478516, -23.809581756591797, -23.003620147705078, -22.19765853881836, -21.391695022583008, -20.58573341369629, -19.77977180480957, -18.97380828857422, -18.1678466796875, -17.36188507080078, -16.555923461914062, -15.749960899353027, -14.943999290466309, -14.138036727905273, -13.332075119018555, -12.52611255645752, -11.720149993896484, -10.914188385009766, -10.108224868774414, -9.302262306213379, -8.49630069732666, -7.690338134765625, -6.884376525878906, -6.078413963317871, -5.272451877593994, -4.466489791870117, -3.6605281829833984, -2.8545660972595215, -2.0486040115356445, -1.2426416873931885, -0.4366796016693115, 0.36928272247314453, 1.1752448081970215, 1.9812068939208984, 2.7871689796447754, 3.5931310653686523, 4.399093151092529, 5.205055236816406, 6.011017799377441, 6.816979885101318, 7.622941970825195, 8.428903579711914, 9.23486614227295, 10.040828704833984, 10.846790313720703, 11.652752876281738, 12.458714485168457, 13.264677047729492, 14.070638656616211, 14.876601219177246, 15.682563781738281, 16.488525390625, 17.29448890686035, 18.10045051574707, 18.90641212463379, 19.71237564086914, 20.51833724975586, 21.324298858642578, 22.130260467529297]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 13.0, 8.0, 6.0, 15.0, 17.0, 18.0, 21.0, 15.0, 20.0, 27.0, 31.0, 28.0, 32.0, 34.0, 40.0, 31.0, 43.0, 47.0, 48.0, 50.0, 35.0, 37.0, 43.0, 40.0, 35.0, 27.0, 44.0, 18.0, 23.0, 21.0, 21.0, 25.0, 18.0, 7.0, 14.0, 5.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.396484375, -3.292022705078125, -3.18756103515625, -3.083099365234375, -2.9786376953125, -2.874176025390625, -2.76971435546875, -2.665252685546875, -2.560791015625, -2.456329345703125, -2.35186767578125, -2.247406005859375, -2.1429443359375, -2.038482666015625, -1.93402099609375, -1.829559326171875, -1.72509765625, -1.620635986328125, -1.51617431640625, -1.411712646484375, -1.3072509765625, -1.202789306640625, -1.09832763671875, -0.993865966796875, -0.889404296875, -0.784942626953125, -0.68048095703125, -0.576019287109375, -0.4715576171875, -0.367095947265625, -0.26263427734375, -0.158172607421875, -0.0537109375, 0.050750732421875, 0.15521240234375, 0.259674072265625, 0.3641357421875, 0.468597412109375, 0.57305908203125, 0.677520751953125, 0.781982421875, 0.886444091796875, 0.99090576171875, 1.095367431640625, 1.1998291015625, 1.304290771484375, 1.40875244140625, 1.513214111328125, 1.61767578125, 1.722137451171875, 1.82659912109375, 1.931060791015625, 2.0355224609375, 2.139984130859375, 2.24444580078125, 2.348907470703125, 2.453369140625, 2.557830810546875, 2.66229248046875, 2.766754150390625, 2.8712158203125, 2.975677490234375, 3.08013916015625, 3.184600830078125, 3.2890625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 12.0, 14.0, 19.0, 27.0, 42.0, 62.0, 85.0, 116.0, 185.0, 243.0, 362.0, 591.0, 816.0, 1223.0, 1803.0, 2725.0, 4216.0, 6717.0, 10286.0, 16616.0, 26882.0, 45928.0, 81924.0, 168388.0, 337297.0, 152923.0, 76635.0, 43126.0, 25343.0, 15656.0, 9800.0, 6378.0, 3998.0, 2671.0, 1747.0, 1200.0, 812.0, 494.0, 381.0, 234.0, 177.0, 118.0, 92.0, 62.0, 37.0, 29.0, 16.0, 19.0, 12.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0198974609375, -0.019264698028564453, -0.018631935119628906, -0.01799917221069336, -0.017366409301757812, -0.016733646392822266, -0.01610088348388672, -0.015468120574951172, -0.014835357666015625, -0.014202594757080078, -0.013569831848144531, -0.012937068939208984, -0.012304306030273438, -0.01167154312133789, -0.011038780212402344, -0.010406017303466797, -0.00977325439453125, -0.009140491485595703, -0.008507728576660156, -0.00787496566772461, -0.0072422027587890625, -0.006609439849853516, -0.005976676940917969, -0.005343914031982422, -0.004711151123046875, -0.004078388214111328, -0.0034456253051757812, -0.0028128623962402344, -0.0021800994873046875, -0.0015473365783691406, -0.0009145736694335938, -0.0002818107604980469, 0.0003509521484375, 0.0009837150573730469, 0.0016164779663085938, 0.0022492408752441406, 0.0028820037841796875, 0.0035147666931152344, 0.004147529602050781, 0.004780292510986328, 0.005413055419921875, 0.006045818328857422, 0.006678581237792969, 0.007311344146728516, 0.007944107055664062, 0.00857686996459961, 0.009209632873535156, 0.009842395782470703, 0.01047515869140625, 0.011107921600341797, 0.011740684509277344, 0.01237344741821289, 0.013006210327148438, 0.013638973236083984, 0.014271736145019531, 0.014904499053955078, 0.015537261962890625, 0.016170024871826172, 0.01680278778076172, 0.017435550689697266, 0.018068313598632812, 0.01870107650756836, 0.019333839416503906, 0.019966602325439453, 0.020599365234375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 8.0, 4.0, 8.0, 8.0, 6.0, 10.0, 18.0, 22.0, 22.0, 20.0, 31.0, 30.0, 37.0, 46.0, 59.0, 46.0, 58.0, 40.0, 1076.0, 46.0, 74.0, 46.0, 50.0, 39.0, 43.0, 23.0, 27.0, 32.0, 24.0, 26.0, 12.0, 13.0, 8.0, 5.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.4327392578125, -2.340087890625, -2.2474365234375, -2.15478515625, -2.0621337890625, -1.969482421875, -1.8768310546875, -1.7841796875, -1.6915283203125, -1.598876953125, -1.5062255859375, -1.41357421875, -1.3209228515625, -1.228271484375, -1.1356201171875, -1.04296875, -0.9503173828125, -0.857666015625, -0.7650146484375, -0.67236328125, -0.5797119140625, -0.487060546875, -0.3944091796875, -0.3017578125, -0.2091064453125, -0.116455078125, -0.0238037109375, 0.06884765625, 0.1614990234375, 0.254150390625, 0.3468017578125, 0.439453125, 0.5321044921875, 0.624755859375, 0.7174072265625, 0.81005859375, 0.9027099609375, 0.995361328125, 1.0880126953125, 1.1806640625, 1.2733154296875, 1.365966796875, 1.4586181640625, 1.55126953125, 1.6439208984375, 1.736572265625, 1.8292236328125, 1.921875, 2.0145263671875, 2.107177734375, 2.1998291015625, 2.29248046875, 2.3851318359375, 2.477783203125, 2.5704345703125, 2.6630859375, 2.7557373046875, 2.848388671875, 2.9410400390625, 3.03369140625, 3.1263427734375, 3.218994140625, 3.3116455078125, 3.404296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 11.0, 12.0, 26.0, 31.0, 34.0, 72.0, 131.0, 187.0, 310.0, 559.0, 966.0, 1505.0, 2819.0, 4884.0, 9078.0, 16585.0, 31771.0, 63134.0, 143129.0, 1435359.0, 214457.0, 84159.0, 40976.0, 21011.0, 11405.0, 6330.0, 3413.0, 1958.0, 1134.0, 640.0, 428.0, 254.0, 103.0, 80.0, 63.0, 46.0, 23.0, 12.0, 4.0, 11.0, 8.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.020538330078125, -0.019928693771362305, -0.01931905746459961, -0.018709421157836914, -0.01809978485107422, -0.017490148544311523, -0.016880512237548828, -0.016270875930786133, -0.015661239624023438, -0.015051603317260742, -0.014441967010498047, -0.013832330703735352, -0.013222694396972656, -0.012613058090209961, -0.012003421783447266, -0.01139378547668457, -0.010784149169921875, -0.01017451286315918, -0.009564876556396484, -0.008955240249633789, -0.008345603942871094, -0.0077359676361083984, -0.007126331329345703, -0.006516695022583008, -0.0059070587158203125, -0.005297422409057617, -0.004687786102294922, -0.0040781497955322266, -0.0034685134887695312, -0.002858877182006836, -0.0022492408752441406, -0.0016396045684814453, -0.00102996826171875, -0.0004203319549560547, 0.00018930435180664062, 0.0007989406585693359, 0.0014085769653320312, 0.0020182132720947266, 0.002627849578857422, 0.003237485885620117, 0.0038471221923828125, 0.004456758499145508, 0.005066394805908203, 0.0056760311126708984, 0.006285667419433594, 0.006895303726196289, 0.007504940032958984, 0.00811457633972168, 0.008724212646484375, 0.00933384895324707, 0.009943485260009766, 0.010553121566772461, 0.011162757873535156, 0.011772394180297852, 0.012382030487060547, 0.012991666793823242, 0.013601303100585938, 0.014210939407348633, 0.014820575714111328, 0.015430212020874023, 0.01603984832763672, 0.016649484634399414, 0.01725912094116211, 0.017868757247924805, 0.0184783935546875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 46.0, 0.0, 0.0, 0.0, 0.0, 0.0, 217.0, 0.0, 0.0, 0.0, 0.0, 404.0, 0.0, 0.0, 0.0, 0.0, 0.0, 229.0, 0.0, 0.0, 0.0, 0.0, 0.0, 74.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.473833203315735e-07, -3.371387720108032e-07, -3.2689422369003296e-07, -3.166496753692627e-07, -3.0640512704849243e-07, -2.9616057872772217e-07, -2.859160304069519e-07, -2.7567148208618164e-07, -2.654269337654114e-07, -2.551823854446411e-07, -2.4493783712387085e-07, -2.3469328880310059e-07, -2.2444874048233032e-07, -2.1420419216156006e-07, -2.039596438407898e-07, -1.9371509552001953e-07, -1.8347054719924927e-07, -1.73225998878479e-07, -1.6298145055770874e-07, -1.5273690223693848e-07, -1.424923539161682e-07, -1.3224780559539795e-07, -1.2200325727462769e-07, -1.1175870895385742e-07, -1.0151416063308716e-07, -9.12696123123169e-08, -8.102506399154663e-08, -7.078051567077637e-08, -6.05359673500061e-08, -5.029141902923584e-08, -4.0046870708465576e-08, -2.9802322387695312e-08, -1.955777406692505e-08, -9.313225746154785e-09, 9.313225746154785e-10, 1.1175870895385742e-08, 2.1420419216156006e-08, 3.166496753692627e-08, 4.190951585769653e-08, 5.21540641784668e-08, 6.239861249923706e-08, 7.264316082000732e-08, 8.288770914077759e-08, 9.313225746154785e-08, 1.0337680578231812e-07, 1.1362135410308838e-07, 1.2386590242385864e-07, 1.341104507446289e-07, 1.4435499906539917e-07, 1.5459954738616943e-07, 1.648440957069397e-07, 1.7508864402770996e-07, 1.8533319234848022e-07, 1.955777406692505e-07, 2.0582228899002075e-07, 2.1606683731079102e-07, 2.2631138563156128e-07, 2.3655593395233154e-07, 2.468004822731018e-07, 2.5704503059387207e-07, 2.6728957891464233e-07, 2.775341272354126e-07, 2.8777867555618286e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 9.0, 10.0, 1.0, 0.0, 6.0, 28.0, 34.0, 17.0, 8.0, 61.0, 21.0, 114.0, 74.0, 135.0, 289.0, 160.0, 577.0, 16222.0, 1012800.0, 16565.0, 542.0, 188.0, 223.0, 126.0, 93.0, 92.0, 39.0, 21.0, 10.0, 6.0, 14.0, 35.0, 3.0, 1.0, 3.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.602836608886719e-06, -5.398876965045929e-06, -5.194917321205139e-06, -4.990957677364349e-06, -4.7869980335235596e-06, -4.58303838968277e-06, -4.37907874584198e-06, -4.17511910200119e-06, -3.9711594581604e-06, -3.7671998143196106e-06, -3.563240170478821e-06, -3.359280526638031e-06, -3.155320882797241e-06, -2.9513612389564514e-06, -2.7474015951156616e-06, -2.543441951274872e-06, -2.339482307434082e-06, -2.1355226635932922e-06, -1.9315630197525024e-06, -1.7276033759117126e-06, -1.5236437320709229e-06, -1.319684088230133e-06, -1.1157244443893433e-06, -9.117648005485535e-07, -7.078051567077637e-07, -5.038455128669739e-07, -2.998858690261841e-07, -9.592622518539429e-08, 1.0803341865539551e-07, 3.119930624961853e-07, 5.159527063369751e-07, 7.199123501777649e-07, 9.238719940185547e-07, 1.1278316378593445e-06, 1.3317912817001343e-06, 1.535750925540924e-06, 1.7397105693817139e-06, 1.9436702132225037e-06, 2.1476298570632935e-06, 2.3515895009040833e-06, 2.555549144744873e-06, 2.759508788585663e-06, 2.9634684324264526e-06, 3.1674280762672424e-06, 3.3713877201080322e-06, 3.575347363948822e-06, 3.779307007789612e-06, 3.983266651630402e-06, 4.187226295471191e-06, 4.391185939311981e-06, 4.595145583152771e-06, 4.799105226993561e-06, 5.003064870834351e-06, 5.20702451467514e-06, 5.41098415851593e-06, 5.61494380235672e-06, 5.81890344619751e-06, 6.0228630900382996e-06, 6.226822733879089e-06, 6.430782377719879e-06, 6.634742021560669e-06, 6.838701665401459e-06, 7.0426613092422485e-06, 7.246620953083038e-06, 7.450580596923828e-06]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 9.0, 7.0, 9.0, 15.0, 18.0, 20.0, 17.0, 21.0, 21.0, 712.0, 19.0, 12.0, 16.0, 18.0, 20.0, 18.0, 11.0, 5.0, 5.0, 0.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3966374012852611e-07, -1.359658341471004e-07, -1.3226792816567468e-07, -1.2857003639510367e-07, -1.2487213041367795e-07, -1.2117422443225223e-07, -1.1747631845082651e-07, -1.1377841246940079e-07, -1.1008050648797507e-07, -1.0638260050654935e-07, -1.0268470163055099e-07, -9.898679564912527e-08, -9.528888966769955e-08, -9.159099079170119e-08, -8.789308481027547e-08, -8.419517882884975e-08, -8.049727995285139e-08, -7.679937397142567e-08, -7.31014750954273e-08, -6.940356911400158e-08, -6.570566313257586e-08, -6.200775715115014e-08, -5.830985827515178e-08, -5.461195229372606e-08, -5.091404986501402e-08, -4.721614743630198e-08, -4.351824145487626e-08, -3.982033902616422e-08, -3.612243659745218e-08, -3.242453061602646e-08, -2.8726628187314418e-08, -2.5028723982245538e-08, -2.1330819777176657e-08, -1.7632915572107777e-08, -1.3935012255217316e-08, -1.0237108938326855e-08, -6.539204733257975e-09, -2.8413005281890946e-09, 8.566019005229464e-10, 4.554506105591827e-09, 8.252410310660707e-09, 1.1950314515729588e-08, 1.5648218720798468e-08, 1.934612114951051e-08, 2.304402535457939e-08, 2.674192955964827e-08, 3.043983198836031e-08, 3.413773441707235e-08, 3.783564039849807e-08, 4.153354282721011e-08, 4.523144880863583e-08, 4.8929351237347873e-08, 5.262725721877359e-08, 5.6325159647485634e-08, 6.002306207619768e-08, 6.37209680576234e-08, 6.741886693362176e-08, 7.111677291504748e-08, 7.481467179104584e-08, 7.851257777247156e-08, 8.221048375389728e-08, 8.590838262989564e-08, 8.960628861132136e-08, 9.330419459274708e-08, 9.70021005741728e-08]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 160.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 701.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 140.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 13.0, 8.0, 6.0, 15.0, 17.0, 18.0, 21.0, 15.0, 20.0, 27.0, 31.0, 28.0, 32.0, 34.0, 40.0, 31.0, 43.0, 47.0, 48.0, 50.0, 35.0, 37.0, 43.0, 40.0, 35.0, 27.0, 44.0, 18.0, 23.0, 21.0, 21.0, 25.0, 18.0, 7.0, 14.0, 5.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.396484375, -3.292022705078125, -3.18756103515625, -3.083099365234375, -2.9786376953125, -2.874176025390625, -2.76971435546875, -2.665252685546875, -2.560791015625, -2.456329345703125, -2.35186767578125, -2.247406005859375, -2.1429443359375, -2.038482666015625, -1.93402099609375, -1.829559326171875, -1.72509765625, -1.620635986328125, -1.51617431640625, -1.411712646484375, -1.3072509765625, -1.202789306640625, -1.09832763671875, -0.993865966796875, -0.889404296875, -0.784942626953125, -0.68048095703125, -0.576019287109375, -0.4715576171875, -0.367095947265625, -0.26263427734375, -0.158172607421875, -0.0537109375, 0.050750732421875, 0.15521240234375, 0.259674072265625, 0.3641357421875, 0.468597412109375, 0.57305908203125, 0.677520751953125, 0.781982421875, 0.886444091796875, 0.99090576171875, 1.095367431640625, 1.1998291015625, 1.304290771484375, 1.40875244140625, 1.513214111328125, 1.61767578125, 1.722137451171875, 1.82659912109375, 1.931060791015625, 2.0355224609375, 2.139984130859375, 2.24444580078125, 2.348907470703125, 2.453369140625, 2.557830810546875, 2.66229248046875, 2.766754150390625, 2.8712158203125, 2.975677490234375, 3.08013916015625, 3.184600830078125, 3.2890625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 11.0, 12.0, 20.0, 31.0, 29.0, 58.0, 73.0, 103.0, 148.0, 212.0, 312.0, 432.0, 678.0, 1140.0, 1780.0, 3288.0, 7013.0, 17314.0, 52078.0, 207796.0, 538560.0, 149254.0, 40761.0, 14192.0, 5894.0, 2844.0, 1595.0, 944.0, 588.0, 423.0, 265.0, 226.0, 137.0, 85.0, 77.0, 43.0, 31.0, 35.0, 14.0, 12.0, 7.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.96875, -5.77862548828125, -5.5885009765625, -5.39837646484375, -5.208251953125, -5.01812744140625, -4.8280029296875, -4.63787841796875, -4.44775390625, -4.25762939453125, -4.0675048828125, -3.87738037109375, -3.687255859375, -3.49713134765625, -3.3070068359375, -3.11688232421875, -2.9267578125, -2.73663330078125, -2.5465087890625, -2.35638427734375, -2.166259765625, -1.97613525390625, -1.7860107421875, -1.59588623046875, -1.40576171875, -1.21563720703125, -1.0255126953125, -0.83538818359375, -0.645263671875, -0.45513916015625, -0.2650146484375, -0.07489013671875, 0.115234375, 0.30535888671875, 0.4954833984375, 0.68560791015625, 0.875732421875, 1.06585693359375, 1.2559814453125, 1.44610595703125, 1.63623046875, 1.82635498046875, 2.0164794921875, 2.20660400390625, 2.396728515625, 2.58685302734375, 2.7769775390625, 2.96710205078125, 3.1572265625, 3.34735107421875, 3.5374755859375, 3.72760009765625, 3.917724609375, 4.10784912109375, 4.2979736328125, 4.48809814453125, 4.67822265625, 4.86834716796875, 5.0584716796875, 5.24859619140625, 5.438720703125, 5.62884521484375, 5.8189697265625, 6.00909423828125, 6.19921875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 11.0, 5.0, 3.0, 10.0, 15.0, 11.0, 11.0, 16.0, 23.0, 33.0, 46.0, 32.0, 41.0, 52.0, 58.0, 100.0, 246.0, 1563.0, 269.0, 141.0, 58.0, 50.0, 45.0, 23.0, 32.0, 31.0, 34.0, 19.0, 17.0, 14.0, 14.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3984375, -11.0867919921875, -10.775146484375, -10.4635009765625, -10.15185546875, -9.8402099609375, -9.528564453125, -9.2169189453125, -8.9052734375, -8.5936279296875, -8.281982421875, -7.9703369140625, -7.65869140625, -7.3470458984375, -7.035400390625, -6.7237548828125, -6.412109375, -6.1004638671875, -5.788818359375, -5.4771728515625, -5.16552734375, -4.8538818359375, -4.542236328125, -4.2305908203125, -3.9189453125, -3.6072998046875, -3.295654296875, -2.9840087890625, -2.67236328125, -2.3607177734375, -2.049072265625, -1.7374267578125, -1.42578125, -1.1141357421875, -0.802490234375, -0.4908447265625, -0.17919921875, 0.1324462890625, 0.444091796875, 0.7557373046875, 1.0673828125, 1.3790283203125, 1.690673828125, 2.0023193359375, 2.31396484375, 2.6256103515625, 2.937255859375, 3.2489013671875, 3.560546875, 3.8721923828125, 4.183837890625, 4.4954833984375, 4.80712890625, 5.1187744140625, 5.430419921875, 5.7420654296875, 6.0537109375, 6.3653564453125, 6.677001953125, 6.9886474609375, 7.30029296875, 7.6119384765625, 7.923583984375, 8.2352294921875, 8.546875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 10.0, 5.0, 4.0, 16.0, 12.0, 13.0, 25.0, 38.0, 40.0, 59.0, 78.0, 120.0, 165.0, 304.0, 508.0, 971.0, 5699.0, 2750349.0, 381818.0, 3302.0, 864.0, 441.0, 231.0, 179.0, 103.0, 86.0, 49.0, 57.0, 30.0, 23.0, 18.0, 19.0, 10.0, 9.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.71875, -19.059326171875, -18.39990234375, -17.740478515625, -17.0810546875, -16.421630859375, -15.76220703125, -15.102783203125, -14.443359375, -13.783935546875, -13.12451171875, -12.465087890625, -11.8056640625, -11.146240234375, -10.48681640625, -9.827392578125, -9.16796875, -8.508544921875, -7.84912109375, -7.189697265625, -6.5302734375, -5.870849609375, -5.21142578125, -4.552001953125, -3.892578125, -3.233154296875, -2.57373046875, -1.914306640625, -1.2548828125, -0.595458984375, 0.06396484375, 0.723388671875, 1.3828125, 2.042236328125, 2.70166015625, 3.361083984375, 4.0205078125, 4.679931640625, 5.33935546875, 5.998779296875, 6.658203125, 7.317626953125, 7.97705078125, 8.636474609375, 9.2958984375, 9.955322265625, 10.61474609375, 11.274169921875, 11.93359375, 12.593017578125, 13.25244140625, 13.911865234375, 14.5712890625, 15.230712890625, 15.89013671875, 16.549560546875, 17.208984375, 17.868408203125, 18.52783203125, 19.187255859375, 19.8466796875, 20.506103515625, 21.16552734375, 21.824951171875, 22.484375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 9.0, 145.0, 646.0, 201.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.77757263183594, -66.21517944335938, -62.652793884277344, -59.09040069580078, -55.528011322021484, -51.96562194824219, -48.403228759765625, -44.84083938598633, -41.27845001220703, -37.716060638427734, -34.15367126464844, -30.591278076171875, -27.028888702392578, -23.46649932861328, -19.90410804748535, -16.341716766357422, -12.779327392578125, -9.216937065124512, -5.654546737670898, -2.092156410217285, 1.4702339172363281, 5.032623291015625, 8.595014572143555, 12.157405853271484, 15.719795227050781, 19.282184600830078, 22.844575881958008, 26.406967163085938, 29.969356536865234, 33.53174591064453, 37.094139099121094, 40.65652847290039, 44.21891784667969, 47.781307220458984, 51.34369659423828, 54.906089782714844, 58.46847915649414, 62.03086853027344, 65.59326171875, 69.15565490722656, 72.7180404663086, 76.28043365478516, 79.84281921386719, 83.40521240234375, 86.96760559082031, 90.52999114990234, 94.0923843383789, 97.65476989746094, 101.2171630859375, 104.77955627441406, 108.3419418334961, 111.90433502197266, 115.46672058105469, 119.02911376953125, 122.59150695800781, 126.15390014648438, 129.71627807617188, 133.27867126464844, 136.841064453125, 140.4034423828125, 143.96583557128906, 147.52822875976562, 151.0906219482422, 154.65301513671875, 158.2154083251953]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 10.0, 7.0, 9.0, 17.0, 18.0, 22.0, 23.0, 28.0, 26.0, 25.0, 36.0, 28.0, 26.0, 43.0, 30.0, 39.0, 37.0, 44.0, 39.0, 45.0, 53.0, 36.0, 29.0, 31.0, 41.0, 25.0, 28.0, 31.0, 25.0, 24.0, 20.0, 18.0, 19.0, 8.0, 12.0, 11.0, 7.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.22344970703125, -20.473140716552734, -19.72283172607422, -18.972524642944336, -18.22221565246582, -17.471906661987305, -16.721599578857422, -15.971290588378906, -15.22098159790039, -14.470672607421875, -13.720364570617676, -12.970056533813477, -12.219747543334961, -11.469438552856445, -10.719130516052246, -9.968822479248047, -9.218513488769531, -8.468204498291016, -7.717896461486816, -6.967587947845459, -6.217279434204102, -5.466970920562744, -4.716662406921387, -3.9663538932800293, -3.216045379638672, -2.4657368659973145, -1.715428352355957, -0.9651198387145996, -0.2148113250732422, 0.5354971885681152, 1.2858057022094727, 2.03611421585083, 2.7864227294921875, 3.536731243133545, 4.287039756774902, 5.03734827041626, 5.787656784057617, 6.537965297698975, 7.288273811340332, 8.038581848144531, 8.788890838623047, 9.539199829101562, 10.289507865905762, 11.039815902709961, 11.790124893188477, 12.540433883666992, 13.290741920471191, 14.04104995727539, 14.791358947753906, 15.541667938232422, 16.291976928710938, 17.04228401184082, 17.792593002319336, 18.54290199279785, 19.293209075927734, 20.04351806640625, 20.793827056884766, 21.54413604736328, 22.294445037841797, 23.04475212097168, 23.795061111450195, 24.54537010192871, 25.295677185058594, 26.04598617553711, 26.796295166015625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 5.0, 5.0, 11.0, 14.0, 12.0, 8.0, 17.0, 16.0, 18.0, 27.0, 21.0, 30.0, 28.0, 25.0, 33.0, 38.0, 48.0, 42.0, 39.0, 37.0, 46.0, 47.0, 51.0, 38.0, 39.0, 31.0, 35.0, 30.0, 35.0, 24.0, 19.0, 24.0, 21.0, 16.0, 9.0, 22.0, 10.0, 7.0, 9.0, 2.0, 3.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.556640625, -3.446624755859375, -3.33660888671875, -3.226593017578125, -3.1165771484375, -3.006561279296875, -2.89654541015625, -2.786529541015625, -2.676513671875, -2.566497802734375, -2.45648193359375, -2.346466064453125, -2.2364501953125, -2.126434326171875, -2.01641845703125, -1.906402587890625, -1.79638671875, -1.686370849609375, -1.57635498046875, -1.466339111328125, -1.3563232421875, -1.246307373046875, -1.13629150390625, -1.026275634765625, -0.916259765625, -0.806243896484375, -0.69622802734375, -0.586212158203125, -0.4761962890625, -0.366180419921875, -0.25616455078125, -0.146148681640625, -0.0361328125, 0.073883056640625, 0.18389892578125, 0.293914794921875, 0.4039306640625, 0.513946533203125, 0.62396240234375, 0.733978271484375, 0.843994140625, 0.954010009765625, 1.06402587890625, 1.174041748046875, 1.2840576171875, 1.394073486328125, 1.50408935546875, 1.614105224609375, 1.72412109375, 1.834136962890625, 1.94415283203125, 2.054168701171875, 2.1641845703125, 2.274200439453125, 2.38421630859375, 2.494232177734375, 2.604248046875, 2.714263916015625, 2.82427978515625, 2.934295654296875, 3.0443115234375, 3.154327392578125, 3.26434326171875, 3.374359130859375, 3.484375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 12.0, 19.0, 8.0, 30.0, 43.0, 50.0, 63.0, 102.0, 155.0, 204.0, 279.0, 434.0, 602.0, 1015.0, 1408.0, 2341.0, 3624.0, 6061.0, 10235.0, 20663.0, 62738.0, 324182.0, 1309965.0, 1762358.0, 527646.0, 101484.0, 26915.0, 12470.0, 6968.0, 4256.0, 2694.0, 1699.0, 1138.0, 776.0, 537.0, 334.0, 236.0, 154.0, 113.0, 81.0, 69.0, 39.0, 20.0, 17.0, 11.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-5.01953125, -4.87255859375, -4.7255859375, -4.57861328125, -4.431640625, -4.28466796875, -4.1376953125, -3.99072265625, -3.84375, -3.69677734375, -3.5498046875, -3.40283203125, -3.255859375, -3.10888671875, -2.9619140625, -2.81494140625, -2.66796875, -2.52099609375, -2.3740234375, -2.22705078125, -2.080078125, -1.93310546875, -1.7861328125, -1.63916015625, -1.4921875, -1.34521484375, -1.1982421875, -1.05126953125, -0.904296875, -0.75732421875, -0.6103515625, -0.46337890625, -0.31640625, -0.16943359375, -0.0224609375, 0.12451171875, 0.271484375, 0.41845703125, 0.5654296875, 0.71240234375, 0.859375, 1.00634765625, 1.1533203125, 1.30029296875, 1.447265625, 1.59423828125, 1.7412109375, 1.88818359375, 2.03515625, 2.18212890625, 2.3291015625, 2.47607421875, 2.623046875, 2.77001953125, 2.9169921875, 3.06396484375, 3.2109375, 3.35791015625, 3.5048828125, 3.65185546875, 3.798828125, 3.94580078125, 4.0927734375, 4.23974609375, 4.38671875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 2.0, 6.0, 7.0, 10.0, 21.0, 13.0, 26.0, 44.0, 54.0, 84.0, 90.0, 140.0, 170.0, 200.0, 290.0, 386.0, 436.0, 467.0, 382.0, 303.0, 210.0, 167.0, 133.0, 112.0, 69.0, 59.0, 51.0, 47.0, 27.0, 18.0, 12.0, 4.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.1754150390625, -4.026611328125, -3.8778076171875, -3.72900390625, -3.5802001953125, -3.431396484375, -3.2825927734375, -3.1337890625, -2.9849853515625, -2.836181640625, -2.6873779296875, -2.53857421875, -2.3897705078125, -2.240966796875, -2.0921630859375, -1.943359375, -1.7945556640625, -1.645751953125, -1.4969482421875, -1.34814453125, -1.1993408203125, -1.050537109375, -0.9017333984375, -0.7529296875, -0.6041259765625, -0.455322265625, -0.3065185546875, -0.15771484375, -0.0089111328125, 0.139892578125, 0.2886962890625, 0.4375, 0.5863037109375, 0.735107421875, 0.8839111328125, 1.03271484375, 1.1815185546875, 1.330322265625, 1.4791259765625, 1.6279296875, 1.7767333984375, 1.925537109375, 2.0743408203125, 2.22314453125, 2.3719482421875, 2.520751953125, 2.6695556640625, 2.818359375, 2.9671630859375, 3.115966796875, 3.2647705078125, 3.41357421875, 3.5623779296875, 3.711181640625, 3.8599853515625, 4.0087890625, 4.1575927734375, 4.306396484375, 4.4552001953125, 4.60400390625, 4.7528076171875, 4.901611328125, 5.0504150390625, 5.19921875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 3.0, 11.0, 8.0, 20.0, 19.0, 25.0, 51.0, 69.0, 94.0, 135.0, 227.0, 338.0, 576.0, 1358.0, 3852.0, 17046.0, 196039.0, 3015026.0, 896771.0, 51004.0, 7327.0, 2136.0, 866.0, 462.0, 271.0, 175.0, 109.0, 60.0, 44.0, 51.0, 25.0, 17.0, 17.0, 6.0, 11.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.5, -9.22662353515625, -8.9532470703125, -8.67987060546875, -8.406494140625, -8.13311767578125, -7.8597412109375, -7.58636474609375, -7.31298828125, -7.03961181640625, -6.7662353515625, -6.49285888671875, -6.219482421875, -5.94610595703125, -5.6727294921875, -5.39935302734375, -5.1259765625, -4.85260009765625, -4.5792236328125, -4.30584716796875, -4.032470703125, -3.75909423828125, -3.4857177734375, -3.21234130859375, -2.93896484375, -2.66558837890625, -2.3922119140625, -2.11883544921875, -1.845458984375, -1.57208251953125, -1.2987060546875, -1.02532958984375, -0.751953125, -0.47857666015625, -0.2052001953125, 0.06817626953125, 0.341552734375, 0.61492919921875, 0.8883056640625, 1.16168212890625, 1.43505859375, 1.70843505859375, 1.9818115234375, 2.25518798828125, 2.528564453125, 2.80194091796875, 3.0753173828125, 3.34869384765625, 3.6220703125, 3.89544677734375, 4.1688232421875, 4.44219970703125, 4.715576171875, 4.98895263671875, 5.2623291015625, 5.53570556640625, 5.80908203125, 6.08245849609375, 6.3558349609375, 6.62921142578125, 6.902587890625, 7.17596435546875, 7.4493408203125, 7.72271728515625, 7.99609375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 14.0, 39.0, 89.0, 209.0, 240.0, 221.0, 114.0, 47.0, 27.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.41825103759766, -66.94837188720703, -65.47850036621094, -64.00862121582031, -62.53874588012695, -61.068870544433594, -59.59899139404297, -58.12911605834961, -56.65924072265625, -55.18936538696289, -53.71949005126953, -52.249610900878906, -50.77973556518555, -49.30986022949219, -47.83998107910156, -46.3701057434082, -44.900230407714844, -43.430355072021484, -41.960479736328125, -40.4906005859375, -39.02072525024414, -37.55084991455078, -36.080970764160156, -34.6110954284668, -33.14122009277344, -31.671344757080078, -30.201467514038086, -28.731590270996094, -27.261714935302734, -25.791839599609375, -24.321962356567383, -22.85208511352539, -21.382213592529297, -19.912338256835938, -18.442461013793945, -16.972583770751953, -15.502708435058594, -14.032832145690918, -12.562955856323242, -11.093079566955566, -9.62320327758789, -8.153326988220215, -6.683450698852539, -5.213574409484863, -3.7436981201171875, -2.2738218307495117, -0.8039455413818359, 0.6659307479858398, 2.1358070373535156, 3.6056833267211914, 5.075559616088867, 6.545435905456543, 8.015312194824219, 9.485188484191895, 10.95506477355957, 12.424941062927246, 13.894817352294922, 15.364693641662598, 16.834569931030273, 18.304447174072266, 19.774322509765625, 21.244197845458984, 22.714075088500977, 24.18395233154297, 25.653827667236328]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 8.0, 4.0, 6.0, 18.0, 14.0, 19.0, 36.0, 25.0, 27.0, 28.0, 30.0, 48.0, 34.0, 39.0, 30.0, 50.0, 45.0, 42.0, 42.0, 39.0, 42.0, 35.0, 39.0, 39.0, 32.0, 30.0, 27.0, 27.0, 23.0, 21.0, 17.0, 17.0, 18.0, 4.0, 7.0, 8.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.364112854003906, -18.760364532470703, -18.156618118286133, -17.55286979675293, -16.94912338256836, -16.345375061035156, -15.74162769317627, -15.137880325317383, -14.53413200378418, -13.930384635925293, -13.326637268066406, -12.722888946533203, -12.119141578674316, -11.51539421081543, -10.911646842956543, -10.307899475097656, -9.70415210723877, -9.100404739379883, -8.496657371520996, -7.892909526824951, -7.289161682128906, -6.6854143142700195, -6.081666946411133, -5.477919101715088, -4.874171733856201, -4.2704243659973145, -3.6666765213012695, -3.062929153442383, -2.459181547164917, -1.8554339408874512, -1.2516865730285645, -0.6479387283325195, -0.04419136047363281, 0.5595561861991882, 1.1633037328720093, 1.7670512199401855, 2.3707988262176514, 2.974546432495117, 3.578293800354004, 4.182041645050049, 4.7857890129089355, 5.389536380767822, 5.993284225463867, 6.597031593322754, 7.200778961181641, 7.8045268058776855, 8.408273696899414, 9.012022018432617, 9.615769386291504, 10.21951675415039, 10.823264122009277, 11.427011489868164, 12.030759811401367, 12.634507179260254, 13.23825454711914, 13.842002868652344, 14.445749282836914, 15.0494966506958, 15.653244018554688, 16.25699234008789, 16.86073875427246, 17.464487075805664, 18.068233489990234, 18.671981811523438, 19.27573013305664]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 2.0, 12.0, 9.0, 17.0, 19.0, 11.0, 22.0, 23.0, 16.0, 28.0, 28.0, 32.0, 28.0, 37.0, 42.0, 29.0, 40.0, 36.0, 52.0, 36.0, 32.0, 45.0, 38.0, 34.0, 29.0, 39.0, 35.0, 20.0, 22.0, 27.0, 19.0, 24.0, 17.0, 19.0, 11.0, 17.0, 8.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0], "bins": [-3.029296875, -2.941070556640625, -2.85284423828125, -2.764617919921875, -2.6763916015625, -2.588165283203125, -2.49993896484375, -2.411712646484375, -2.323486328125, -2.235260009765625, -2.14703369140625, -2.058807373046875, -1.9705810546875, -1.882354736328125, -1.79412841796875, -1.705902099609375, -1.61767578125, -1.529449462890625, -1.44122314453125, -1.352996826171875, -1.2647705078125, -1.176544189453125, -1.08831787109375, -1.000091552734375, -0.911865234375, -0.823638916015625, -0.73541259765625, -0.647186279296875, -0.5589599609375, -0.470733642578125, -0.38250732421875, -0.294281005859375, -0.2060546875, -0.117828369140625, -0.02960205078125, 0.058624267578125, 0.1468505859375, 0.235076904296875, 0.32330322265625, 0.411529541015625, 0.499755859375, 0.587982177734375, 0.67620849609375, 0.764434814453125, 0.8526611328125, 0.940887451171875, 1.02911376953125, 1.117340087890625, 1.20556640625, 1.293792724609375, 1.38201904296875, 1.470245361328125, 1.5584716796875, 1.646697998046875, 1.73492431640625, 1.823150634765625, 1.911376953125, 1.999603271484375, 2.08782958984375, 2.176055908203125, 2.2642822265625, 2.352508544921875, 2.44073486328125, 2.528961181640625, 2.6171875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 9.0, 11.0, 13.0, 19.0, 33.0, 33.0, 52.0, 80.0, 119.0, 162.0, 226.0, 308.0, 429.0, 642.0, 892.0, 1370.0, 2018.0, 2982.0, 4198.0, 6332.0, 9563.0, 14720.0, 22831.0, 36483.0, 61853.0, 112841.0, 268656.0, 241313.0, 104588.0, 57631.0, 34511.0, 21469.0, 14150.0, 9182.0, 5935.0, 4000.0, 2704.0, 2002.0, 1246.0, 885.0, 580.0, 477.0, 266.0, 213.0, 159.0, 113.0, 82.0, 57.0, 40.0, 31.0, 23.0, 11.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0175933837890625, -0.017024755477905273, -0.016456127166748047, -0.01588749885559082, -0.015318870544433594, -0.014750242233276367, -0.01418161392211914, -0.013612985610961914, -0.013044357299804688, -0.012475728988647461, -0.011907100677490234, -0.011338472366333008, -0.010769844055175781, -0.010201215744018555, -0.009632587432861328, -0.009063959121704102, -0.008495330810546875, -0.007926702499389648, -0.007358074188232422, -0.006789445877075195, -0.006220817565917969, -0.005652189254760742, -0.005083560943603516, -0.004514932632446289, -0.0039463043212890625, -0.003377676010131836, -0.0028090476989746094, -0.002240419387817383, -0.0016717910766601562, -0.0011031627655029297, -0.0005345344543457031, 3.409385681152344e-05, 0.00060272216796875, 0.0011713504791259766, 0.0017399787902832031, 0.0023086071014404297, 0.0028772354125976562, 0.003445863723754883, 0.004014492034912109, 0.004583120346069336, 0.0051517486572265625, 0.005720376968383789, 0.006289005279541016, 0.006857633590698242, 0.007426261901855469, 0.007994890213012695, 0.008563518524169922, 0.009132146835327148, 0.009700775146484375, 0.010269403457641602, 0.010838031768798828, 0.011406660079956055, 0.011975288391113281, 0.012543916702270508, 0.013112545013427734, 0.013681173324584961, 0.014249801635742188, 0.014818429946899414, 0.01538705825805664, 0.015955686569213867, 0.016524314880371094, 0.01709294319152832, 0.017661571502685547, 0.018230199813842773, 0.018798828125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 5.0, 13.0, 8.0, 14.0, 15.0, 16.0, 15.0, 39.0, 35.0, 24.0, 29.0, 33.0, 25.0, 37.0, 40.0, 47.0, 36.0, 40.0, 1063.0, 46.0, 32.0, 39.0, 38.0, 39.0, 30.0, 29.0, 33.0, 29.0, 25.0, 20.0, 23.0, 22.0, 17.0, 7.0, 15.0, 9.0, 10.0, 6.0, 4.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.12890625, -2.06378173828125, -1.9986572265625, -1.93353271484375, -1.868408203125, -1.80328369140625, -1.7381591796875, -1.67303466796875, -1.60791015625, -1.54278564453125, -1.4776611328125, -1.41253662109375, -1.347412109375, -1.28228759765625, -1.2171630859375, -1.15203857421875, -1.0869140625, -1.02178955078125, -0.9566650390625, -0.89154052734375, -0.826416015625, -0.76129150390625, -0.6961669921875, -0.63104248046875, -0.56591796875, -0.50079345703125, -0.4356689453125, -0.37054443359375, -0.305419921875, -0.24029541015625, -0.1751708984375, -0.11004638671875, -0.044921875, 0.02020263671875, 0.0853271484375, 0.15045166015625, 0.215576171875, 0.28070068359375, 0.3458251953125, 0.41094970703125, 0.47607421875, 0.54119873046875, 0.6063232421875, 0.67144775390625, 0.736572265625, 0.80169677734375, 0.8668212890625, 0.93194580078125, 0.9970703125, 1.06219482421875, 1.1273193359375, 1.19244384765625, 1.257568359375, 1.32269287109375, 1.3878173828125, 1.45294189453125, 1.51806640625, 1.58319091796875, 1.6483154296875, 1.71343994140625, 1.778564453125, 1.84368896484375, 1.9088134765625, 1.97393798828125, 2.0390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 9.0, 11.0, 18.0, 32.0, 36.0, 53.0, 71.0, 132.0, 161.0, 261.0, 370.0, 599.0, 872.0, 1283.0, 2029.0, 3183.0, 4787.0, 7816.0, 11923.0, 19465.0, 31159.0, 50667.0, 84919.0, 171766.0, 1351274.0, 150326.0, 78786.0, 46948.0, 28839.0, 17881.0, 11363.0, 7018.0, 4582.0, 2882.0, 1858.0, 1284.0, 785.0, 534.0, 384.0, 234.0, 156.0, 101.0, 92.0, 63.0, 39.0, 30.0, 22.0, 11.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.012054443359375, -0.011670827865600586, -0.011287212371826172, -0.010903596878051758, -0.010519981384277344, -0.01013636589050293, -0.009752750396728516, -0.009369134902954102, -0.008985519409179688, -0.008601903915405273, -0.00821828842163086, -0.007834672927856445, -0.007451057434082031, -0.007067441940307617, -0.006683826446533203, -0.006300210952758789, -0.005916595458984375, -0.005532979965209961, -0.005149364471435547, -0.004765748977661133, -0.004382133483886719, -0.003998517990112305, -0.0036149024963378906, -0.0032312870025634766, -0.0028476715087890625, -0.0024640560150146484, -0.0020804405212402344, -0.0016968250274658203, -0.0013132095336914062, -0.0009295940399169922, -0.0005459785461425781, -0.00016236305236816406, 0.00022125244140625, 0.0006048679351806641, 0.0009884834289550781, 0.0013720989227294922, 0.0017557144165039062, 0.0021393299102783203, 0.0025229454040527344, 0.0029065608978271484, 0.0032901763916015625, 0.0036737918853759766, 0.004057407379150391, 0.004441022872924805, 0.004824638366699219, 0.005208253860473633, 0.005591869354248047, 0.005975484848022461, 0.006359100341796875, 0.006742715835571289, 0.007126331329345703, 0.007509946823120117, 0.007893562316894531, 0.008277177810668945, 0.00866079330444336, 0.009044408798217773, 0.009428024291992188, 0.009811639785766602, 0.010195255279541016, 0.01057887077331543, 0.010962486267089844, 0.011346101760864258, 0.011729717254638672, 0.012113332748413086, 0.0124969482421875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 44.0, 0.0, 0.0, 0.0, 0.0, 0.0, 166.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 528.0, 0.0, 0.0, 0.0, 0.0, 0.0, 178.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.980232238769531e-07, -2.8870999813079834e-07, -2.7939677238464355e-07, -2.7008354663848877e-07, -2.60770320892334e-07, -2.514570951461792e-07, -2.421438694000244e-07, -2.3283064365386963e-07, -2.2351741790771484e-07, -2.1420419216156006e-07, -2.0489096641540527e-07, -1.955777406692505e-07, -1.862645149230957e-07, -1.7695128917694092e-07, -1.6763806343078613e-07, -1.5832483768463135e-07, -1.4901161193847656e-07, -1.3969838619232178e-07, -1.30385160446167e-07, -1.210719347000122e-07, -1.1175870895385742e-07, -1.0244548320770264e-07, -9.313225746154785e-08, -8.381903171539307e-08, -7.450580596923828e-08, -6.51925802230835e-08, -5.587935447692871e-08, -4.6566128730773926e-08, -3.725290298461914e-08, -2.7939677238464355e-08, -1.862645149230957e-08, -9.313225746154785e-09, 0.0, 9.313225746154785e-09, 1.862645149230957e-08, 2.7939677238464355e-08, 3.725290298461914e-08, 4.6566128730773926e-08, 5.587935447692871e-08, 6.51925802230835e-08, 7.450580596923828e-08, 8.381903171539307e-08, 9.313225746154785e-08, 1.0244548320770264e-07, 1.1175870895385742e-07, 1.210719347000122e-07, 1.30385160446167e-07, 1.3969838619232178e-07, 1.4901161193847656e-07, 1.5832483768463135e-07, 1.6763806343078613e-07, 1.7695128917694092e-07, 1.862645149230957e-07, 1.955777406692505e-07, 2.0489096641540527e-07, 2.1420419216156006e-07, 2.2351741790771484e-07, 2.3283064365386963e-07, 2.421438694000244e-07, 2.514570951461792e-07, 2.60770320892334e-07, 2.7008354663848877e-07, 2.7939677238464355e-07, 2.8870999813079834e-07, 2.980232238769531e-07]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 4.0, 4.0, 9.0, 6.0, 6.0, 22.0, 29.0, 40.0, 19.0, 7.0, 40.0, 92.0, 201.0, 182.0, 47.0, 411.0, 640.0, 123459.0, 920055.0, 2043.0, 446.0, 107.0, 90.0, 240.0, 114.0, 58.0, 7.0, 13.0, 36.0, 20.0, 18.0, 15.0, 7.0, 8.0, 8.0, 4.0, 7.0, 9.0, 5.0, 6.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7220458984375e-06, -5.544163286685944e-06, -5.366280674934387e-06, -5.188398063182831e-06, -5.010515451431274e-06, -4.832632839679718e-06, -4.654750227928162e-06, -4.476867616176605e-06, -4.298985004425049e-06, -4.1211023926734924e-06, -3.943219780921936e-06, -3.7653371691703796e-06, -3.5874545574188232e-06, -3.409571945667267e-06, -3.2316893339157104e-06, -3.053806722164154e-06, -2.8759241104125977e-06, -2.6980414986610413e-06, -2.520158886909485e-06, -2.3422762751579285e-06, -2.164393663406372e-06, -1.9865110516548157e-06, -1.8086284399032593e-06, -1.6307458281517029e-06, -1.4528632164001465e-06, -1.27498060464859e-06, -1.0970979928970337e-06, -9.192153811454773e-07, -7.413327693939209e-07, -5.634501576423645e-07, -3.855675458908081e-07, -2.076849341392517e-07, -2.9802322387695312e-08, 1.4808028936386108e-07, 3.259629011154175e-07, 5.038455128669739e-07, 6.817281246185303e-07, 8.596107363700867e-07, 1.037493348121643e-06, 1.2153759598731995e-06, 1.3932585716247559e-06, 1.5711411833763123e-06, 1.7490237951278687e-06, 1.926906406879425e-06, 2.1047890186309814e-06, 2.282671630382538e-06, 2.4605542421340942e-06, 2.6384368538856506e-06, 2.816319465637207e-06, 2.9942020773887634e-06, 3.17208468914032e-06, 3.3499673008918762e-06, 3.5278499126434326e-06, 3.705732524394989e-06, 3.883615136146545e-06, 4.061497747898102e-06, 4.239380359649658e-06, 4.417262971401215e-06, 4.595145583152771e-06, 4.773028194904327e-06, 4.950910806655884e-06, 5.12879341840744e-06, 5.306676030158997e-06, 5.484558641910553e-06, 5.662441253662109e-06]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 9.0, 6.0, 7.0, 4.0, 4.0, 9.0, 5.0, 864.0, 7.0, 7.0, 9.0, 10.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.1453262516170071e-07, -1.1141437994410808e-07, -1.0829613472651545e-07, -1.0517788950892282e-07, -1.0205964429133019e-07, -9.894139907373756e-08, -9.582315385614493e-08, -9.27049086385523e-08, -8.958666342095967e-08, -8.646841820336704e-08, -8.335017298577441e-08, -8.023192776818178e-08, -7.711368255058915e-08, -7.399543733299652e-08, -7.087719211540389e-08, -6.775894689781126e-08, -6.464070878564598e-08, -6.152246356805335e-08, -5.8404218350460724e-08, -5.5285973132868094e-08, -5.2167727915275464e-08, -4.9049482697682834e-08, -4.593124103280388e-08, -4.281299581521125e-08, -3.969475059761862e-08, -3.657650538002599e-08, -3.345826016243336e-08, -3.034001849755441e-08, -2.722177150360494e-08, -2.410352628601231e-08, -2.098528284477652e-08, -1.786703762718389e-08, -1.4748785304163903e-08, -1.1630540086571273e-08, -8.512295757157062e-09, -5.394051427742852e-09, -2.275806210150222e-09, 8.424390074424082e-10, 3.960682448678199e-09, 7.078927666270829e-09, 1.0197172883863459e-08, 1.3315418101456089e-08, 1.643366331904872e-08, 1.955190676028451e-08, 2.267015197787714e-08, 2.578839719546977e-08, 2.890664063670556e-08, 3.202488585429819e-08, 3.514313107189082e-08, 3.826137628948345e-08, 4.137962150707608e-08, 4.449786672466871e-08, 4.761611194226134e-08, 5.073435715985397e-08, 5.385259882473292e-08, 5.697084404232555e-08, 6.008909281263186e-08, 6.320733803022449e-08, 6.632558324781712e-08, 6.944382846540975e-08, 7.256207368300238e-08, 7.568031890059501e-08, 7.879856411818764e-08, 8.191680933578027e-08, 8.503504744794554e-08]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 78.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 861.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 81.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 2.0, 12.0, 9.0, 17.0, 19.0, 11.0, 22.0, 23.0, 16.0, 28.0, 28.0, 32.0, 28.0, 37.0, 42.0, 29.0, 40.0, 36.0, 52.0, 36.0, 32.0, 45.0, 38.0, 34.0, 29.0, 39.0, 35.0, 20.0, 22.0, 27.0, 19.0, 24.0, 17.0, 19.0, 11.0, 17.0, 8.0, 8.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0], "bins": [-3.029296875, -2.941070556640625, -2.85284423828125, -2.764617919921875, -2.6763916015625, -2.588165283203125, -2.49993896484375, -2.411712646484375, -2.323486328125, -2.235260009765625, -2.14703369140625, -2.058807373046875, -1.9705810546875, -1.882354736328125, -1.79412841796875, -1.705902099609375, -1.61767578125, -1.529449462890625, -1.44122314453125, -1.352996826171875, -1.2647705078125, -1.176544189453125, -1.08831787109375, -1.000091552734375, -0.911865234375, -0.823638916015625, -0.73541259765625, -0.647186279296875, -0.5589599609375, -0.470733642578125, -0.38250732421875, -0.294281005859375, -0.2060546875, -0.117828369140625, -0.02960205078125, 0.058624267578125, 0.1468505859375, 0.235076904296875, 0.32330322265625, 0.411529541015625, 0.499755859375, 0.587982177734375, 0.67620849609375, 0.764434814453125, 0.8526611328125, 0.940887451171875, 1.02911376953125, 1.117340087890625, 1.20556640625, 1.293792724609375, 1.38201904296875, 1.470245361328125, 1.5584716796875, 1.646697998046875, 1.73492431640625, 1.823150634765625, 1.911376953125, 1.999603271484375, 2.08782958984375, 2.176055908203125, 2.2642822265625, 2.352508544921875, 2.44073486328125, 2.528961181640625, 2.6171875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 12.0, 8.0, 11.0, 20.0, 19.0, 24.0, 37.0, 37.0, 51.0, 84.0, 121.0, 149.0, 231.0, 351.0, 605.0, 1070.0, 2217.0, 5289.0, 16021.0, 66148.0, 328596.0, 474613.0, 114100.0, 24934.0, 7513.0, 2866.0, 1409.0, 724.0, 378.0, 251.0, 163.0, 117.0, 76.0, 62.0, 38.0, 43.0, 32.0, 27.0, 18.0, 13.0, 17.0, 16.0, 7.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0], "bins": [-4.55078125, -4.41357421875, -4.2763671875, -4.13916015625, -4.001953125, -3.86474609375, -3.7275390625, -3.59033203125, -3.453125, -3.31591796875, -3.1787109375, -3.04150390625, -2.904296875, -2.76708984375, -2.6298828125, -2.49267578125, -2.35546875, -2.21826171875, -2.0810546875, -1.94384765625, -1.806640625, -1.66943359375, -1.5322265625, -1.39501953125, -1.2578125, -1.12060546875, -0.9833984375, -0.84619140625, -0.708984375, -0.57177734375, -0.4345703125, -0.29736328125, -0.16015625, -0.02294921875, 0.1142578125, 0.25146484375, 0.388671875, 0.52587890625, 0.6630859375, 0.80029296875, 0.9375, 1.07470703125, 1.2119140625, 1.34912109375, 1.486328125, 1.62353515625, 1.7607421875, 1.89794921875, 2.03515625, 2.17236328125, 2.3095703125, 2.44677734375, 2.583984375, 2.72119140625, 2.8583984375, 2.99560546875, 3.1328125, 3.27001953125, 3.4072265625, 3.54443359375, 3.681640625, 3.81884765625, 3.9560546875, 4.09326171875, 4.23046875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 3.0, 9.0, 18.0, 19.0, 19.0, 21.0, 31.0, 30.0, 49.0, 56.0, 62.0, 56.0, 126.0, 389.0, 1583.0, 168.0, 80.0, 67.0, 49.0, 49.0, 40.0, 32.0, 28.0, 15.0, 11.0, 18.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.392333984375, -7.07373046875, -6.755126953125, -6.4365234375, -6.117919921875, -5.79931640625, -5.480712890625, -5.162109375, -4.843505859375, -4.52490234375, -4.206298828125, -3.8876953125, -3.569091796875, -3.25048828125, -2.931884765625, -2.61328125, -2.294677734375, -1.97607421875, -1.657470703125, -1.3388671875, -1.020263671875, -0.70166015625, -0.383056640625, -0.064453125, 0.254150390625, 0.57275390625, 0.891357421875, 1.2099609375, 1.528564453125, 1.84716796875, 2.165771484375, 2.484375, 2.802978515625, 3.12158203125, 3.440185546875, 3.7587890625, 4.077392578125, 4.39599609375, 4.714599609375, 5.033203125, 5.351806640625, 5.67041015625, 5.989013671875, 6.3076171875, 6.626220703125, 6.94482421875, 7.263427734375, 7.58203125, 7.900634765625, 8.21923828125, 8.537841796875, 8.8564453125, 9.175048828125, 9.49365234375, 9.812255859375, 10.130859375, 10.449462890625, 10.76806640625, 11.086669921875, 11.4052734375, 11.723876953125, 12.04248046875, 12.361083984375, 12.6796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 6.0, 6.0, 13.0, 12.0, 15.0, 17.0, 54.0, 68.0, 126.0, 219.0, 393.0, 1004.0, 32904.0, 3106531.0, 2945.0, 642.0, 311.0, 154.0, 100.0, 57.0, 28.0, 21.0, 18.0, 11.0, 12.0, 17.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.0625, -29.297119140625, -28.53173828125, -27.766357421875, -27.0009765625, -26.235595703125, -25.47021484375, -24.704833984375, -23.939453125, -23.174072265625, -22.40869140625, -21.643310546875, -20.8779296875, -20.112548828125, -19.34716796875, -18.581787109375, -17.81640625, -17.051025390625, -16.28564453125, -15.520263671875, -14.7548828125, -13.989501953125, -13.22412109375, -12.458740234375, -11.693359375, -10.927978515625, -10.16259765625, -9.397216796875, -8.6318359375, -7.866455078125, -7.10107421875, -6.335693359375, -5.5703125, -4.804931640625, -4.03955078125, -3.274169921875, -2.5087890625, -1.743408203125, -0.97802734375, -0.212646484375, 0.552734375, 1.318115234375, 2.08349609375, 2.848876953125, 3.6142578125, 4.379638671875, 5.14501953125, 5.910400390625, 6.67578125, 7.441162109375, 8.20654296875, 8.971923828125, 9.7373046875, 10.502685546875, 11.26806640625, 12.033447265625, 12.798828125, 13.564208984375, 14.32958984375, 15.094970703125, 15.8603515625, 16.625732421875, 17.39111328125, 18.156494140625, 18.921875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 31.0, 436.0, 487.0, 57.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.99073314666748, -6.779177188873291, -4.567621231079102, -2.356065273284912, -0.14450931549072266, 2.0670461654663086, 4.278602600097656, 6.490159034729004, 8.701714515686035, 10.913270950317383, 13.124826431274414, 15.336381912231445, 17.54793930053711, 19.75949478149414, 21.971050262451172, 24.182605743408203, 26.394161224365234, 28.605716705322266, 30.817272186279297, 33.02882766723633, 35.240386962890625, 37.451942443847656, 39.66349792480469, 41.87505340576172, 44.08660888671875, 46.29816436767578, 48.50971984863281, 50.721275329589844, 52.932830810546875, 55.144386291503906, 57.3559455871582, 59.567501068115234, 61.779052734375, 63.99060821533203, 66.20216369628906, 68.4137191772461, 70.62527465820312, 72.83683013916016, 75.04838562011719, 77.25994873046875, 79.47149658203125, 81.68305206298828, 83.89460754394531, 86.10616302490234, 88.31771850585938, 90.5292739868164, 92.74082946777344, 94.952392578125, 97.16394805908203, 99.37550354003906, 101.5870590209961, 103.79861450195312, 106.01016998291016, 108.22172546386719, 110.43328094482422, 112.64483642578125, 114.85639953613281, 117.06795501708984, 119.27951049804688, 121.4910659790039, 123.70262145996094, 125.91417694091797, 128.125732421875, 130.33729553222656, 132.54884338378906]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 4.0, 5.0, 6.0, 3.0, 10.0, 14.0, 15.0, 16.0, 12.0, 18.0, 15.0, 20.0, 26.0, 29.0, 40.0, 28.0, 30.0, 27.0, 34.0, 37.0, 45.0, 36.0, 39.0, 43.0, 23.0, 31.0, 36.0, 41.0, 28.0, 39.0, 29.0, 26.0, 25.0, 29.0, 18.0, 18.0, 17.0, 17.0, 16.0, 16.0, 13.0, 6.0, 6.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.852767944335938, -15.32209587097168, -14.791422843933105, -14.260750770568848, -13.73007869720459, -13.199405670166016, -12.668733596801758, -12.1380615234375, -11.607389450073242, -11.076717376708984, -10.54604434967041, -10.015372276306152, -9.484700202941895, -8.95402717590332, -8.423355102539062, -7.892683029174805, -7.3620100021362305, -6.8313374519348145, -6.300665378570557, -5.769992828369141, -5.239320755004883, -4.708648204803467, -4.177975654602051, -3.647303342819214, -3.116631031036377, -2.58595871925354, -2.055286407470703, -1.524613857269287, -0.9939415454864502, -0.4632692337036133, 0.06740331649780273, 0.5980756282806396, 1.1287479400634766, 1.6594202518463135, 2.1900925636291504, 2.7207651138305664, 3.2514374256134033, 3.7821097373962402, 4.312782287597656, 4.843454360961914, 5.37412691116333, 5.904799461364746, 6.435471534729004, 6.96614408493042, 7.496816635131836, 8.027488708496094, 8.558160781860352, 9.088833808898926, 9.619505882263184, 10.150177955627441, 10.680850982666016, 11.211523056030273, 11.742195129394531, 12.272867202758789, 12.803540229797363, 13.334212303161621, 13.864885330200195, 14.395557403564453, 14.926230430603027, 15.456902503967285, 15.987574577331543, 16.518247604370117, 17.048919677734375, 17.579591751098633, 18.11026382446289]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 3.0, 8.0, 13.0, 2.0, 13.0, 11.0, 10.0, 18.0, 20.0, 25.0, 31.0, 33.0, 30.0, 26.0, 45.0, 31.0, 42.0, 37.0, 33.0, 43.0, 36.0, 48.0, 35.0, 39.0, 35.0, 52.0, 33.0, 27.0, 20.0, 28.0, 26.0, 17.0, 23.0, 13.0, 17.0, 20.0, 11.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.12109375, -3.0208740234375, -2.920654296875, -2.8204345703125, -2.72021484375, -2.6199951171875, -2.519775390625, -2.4195556640625, -2.3193359375, -2.2191162109375, -2.118896484375, -2.0186767578125, -1.91845703125, -1.8182373046875, -1.718017578125, -1.6177978515625, -1.517578125, -1.4173583984375, -1.317138671875, -1.2169189453125, -1.11669921875, -1.0164794921875, -0.916259765625, -0.8160400390625, -0.7158203125, -0.6156005859375, -0.515380859375, -0.4151611328125, -0.31494140625, -0.2147216796875, -0.114501953125, -0.0142822265625, 0.0859375, 0.1861572265625, 0.286376953125, 0.3865966796875, 0.48681640625, 0.5870361328125, 0.687255859375, 0.7874755859375, 0.8876953125, 0.9879150390625, 1.088134765625, 1.1883544921875, 1.28857421875, 1.3887939453125, 1.489013671875, 1.5892333984375, 1.689453125, 1.7896728515625, 1.889892578125, 1.9901123046875, 2.09033203125, 2.1905517578125, 2.290771484375, 2.3909912109375, 2.4912109375, 2.5914306640625, 2.691650390625, 2.7918701171875, 2.89208984375, 2.9923095703125, 3.092529296875, 3.1927490234375, 3.29296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 11.0, 15.0, 17.0, 26.0, 27.0, 43.0, 51.0, 62.0, 88.0, 100.0, 164.0, 184.0, 237.0, 329.0, 480.0, 685.0, 1162.0, 2996.0, 14661.0, 156810.0, 2905548.0, 1047370.0, 51463.0, 6827.0, 1808.0, 871.0, 587.0, 381.0, 295.0, 250.0, 167.0, 135.0, 91.0, 67.0, 67.0, 49.0, 32.0, 31.0, 18.0, 22.0, 14.0, 9.0, 7.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.765625, -15.2696533203125, -14.773681640625, -14.2777099609375, -13.78173828125, -13.2857666015625, -12.789794921875, -12.2938232421875, -11.7978515625, -11.3018798828125, -10.805908203125, -10.3099365234375, -9.81396484375, -9.3179931640625, -8.822021484375, -8.3260498046875, -7.830078125, -7.3341064453125, -6.838134765625, -6.3421630859375, -5.84619140625, -5.3502197265625, -4.854248046875, -4.3582763671875, -3.8623046875, -3.3663330078125, -2.870361328125, -2.3743896484375, -1.87841796875, -1.3824462890625, -0.886474609375, -0.3905029296875, 0.10546875, 0.6014404296875, 1.097412109375, 1.5933837890625, 2.08935546875, 2.5853271484375, 3.081298828125, 3.5772705078125, 4.0732421875, 4.5692138671875, 5.065185546875, 5.5611572265625, 6.05712890625, 6.5531005859375, 7.049072265625, 7.5450439453125, 8.041015625, 8.5369873046875, 9.032958984375, 9.5289306640625, 10.02490234375, 10.5208740234375, 11.016845703125, 11.5128173828125, 12.0087890625, 12.5047607421875, 13.000732421875, 13.4967041015625, 13.99267578125, 14.4886474609375, 14.984619140625, 15.4805908203125, 15.9765625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 8.0, 8.0, 27.0, 39.0, 52.0, 72.0, 100.0, 148.0, 217.0, 280.0, 425.0, 529.0, 618.0, 463.0, 356.0, 215.0, 160.0, 113.0, 78.0, 51.0, 38.0, 19.0, 21.0, 7.0, 13.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.0355224609375, -5.774169921875, -5.5128173828125, -5.25146484375, -4.9901123046875, -4.728759765625, -4.4674072265625, -4.2060546875, -3.9447021484375, -3.683349609375, -3.4219970703125, -3.16064453125, -2.8992919921875, -2.637939453125, -2.3765869140625, -2.115234375, -1.8538818359375, -1.592529296875, -1.3311767578125, -1.06982421875, -0.8084716796875, -0.547119140625, -0.2857666015625, -0.0244140625, 0.2369384765625, 0.498291015625, 0.7596435546875, 1.02099609375, 1.2823486328125, 1.543701171875, 1.8050537109375, 2.06640625, 2.3277587890625, 2.589111328125, 2.8504638671875, 3.11181640625, 3.3731689453125, 3.634521484375, 3.8958740234375, 4.1572265625, 4.4185791015625, 4.679931640625, 4.9412841796875, 5.20263671875, 5.4639892578125, 5.725341796875, 5.9866943359375, 6.248046875, 6.5093994140625, 6.770751953125, 7.0321044921875, 7.29345703125, 7.5548095703125, 7.816162109375, 8.0775146484375, 8.3388671875, 8.6002197265625, 8.861572265625, 9.1229248046875, 9.38427734375, 9.6456298828125, 9.906982421875, 10.1683349609375, 10.4296875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 12.0, 20.0, 25.0, 26.0, 45.0, 40.0, 51.0, 109.0, 157.0, 315.0, 592.0, 1681.0, 6035.0, 31417.0, 239177.0, 2276049.0, 1463771.0, 146692.0, 21119.0, 4436.0, 1252.0, 487.0, 240.0, 142.0, 115.0, 65.0, 55.0, 35.0, 33.0, 22.0, 14.0, 13.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.190673828125, -7.89697265625, -7.603271484375, -7.3095703125, -7.015869140625, -6.72216796875, -6.428466796875, -6.134765625, -5.841064453125, -5.54736328125, -5.253662109375, -4.9599609375, -4.666259765625, -4.37255859375, -4.078857421875, -3.78515625, -3.491455078125, -3.19775390625, -2.904052734375, -2.6103515625, -2.316650390625, -2.02294921875, -1.729248046875, -1.435546875, -1.141845703125, -0.84814453125, -0.554443359375, -0.2607421875, 0.032958984375, 0.32666015625, 0.620361328125, 0.9140625, 1.207763671875, 1.50146484375, 1.795166015625, 2.0888671875, 2.382568359375, 2.67626953125, 2.969970703125, 3.263671875, 3.557373046875, 3.85107421875, 4.144775390625, 4.4384765625, 4.732177734375, 5.02587890625, 5.319580078125, 5.61328125, 5.906982421875, 6.20068359375, 6.494384765625, 6.7880859375, 7.081787109375, 7.37548828125, 7.669189453125, 7.962890625, 8.256591796875, 8.55029296875, 8.843994140625, 9.1376953125, 9.431396484375, 9.72509765625, 10.018798828125, 10.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 8.0, 17.0, 19.0, 29.0, 29.0, 43.0, 49.0, 73.0, 65.0, 46.0, 88.0, 79.0, 71.0, 66.0, 61.0, 57.0, 53.0, 30.0, 29.0, 21.0, 21.0, 6.0, 5.0, 4.0, 3.0, 6.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.623638153076172, -30.243188858032227, -28.86273956298828, -27.48229217529297, -26.101842880249023, -24.721393585205078, -23.340946197509766, -21.96049690246582, -20.580047607421875, -19.19959831237793, -17.819149017333984, -16.438701629638672, -15.058252334594727, -13.677803039550781, -12.297354698181152, -10.916906356811523, -9.536457061767578, -8.156007766723633, -6.775559425354004, -5.395110607147217, -4.01466178894043, -2.6342129707336426, -1.2537641525268555, 0.12668418884277344, 1.5071334838867188, 2.887582302093506, 4.268031120300293, 5.64847993850708, 7.028928756713867, 8.409378051757812, 9.789826393127441, 11.17027473449707, 12.550724029541016, 13.931173324584961, 15.31162166595459, 16.69207000732422, 18.072519302368164, 19.45296859741211, 20.833415985107422, 22.213865280151367, 23.594314575195312, 24.974763870239258, 26.355213165283203, 27.735660552978516, 29.11610984802246, 30.496559143066406, 31.87700653076172, 33.25745391845703, 34.63790512084961, 36.01835250854492, 37.3988037109375, 38.77925109863281, 40.159698486328125, 41.5401496887207, 42.920597076416016, 44.301048278808594, 45.681495666503906, 47.06194305419922, 48.4423942565918, 49.82284164428711, 51.20329284667969, 52.583740234375, 53.96418762207031, 55.344635009765625, 56.7250862121582]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 8.0, 11.0, 13.0, 14.0, 7.0, 13.0, 16.0, 18.0, 17.0, 23.0, 29.0, 28.0, 29.0, 43.0, 44.0, 46.0, 44.0, 37.0, 43.0, 42.0, 38.0, 36.0, 35.0, 42.0, 39.0, 29.0, 34.0, 26.0, 27.0, 23.0, 16.0, 17.0, 15.0, 10.0, 12.0, 11.0, 16.0, 14.0, 8.0, 5.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-30.3070011138916, -29.419960021972656, -28.53291893005371, -27.645877838134766, -26.75883674621582, -25.871795654296875, -24.984756469726562, -24.097713470458984, -23.210674285888672, -22.323633193969727, -21.43659210205078, -20.549551010131836, -19.66250991821289, -18.775468826293945, -17.888427734375, -17.001388549804688, -16.11434555053711, -15.227304458618164, -14.340263366699219, -13.453222274780273, -12.566181182861328, -11.679140090942383, -10.792099952697754, -9.905058860778809, -9.018017768859863, -8.130976676940918, -7.243935585021973, -6.3568949699401855, -5.46985387802124, -4.582812786102295, -3.695772171020508, -2.8087310791015625, -1.9216880798339844, -1.0346471071243286, -0.14760613441467285, 0.7394347190856934, 1.6264758110046387, 2.513516902923584, 3.400557518005371, 4.287598609924316, 5.174639701843262, 6.061680793762207, 6.948721885681152, 7.8357625007629395, 8.722803115844727, 9.609844207763672, 10.496885299682617, 11.383926391601562, 12.270967483520508, 13.158008575439453, 14.045049667358398, 14.932090759277344, 15.819131851196289, 16.706172943115234, 17.593212127685547, 18.480255126953125, 19.367294311523438, 20.254335403442383, 21.141376495361328, 22.028417587280273, 22.91545867919922, 23.802499771118164, 24.68954086303711, 25.576580047607422, 26.463623046875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 9.0, 11.0, 10.0, 15.0, 14.0, 13.0, 11.0, 19.0, 20.0, 23.0, 34.0, 37.0, 34.0, 51.0, 43.0, 48.0, 37.0, 49.0, 45.0, 46.0, 45.0, 43.0, 45.0, 35.0, 30.0, 29.0, 25.0, 25.0, 18.0, 23.0, 14.0, 11.0, 16.0, 13.0, 11.0, 9.0, 12.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-60.21875, -58.46728515625, -56.7158203125, -54.96435546875, -53.212890625, -51.46142578125, -49.7099609375, -47.95849609375, -46.20703125, -44.45556640625, -42.7041015625, -40.95263671875, -39.201171875, -37.44970703125, -35.6982421875, -33.94677734375, -32.1953125, -30.44384765625, -28.6923828125, -26.94091796875, -25.189453125, -23.43798828125, -21.6865234375, -19.93505859375, -18.18359375, -16.43212890625, -14.6806640625, -12.92919921875, -11.177734375, -9.42626953125, -7.6748046875, -5.92333984375, -4.171875, -2.42041015625, -0.6689453125, 1.08251953125, 2.833984375, 4.58544921875, 6.3369140625, 8.08837890625, 9.83984375, 11.59130859375, 13.3427734375, 15.09423828125, 16.845703125, 18.59716796875, 20.3486328125, 22.10009765625, 23.8515625, 25.60302734375, 27.3544921875, 29.10595703125, 30.857421875, 32.60888671875, 34.3603515625, 36.11181640625, 37.86328125, 39.61474609375, 41.3662109375, 43.11767578125, 44.869140625, 46.62060546875, 48.3720703125, 50.12353515625, 51.875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 12.0, 6.0, 13.0, 15.0, 18.0, 31.0, 55.0, 105.0, 153.0, 209.0, 280.0, 474.0, 685.0, 1058.0, 1589.0, 2379.0, 3564.0, 5329.0, 7980.0, 12144.0, 18246.0, 28914.0, 47594.0, 84932.0, 185914.0, 337393.0, 132043.0, 67286.0, 39374.0, 24134.0, 15655.0, 10247.0, 6907.0, 4601.0, 3135.0, 2008.0, 1347.0, 906.0, 620.0, 420.0, 265.0, 172.0, 111.0, 69.0, 52.0, 46.0, 31.0, 17.0, 8.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.418212890625, -0.4056587219238281, -0.39310455322265625, -0.3805503845214844, -0.3679962158203125, -0.3554420471191406, -0.34288787841796875, -0.3303337097167969, -0.317779541015625, -0.3052253723144531, -0.29267120361328125, -0.2801170349121094, -0.2675628662109375, -0.2550086975097656, -0.24245452880859375, -0.22990036010742188, -0.21734619140625, -0.20479202270507812, -0.19223785400390625, -0.17968368530273438, -0.1671295166015625, -0.15457534790039062, -0.14202117919921875, -0.12946701049804688, -0.116912841796875, -0.10435867309570312, -0.09180450439453125, -0.07925033569335938, -0.0666961669921875, -0.054141998291015625, -0.04158782958984375, -0.029033660888671875, -0.0164794921875, -0.003925323486328125, 0.00862884521484375, 0.021183013916015625, 0.0337371826171875, 0.046291351318359375, 0.05884552001953125, 0.07139968872070312, 0.083953857421875, 0.09650802612304688, 0.10906219482421875, 0.12161636352539062, 0.1341705322265625, 0.14672470092773438, 0.15927886962890625, 0.17183303833007812, 0.18438720703125, 0.19694137573242188, 0.20949554443359375, 0.22204971313476562, 0.2346038818359375, 0.24715805053710938, 0.25971221923828125, 0.2722663879394531, 0.284820556640625, 0.2973747253417969, 0.30992889404296875, 0.3224830627441406, 0.3350372314453125, 0.3475914001464844, 0.36014556884765625, 0.3726997375488281, 0.38525390625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 5.0, 12.0, 14.0, 17.0, 17.0, 17.0, 20.0, 21.0, 26.0, 40.0, 25.0, 33.0, 28.0, 38.0, 39.0, 40.0, 27.0, 48.0, 1060.0, 39.0, 37.0, 44.0, 43.0, 44.0, 41.0, 25.0, 22.0, 27.0, 26.0, 20.0, 17.0, 20.0, 19.0, 8.0, 11.0, 10.0, 7.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-36.03125, -34.976318359375, -33.92138671875, -32.866455078125, -31.8115234375, -30.756591796875, -29.70166015625, -28.646728515625, -27.591796875, -26.536865234375, -25.48193359375, -24.427001953125, -23.3720703125, -22.317138671875, -21.26220703125, -20.207275390625, -19.15234375, -18.097412109375, -17.04248046875, -15.987548828125, -14.9326171875, -13.877685546875, -12.82275390625, -11.767822265625, -10.712890625, -9.657958984375, -8.60302734375, -7.548095703125, -6.4931640625, -5.438232421875, -4.38330078125, -3.328369140625, -2.2734375, -1.218505859375, -0.16357421875, 0.891357421875, 1.9462890625, 3.001220703125, 4.05615234375, 5.111083984375, 6.166015625, 7.220947265625, 8.27587890625, 9.330810546875, 10.3857421875, 11.440673828125, 12.49560546875, 13.550537109375, 14.60546875, 15.660400390625, 16.71533203125, 17.770263671875, 18.8251953125, 19.880126953125, 20.93505859375, 21.989990234375, 23.044921875, 24.099853515625, 25.15478515625, 26.209716796875, 27.2646484375, 28.319580078125, 29.37451171875, 30.429443359375, 31.484375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 14.0, 10.0, 16.0, 24.0, 33.0, 50.0, 69.0, 137.0, 167.0, 221.0, 388.0, 600.0, 897.0, 1187.0, 1995.0, 3051.0, 4543.0, 7172.0, 11436.0, 17735.0, 28453.0, 47114.0, 81255.0, 161640.0, 1353225.0, 165386.0, 83171.0, 47526.0, 29407.0, 18021.0, 11282.0, 7386.0, 4677.0, 3035.0, 1975.0, 1297.0, 838.0, 538.0, 361.0, 283.0, 183.0, 95.0, 81.0, 56.0, 54.0, 20.0, 11.0, 6.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1943359375, -0.18796730041503906, -0.18159866333007812, -0.1752300262451172, -0.16886138916015625, -0.1624927520751953, -0.15612411499023438, -0.14975547790527344, -0.1433868408203125, -0.13701820373535156, -0.13064956665039062, -0.12428092956542969, -0.11791229248046875, -0.11154365539550781, -0.10517501831054688, -0.09880638122558594, -0.092437744140625, -0.08606910705566406, -0.07970046997070312, -0.07333183288574219, -0.06696319580078125, -0.06059455871582031, -0.054225921630859375, -0.04785728454589844, -0.0414886474609375, -0.03512001037597656, -0.028751373291015625, -0.022382736206054688, -0.01601409912109375, -0.009645462036132812, -0.003276824951171875, 0.0030918121337890625, 0.00946044921875, 0.015829086303710938, 0.022197723388671875, 0.028566360473632812, 0.03493499755859375, 0.04130363464355469, 0.047672271728515625, 0.05404090881347656, 0.0604095458984375, 0.06677818298339844, 0.07314682006835938, 0.07951545715332031, 0.08588409423828125, 0.09225273132324219, 0.09862136840820312, 0.10499000549316406, 0.111358642578125, 0.11772727966308594, 0.12409591674804688, 0.1304645538330078, 0.13683319091796875, 0.1432018280029297, 0.14957046508789062, 0.15593910217285156, 0.1623077392578125, 0.16867637634277344, 0.17504501342773438, 0.1814136505126953, 0.18778228759765625, 0.1941509246826172, 0.20051956176757812, 0.20688819885253906, 0.2132568359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 5.0, 7.0, 15.0, 14.0, 12.0, 7.0, 16.0, 29.0, 21.0, 30.0, 52.0, 39.0, 24.0, 32.0, 43.0, 28.0, 41.0, 42.0, 35.0, 54.0, 43.0, 47.0, 37.0, 35.0, 33.0, 28.0, 35.0, 29.0, 23.0, 21.0, 28.0, 17.0, 9.0, 10.0, 14.0, 7.0, 7.0, 5.0, 6.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.5138800740242004e-06, -3.3918768167495728e-06, -3.269873559474945e-06, -3.1478703022003174e-06, -3.0258670449256897e-06, -2.903863787651062e-06, -2.7818605303764343e-06, -2.6598572731018066e-06, -2.537854015827179e-06, -2.4158507585525513e-06, -2.2938475012779236e-06, -2.171844244003296e-06, -2.0498409867286682e-06, -1.9278377294540405e-06, -1.8058344721794128e-06, -1.6838312149047852e-06, -1.5618279576301575e-06, -1.4398247003555298e-06, -1.317821443080902e-06, -1.1958181858062744e-06, -1.0738149285316467e-06, -9.51811671257019e-07, -8.298084139823914e-07, -7.078051567077637e-07, -5.85801899433136e-07, -4.637986421585083e-07, -3.417953848838806e-07, -2.1979212760925293e-07, -9.778887033462524e-08, 2.421438694000244e-08, 1.4621764421463013e-07, 2.682209014892578e-07, 3.902241587638855e-07, 5.122274160385132e-07, 6.342306733131409e-07, 7.562339305877686e-07, 8.782371878623962e-07, 1.000240445137024e-06, 1.1222437024116516e-06, 1.2442469596862793e-06, 1.366250216960907e-06, 1.4882534742355347e-06, 1.6102567315101624e-06, 1.73225998878479e-06, 1.8542632460594177e-06, 1.9762665033340454e-06, 2.098269760608673e-06, 2.2202730178833008e-06, 2.3422762751579285e-06, 2.464279532432556e-06, 2.586282789707184e-06, 2.7082860469818115e-06, 2.830289304256439e-06, 2.952292561531067e-06, 3.0742958188056946e-06, 3.1962990760803223e-06, 3.31830233335495e-06, 3.4403055906295776e-06, 3.5623088479042053e-06, 3.684312105178833e-06, 3.8063153624534607e-06, 3.928318619728088e-06, 4.050321877002716e-06, 4.172325134277344e-06]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 7.0, 5.0, 6.0, 2.0, 15.0, 17.0, 32.0, 29.0, 56.0, 86.0, 107.0, 167.0, 241.0, 416.0, 783.0, 1357.0, 2637.0, 5792.0, 13435.0, 36698.0, 79836.0, 159044.0, 236346.0, 231018.0, 149760.0, 73429.0, 31910.0, 13394.0, 5853.0, 2768.0, 1329.0, 709.0, 493.0, 244.0, 159.0, 122.0, 76.0, 58.0, 54.0, 23.0, 16.0, 10.0, 8.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7404556274414062e-05, -1.680385321378708e-05, -1.6203150153160095e-05, -1.560244709253311e-05, -1.5001744031906128e-05, -1.4401040971279144e-05, -1.380033791065216e-05, -1.3199634850025177e-05, -1.2598931789398193e-05, -1.199822872877121e-05, -1.1397525668144226e-05, -1.0796822607517242e-05, -1.0196119546890259e-05, -9.595416486263275e-06, -8.994713425636292e-06, -8.394010365009308e-06, -7.793307304382324e-06, -7.1926042437553406e-06, -6.591901183128357e-06, -5.991198122501373e-06, -5.39049506187439e-06, -4.789792001247406e-06, -4.189088940620422e-06, -3.5883858799934387e-06, -2.987682819366455e-06, -2.3869797587394714e-06, -1.7862766981124878e-06, -1.1855736374855042e-06, -5.848705768585205e-07, 1.5832483768463135e-08, 6.165355443954468e-07, 1.2172386050224304e-06, 1.817941665649414e-06, 2.4186447262763977e-06, 3.0193477869033813e-06, 3.620050847530365e-06, 4.220753908157349e-06, 4.821456968784332e-06, 5.422160029411316e-06, 6.0228630900382996e-06, 6.623566150665283e-06, 7.224269211292267e-06, 7.82497227191925e-06, 8.425675332546234e-06, 9.026378393173218e-06, 9.627081453800201e-06, 1.0227784514427185e-05, 1.0828487575054169e-05, 1.1429190635681152e-05, 1.2029893696308136e-05, 1.263059675693512e-05, 1.3231299817562103e-05, 1.3832002878189087e-05, 1.443270593881607e-05, 1.5033408999443054e-05, 1.5634112060070038e-05, 1.623481512069702e-05, 1.6835518181324005e-05, 1.743622124195099e-05, 1.8036924302577972e-05, 1.8637627363204956e-05, 1.923833042383194e-05, 1.9839033484458923e-05, 2.0439736545085907e-05, 2.104043960571289e-05]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 16.0, 19.0, 16.0, 29.0, 26.0, 46.0, 31.0, 40.0, 58.0, 73.0, 77.0, 75.0, 70.0, 63.0, 60.0, 65.0, 47.0, 45.0, 41.0, 24.0, 17.0, 12.0, 17.0, 15.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05051878260565e-06, -3.9237920645973645e-06, -3.7970648918417282e-06, -3.6703379464597674e-06, -3.5436110010778066e-06, -3.416884283069521e-06, -3.2901573376875604e-06, -3.1634303923055995e-06, -3.0367034469236387e-06, -2.909976501541678e-06, -2.783249556159717e-06, -2.656522610777756e-06, -2.529795892769471e-06, -2.4030687200138345e-06, -2.276342002005549e-06, -2.1496150566235883e-06, -2.0228881112416275e-06, -1.8961611658596667e-06, -1.7694342204777058e-06, -1.6427073887825827e-06, -1.5159804434006219e-06, -1.389253498018661e-06, -1.262526666323538e-06, -1.1357997209415771e-06, -1.0090727755596163e-06, -8.823458301776554e-07, -7.556189416391135e-07, -6.288920531005715e-07, -5.021651077186107e-07, -3.7543816233664984e-07, -2.4871127379810787e-07, -1.219843852595659e-07, 4.742560122394934e-09, 1.3146947708264634e-07, 2.5819639404289774e-07, 3.8492331100314914e-07, 5.116502279634005e-07, 6.383771733453614e-07, 7.651040618839033e-07, 8.918309504224453e-07, 1.0185578958044061e-06, 1.145284841186367e-06, 1.2720117865683278e-06, 1.398738618263451e-06, 1.5254655636454117e-06, 1.6521925090273726e-06, 1.7789193407224957e-06, 1.9056462861044565e-06, 2.0323732314864174e-06, 2.159100176868378e-06, 2.285827122250339e-06, 2.4125540676323e-06, 2.5392810130142607e-06, 2.666007731022546e-06, 2.792734676404507e-06, 2.9194616217864677e-06, 3.0461885671684286e-06, 3.1729155125503894e-06, 3.2996424579323502e-06, 3.426369403314311e-06, 3.5530961213225964e-06, 3.6798232940782327e-06, 3.806550012086518e-06, 3.933277184842154e-06, 4.06000390285044e-06]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 4.0, 1.0, 9.0, 1.0, 8.0, 12.0, 6.0, 27.0, 13.0, 21.0, 14.0, 18.0, 57.0, 22.0, 44.0, 25.0, 28.0, 59.0, 34.0, 64.0, 24.0, 38.0, 52.0, 25.0, 56.0, 26.0, 62.0, 24.0, 26.0, 38.0, 17.0, 43.0, 13.0, 16.0, 24.0, 9.0, 9.0, 2.0, 4.0, 12.0, 2.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6226043701171875e-06, -2.5387853384017944e-06, -2.4549663066864014e-06, -2.3711472749710083e-06, -2.2873282432556152e-06, -2.203509211540222e-06, -2.119690179824829e-06, -2.035871148109436e-06, -1.952052116394043e-06, -1.86823308467865e-06, -1.7844140529632568e-06, -1.7005950212478638e-06, -1.6167759895324707e-06, -1.5329569578170776e-06, -1.4491379261016846e-06, -1.3653188943862915e-06, -1.2814998626708984e-06, -1.1976808309555054e-06, -1.1138617992401123e-06, -1.0300427675247192e-06, -9.462237358093262e-07, -8.624047040939331e-07, -7.7858567237854e-07, -6.94766640663147e-07, -6.109476089477539e-07, -5.271285772323608e-07, -4.4330954551696777e-07, -3.594905138015747e-07, -2.7567148208618164e-07, -1.9185245037078857e-07, -1.0803341865539551e-07, -2.421438694000244e-08, 5.960464477539063e-08, 1.434236764907837e-07, 2.2724270820617676e-07, 3.110617399215698e-07, 3.948807716369629e-07, 4.78699803352356e-07, 5.62518835067749e-07, 6.463378667831421e-07, 7.301568984985352e-07, 8.139759302139282e-07, 8.977949619293213e-07, 9.816139936447144e-07, 1.0654330253601074e-06, 1.1492520570755005e-06, 1.2330710887908936e-06, 1.3168901205062866e-06, 1.4007091522216797e-06, 1.4845281839370728e-06, 1.5683472156524658e-06, 1.6521662473678589e-06, 1.735985279083252e-06, 1.819804310798645e-06, 1.903623342514038e-06, 1.987442374229431e-06, 2.0712614059448242e-06, 2.1550804376602173e-06, 2.2388994693756104e-06, 2.3227185010910034e-06, 2.4065375328063965e-06, 2.4903565645217896e-06, 2.5741755962371826e-06, 2.6579946279525757e-06, 2.7418136596679688e-06]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 9.0, 11.0, 10.0, 15.0, 14.0, 13.0, 11.0, 19.0, 20.0, 23.0, 34.0, 37.0, 34.0, 51.0, 43.0, 48.0, 37.0, 49.0, 45.0, 46.0, 45.0, 43.0, 45.0, 35.0, 30.0, 29.0, 25.0, 25.0, 18.0, 23.0, 14.0, 11.0, 16.0, 13.0, 11.0, 9.0, 12.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-60.21875, -58.46728515625, -56.7158203125, -54.96435546875, -53.212890625, -51.46142578125, -49.7099609375, -47.95849609375, -46.20703125, -44.45556640625, -42.7041015625, -40.95263671875, -39.201171875, -37.44970703125, -35.6982421875, -33.94677734375, -32.1953125, -30.44384765625, -28.6923828125, -26.94091796875, -25.189453125, -23.43798828125, -21.6865234375, -19.93505859375, -18.18359375, -16.43212890625, -14.6806640625, -12.92919921875, -11.177734375, -9.42626953125, -7.6748046875, -5.92333984375, -4.171875, -2.42041015625, -0.6689453125, 1.08251953125, 2.833984375, 4.58544921875, 6.3369140625, 8.08837890625, 9.83984375, 11.59130859375, 13.3427734375, 15.09423828125, 16.845703125, 18.59716796875, 20.3486328125, 22.10009765625, 23.8515625, 25.60302734375, 27.3544921875, 29.10595703125, 30.857421875, 32.60888671875, 34.3603515625, 36.11181640625, 37.86328125, 39.61474609375, 41.3662109375, 43.11767578125, 44.869140625, 46.62060546875, 48.3720703125, 50.12353515625, 51.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 4.0, 10.0, 11.0, 16.0, 15.0, 20.0, 27.0, 34.0, 35.0, 61.0, 89.0, 158.0, 194.0, 372.0, 653.0, 1731.0, 5349.0, 22181.0, 109695.0, 433628.0, 367119.0, 82693.0, 17141.0, 4397.0, 1388.0, 588.0, 303.0, 170.0, 121.0, 71.0, 64.0, 54.0, 20.0, 30.0, 26.0, 18.0, 19.0, 14.0, 9.0, 7.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.4140625, -9.136474609375, -8.85888671875, -8.581298828125, -8.3037109375, -8.026123046875, -7.74853515625, -7.470947265625, -7.193359375, -6.915771484375, -6.63818359375, -6.360595703125, -6.0830078125, -5.805419921875, -5.52783203125, -5.250244140625, -4.97265625, -4.695068359375, -4.41748046875, -4.139892578125, -3.8623046875, -3.584716796875, -3.30712890625, -3.029541015625, -2.751953125, -2.474365234375, -2.19677734375, -1.919189453125, -1.6416015625, -1.364013671875, -1.08642578125, -0.808837890625, -0.53125, -0.253662109375, 0.02392578125, 0.301513671875, 0.5791015625, 0.856689453125, 1.13427734375, 1.411865234375, 1.689453125, 1.967041015625, 2.24462890625, 2.522216796875, 2.7998046875, 3.077392578125, 3.35498046875, 3.632568359375, 3.91015625, 4.187744140625, 4.46533203125, 4.742919921875, 5.0205078125, 5.298095703125, 5.57568359375, 5.853271484375, 6.130859375, 6.408447265625, 6.68603515625, 6.963623046875, 7.2412109375, 7.518798828125, 7.79638671875, 8.073974609375, 8.3515625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 13.0, 15.0, 28.0, 36.0, 46.0, 63.0, 62.0, 64.0, 91.0, 2142.0, 86.0, 86.0, 74.0, 52.0, 57.0, 33.0, 19.0, 32.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.875, -149.5517578125, -145.228515625, -140.9052734375, -136.58203125, -132.2587890625, -127.935546875, -123.6123046875, -119.2890625, -114.9658203125, -110.642578125, -106.3193359375, -101.99609375, -97.6728515625, -93.349609375, -89.0263671875, -84.703125, -80.3798828125, -76.056640625, -71.7333984375, -67.41015625, -63.0869140625, -58.763671875, -54.4404296875, -50.1171875, -45.7939453125, -41.470703125, -37.1474609375, -32.82421875, -28.5009765625, -24.177734375, -19.8544921875, -15.53125, -11.2080078125, -6.884765625, -2.5615234375, 1.76171875, 6.0849609375, 10.408203125, 14.7314453125, 19.0546875, 23.3779296875, 27.701171875, 32.0244140625, 36.34765625, 40.6708984375, 44.994140625, 49.3173828125, 53.640625, 57.9638671875, 62.287109375, 66.6103515625, 70.93359375, 75.2568359375, 79.580078125, 83.9033203125, 88.2265625, 92.5498046875, 96.873046875, 101.1962890625, 105.51953125, 109.8427734375, 114.166015625, 118.4892578125, 122.8125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 16.0, 21.0, 22.0, 34.0, 45.0, 75.0, 112.0, 140.0, 231.0, 328.0, 606.0, 1361.0, 4914.0, 68310.0, 2915417.0, 143219.0, 7353.0, 1562.0, 739.0, 426.0, 248.0, 158.0, 106.0, 78.0, 40.0, 41.0, 23.0, 20.0, 17.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6640625, -14.1849365234375, -13.705810546875, -13.2266845703125, -12.74755859375, -12.2684326171875, -11.789306640625, -11.3101806640625, -10.8310546875, -10.3519287109375, -9.872802734375, -9.3936767578125, -8.91455078125, -8.4354248046875, -7.956298828125, -7.4771728515625, -6.998046875, -6.5189208984375, -6.039794921875, -5.5606689453125, -5.08154296875, -4.6024169921875, -4.123291015625, -3.6441650390625, -3.1650390625, -2.6859130859375, -2.206787109375, -1.7276611328125, -1.24853515625, -0.7694091796875, -0.290283203125, 0.1888427734375, 0.66796875, 1.1470947265625, 1.626220703125, 2.1053466796875, 2.58447265625, 3.0635986328125, 3.542724609375, 4.0218505859375, 4.5009765625, 4.9801025390625, 5.459228515625, 5.9383544921875, 6.41748046875, 6.8966064453125, 7.375732421875, 7.8548583984375, 8.333984375, 8.8131103515625, 9.292236328125, 9.7713623046875, 10.25048828125, 10.7296142578125, 11.208740234375, 11.6878662109375, 12.1669921875, 12.6461181640625, 13.125244140625, 13.6043701171875, 14.08349609375, 14.5626220703125, 15.041748046875, 15.5208740234375, 16.0]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 28.0, 96.0, 313.0, 319.0, 148.0, 44.0, 20.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.9063720703125, -93.5420150756836, -84.17765808105469, -74.81330108642578, -65.44894409179688, -56.08458709716797, -46.72023010253906, -37.355873107910156, -27.99151611328125, -18.627159118652344, -9.262802124023438, 0.10155487060546875, 9.465911865234375, 18.83026885986328, 28.194625854492188, 37.558982849121094, 46.92333984375, 56.287696838378906, 65.65205383300781, 75.01641082763672, 84.38076782226562, 93.74512481689453, 103.10948181152344, 112.47383880615234, 121.83819580078125, 131.20254516601562, 140.56690979003906, 149.9312744140625, 159.29562377929688, 168.65997314453125, 178.0243377685547, 187.38870239257812, 196.7530517578125, 206.11740112304688, 215.4817657470703, 224.84613037109375, 234.21047973632812, 243.5748291015625, 252.93919372558594, 262.3035583496094, 271.66790771484375, 281.0322570800781, 290.3966064453125, 299.760986328125, 309.1253356933594, 318.48968505859375, 327.85406494140625, 337.2184143066406, 346.582763671875, 355.9471130371094, 365.31146240234375, 374.67584228515625, 384.0401916503906, 393.404541015625, 402.7689208984375, 412.1332702636719, 421.49761962890625, 430.8619689941406, 440.226318359375, 449.5906982421875, 458.9550476074219, 468.31939697265625, 477.68377685546875, 487.0481262207031, 496.4124755859375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 10.0, 7.0, 11.0, 10.0, 18.0, 11.0, 20.0, 28.0, 15.0, 36.0, 40.0, 38.0, 41.0, 41.0, 46.0, 45.0, 53.0, 43.0, 57.0, 50.0, 44.0, 41.0, 42.0, 28.0, 39.0, 20.0, 28.0, 26.0, 19.0, 20.0, 15.0, 8.0, 13.0, 11.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.92298889160156, -126.03353118896484, -122.14407348632812, -118.25460815429688, -114.36515045166016, -110.47569274902344, -106.58622741699219, -102.69676971435547, -98.80731201171875, -94.91785430908203, -91.02839660644531, -87.13893127441406, -83.24947357177734, -79.36001586914062, -75.47055053710938, -71.58109283447266, -67.69163513183594, -63.80217742919922, -59.912715911865234, -56.02325439453125, -52.13379669189453, -48.24433898925781, -44.35487747192383, -40.465415954589844, -36.575958251953125, -32.686500549316406, -28.797039031982422, -24.90757942199707, -21.01811981201172, -17.128660202026367, -13.239200592041016, -9.349740982055664, -5.4602813720703125, -1.570821762084961, 2.3186378479003906, 6.208097457885742, 10.097557067871094, 13.987016677856445, 17.876476287841797, 21.76593589782715, 25.6553955078125, 29.54485511779785, 33.4343147277832, 37.32377624511719, 41.213233947753906, 45.102691650390625, 48.99215316772461, 52.881614685058594, 56.77107238769531, 60.66053009033203, 64.54998779296875, 68.439453125, 72.32891082763672, 76.21836853027344, 80.10783386230469, 83.9972915649414, 87.88674926757812, 91.77620697021484, 95.66566467285156, 99.55513000488281, 103.44458770751953, 107.33404541015625, 111.2235107421875, 115.11296844482422, 119.00242614746094]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 11.0, 13.0, 22.0, 26.0, 28.0, 47.0, 50.0, 54.0, 95.0, 110.0, 155.0, 167.0, 229.0, 311.0, 412.0, 473.0, 521.0, 763.0, 1471.0, 1040028.0, 771.0, 579.0, 447.0, 347.0, 322.0, 245.0, 196.0, 154.0, 116.0, 76.0, 72.0, 47.0, 55.0, 31.0, 22.0, 18.0, 9.0, 9.0, 7.0, 11.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-30.341537475585938, -29.36426544189453, -28.386991500854492, -27.409719467163086, -26.432445526123047, -25.45517349243164, -24.477901458740234, -23.500627517700195, -22.523353576660156, -21.54608154296875, -20.56880760192871, -19.591535568237305, -18.614261627197266, -17.63698959350586, -16.659717559814453, -15.682443618774414, -14.705171585083008, -13.727898597717285, -12.750625610351562, -11.773353576660156, -10.796079635620117, -9.818807601928711, -8.841534614562988, -7.864261627197266, -6.886988639831543, -5.90971565246582, -4.932442665100098, -3.955170154571533, -2.9778971672058105, -2.000624179840088, -1.0233516693115234, -0.04607868194580078, 0.9311943054199219, 1.908467173576355, 2.885740041732788, 3.8630127906799316, 4.840285778045654, 5.817558765411377, 6.794831275939941, 7.772104263305664, 8.749377250671387, 9.72665023803711, 10.703923225402832, 11.681196212768555, 12.658468246459961, 13.6357421875, 14.613014221191406, 15.590287208557129, 16.56756019592285, 17.544832229614258, 18.522106170654297, 19.499378204345703, 20.476652145385742, 21.45392417907715, 22.431198120117188, 23.408470153808594, 24.3857421875, 25.363014221191406, 26.340288162231445, 27.31756019592285, 28.29483413696289, 29.272106170654297, 30.249378204345703, 31.226652145385742, 32.20392608642578]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 12.0, 26.0, 25.0, 37.0, 82.0, 234.0, 120112.0, 51342560.0, 259.0, 57.0, 25.0, 19.0, 11.0, 7.0, 5.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1996.619873046875, -1946.710693359375, -1896.8016357421875, -1846.8924560546875, -1796.9833984375, -1747.07421875, -1697.1650390625, -1647.2559814453125, -1597.3468017578125, -1547.4376220703125, -1497.528564453125, -1447.619384765625, -1397.7103271484375, -1347.8011474609375, -1297.89208984375, -1247.98291015625, -1198.07373046875, -1148.16455078125, -1098.2554931640625, -1048.3463134765625, -998.4371948242188, -948.528076171875, -898.6189575195312, -848.7098388671875, -798.80078125, -748.8916625976562, -698.9825439453125, -649.0733642578125, -599.1642456054688, -549.255126953125, -499.34600830078125, -449.4368591308594, -399.5277099609375, -349.61859130859375, -299.7094421386719, -249.80032348632812, -199.8911895751953, -149.9820556640625, -100.07293701171875, -50.163787841796875, -0.254669189453125, 49.65446090698242, 99.56359100341797, 149.47271728515625, 199.38185119628906, 249.29098510742188, 299.2001037597656, 349.1092529296875, 399.01837158203125, 448.927490234375, 498.8366394042969, 548.7457275390625, 598.6549072265625, 648.5640258789062, 698.47314453125, 748.38232421875, 798.2913818359375, 848.2005004882812, 898.109619140625, 948.018798828125, 997.9279174804688, 1047.8370361328125, 1097.74609375, 1147.6552734375, 1197.564453125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 13.0, 14.0, 27.0, 41.0, 50.0, 61.0, 90.0, 139.0, 189.0, 324.0, 483.0, 746.0, 1079.0, 1743.0, 2764.0, 4256.0, 6813.0, 11148.0, 18251.0, 29892.0, 49717.0, 83167.0, 142782.0, 266478.0, 591608.0, 4075678.0, 472707.0, 222321.0, 123369.0, 72456.0, 43701.0, 26404.0, 16049.0, 10146.0, 6020.0, 3774.0, 2436.0, 1587.0, 958.0, 678.0, 438.0, 271.0, 183.0, 128.0, 80.0, 62.0, 35.0, 23.0, 17.0, 13.0, 8.0, 11.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.101318359375, -0.09818840026855469, -0.09505844116210938, -0.09192848205566406, -0.08879852294921875, -0.08566856384277344, -0.08253860473632812, -0.07940864562988281, -0.0762786865234375, -0.07314872741699219, -0.07001876831054688, -0.06688880920410156, -0.06375885009765625, -0.06062889099121094, -0.057498931884765625, -0.05436897277832031, -0.051239013671875, -0.04810905456542969, -0.044979095458984375, -0.04184913635253906, -0.03871917724609375, -0.03558921813964844, -0.032459259033203125, -0.029329299926757812, -0.0261993408203125, -0.023069381713867188, -0.019939422607421875, -0.016809463500976562, -0.01367950439453125, -0.010549545288085938, -0.007419586181640625, -0.0042896270751953125, -0.00115966796875, 0.0019702911376953125, 0.005100250244140625, 0.008230209350585938, 0.01136016845703125, 0.014490127563476562, 0.017620086669921875, 0.020750045776367188, 0.0238800048828125, 0.027009963989257812, 0.030139923095703125, 0.03326988220214844, 0.03639984130859375, 0.03952980041503906, 0.042659759521484375, 0.04578971862792969, 0.048919677734375, 0.05204963684082031, 0.055179595947265625, 0.05830955505371094, 0.06143951416015625, 0.06456947326660156, 0.06769943237304688, 0.07082939147949219, 0.0739593505859375, 0.07708930969238281, 0.08021926879882812, 0.08334922790527344, 0.08647918701171875, 0.08960914611816406, 0.09273910522460938, 0.09586906433105469, 0.0989990234375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 4.0, 8.0, 11.0, 13.0, 8.0, 11.0, 19.0, 25.0, 22.0, 37.0, 26.0, 23.0, 34.0, 41.0, 33.0, 30.0, 40.0, 39.0, 1069.0, 33.0, 54.0, 55.0, 44.0, 39.0, 31.0, 38.0, 28.0, 36.0, 26.0, 26.0, 22.0, 14.0, 18.0, 12.0, 21.0, 8.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.296875, -13.817626953125, -13.33837890625, -12.859130859375, -12.3798828125, -11.900634765625, -11.42138671875, -10.942138671875, -10.462890625, -9.983642578125, -9.50439453125, -9.025146484375, -8.5458984375, -8.066650390625, -7.58740234375, -7.108154296875, -6.62890625, -6.149658203125, -5.67041015625, -5.191162109375, -4.7119140625, -4.232666015625, -3.75341796875, -3.274169921875, -2.794921875, -2.315673828125, -1.83642578125, -1.357177734375, -0.8779296875, -0.398681640625, 0.08056640625, 0.559814453125, 1.0390625, 1.518310546875, 1.99755859375, 2.476806640625, 2.9560546875, 3.435302734375, 3.91455078125, 4.393798828125, 4.873046875, 5.352294921875, 5.83154296875, 6.310791015625, 6.7900390625, 7.269287109375, 7.74853515625, 8.227783203125, 8.70703125, 9.186279296875, 9.66552734375, 10.144775390625, 10.6240234375, 11.103271484375, 11.58251953125, 12.061767578125, 12.541015625, 13.020263671875, 13.49951171875, 13.978759765625, 14.4580078125, 14.937255859375, 15.41650390625, 15.895751953125, 16.375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 5.0, 5.0, 4.0, 7.0, 19.0, 28.0, 45.0, 42.0, 69.0, 116.0, 184.0, 210.0, 330.0, 478.0, 695.0, 915.0, 1404.0, 2115.0, 2982.0, 4445.0, 6577.0, 10065.0, 15507.0, 23893.0, 38134.0, 60700.0, 100150.0, 169191.0, 310873.0, 624007.0, 3924688.0, 434143.0, 222109.0, 127098.0, 77113.0, 47436.0, 29689.0, 19003.0, 12203.0, 8152.0, 5412.0, 3561.0, 2329.0, 1622.0, 1130.0, 774.0, 473.0, 369.0, 304.0, 193.0, 137.0, 104.0, 70.0, 43.0, 31.0, 22.0, 19.0, 12.0, 5.0, 7.0, 2.0, 4.0, 2.0], "bins": [-0.07647705078125, -0.07402896881103516, -0.07158088684082031, -0.06913280487060547, -0.06668472290039062, -0.06423664093017578, -0.06178855895996094, -0.059340476989746094, -0.05689239501953125, -0.054444313049316406, -0.05199623107910156, -0.04954814910888672, -0.047100067138671875, -0.04465198516845703, -0.04220390319824219, -0.039755821228027344, -0.0373077392578125, -0.034859657287597656, -0.03241157531738281, -0.02996349334716797, -0.027515411376953125, -0.02506732940673828, -0.022619247436523438, -0.020171165466308594, -0.01772308349609375, -0.015275001525878906, -0.012826919555664062, -0.010378837585449219, -0.007930755615234375, -0.005482673645019531, -0.0030345916748046875, -0.0005865097045898438, 0.001861572265625, 0.004309654235839844, 0.0067577362060546875, 0.009205818176269531, 0.011653900146484375, 0.014101982116699219, 0.016550064086914062, 0.018998146057128906, 0.02144622802734375, 0.023894309997558594, 0.026342391967773438, 0.02879047393798828, 0.031238555908203125, 0.03368663787841797, 0.03613471984863281, 0.038582801818847656, 0.0410308837890625, 0.043478965759277344, 0.04592704772949219, 0.04837512969970703, 0.050823211669921875, 0.05327129364013672, 0.05571937561035156, 0.058167457580566406, 0.06061553955078125, 0.0630636215209961, 0.06551170349121094, 0.06795978546142578, 0.07040786743164062, 0.07285594940185547, 0.07530403137207031, 0.07775211334228516, 0.0802001953125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 0.0, 6.0, 0.0, 14.0, 8.0, 13.0, 18.0, 15.0, 25.0, 25.0, 24.0, 30.0, 28.0, 32.0, 37.0, 48.0, 38.0, 50.0, 41.0, 1070.0, 45.0, 49.0, 38.0, 47.0, 44.0, 36.0, 29.0, 31.0, 30.0, 24.0, 19.0, 19.0, 19.0, 19.0, 11.0, 8.0, 7.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.609375, -12.2337646484375, -11.858154296875, -11.4825439453125, -11.10693359375, -10.7313232421875, -10.355712890625, -9.9801025390625, -9.6044921875, -9.2288818359375, -8.853271484375, -8.4776611328125, -8.10205078125, -7.7264404296875, -7.350830078125, -6.9752197265625, -6.599609375, -6.2239990234375, -5.848388671875, -5.4727783203125, -5.09716796875, -4.7215576171875, -4.345947265625, -3.9703369140625, -3.5947265625, -3.2191162109375, -2.843505859375, -2.4678955078125, -2.09228515625, -1.7166748046875, -1.341064453125, -0.9654541015625, -0.58984375, -0.2142333984375, 0.161376953125, 0.5369873046875, 0.91259765625, 1.2882080078125, 1.663818359375, 2.0394287109375, 2.4150390625, 2.7906494140625, 3.166259765625, 3.5418701171875, 3.91748046875, 4.2930908203125, 4.668701171875, 5.0443115234375, 5.419921875, 5.7955322265625, 6.171142578125, 6.5467529296875, 6.92236328125, 7.2979736328125, 7.673583984375, 8.0491943359375, 8.4248046875, 8.8004150390625, 9.176025390625, 9.5516357421875, 9.92724609375, 10.3028564453125, 10.678466796875, 11.0540771484375, 11.4296875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 5.0, 9.0, 5.0, 7.0, 6.0, 9.0, 6.0, 12.0, 24.0, 34.0, 48.0, 46.0, 47.0, 59.0, 86.0, 108.0, 125.0, 141.0, 216.0, 272.0, 326.0, 504.0, 723.0, 1282.0, 3934.0, 19601.0, 158735.0, 6034468.0, 55662.0, 9478.0, 2250.0, 933.0, 556.0, 376.0, 263.0, 198.0, 168.0, 141.0, 93.0, 97.0, 56.0, 73.0, 52.0, 47.0, 40.0, 21.0, 32.0, 21.0, 5.0, 15.0, 15.0, 2.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.44140625, -0.4272918701171875, -0.413177490234375, -0.3990631103515625, -0.38494873046875, -0.3708343505859375, -0.356719970703125, -0.3426055908203125, -0.3284912109375, -0.3143768310546875, -0.300262451171875, -0.2861480712890625, -0.27203369140625, -0.2579193115234375, -0.243804931640625, -0.2296905517578125, -0.215576171875, -0.2014617919921875, -0.187347412109375, -0.1732330322265625, -0.15911865234375, -0.1450042724609375, -0.130889892578125, -0.1167755126953125, -0.1026611328125, -0.0885467529296875, -0.074432373046875, -0.0603179931640625, -0.04620361328125, -0.0320892333984375, -0.017974853515625, -0.0038604736328125, 0.01025390625, 0.0243682861328125, 0.038482666015625, 0.0525970458984375, 0.06671142578125, 0.0808258056640625, 0.094940185546875, 0.1090545654296875, 0.1231689453125, 0.1372833251953125, 0.151397705078125, 0.1655120849609375, 0.17962646484375, 0.1937408447265625, 0.207855224609375, 0.2219696044921875, 0.236083984375, 0.2501983642578125, 0.264312744140625, 0.2784271240234375, 0.29254150390625, 0.3066558837890625, 0.320770263671875, 0.3348846435546875, 0.3489990234375, 0.3631134033203125, 0.377227783203125, 0.3913421630859375, 0.40545654296875, 0.4195709228515625, 0.433685302734375, 0.4477996826171875, 0.4619140625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 10.0, 11.0, 16.0, 11.0, 14.0, 11.0, 26.0, 23.0, 19.0, 24.0, 24.0, 40.0, 36.0, 36.0, 36.0, 34.0, 37.0, 37.0, 39.0, 1050.0, 49.0, 35.0, 42.0, 40.0, 34.0, 32.0, 32.0, 27.0, 25.0, 24.0, 19.0, 14.0, 19.0, 19.0, 10.0, 15.0, 14.0, 6.0, 8.0, 9.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.7578125, -7.510986328125, -7.26416015625, -7.017333984375, -6.7705078125, -6.523681640625, -6.27685546875, -6.030029296875, -5.783203125, -5.536376953125, -5.28955078125, -5.042724609375, -4.7958984375, -4.549072265625, -4.30224609375, -4.055419921875, -3.80859375, -3.561767578125, -3.31494140625, -3.068115234375, -2.8212890625, -2.574462890625, -2.32763671875, -2.080810546875, -1.833984375, -1.587158203125, -1.34033203125, -1.093505859375, -0.8466796875, -0.599853515625, -0.35302734375, -0.106201171875, 0.140625, 0.387451171875, 0.63427734375, 0.881103515625, 1.1279296875, 1.374755859375, 1.62158203125, 1.868408203125, 2.115234375, 2.362060546875, 2.60888671875, 2.855712890625, 3.1025390625, 3.349365234375, 3.59619140625, 3.843017578125, 4.08984375, 4.336669921875, 4.58349609375, 4.830322265625, 5.0771484375, 5.323974609375, 5.57080078125, 5.817626953125, 6.064453125, 6.311279296875, 6.55810546875, 6.804931640625, 7.0517578125, 7.298583984375, 7.54541015625, 7.792236328125, 8.0390625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 650.0, 356.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.42967224121094, -31.19765853881836, -28.96564292907715, -26.73362922668457, -24.50161361694336, -22.26959991455078, -20.037586212158203, -17.805572509765625, -15.573556900024414, -13.34154224395752, -11.109527587890625, -8.877513885498047, -6.645499229431152, -4.413484573364258, -2.1814708709716797, 0.050543785095214844, 2.2825584411621094, 4.514573097229004, 6.74658727645874, 8.978601455688477, 11.210616111755371, 13.442630767822266, 15.674644470214844, 17.906658172607422, 20.138673782348633, 22.37068748474121, 24.602703094482422, 26.834716796875, 29.066730499267578, 31.29874610900879, 33.53076171875, 35.76277542114258, 37.994789123535156, 40.226802825927734, 42.45881652832031, 44.690834045410156, 46.922847747802734, 49.15486145019531, 51.38687515258789, 53.61888885498047, 55.85090637207031, 58.08292007446289, 60.31493377685547, 62.54695129394531, 64.77896118164062, 67.01097869873047, 69.24299621582031, 71.47500610351562, 73.70701599121094, 75.93903350830078, 78.1710433959961, 80.40306091308594, 82.63507080078125, 84.8670883178711, 87.09910583496094, 89.33111572265625, 91.5631332397461, 93.79515075683594, 96.02716064453125, 98.2591781616211, 100.4911880493164, 102.72320556640625, 104.95521545410156, 107.1872329711914, 109.41925048828125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 12.0, 6.0, 7.0, 10.0, 15.0, 16.0, 11.0, 14.0, 18.0, 21.0, 29.0, 18.0, 17.0, 25.0, 35.0, 31.0, 31.0, 43.0, 33.0, 47.0, 37.0, 33.0, 44.0, 53.0, 49.0, 34.0, 19.0, 24.0, 29.0, 28.0, 24.0, 20.0, 22.0, 17.0, 14.0, 17.0, 21.0, 13.0, 9.0, 8.0, 7.0, 8.0, 9.0, 10.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-16.5479736328125, -16.06859588623047, -15.589218139648438, -15.109840393066406, -14.630461692810059, -14.151083946228027, -13.671706199645996, -13.192328453063965, -12.712950706481934, -12.233572959899902, -11.754195213317871, -11.274816513061523, -10.795438766479492, -10.316061019897461, -9.83668327331543, -9.357305526733398, -8.877927780151367, -8.398550033569336, -7.9191718101501465, -7.439794063568115, -6.960416316986084, -6.4810380935668945, -6.001660346984863, -5.522282600402832, -5.042903900146484, -4.563526153564453, -4.084147930145264, -3.6047701835632324, -3.125392436981201, -2.646014451980591, -2.1666364669799805, -1.6872587203979492, -1.207880973815918, -0.7285031080245972, -0.2491251826286316, 0.23025274276733398, 0.7096306085586548, 1.1890084743499756, 1.668386459350586, 2.147764205932617, 2.6271421909332275, 3.106520175933838, 3.585897922515869, 4.065276145935059, 4.54465389251709, 5.024031639099121, 5.503409385681152, 5.982787132263184, 6.462165355682373, 6.941543102264404, 7.420921325683594, 7.900299072265625, 8.379676818847656, 8.859054565429688, 9.338432312011719, 9.81781005859375, 10.297188758850098, 10.776566505432129, 11.25594425201416, 11.735322952270508, 12.214700698852539, 12.69407844543457, 13.173456192016602, 13.652833938598633, 14.132211685180664]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 7.0, 4.0, 9.0, 9.0, 3.0, 11.0, 11.0, 12.0, 21.0, 33.0, 28.0, 33.0, 64.0, 82.0, 65.0, 102.0, 151.0, 195.0, 294.0, 419.0, 770.0, 3967.0, 17672.0, 3853001.0, 300593.0, 10316.0, 3324.0, 841.0, 522.0, 375.0, 296.0, 232.0, 164.0, 114.0, 122.0, 76.0, 81.0, 56.0, 39.0, 31.0, 20.0, 18.0, 25.0, 9.0, 13.0, 16.0, 4.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.036346435546875, -0.03517293930053711, -0.03399944305419922, -0.03282594680786133, -0.03165245056152344, -0.030478954315185547, -0.029305458068847656, -0.028131961822509766, -0.026958465576171875, -0.025784969329833984, -0.024611473083496094, -0.023437976837158203, -0.022264480590820312, -0.021090984344482422, -0.01991748809814453, -0.01874399185180664, -0.01757049560546875, -0.01639699935913086, -0.015223503112792969, -0.014050006866455078, -0.012876510620117188, -0.011703014373779297, -0.010529518127441406, -0.009356021881103516, -0.008182525634765625, -0.007009029388427734, -0.005835533142089844, -0.004662036895751953, -0.0034885406494140625, -0.002315044403076172, -0.0011415481567382812, 3.1948089599609375e-05, 0.0012054443359375, 0.0023789405822753906, 0.0035524368286132812, 0.004725933074951172, 0.0058994293212890625, 0.007072925567626953, 0.008246421813964844, 0.009419918060302734, 0.010593414306640625, 0.011766910552978516, 0.012940406799316406, 0.014113903045654297, 0.015287399291992188, 0.016460895538330078, 0.01763439178466797, 0.01880788803100586, 0.01998138427734375, 0.02115488052368164, 0.02232837677001953, 0.023501873016357422, 0.024675369262695312, 0.025848865509033203, 0.027022361755371094, 0.028195858001708984, 0.029369354248046875, 0.030542850494384766, 0.031716346740722656, 0.03288984298706055, 0.03406333923339844, 0.03523683547973633, 0.03641033172607422, 0.03758382797241211, 0.03875732421875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 0.0, 5.0, 7.0, 5.0, 6.0, 14.0, 7.0, 14.0, 22.0, 781.0, 36.0, 11.0, 12.0, 14.0, 10.0, 5.0, 5.0, 6.0, 5.0, 1.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0189361572265625, -0.0183258056640625, -0.0177154541015625, -0.0171051025390625, -0.0164947509765625, -0.0158843994140625, -0.0152740478515625, -0.0146636962890625, -0.0140533447265625, -0.0134429931640625, -0.0128326416015625, -0.0122222900390625, -0.0116119384765625, -0.0110015869140625, -0.0103912353515625, -0.0097808837890625, -0.0091705322265625, -0.0085601806640625, -0.0079498291015625, -0.0073394775390625, -0.0067291259765625, -0.0061187744140625, -0.0055084228515625, -0.0048980712890625, -0.0042877197265625, -0.0036773681640625, -0.0030670166015625, -0.0024566650390625, -0.0018463134765625, -0.0012359619140625, -0.0006256103515625, -1.52587890625e-05, 0.0005950927734375, 0.0012054443359375, 0.0018157958984375, 0.0024261474609375, 0.0030364990234375, 0.0036468505859375, 0.0042572021484375, 0.0048675537109375, 0.0054779052734375, 0.0060882568359375, 0.0066986083984375, 0.0073089599609375, 0.0079193115234375, 0.0085296630859375, 0.0091400146484375, 0.0097503662109375, 0.0103607177734375, 0.0109710693359375, 0.0115814208984375, 0.0121917724609375, 0.0128021240234375, 0.0134124755859375, 0.0140228271484375, 0.0146331787109375, 0.0152435302734375, 0.0158538818359375, 0.0164642333984375, 0.0170745849609375, 0.0176849365234375, 0.0182952880859375, 0.0189056396484375, 0.0195159912109375, 0.0201263427734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 8.0, 15.0, 10.0, 14.0, 17.0, 24.0, 37.0, 49.0, 96.0, 243.0, 992.0, 6034.0, 569871.0, 3608951.0, 5860.0, 1334.0, 324.0, 141.0, 72.0, 52.0, 29.0, 14.0, 12.0, 11.0, 11.0, 8.0, 6.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.10882568359375, -0.10552978515625, -0.10223388671875, -0.09893798828125, -0.09564208984375, -0.09234619140625, -0.08905029296875, -0.08575439453125, -0.08245849609375, -0.07916259765625, -0.07586669921875, -0.07257080078125, -0.06927490234375, -0.06597900390625, -0.06268310546875, -0.05938720703125, -0.05609130859375, -0.05279541015625, -0.04949951171875, -0.04620361328125, -0.04290771484375, -0.03961181640625, -0.03631591796875, -0.03302001953125, -0.02972412109375, -0.02642822265625, -0.02313232421875, -0.01983642578125, -0.01654052734375, -0.01324462890625, -0.00994873046875, -0.00665283203125, -0.00335693359375, -6.103515625e-05, 0.00323486328125, 0.00653076171875, 0.00982666015625, 0.01312255859375, 0.01641845703125, 0.01971435546875, 0.02301025390625, 0.02630615234375, 0.02960205078125, 0.03289794921875, 0.03619384765625, 0.03948974609375, 0.04278564453125, 0.04608154296875, 0.04937744140625, 0.05267333984375, 0.05596923828125, 0.05926513671875, 0.06256103515625, 0.06585693359375, 0.06915283203125, 0.07244873046875, 0.07574462890625, 0.07904052734375, 0.08233642578125, 0.08563232421875, 0.08892822265625, 0.09222412109375, 0.09552001953125, 0.09881591796875, 0.10211181640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 5.0, 4.0, 7.0, 8.0, 5.0, 13.0, 7.0, 49.0, 208.0, 1669.0, 1761.0, 190.0, 53.0, 19.0, 9.0, 4.0, 6.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.036468505859375, -0.03529214859008789, -0.03411579132080078, -0.03293943405151367, -0.03176307678222656, -0.030586719512939453, -0.029410362243652344, -0.028234004974365234, -0.027057647705078125, -0.025881290435791016, -0.024704933166503906, -0.023528575897216797, -0.022352218627929688, -0.021175861358642578, -0.01999950408935547, -0.01882314682006836, -0.01764678955078125, -0.01647043228149414, -0.015294075012207031, -0.014117717742919922, -0.012941360473632812, -0.011765003204345703, -0.010588645935058594, -0.009412288665771484, -0.008235931396484375, -0.007059574127197266, -0.005883216857910156, -0.004706859588623047, -0.0035305023193359375, -0.002354145050048828, -0.0011777877807617188, -1.430511474609375e-06, 0.0011749267578125, 0.0023512840270996094, 0.0035276412963867188, 0.004703998565673828, 0.0058803558349609375, 0.007056713104248047, 0.008233070373535156, 0.009409427642822266, 0.010585784912109375, 0.011762142181396484, 0.012938499450683594, 0.014114856719970703, 0.015291213989257812, 0.016467571258544922, 0.01764392852783203, 0.01882028579711914, 0.01999664306640625, 0.02117300033569336, 0.02234935760498047, 0.023525714874267578, 0.024702072143554688, 0.025878429412841797, 0.027054786682128906, 0.028231143951416016, 0.029407501220703125, 0.030583858489990234, 0.031760215759277344, 0.03293657302856445, 0.03411293029785156, 0.03528928756713867, 0.03646564483642578, 0.03764200210571289, 0.038818359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1016.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2939869165420532, -0.2597557604312897, -0.22552458941936493, -0.19129341840744019, -0.15706226229667664, -0.12283110618591309, -0.08859993517398834, -0.0543687641620636, -0.02013760805130005, 0.014093555510044098, 0.048324719071388245, 0.08255588263273239, 0.11678704619407654, 0.1510182023048401, 0.18524937331676483, 0.21948054432868958, 0.2537117004394531, 0.2879428565502167, 0.3221740126609802, 0.35640519857406616, 0.3906363546848297, 0.42486751079559326, 0.4590986967086792, 0.49332985281944275, 0.5275610089302063, 0.5617921948432922, 0.5960233211517334, 0.6302545070648193, 0.6644856929779053, 0.6987168192863464, 0.7329480051994324, 0.7671791315078735, 0.8014103174209595, 0.8356415033340454, 0.8698726296424866, 0.9041038155555725, 0.9383349418640137, 0.9725661277770996, 1.0067973136901855, 1.0410284996032715, 1.0752596855163574, 1.1094908714294434, 1.1437220573425293, 1.1779531240463257, 1.2121843099594116, 1.2464154958724976, 1.2806466817855835, 1.3148778676986694, 1.3491089344024658, 1.3833401203155518, 1.4175713062286377, 1.451802372932434, 1.48603355884552, 1.520264744758606, 1.554495930671692, 1.5887271165847778, 1.6229581832885742, 1.6571893692016602, 1.691420555114746, 1.7256516218185425, 1.7598828077316284, 1.7941139936447144, 1.8283451795578003, 1.8625763654708862, 1.8968075513839722]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 7.0, 8.0, 11.0, 17.0, 22.0, 24.0, 42.0, 50.0, 68.0, 76.0, 94.0, 112.0, 90.0, 82.0, 63.0, 40.0, 39.0, 29.0, 20.0, 10.0, 10.0, 8.0, 6.0, 3.0, 5.0, 9.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11265707015991211, -0.10868007689714432, -0.10470308363437653, -0.10072609037160873, -0.09674909710884094, -0.09277210384607315, -0.08879511058330536, -0.08481811732053757, -0.08084112405776978, -0.07686413079500198, -0.07288713753223419, -0.0689101442694664, -0.06493315100669861, -0.06095615774393082, -0.056979164481163025, -0.05300217121839523, -0.04902517795562744, -0.04504818469285965, -0.04107119143009186, -0.037094198167324066, -0.033117204904556274, -0.029140211641788483, -0.02516321837902069, -0.0211862251162529, -0.017209231853485107, -0.013232238590717316, -0.009255245327949524, -0.005278252065181732, -0.0013012588024139404, 0.0026757344603538513, 0.006652727723121643, 0.010629720985889435, 0.014606714248657227, 0.01858370751142502, 0.02256070077419281, 0.026537694036960602, 0.030514687299728394, 0.034491680562496185, 0.03846867382526398, 0.04244566708803177, 0.04642266035079956, 0.05039965361356735, 0.054376646876335144, 0.058353640139102936, 0.06233063340187073, 0.06630762666463852, 0.07028461992740631, 0.0742616131901741, 0.0782386064529419, 0.08221559971570969, 0.08619259297847748, 0.09016958624124527, 0.09414657950401306, 0.09812357276678085, 0.10210056602954865, 0.10607755929231644, 0.11005455255508423, 0.11403154581785202, 0.11800853908061981, 0.1219855323433876, 0.1259625256061554, 0.12993952631950378, 0.13391651213169098, 0.13789349794387817, 0.14187049865722656]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 6.0, 6.0, 14.0, 20.0, 28.0, 37.0, 62.0, 76.0, 109.0, 147.0, 213.0, 279.0, 374.0, 493.0, 743.0, 1064.0, 1574.0, 2263.0, 3521.0, 5967.0, 10781.0, 25431.0, 903992.0, 53916.0, 16257.0, 7750.0, 4448.0, 2725.0, 1816.0, 1286.0, 883.0, 613.0, 457.0, 333.0, 237.0, 176.0, 133.0, 101.0, 79.0, 47.0, 28.0, 21.0, 18.0, 10.0, 6.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0206298828125, -0.019959211349487305, -0.01928853988647461, -0.018617868423461914, -0.01794719696044922, -0.017276525497436523, -0.016605854034423828, -0.015935182571411133, -0.015264511108398438, -0.014593839645385742, -0.013923168182373047, -0.013252496719360352, -0.012581825256347656, -0.011911153793334961, -0.011240482330322266, -0.01056981086730957, -0.009899139404296875, -0.00922846794128418, -0.008557796478271484, -0.007887125015258789, -0.007216453552246094, -0.0065457820892333984, -0.005875110626220703, -0.005204439163208008, -0.0045337677001953125, -0.003863096237182617, -0.003192424774169922, -0.0025217533111572266, -0.0018510818481445312, -0.001180410385131836, -0.0005097389221191406, 0.0001609325408935547, 0.00083160400390625, 0.0015022754669189453, 0.0021729469299316406, 0.002843618392944336, 0.0035142898559570312, 0.0041849613189697266, 0.004855632781982422, 0.005526304244995117, 0.0061969757080078125, 0.006867647171020508, 0.007538318634033203, 0.008208990097045898, 0.008879661560058594, 0.009550333023071289, 0.010221004486083984, 0.01089167594909668, 0.011562347412109375, 0.01223301887512207, 0.012903690338134766, 0.013574361801147461, 0.014245033264160156, 0.014915704727172852, 0.015586376190185547, 0.016257047653198242, 0.016927719116210938, 0.017598390579223633, 0.018269062042236328, 0.018939733505249023, 0.01961040496826172, 0.020281076431274414, 0.02095174789428711, 0.021622419357299805, 0.0222930908203125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 3.0, 6.0, 12.0, 8.0, 9.0, 17.0, 27.0, 777.0, 34.0, 10.0, 14.0, 9.0, 12.0, 2.0, 8.0, 5.0, 4.0, 2.0, 5.0, 1.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0182342529296875, -0.017642498016357422, -0.017050743103027344, -0.016458988189697266, -0.015867233276367188, -0.01527547836303711, -0.014683723449707031, -0.014091968536376953, -0.013500213623046875, -0.012908458709716797, -0.012316703796386719, -0.01172494888305664, -0.011133193969726562, -0.010541439056396484, -0.009949684143066406, -0.009357929229736328, -0.00876617431640625, -0.008174419403076172, -0.007582664489746094, -0.006990909576416016, -0.0063991546630859375, -0.005807399749755859, -0.005215644836425781, -0.004623889923095703, -0.004032135009765625, -0.003440380096435547, -0.0028486251831054688, -0.0022568702697753906, -0.0016651153564453125, -0.0010733604431152344, -0.00048160552978515625, 0.00011014938354492188, 0.000701904296875, 0.0012936592102050781, 0.0018854141235351562, 0.0024771690368652344, 0.0030689239501953125, 0.0036606788635253906, 0.004252433776855469, 0.004844188690185547, 0.005435943603515625, 0.006027698516845703, 0.006619453430175781, 0.007211208343505859, 0.0078029632568359375, 0.008394718170166016, 0.008986473083496094, 0.009578227996826172, 0.01016998291015625, 0.010761737823486328, 0.011353492736816406, 0.011945247650146484, 0.012537002563476562, 0.01312875747680664, 0.013720512390136719, 0.014312267303466797, 0.014904022216796875, 0.015495777130126953, 0.01608753204345703, 0.01667928695678711, 0.017271041870117188, 0.017862796783447266, 0.018454551696777344, 0.019046306610107422, 0.0196380615234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 11.0, 6.0, 16.0, 19.0, 8.0, 21.0, 25.0, 29.0, 49.0, 38.0, 69.0, 77.0, 118.0, 133.0, 197.0, 348.0, 860.0, 3310.0, 31131.0, 879679.0, 122150.0, 7400.0, 1420.0, 491.0, 254.0, 141.0, 97.0, 83.0, 63.0, 59.0, 44.0, 36.0, 31.0, 21.0, 25.0, 24.0, 9.0, 8.0, 11.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.07452392578125, -0.07224559783935547, -0.06996726989746094, -0.0676889419555664, -0.06541061401367188, -0.06313228607177734, -0.06085395812988281, -0.05857563018798828, -0.05629730224609375, -0.05401897430419922, -0.05174064636230469, -0.049462318420410156, -0.047183990478515625, -0.044905662536621094, -0.04262733459472656, -0.04034900665283203, -0.0380706787109375, -0.03579235076904297, -0.03351402282714844, -0.031235694885253906, -0.028957366943359375, -0.026679039001464844, -0.024400711059570312, -0.02212238311767578, -0.01984405517578125, -0.01756572723388672, -0.015287399291992188, -0.013009071350097656, -0.010730743408203125, -0.008452415466308594, -0.0061740875244140625, -0.0038957595825195312, -0.001617431640625, 0.0006608963012695312, 0.0029392242431640625, 0.005217552185058594, 0.007495880126953125, 0.009774208068847656, 0.012052536010742188, 0.014330863952636719, 0.01660919189453125, 0.01888751983642578, 0.021165847778320312, 0.023444175720214844, 0.025722503662109375, 0.028000831604003906, 0.030279159545898438, 0.03255748748779297, 0.0348358154296875, 0.03711414337158203, 0.03939247131347656, 0.041670799255371094, 0.043949127197265625, 0.046227455139160156, 0.04850578308105469, 0.05078411102294922, 0.05306243896484375, 0.05534076690673828, 0.05761909484863281, 0.059897422790527344, 0.062175750732421875, 0.0644540786743164, 0.06673240661621094, 0.06901073455810547, 0.0712890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 9.0, 11.0, 6.0, 15.0, 13.0, 6.0, 15.0, 17.0, 15.0, 29.0, 18.0, 25.0, 28.0, 40.0, 31.0, 34.0, 39.0, 36.0, 39.0, 41.0, 45.0, 33.0, 44.0, 34.0, 31.0, 37.0, 33.0, 24.0, 27.0, 20.0, 29.0, 25.0, 16.0, 26.0, 13.0, 18.0, 23.0, 7.0, 6.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.06732177734375, -0.0652627944946289, -0.06320381164550781, -0.06114482879638672, -0.059085845947265625, -0.05702686309814453, -0.05496788024902344, -0.052908897399902344, -0.05084991455078125, -0.048790931701660156, -0.04673194885253906, -0.04467296600341797, -0.042613983154296875, -0.04055500030517578, -0.03849601745605469, -0.036437034606933594, -0.0343780517578125, -0.032319068908691406, -0.030260086059570312, -0.02820110321044922, -0.026142120361328125, -0.02408313751220703, -0.022024154663085938, -0.019965171813964844, -0.01790618896484375, -0.015847206115722656, -0.013788223266601562, -0.011729240417480469, -0.009670257568359375, -0.007611274719238281, -0.0055522918701171875, -0.0034933090209960938, -0.001434326171875, 0.0006246566772460938, 0.0026836395263671875, 0.004742622375488281, 0.006801605224609375, 0.008860588073730469, 0.010919570922851562, 0.012978553771972656, 0.01503753662109375, 0.017096519470214844, 0.019155502319335938, 0.02121448516845703, 0.023273468017578125, 0.02533245086669922, 0.027391433715820312, 0.029450416564941406, 0.0315093994140625, 0.033568382263183594, 0.03562736511230469, 0.03768634796142578, 0.039745330810546875, 0.04180431365966797, 0.04386329650878906, 0.045922279357910156, 0.04798126220703125, 0.050040245056152344, 0.05209922790527344, 0.05415821075439453, 0.056217193603515625, 0.05827617645263672, 0.06033515930175781, 0.062394142150878906, 0.064453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 11.0, 9.0, 13.0, 26.0, 28.0, 29.0, 50.0, 69.0, 85.0, 158.0, 237.0, 447.0, 784.0, 1823.0, 6740.0, 45448.0, 937093.0, 45165.0, 6293.0, 2084.0, 795.0, 461.0, 181.0, 140.0, 117.0, 71.0, 45.0, 34.0, 17.0, 16.0, 19.0, 8.0, 6.0, 14.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.6226043701171875e-05, -2.54875048995018e-05, -2.4748966097831726e-05, -2.401042729616165e-05, -2.3271888494491577e-05, -2.2533349692821503e-05, -2.1794810891151428e-05, -2.1056272089481354e-05, -2.031773328781128e-05, -1.9579194486141205e-05, -1.884065568447113e-05, -1.8102116882801056e-05, -1.736357808113098e-05, -1.6625039279460907e-05, -1.5886500477790833e-05, -1.5147961676120758e-05, -1.4409422874450684e-05, -1.3670884072780609e-05, -1.2932345271110535e-05, -1.219380646944046e-05, -1.1455267667770386e-05, -1.0716728866100311e-05, -9.978190064430237e-06, -9.239651262760162e-06, -8.501112461090088e-06, -7.762573659420013e-06, -7.024034857749939e-06, -6.2854960560798645e-06, -5.54695725440979e-06, -4.8084184527397156e-06, -4.069879651069641e-06, -3.3313408493995667e-06, -2.592802047729492e-06, -1.8542632460594177e-06, -1.1157244443893433e-06, -3.771856427192688e-07, 3.6135315895080566e-07, 1.0998919606208801e-06, 1.8384307622909546e-06, 2.576969563961029e-06, 3.3155083656311035e-06, 4.054047167301178e-06, 4.7925859689712524e-06, 5.531124770641327e-06, 6.269663572311401e-06, 7.008202373981476e-06, 7.74674117565155e-06, 8.485279977321625e-06, 9.2238187789917e-06, 9.962357580661774e-06, 1.0700896382331848e-05, 1.1439435184001923e-05, 1.2177973985671997e-05, 1.2916512787342072e-05, 1.3655051589012146e-05, 1.439359039068222e-05, 1.5132129192352295e-05, 1.587066799402237e-05, 1.6609206795692444e-05, 1.734774559736252e-05, 1.8086284399032593e-05, 1.8824823200702667e-05, 1.9563362002372742e-05, 2.0301900804042816e-05, 2.104043960571289e-05]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 5.0, 1.0, 11.0, 9.0, 20.0, 13.0, 20.0, 35.0, 15.0, 32.0, 28.0, 41.0, 55.0, 51.0, 48.0, 53.0, 55.0, 61.0, 34.0, 45.0, 71.0, 60.0, 40.0, 34.0, 27.0, 32.0, 25.0, 14.0, 18.0, 2.0, 13.0, 11.0, 8.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3974647521972656e-06, -3.2838433980941772e-06, -3.170222043991089e-06, -3.0566006898880005e-06, -2.942979335784912e-06, -2.8293579816818237e-06, -2.7157366275787354e-06, -2.602115273475647e-06, -2.4884939193725586e-06, -2.3748725652694702e-06, -2.261251211166382e-06, -2.1476298570632935e-06, -2.034008502960205e-06, -1.9203871488571167e-06, -1.8067657947540283e-06, -1.69314444065094e-06, -1.5795230865478516e-06, -1.4659017324447632e-06, -1.3522803783416748e-06, -1.2386590242385864e-06, -1.125037670135498e-06, -1.0114163160324097e-06, -8.977949619293213e-07, -7.841736078262329e-07, -6.705522537231445e-07, -5.569308996200562e-07, -4.4330954551696777e-07, -3.296881914138794e-07, -2.1606683731079102e-07, -1.0244548320770264e-07, 1.1175870895385742e-08, 1.2479722499847412e-07, 2.384185791015625e-07, 3.520399332046509e-07, 4.6566128730773926e-07, 5.792826414108276e-07, 6.92903995513916e-07, 8.065253496170044e-07, 9.201467037200928e-07, 1.0337680578231812e-06, 1.1473894119262695e-06, 1.261010766029358e-06, 1.3746321201324463e-06, 1.4882534742355347e-06, 1.601874828338623e-06, 1.7154961824417114e-06, 1.8291175365447998e-06, 1.942738890647888e-06, 2.0563602447509766e-06, 2.169981598854065e-06, 2.2836029529571533e-06, 2.3972243070602417e-06, 2.51084566116333e-06, 2.6244670152664185e-06, 2.738088369369507e-06, 2.8517097234725952e-06, 2.9653310775756836e-06, 3.078952431678772e-06, 3.1925737857818604e-06, 3.3061951398849487e-06, 3.419816493988037e-06, 3.5334378480911255e-06, 3.647059202194214e-06, 3.7606805562973022e-06, 3.874301910400391e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 2.0, 5.0, 4.0, 9.0, 12.0, 18.0, 24.0, 21.0, 28.0, 49.0, 57.0, 89.0, 91.0, 164.0, 335.0, 1073.0, 6464.0, 329889.0, 700357.0, 7728.0, 1115.0, 380.0, 184.0, 137.0, 76.0, 59.0, 44.0, 26.0, 20.0, 19.0, 18.0, 13.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.7179718017578125e-05, -2.640392631292343e-05, -2.5628134608268738e-05, -2.4852342903614044e-05, -2.407655119895935e-05, -2.3300759494304657e-05, -2.2524967789649963e-05, -2.174917608499527e-05, -2.0973384380340576e-05, -2.0197592675685883e-05, -1.942180097103119e-05, -1.8646009266376495e-05, -1.7870217561721802e-05, -1.7094425857067108e-05, -1.6318634152412415e-05, -1.554284244775772e-05, -1.4767050743103027e-05, -1.3991259038448334e-05, -1.321546733379364e-05, -1.2439675629138947e-05, -1.1663883924484253e-05, -1.088809221982956e-05, -1.0112300515174866e-05, -9.336508810520172e-06, -8.560717105865479e-06, -7.784925401210785e-06, -7.009133696556091e-06, -6.233341991901398e-06, -5.457550287246704e-06, -4.6817585825920105e-06, -3.905966877937317e-06, -3.1301751732826233e-06, -2.3543834686279297e-06, -1.578591763973236e-06, -8.028000593185425e-07, -2.7008354663848877e-08, 7.487833499908447e-07, 1.5245750546455383e-06, 2.300366759300232e-06, 3.0761584639549255e-06, 3.851950168609619e-06, 4.627741873264313e-06, 5.403533577919006e-06, 6.1793252825737e-06, 6.9551169872283936e-06, 7.730908691883087e-06, 8.50670039653778e-06, 9.282492101192474e-06, 1.0058283805847168e-05, 1.0834075510501862e-05, 1.1609867215156555e-05, 1.2385658919811249e-05, 1.3161450624465942e-05, 1.3937242329120636e-05, 1.471303403377533e-05, 1.5488825738430023e-05, 1.6264617443084717e-05, 1.704040914773941e-05, 1.7816200852394104e-05, 1.8591992557048798e-05, 1.936778426170349e-05, 2.0143575966358185e-05, 2.091936767101288e-05, 2.1695159375667572e-05, 2.2470951080322266e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 13.0, 19.0, 13.0, 15.0, 25.0, 30.0, 37.0, 20.0, 35.0, 37.0, 69.0, 69.0, 63.0, 71.0, 62.0, 69.0, 49.0, 57.0, 45.0, 27.0, 27.0, 24.0, 14.0, 15.0, 10.0, 12.0, 11.0, 10.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.4557113647460938e-05, -2.3855827748775482e-05, -2.3154541850090027e-05, -2.245325595140457e-05, -2.1751970052719116e-05, -2.105068415403366e-05, -2.0349398255348206e-05, -1.964811235666275e-05, -1.8946826457977295e-05, -1.824554055929184e-05, -1.7544254660606384e-05, -1.684296876192093e-05, -1.6141682863235474e-05, -1.544039696455002e-05, -1.4739111065864563e-05, -1.4037825167179108e-05, -1.3336539268493652e-05, -1.2635253369808197e-05, -1.1933967471122742e-05, -1.1232681572437286e-05, -1.0531395673751831e-05, -9.830109775066376e-06, -9.12882387638092e-06, -8.427537977695465e-06, -7.72625207901001e-06, -7.0249661803245544e-06, -6.323680281639099e-06, -5.622394382953644e-06, -4.9211084842681885e-06, -4.219822585582733e-06, -3.518536686897278e-06, -2.8172507882118225e-06, -2.115964889526367e-06, -1.4146789908409119e-06, -7.133930921554565e-07, -1.210719347000122e-08, 6.891787052154541e-07, 1.3904646039009094e-06, 2.0917505025863647e-06, 2.79303640127182e-06, 3.4943222999572754e-06, 4.195608198642731e-06, 4.896894097328186e-06, 5.598179996013641e-06, 6.299465894699097e-06, 7.000751793384552e-06, 7.702037692070007e-06, 8.403323590755463e-06, 9.104609489440918e-06, 9.805895388126373e-06, 1.0507181286811829e-05, 1.1208467185497284e-05, 1.190975308418274e-05, 1.2611038982868195e-05, 1.331232488155365e-05, 1.4013610780239105e-05, 1.471489667892456e-05, 1.5416182577610016e-05, 1.611746847629547e-05, 1.6818754374980927e-05, 1.7520040273666382e-05, 1.8221326172351837e-05, 1.8922612071037292e-05, 1.9623897969722748e-05, 2.0325183868408203e-05]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 875.0, 136.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.669297218322754, -4.587241172790527, -4.505185127258301, -4.423129081726074, -4.341073036193848, -4.259017467498779, -4.176961421966553, -4.094905376434326, -4.0128493309021, -3.930793285369873, -3.8487372398376465, -3.766681432723999, -3.6846253871917725, -3.602569341659546, -3.5205135345458984, -3.438457489013672, -3.3564014434814453, -3.2743453979492188, -3.192289352416992, -3.1102335453033447, -3.028177499771118, -2.9461214542388916, -2.864065647125244, -2.7820096015930176, -2.699953556060791, -2.6178975105285645, -2.535841464996338, -2.4537856578826904, -2.371729612350464, -2.2896735668182373, -2.20761775970459, -2.1255617141723633, -2.0435056686401367, -1.9614496231079102, -1.8793936967849731, -1.7973377704620361, -1.7152817249298096, -1.633225679397583, -1.551169753074646, -1.469113826751709, -1.3870577812194824, -1.3050017356872559, -1.2229458093643188, -1.1408898830413818, -1.0588338375091553, -0.9767778515815735, -0.8947218656539917, -0.8126658797264099, -0.7306098341941833, -0.6485538482666016, -0.5664978623390198, -0.484441876411438, -0.4023858904838562, -0.3203299045562744, -0.23827391862869263, -0.15621793270111084, -0.07416194677352905, 0.007894039154052734, 0.08995002508163452, 0.1720060110092163, 0.2540619969367981, 0.3361179828643799, 0.41817396879196167, 0.5002299547195435, 0.5822859406471252]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 6.0, 6.0, 5.0, 11.0, 14.0, 16.0, 18.0, 26.0, 49.0, 112.0, 144.0, 178.0, 141.0, 104.0, 59.0, 35.0, 16.0, 11.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.386279821395874, -1.339289665222168, -1.2922996282577515, -1.2453094720840454, -1.198319435119629, -1.1513292789459229, -1.1043391227722168, -1.0573489665985107, -1.0103589296340942, -0.963368833065033, -0.9163787364959717, -0.8693885803222656, -0.8223984837532043, -0.7754083871841431, -0.728418231010437, -0.6814281344413757, -0.6344380378723145, -0.5874479413032532, -0.5404578447341919, -0.49346768856048584, -0.44647759199142456, -0.3994874954223633, -0.3524973690509796, -0.30550724267959595, -0.25851714611053467, -0.2115270346403122, -0.16453692317008972, -0.11754681169986725, -0.07055670022964478, -0.023566588759422302, 0.02342352271080017, 0.07041364908218384, 0.11740386486053467, 0.16439397633075714, 0.21138408780097961, 0.2583742141723633, 0.30536431074142456, 0.35235440731048584, 0.3993445336818695, 0.4463346600532532, 0.49332475662231445, 0.5403148531913757, 0.587304949760437, 0.6342951059341431, 0.6812852025032043, 0.7282752990722656, 0.7752654552459717, 0.822255551815033, 0.8692456483840942, 0.9162357449531555, 0.9632258415222168, 1.0102159976959229, 1.057206153869629, 1.1041961908340454, 1.1511863470077515, 1.198176383972168, 1.245166540145874, 1.29215669631958, 1.3391467332839966, 1.3861368894577026, 1.4331269264221191, 1.4801170825958252, 1.5271072387695312, 1.5740973949432373, 1.6210874319076538]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 10.0, 9.0, 7.0, 23.0, 33.0, 52.0, 105.0, 198.0, 500.0, 1144.0, 3897.0, 52441.0, 4125752.0, 6156.0, 2087.0, 877.0, 449.0, 213.0, 123.0, 63.0, 36.0, 17.0, 24.0, 10.0, 8.0, 8.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1973876953125, -0.19035911560058594, -0.18333053588867188, -0.1763019561767578, -0.16927337646484375, -0.1622447967529297, -0.15521621704101562, -0.14818763732910156, -0.1411590576171875, -0.13413047790527344, -0.12710189819335938, -0.12007331848144531, -0.11304473876953125, -0.10601615905761719, -0.09898757934570312, -0.09195899963378906, -0.084930419921875, -0.07790184020996094, -0.07087326049804688, -0.06384468078613281, -0.05681610107421875, -0.04978752136230469, -0.042758941650390625, -0.03573036193847656, -0.0287017822265625, -0.021673202514648438, -0.014644622802734375, -0.0076160430908203125, -0.00058746337890625, 0.0064411163330078125, 0.013469696044921875, 0.020498275756835938, 0.02752685546875, 0.03455543518066406, 0.041584014892578125, 0.04861259460449219, 0.05564117431640625, 0.06266975402832031, 0.06969833374023438, 0.07672691345214844, 0.0837554931640625, 0.09078407287597656, 0.09781265258789062, 0.10484123229980469, 0.11186981201171875, 0.11889839172363281, 0.12592697143554688, 0.13295555114746094, 0.139984130859375, 0.14701271057128906, 0.15404129028320312, 0.1610698699951172, 0.16809844970703125, 0.1751270294189453, 0.18215560913085938, 0.18918418884277344, 0.1962127685546875, 0.20324134826660156, 0.21026992797851562, 0.2172985076904297, 0.22432708740234375, 0.2313556671142578, 0.23838424682617188, 0.24541282653808594, 0.25244140625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 10.0, 9.0, 4.0, 8.0, 4.0, 13.0, 15.0, 24.0, 613.0, 175.0, 17.0, 13.0, 10.0, 7.0, 8.0, 8.0, 6.0, 6.0, 4.0, 7.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01276397705078125, -0.012310385704040527, -0.011856794357299805, -0.011403203010559082, -0.01094961166381836, -0.010496020317077637, -0.010042428970336914, -0.009588837623596191, -0.009135246276855469, -0.008681654930114746, -0.008228063583374023, -0.007774472236633301, -0.007320880889892578, -0.0068672895431518555, -0.006413698196411133, -0.00596010684967041, -0.0055065155029296875, -0.005052924156188965, -0.004599332809448242, -0.0041457414627075195, -0.003692150115966797, -0.0032385587692260742, -0.0027849674224853516, -0.002331376075744629, -0.0018777847290039062, -0.0014241933822631836, -0.0009706020355224609, -0.0005170106887817383, -6.341934204101562e-05, 0.00039017200469970703, 0.0008437633514404297, 0.0012973546981811523, 0.001750946044921875, 0.0022045373916625977, 0.0026581287384033203, 0.003111720085144043, 0.0035653114318847656, 0.004018902778625488, 0.004472494125366211, 0.004926085472106934, 0.005379676818847656, 0.005833268165588379, 0.0062868595123291016, 0.006740450859069824, 0.007194042205810547, 0.0076476335525512695, 0.008101224899291992, 0.008554816246032715, 0.009008407592773438, 0.00946199893951416, 0.009915590286254883, 0.010369181632995605, 0.010822772979736328, 0.01127636432647705, 0.011729955673217773, 0.012183547019958496, 0.012637138366699219, 0.013090729713439941, 0.013544321060180664, 0.013997912406921387, 0.01445150375366211, 0.014905095100402832, 0.015358686447143555, 0.015812277793884277, 0.016265869140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 3.0, 6.0, 9.0, 6.0, 12.0, 17.0, 19.0, 12.0, 28.0, 31.0, 49.0, 62.0, 113.0, 174.0, 394.0, 1131.0, 5581.0, 58051.0, 4104599.0, 19744.0, 2783.0, 719.0, 272.0, 135.0, 64.0, 58.0, 40.0, 28.0, 19.0, 24.0, 10.0, 15.0, 10.0, 8.0, 12.0, 5.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1766357421875, -0.17148590087890625, -0.1663360595703125, -0.16118621826171875, -0.156036376953125, -0.15088653564453125, -0.1457366943359375, -0.14058685302734375, -0.13543701171875, -0.13028717041015625, -0.1251373291015625, -0.11998748779296875, -0.114837646484375, -0.10968780517578125, -0.1045379638671875, -0.09938812255859375, -0.09423828125, -0.08908843994140625, -0.0839385986328125, -0.07878875732421875, -0.073638916015625, -0.06848907470703125, -0.0633392333984375, -0.05818939208984375, -0.05303955078125, -0.04788970947265625, -0.0427398681640625, -0.03759002685546875, -0.032440185546875, -0.02729034423828125, -0.0221405029296875, -0.01699066162109375, -0.0118408203125, -0.00669097900390625, -0.0015411376953125, 0.00360870361328125, 0.008758544921875, 0.01390838623046875, 0.0190582275390625, 0.02420806884765625, 0.02935791015625, 0.03450775146484375, 0.0396575927734375, 0.04480743408203125, 0.049957275390625, 0.05510711669921875, 0.0602569580078125, 0.06540679931640625, 0.070556640625, 0.07570648193359375, 0.0808563232421875, 0.08600616455078125, 0.091156005859375, 0.09630584716796875, 0.1014556884765625, 0.10660552978515625, 0.11175537109375, 0.11690521240234375, 0.1220550537109375, 0.12720489501953125, 0.132354736328125, 0.13750457763671875, 0.1426544189453125, 0.14780426025390625, 0.1529541015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 9.0, 5.0, 8.0, 12.0, 19.0, 6.0, 19.0, 13.0, 21.0, 22.0, 36.0, 59.0, 3597.0, 30.0, 24.0, 22.0, 17.0, 14.0, 11.0, 13.0, 11.0, 15.0, 4.0, 14.0, 7.0, 7.0, 6.0, 5.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.025299072265625, -0.024561405181884766, -0.02382373809814453, -0.023086071014404297, -0.022348403930664062, -0.021610736846923828, -0.020873069763183594, -0.02013540267944336, -0.019397735595703125, -0.01866006851196289, -0.017922401428222656, -0.017184734344482422, -0.016447067260742188, -0.015709400177001953, -0.014971733093261719, -0.014234066009521484, -0.01349639892578125, -0.012758731842041016, -0.012021064758300781, -0.011283397674560547, -0.010545730590820312, -0.009808063507080078, -0.009070396423339844, -0.00833272933959961, -0.007595062255859375, -0.006857395172119141, -0.006119728088378906, -0.005382061004638672, -0.0046443939208984375, -0.003906726837158203, -0.0031690597534179688, -0.0024313926696777344, -0.0016937255859375, -0.0009560585021972656, -0.00021839141845703125, 0.0005192756652832031, 0.0012569427490234375, 0.001994609832763672, 0.0027322769165039062, 0.0034699440002441406, 0.004207611083984375, 0.004945278167724609, 0.005682945251464844, 0.006420612335205078, 0.0071582794189453125, 0.007895946502685547, 0.008633613586425781, 0.009371280670166016, 0.01010894775390625, 0.010846614837646484, 0.011584281921386719, 0.012321949005126953, 0.013059616088867188, 0.013797283172607422, 0.014534950256347656, 0.01527261734008789, 0.016010284423828125, 0.01674795150756836, 0.017485618591308594, 0.018223285675048828, 0.018960952758789062, 0.019698619842529297, 0.02043628692626953, 0.021173954010009766, 0.02191162109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1016.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.814591646194458, -1.782610297203064, -1.75062894821167, -1.7186474800109863, -1.6866661310195923, -1.6546847820281982, -1.6227034330368042, -1.5907220840454102, -1.5587407350540161, -1.526759386062622, -1.494778037071228, -1.462796688079834, -1.4308152198791504, -1.3988338708877563, -1.3668525218963623, -1.3348711729049683, -1.3028898239135742, -1.2709084749221802, -1.2389271259307861, -1.2069456577301025, -1.1749643087387085, -1.1429829597473145, -1.1110016107559204, -1.0790202617645264, -1.0470387935638428, -1.0150574445724487, -0.9830760359764099, -0.9510946869850159, -0.9191133379936218, -0.887131929397583, -0.855150580406189, -0.8231692314147949, -0.7911879420280457, -0.7592065930366516, -0.7272251844406128, -0.6952438354492188, -0.6632624864578247, -0.6312811374664307, -0.5992997288703918, -0.5673183798789978, -0.5353370308876038, -0.5033556818962097, -0.4713743031024933, -0.43939292430877686, -0.4074115753173828, -0.3754301965236664, -0.34344881772994995, -0.3114674687385559, -0.2794860601425171, -0.24750469624996185, -0.21552333235740662, -0.18354195356369019, -0.15156058967113495, -0.11957922577857971, -0.08759784698486328, -0.055616483092308044, -0.023635134100914, 0.008346233516931534, 0.04032760113477707, 0.0723089724779129, 0.10429033637046814, 0.13627170026302338, 0.1682530790567398, 0.20023444294929504, 0.23221580684185028]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 10.0, 6.0, 18.0, 22.0, 42.0, 67.0, 109.0, 138.0, 171.0, 112.0, 95.0, 73.0, 32.0, 15.0, 12.0, 13.0, 10.0, 5.0, 10.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13524079322814941, -0.13109557330608368, -0.12695035338401794, -0.1228051483631134, -0.11865992844104767, -0.11451470851898193, -0.1103694960474968, -0.10622428357601166, -0.10207906365394592, -0.09793384373188019, -0.09378863126039505, -0.08964341878890991, -0.08549819886684418, -0.08135297894477844, -0.0772077664732933, -0.07306255400180817, -0.06891733407974243, -0.0647721141576767, -0.06062690168619156, -0.05648168548941612, -0.052336469292640686, -0.04819125309586525, -0.04404603689908981, -0.03990082070231438, -0.03575560450553894, -0.031610388308763504, -0.027465172111988068, -0.02331995591521263, -0.019174739718437195, -0.015029523521661758, -0.010884307324886322, -0.006739091128110886, -0.0025938749313354492, 0.0015513412654399872, 0.005696557462215424, 0.00984177365899086, 0.013986989855766296, 0.018132206052541733, 0.02227742224931717, 0.026422638446092606, 0.030567854642868042, 0.03471307083964348, 0.038858287036418915, 0.04300350323319435, 0.04714871942996979, 0.051293935626745224, 0.05543915182352066, 0.0595843680202961, 0.06372958421707153, 0.06787480413913727, 0.0720200166106224, 0.07616522908210754, 0.08031044900417328, 0.08445566892623901, 0.08860088139772415, 0.09274609386920929, 0.09689131379127502, 0.10103653371334076, 0.1051817461848259, 0.10932695865631104, 0.11347217857837677, 0.1176173985004425, 0.12176261097192764, 0.12590782344341278, 0.13005304336547852]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 7.0, 10.0, 13.0, 21.0, 17.0, 29.0, 38.0, 38.0, 69.0, 91.0, 121.0, 152.0, 262.0, 322.0, 430.0, 607.0, 945.0, 1301.0, 2051.0, 2925.0, 4724.0, 7996.0, 13771.0, 29600.0, 866889.0, 70211.0, 18750.0, 10110.0, 5828.0, 3669.0, 2255.0, 1568.0, 1073.0, 747.0, 557.0, 372.0, 274.0, 214.0, 135.0, 101.0, 71.0, 58.0, 34.0, 22.0, 17.0, 17.0, 7.0, 10.0, 4.0, 6.0, 2.0, 5.0, 3.0, 1.0, 3.0], "bins": [-0.043182373046875, -0.04190206527709961, -0.04062175750732422, -0.03934144973754883, -0.03806114196777344, -0.03678083419799805, -0.035500526428222656, -0.034220218658447266, -0.032939910888671875, -0.031659603118896484, -0.030379295349121094, -0.029098987579345703, -0.027818679809570312, -0.026538372039794922, -0.02525806427001953, -0.02397775650024414, -0.02269744873046875, -0.02141714096069336, -0.02013683319091797, -0.018856525421142578, -0.017576217651367188, -0.016295909881591797, -0.015015602111816406, -0.013735294342041016, -0.012454986572265625, -0.011174678802490234, -0.009894371032714844, -0.008614063262939453, -0.0073337554931640625, -0.006053447723388672, -0.004773139953613281, -0.0034928321838378906, -0.0022125244140625, -0.0009322166442871094, 0.00034809112548828125, 0.0016283988952636719, 0.0029087066650390625, 0.004189014434814453, 0.005469322204589844, 0.006749629974365234, 0.008029937744140625, 0.009310245513916016, 0.010590553283691406, 0.011870861053466797, 0.013151168823242188, 0.014431476593017578, 0.01571178436279297, 0.01699209213256836, 0.01827239990234375, 0.01955270767211914, 0.02083301544189453, 0.022113323211669922, 0.023393630981445312, 0.024673938751220703, 0.025954246520996094, 0.027234554290771484, 0.028514862060546875, 0.029795169830322266, 0.031075477600097656, 0.03235578536987305, 0.03363609313964844, 0.03491640090942383, 0.03619670867919922, 0.03747701644897461, 0.03875732421875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 10.0, 4.0, 8.0, 9.0, 11.0, 15.0, 25.0, 482.0, 297.0, 24.0, 5.0, 12.0, 7.0, 9.0, 6.0, 8.0, 9.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01279449462890625, -0.01237177848815918, -0.01194906234741211, -0.011526346206665039, -0.011103630065917969, -0.010680913925170898, -0.010258197784423828, -0.009835481643676758, -0.009412765502929688, -0.008990049362182617, -0.008567333221435547, -0.008144617080688477, -0.007721900939941406, -0.007299184799194336, -0.006876468658447266, -0.006453752517700195, -0.006031036376953125, -0.005608320236206055, -0.005185604095458984, -0.004762887954711914, -0.004340171813964844, -0.0039174556732177734, -0.003494739532470703, -0.003072023391723633, -0.0026493072509765625, -0.002226591110229492, -0.0018038749694824219, -0.0013811588287353516, -0.0009584426879882812, -0.0005357265472412109, -0.00011301040649414062, 0.0003097057342529297, 0.000732421875, 0.0011551380157470703, 0.0015778541564941406, 0.002000570297241211, 0.0024232864379882812, 0.0028460025787353516, 0.003268718719482422, 0.003691434860229492, 0.0041141510009765625, 0.004536867141723633, 0.004959583282470703, 0.0053822994232177734, 0.005805015563964844, 0.006227731704711914, 0.006650447845458984, 0.007073163986206055, 0.007495880126953125, 0.007918596267700195, 0.008341312408447266, 0.008764028549194336, 0.009186744689941406, 0.009609460830688477, 0.010032176971435547, 0.010454893112182617, 0.010877609252929688, 0.011300325393676758, 0.011723041534423828, 0.012145757675170898, 0.012568473815917969, 0.012991189956665039, 0.01341390609741211, 0.01383662223815918, 0.01425933837890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 6.0, 8.0, 6.0, 9.0, 16.0, 10.0, 19.0, 13.0, 24.0, 39.0, 49.0, 53.0, 50.0, 58.0, 88.0, 116.0, 102.0, 169.0, 198.0, 366.0, 704.0, 3680.0, 90265.0, 927741.0, 21300.0, 1710.0, 523.0, 272.0, 191.0, 124.0, 111.0, 119.0, 76.0, 62.0, 53.0, 48.0, 37.0, 35.0, 21.0, 21.0, 17.0, 14.0, 10.0, 4.0, 7.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.0791482925415039, -0.07644844055175781, -0.07374858856201172, -0.07104873657226562, -0.06834888458251953, -0.06564903259277344, -0.06294918060302734, -0.06024932861328125, -0.057549476623535156, -0.05484962463378906, -0.05214977264404297, -0.049449920654296875, -0.04675006866455078, -0.04405021667480469, -0.041350364685058594, -0.0386505126953125, -0.035950660705566406, -0.03325080871582031, -0.03055095672607422, -0.027851104736328125, -0.02515125274658203, -0.022451400756835938, -0.019751548767089844, -0.01705169677734375, -0.014351844787597656, -0.011651992797851562, -0.008952140808105469, -0.006252288818359375, -0.0035524368286132812, -0.0008525848388671875, 0.0018472671508789062, 0.004547119140625, 0.007246971130371094, 0.009946823120117188, 0.012646675109863281, 0.015346527099609375, 0.01804637908935547, 0.020746231079101562, 0.023446083068847656, 0.02614593505859375, 0.028845787048339844, 0.03154563903808594, 0.03424549102783203, 0.036945343017578125, 0.03964519500732422, 0.04234504699707031, 0.045044898986816406, 0.0477447509765625, 0.050444602966308594, 0.05314445495605469, 0.05584430694580078, 0.058544158935546875, 0.06124401092529297, 0.06394386291503906, 0.06664371490478516, 0.06934356689453125, 0.07204341888427734, 0.07474327087402344, 0.07744312286376953, 0.08014297485351562, 0.08284282684326172, 0.08554267883300781, 0.0882425308227539, 0.0909423828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 7.0, 5.0, 8.0, 13.0, 6.0, 10.0, 4.0, 11.0, 15.0, 24.0, 21.0, 19.0, 25.0, 22.0, 30.0, 30.0, 41.0, 32.0, 40.0, 44.0, 36.0, 38.0, 44.0, 37.0, 38.0, 44.0, 37.0, 37.0, 38.0, 25.0, 39.0, 15.0, 18.0, 26.0, 24.0, 16.0, 12.0, 14.0, 9.0, 8.0, 10.0, 9.0, 3.0, 4.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03826904296875, -0.03700685501098633, -0.035744667053222656, -0.034482479095458984, -0.03322029113769531, -0.03195810317993164, -0.03069591522216797, -0.029433727264404297, -0.028171539306640625, -0.026909351348876953, -0.02564716339111328, -0.02438497543334961, -0.023122787475585938, -0.021860599517822266, -0.020598411560058594, -0.019336223602294922, -0.01807403564453125, -0.016811847686767578, -0.015549659729003906, -0.014287471771240234, -0.013025283813476562, -0.01176309585571289, -0.010500907897949219, -0.009238719940185547, -0.007976531982421875, -0.006714344024658203, -0.005452156066894531, -0.004189968109130859, -0.0029277801513671875, -0.0016655921936035156, -0.00040340423583984375, 0.0008587837219238281, 0.0021209716796875, 0.003383159637451172, 0.004645347595214844, 0.005907535552978516, 0.0071697235107421875, 0.00843191146850586, 0.009694099426269531, 0.010956287384033203, 0.012218475341796875, 0.013480663299560547, 0.014742851257324219, 0.01600503921508789, 0.017267227172851562, 0.018529415130615234, 0.019791603088378906, 0.021053791046142578, 0.02231597900390625, 0.023578166961669922, 0.024840354919433594, 0.026102542877197266, 0.027364730834960938, 0.02862691879272461, 0.02988910675048828, 0.031151294708251953, 0.032413482666015625, 0.0336756706237793, 0.03493785858154297, 0.03620004653930664, 0.03746223449707031, 0.038724422454833984, 0.039986610412597656, 0.04124879837036133, 0.042510986328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 14.0, 23.0, 47.0, 64.0, 165.0, 391.0, 1362.0, 9701.0, 1005077.0, 28689.0, 2099.0, 531.0, 185.0, 73.0, 42.0, 27.0, 12.0, 12.0, 9.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001360177993774414, -0.00013185106217861176, -0.0001276843249797821, -0.00012351758778095245, -0.0001193508505821228, -0.00011518411338329315, -0.0001110173761844635, -0.00010685063898563385, -0.0001026839017868042, -9.851716458797455e-05, -9.43504273891449e-05, -9.018369019031525e-05, -8.60169529914856e-05, -8.185021579265594e-05, -7.76834785938263e-05, -7.351674139499664e-05, -6.935000419616699e-05, -6.518326699733734e-05, -6.101652979850769e-05, -5.684979259967804e-05, -5.268305540084839e-05, -4.851631820201874e-05, -4.434958100318909e-05, -4.0182843804359436e-05, -3.6016106605529785e-05, -3.1849369406700134e-05, -2.7682632207870483e-05, -2.3515895009040833e-05, -1.934915781021118e-05, -1.518242061138153e-05, -1.101568341255188e-05, -6.848946213722229e-06, -2.682209014892578e-06, 1.4845281839370728e-06, 5.651265382766724e-06, 9.818002581596375e-06, 1.3984739780426025e-05, 1.8151476979255676e-05, 2.2318214178085327e-05, 2.6484951376914978e-05, 3.065168857574463e-05, 3.481842577457428e-05, 3.898516297340393e-05, 4.315190017223358e-05, 4.731863737106323e-05, 5.148537456989288e-05, 5.5652111768722534e-05, 5.9818848967552185e-05, 6.398558616638184e-05, 6.815232336521149e-05, 7.231906056404114e-05, 7.648579776287079e-05, 8.065253496170044e-05, 8.481927216053009e-05, 8.898600935935974e-05, 9.315274655818939e-05, 9.731948375701904e-05, 0.0001014862209558487, 0.00010565295815467834, 0.000109819695353508, 0.00011398643255233765, 0.0001181531697511673, 0.00012231990694999695, 0.0001264866441488266, 0.00013065338134765625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 5.0, 11.0, 15.0, 12.0, 24.0, 51.0, 65.0, 74.0, 90.0, 138.0, 98.0, 96.0, 80.0, 84.0, 52.0, 24.0, 20.0, 14.0, 18.0, 7.0, 7.0, 0.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0848045349121094e-05, -1.0595656931400299e-05, -1.0343268513679504e-05, -1.009088009595871e-05, -9.838491678237915e-06, -9.58610326051712e-06, -9.333714842796326e-06, -9.081326425075531e-06, -8.828938007354736e-06, -8.576549589633942e-06, -8.324161171913147e-06, -8.071772754192352e-06, -7.819384336471558e-06, -7.566995918750763e-06, -7.314607501029968e-06, -7.062219083309174e-06, -6.809830665588379e-06, -6.557442247867584e-06, -6.3050538301467896e-06, -6.052665412425995e-06, -5.8002769947052e-06, -5.5478885769844055e-06, -5.295500159263611e-06, -5.043111741542816e-06, -4.7907233238220215e-06, -4.538334906101227e-06, -4.285946488380432e-06, -4.0335580706596375e-06, -3.7811696529388428e-06, -3.528781235218048e-06, -3.2763928174972534e-06, -3.0240043997764587e-06, -2.771615982055664e-06, -2.5192275643348694e-06, -2.2668391466140747e-06, -2.01445072889328e-06, -1.7620623111724854e-06, -1.5096738934516907e-06, -1.257285475730896e-06, -1.0048970580101013e-06, -7.525086402893066e-07, -5.00120222568512e-07, -2.477318048477173e-07, 4.6566128730773926e-09, 2.5704503059387207e-07, 5.094334483146667e-07, 7.618218660354614e-07, 1.014210283756256e-06, 1.2665987014770508e-06, 1.5189871191978455e-06, 1.7713755369186401e-06, 2.023763954639435e-06, 2.2761523723602295e-06, 2.528540790081024e-06, 2.780929207801819e-06, 3.0333176255226135e-06, 3.285706043243408e-06, 3.538094460964203e-06, 3.7904828786849976e-06, 4.042871296405792e-06, 4.295259714126587e-06, 4.547648131847382e-06, 4.800036549568176e-06, 5.052424967288971e-06, 5.304813385009766e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 14.0, 16.0, 11.0, 31.0, 33.0, 45.0, 51.0, 76.0, 101.0, 143.0, 225.0, 321.0, 915.0, 7959.0, 966429.0, 68347.0, 2316.0, 552.0, 267.0, 175.0, 126.0, 81.0, 57.0, 57.0, 34.0, 31.0, 27.0, 18.0, 16.0, 7.0, 7.0, 9.0, 10.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.328655242919922e-05, -5.13661652803421e-05, -4.9445778131484985e-05, -4.752539098262787e-05, -4.560500383377075e-05, -4.3684616684913635e-05, -4.176422953605652e-05, -3.98438423871994e-05, -3.7923455238342285e-05, -3.600306808948517e-05, -3.408268094062805e-05, -3.2162293791770935e-05, -3.024190664291382e-05, -2.83215194940567e-05, -2.6401132345199585e-05, -2.4480745196342468e-05, -2.256035804748535e-05, -2.0639970898628235e-05, -1.8719583749771118e-05, -1.6799196600914e-05, -1.4878809452056885e-05, -1.2958422303199768e-05, -1.1038035154342651e-05, -9.117648005485535e-06, -7.197260856628418e-06, -5.276873707771301e-06, -3.3564865589141846e-06, -1.4360994100570679e-06, 4.842877388000488e-07, 2.4046748876571655e-06, 4.325062036514282e-06, 6.245449185371399e-06, 8.165836334228516e-06, 1.0086223483085632e-05, 1.2006610631942749e-05, 1.3926997780799866e-05, 1.5847384929656982e-05, 1.77677720785141e-05, 1.9688159227371216e-05, 2.1608546376228333e-05, 2.352893352508545e-05, 2.5449320673942566e-05, 2.7369707822799683e-05, 2.92900949716568e-05, 3.1210482120513916e-05, 3.313086926937103e-05, 3.505125641822815e-05, 3.6971643567085266e-05, 3.889203071594238e-05, 4.08124178647995e-05, 4.2732805013656616e-05, 4.465319216251373e-05, 4.657357931137085e-05, 4.8493966460227966e-05, 5.041435360908508e-05, 5.23347407579422e-05, 5.4255127906799316e-05, 5.617551505565643e-05, 5.809590220451355e-05, 6.0016289353370667e-05, 6.193667650222778e-05, 6.38570636510849e-05, 6.577745079994202e-05, 6.769783794879913e-05, 6.961822509765625e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 10.0, 6.0, 5.0, 5.0, 18.0, 12.0, 16.0, 19.0, 23.0, 40.0, 42.0, 41.0, 49.0, 62.0, 65.0, 87.0, 79.0, 64.0, 56.0, 47.0, 44.0, 44.0, 30.0, 20.0, 19.0, 18.0, 9.0, 16.0, 12.0, 9.0, 7.0, 4.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.491474151611328e-05, -2.401694655418396e-05, -2.311915159225464e-05, -2.2221356630325317e-05, -2.1323561668395996e-05, -2.0425766706466675e-05, -1.9527971744537354e-05, -1.8630176782608032e-05, -1.773238182067871e-05, -1.683458685874939e-05, -1.593679189682007e-05, -1.5038996934890747e-05, -1.4141201972961426e-05, -1.3243407011032104e-05, -1.2345612049102783e-05, -1.1447817087173462e-05, -1.055002212524414e-05, -9.65222716331482e-06, -8.754432201385498e-06, -7.856637239456177e-06, -6.9588422775268555e-06, -6.061047315597534e-06, -5.163252353668213e-06, -4.265457391738892e-06, -3.3676624298095703e-06, -2.469867467880249e-06, -1.5720725059509277e-06, -6.742775440216064e-07, 2.2351741790771484e-07, 1.1213123798370361e-06, 2.0191073417663574e-06, 2.9169023036956787e-06, 3.814697265625e-06, 4.712492227554321e-06, 5.610287189483643e-06, 6.508082151412964e-06, 7.405877113342285e-06, 8.303672075271606e-06, 9.201467037200928e-06, 1.0099261999130249e-05, 1.099705696105957e-05, 1.1894851922988892e-05, 1.2792646884918213e-05, 1.3690441846847534e-05, 1.4588236808776855e-05, 1.5486031770706177e-05, 1.6383826732635498e-05, 1.728162169456482e-05, 1.817941665649414e-05, 1.9077211618423462e-05, 1.9975006580352783e-05, 2.0872801542282104e-05, 2.1770596504211426e-05, 2.2668391466140747e-05, 2.356618642807007e-05, 2.446398138999939e-05, 2.536177635192871e-05, 2.6259571313858032e-05, 2.7157366275787354e-05, 2.8055161237716675e-05, 2.8952956199645996e-05, 2.9850751161575317e-05, 3.074854612350464e-05, 3.164634108543396e-05, 3.254413604736328e-05]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 965.0, 37.0, 6.0, 0.0, 1.0], "bins": [-2.155596971511841, -2.1194586753845215, -2.083320379257202, -2.0471818447113037, -2.0110435485839844, -1.974905252456665, -1.9387669563293457, -1.9026286602020264, -1.8664902448654175, -1.8303519487380981, -1.7942135334014893, -1.75807523727417, -1.7219369411468506, -1.6857985258102417, -1.6496602296829224, -1.6135218143463135, -1.5773835182189941, -1.5412452220916748, -1.505106806755066, -1.4689685106277466, -1.4328300952911377, -1.3966917991638184, -1.360553503036499, -1.3244152069091797, -1.2882767915725708, -1.2521384954452515, -1.2160000801086426, -1.1798617839813232, -1.143723487854004, -1.107585072517395, -1.0714467763900757, -1.0353083610534668, -0.9991700053215027, -0.9630316495895386, -0.9268933534622192, -0.8907549977302551, -0.854616641998291, -0.8184782862663269, -0.7823399305343628, -0.7462016344070435, -0.7100632786750793, -0.6739249229431152, -0.6377866268157959, -0.6016482710838318, -0.5655099153518677, -0.5293715596199036, -0.49323323369026184, -0.4570949077606201, -0.420956552028656, -0.3848181962966919, -0.34867987036705017, -0.31254154443740845, -0.27640318870544434, -0.24026484787464142, -0.2041265070438385, -0.16798818111419678, -0.13184982538223267, -0.09571148455142975, -0.05957314372062683, -0.023434802889823914, 0.012703537940979004, 0.04884187877178192, 0.08498021960258484, 0.12111854553222656, 0.15725690126419067]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 13.0, 12.0, 15.0, 21.0, 28.0, 40.0, 50.0, 72.0, 79.0, 107.0, 96.0, 96.0, 82.0, 71.0, 38.0, 45.0, 29.0, 22.0, 13.0, 12.0, 8.0, 6.0, 1.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48047685623168945, -0.4644232988357544, -0.44836974143981934, -0.4323161840438843, -0.4162626266479492, -0.40020906925201416, -0.3841554820537567, -0.36810192465782166, -0.3520483672618866, -0.33599480986595154, -0.3199412524700165, -0.3038876950740814, -0.287834107875824, -0.2717805504798889, -0.25572699308395386, -0.2396734356880188, -0.22361987829208374, -0.20756632089614868, -0.19151276350021362, -0.17545919120311737, -0.1594056338071823, -0.14335207641124725, -0.127298504114151, -0.11124494671821594, -0.09519138932228088, -0.07913783192634583, -0.06308426707983017, -0.04703070595860481, -0.030977144837379456, -0.014923587441444397, 0.0011299774050712585, 0.017183542251586914, 0.0332370400428772, 0.049290601164102554, 0.06534416228532791, 0.08139772713184357, 0.09745128452777863, 0.11350484192371368, 0.12955841422080994, 0.145611971616745, 0.16166552901268005, 0.1777190864086151, 0.19377264380455017, 0.20982621610164642, 0.22587977349758148, 0.24193333089351654, 0.2579869031906128, 0.27404046058654785, 0.2900940179824829, 0.30614757537841797, 0.322201132774353, 0.3382546901702881, 0.35430824756622314, 0.3703618049621582, 0.38641539216041565, 0.4024689495563507, 0.41852250695228577, 0.4345760643482208, 0.4506296217441559, 0.46668317914009094, 0.4827367663383484, 0.49879032373428345, 0.5148438811302185, 0.5308974385261536, 0.5469509959220886]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 6.0, 15.0, 12.0, 27.0, 32.0, 51.0, 110.0, 171.0, 312.0, 607.0, 1264.0, 3046.0, 9516.0, 4055298.0, 105873.0, 10079.0, 3851.0, 1783.0, 940.0, 529.0, 278.0, 165.0, 101.0, 62.0, 42.0, 24.0, 23.0, 15.0, 10.0, 9.0, 3.0, 3.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.134521484375, -0.1301727294921875, -0.125823974609375, -0.1214752197265625, -0.11712646484375, -0.1127777099609375, -0.108428955078125, -0.1040802001953125, -0.0997314453125, -0.0953826904296875, -0.091033935546875, -0.0866851806640625, -0.08233642578125, -0.0779876708984375, -0.073638916015625, -0.0692901611328125, -0.06494140625, -0.0605926513671875, -0.056243896484375, -0.0518951416015625, -0.04754638671875, -0.0431976318359375, -0.038848876953125, -0.0345001220703125, -0.0301513671875, -0.0258026123046875, -0.021453857421875, -0.0171051025390625, -0.01275634765625, -0.0084075927734375, -0.004058837890625, 0.0002899169921875, 0.004638671875, 0.0089874267578125, 0.013336181640625, 0.0176849365234375, 0.02203369140625, 0.0263824462890625, 0.030731201171875, 0.0350799560546875, 0.0394287109375, 0.0437774658203125, 0.048126220703125, 0.0524749755859375, 0.05682373046875, 0.0611724853515625, 0.065521240234375, 0.0698699951171875, 0.07421875, 0.0785675048828125, 0.082916259765625, 0.0872650146484375, 0.09161376953125, 0.0959625244140625, 0.100311279296875, 0.1046600341796875, 0.1090087890625, 0.1133575439453125, 0.117706298828125, 0.1220550537109375, 0.12640380859375, 0.1307525634765625, 0.135101318359375, 0.1394500732421875, 0.143798828125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 4.0, 8.0, 8.0, 5.0, 12.0, 14.0, 13.0, 61.0, 586.0, 163.0, 17.0, 9.0, 9.0, 11.0, 11.0, 5.0, 8.0, 4.0, 5.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01287078857421875, -0.012455344200134277, -0.012039899826049805, -0.011624455451965332, -0.01120901107788086, -0.010793566703796387, -0.010378122329711914, -0.009962677955627441, -0.009547233581542969, -0.009131789207458496, -0.008716344833374023, -0.00830090045928955, -0.007885456085205078, -0.0074700117111206055, -0.007054567337036133, -0.00663912296295166, -0.0062236785888671875, -0.005808234214782715, -0.005392789840698242, -0.0049773454666137695, -0.004561901092529297, -0.004146456718444824, -0.0037310123443603516, -0.003315567970275879, -0.0029001235961914062, -0.0024846792221069336, -0.002069234848022461, -0.0016537904739379883, -0.0012383460998535156, -0.000822901725769043, -0.0004074573516845703, 7.987022399902344e-06, 0.000423431396484375, 0.0008388757705688477, 0.0012543201446533203, 0.001669764518737793, 0.0020852088928222656, 0.0025006532669067383, 0.002916097640991211, 0.0033315420150756836, 0.0037469863891601562, 0.004162430763244629, 0.0045778751373291016, 0.004993319511413574, 0.005408763885498047, 0.0058242082595825195, 0.006239652633666992, 0.006655097007751465, 0.0070705413818359375, 0.00748598575592041, 0.007901430130004883, 0.008316874504089355, 0.008732318878173828, 0.0091477632522583, 0.009563207626342773, 0.009978652000427246, 0.010394096374511719, 0.010809540748596191, 0.011224985122680664, 0.011640429496765137, 0.01205587387084961, 0.012471318244934082, 0.012886762619018555, 0.013302206993103027, 0.0137176513671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 7.0, 8.0, 15.0, 22.0, 17.0, 35.0, 34.0, 54.0, 80.0, 124.0, 188.0, 349.0, 933.0, 6635.0, 4133695.0, 48788.0, 2022.0, 522.0, 241.0, 146.0, 102.0, 64.0, 50.0, 29.0, 22.0, 14.0, 23.0, 11.0, 9.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.254638671875, -0.24686241149902344, -0.23908615112304688, -0.2313098907470703, -0.22353363037109375, -0.2157573699951172, -0.20798110961914062, -0.20020484924316406, -0.1924285888671875, -0.18465232849121094, -0.17687606811523438, -0.1690998077392578, -0.16132354736328125, -0.1535472869873047, -0.14577102661132812, -0.13799476623535156, -0.130218505859375, -0.12244224548339844, -0.11466598510742188, -0.10688972473144531, -0.09911346435546875, -0.09133720397949219, -0.08356094360351562, -0.07578468322753906, -0.0680084228515625, -0.06023216247558594, -0.052455902099609375, -0.04467964172363281, -0.03690338134765625, -0.029127120971679688, -0.021350860595703125, -0.013574600219726562, -0.00579833984375, 0.0019779205322265625, 0.009754180908203125, 0.017530441284179688, 0.02530670166015625, 0.03308296203613281, 0.040859222412109375, 0.04863548278808594, 0.0564117431640625, 0.06418800354003906, 0.07196426391601562, 0.07974052429199219, 0.08751678466796875, 0.09529304504394531, 0.10306930541992188, 0.11084556579589844, 0.118621826171875, 0.12639808654785156, 0.13417434692382812, 0.1419506072998047, 0.14972686767578125, 0.1575031280517578, 0.16527938842773438, 0.17305564880371094, 0.1808319091796875, 0.18860816955566406, 0.19638442993164062, 0.2041606903076172, 0.21193695068359375, 0.2197132110595703, 0.22748947143554688, 0.23526573181152344, 0.2430419921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 8.0, 4.0, 9.0, 16.0, 18.0, 20.0, 30.0, 32.0, 56.0, 54.0, 71.0, 135.0, 2481.0, 701.0, 117.0, 89.0, 54.0, 36.0, 32.0, 25.0, 18.0, 7.0, 10.0, 10.0, 8.0, 12.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.036457061767578125, -0.03531646728515625, -0.034175872802734375, -0.0330352783203125, -0.031894683837890625, -0.03075408935546875, -0.029613494873046875, -0.028472900390625, -0.027332305908203125, -0.02619171142578125, -0.025051116943359375, -0.0239105224609375, -0.022769927978515625, -0.02162933349609375, -0.020488739013671875, -0.01934814453125, -0.018207550048828125, -0.01706695556640625, -0.015926361083984375, -0.0147857666015625, -0.013645172119140625, -0.01250457763671875, -0.011363983154296875, -0.010223388671875, -0.009082794189453125, -0.00794219970703125, -0.006801605224609375, -0.0056610107421875, -0.004520416259765625, -0.00337982177734375, -0.002239227294921875, -0.0010986328125, 4.1961669921875e-05, 0.00118255615234375, 0.002323150634765625, 0.0034637451171875, 0.004604339599609375, 0.00574493408203125, 0.006885528564453125, 0.008026123046875, 0.009166717529296875, 0.01030731201171875, 0.011447906494140625, 0.0125885009765625, 0.013729095458984375, 0.01486968994140625, 0.016010284423828125, 0.01715087890625, 0.018291473388671875, 0.01943206787109375, 0.020572662353515625, 0.0217132568359375, 0.022853851318359375, 0.02399444580078125, 0.025135040283203125, 0.026275634765625, 0.027416229248046875, 0.02855682373046875, 0.029697418212890625, 0.0308380126953125, 0.031978607177734375, 0.03311920166015625, 0.034259796142578125, 0.035400390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 7.0, 98.0, 855.0, 38.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.262847900390625, -0.2575269937515259, -0.25220605731010437, -0.24688513576984406, -0.24156421422958374, -0.23624329268932343, -0.2309223711490631, -0.225601464509964, -0.22028052806854248, -0.21495960652828217, -0.20963868498802185, -0.20431776344776154, -0.19899684190750122, -0.1936759203672409, -0.1883549988269806, -0.18303409218788147, -0.17771317064762115, -0.17239224910736084, -0.16707132756710052, -0.1617504060268402, -0.1564294844865799, -0.15110856294631958, -0.14578765630722046, -0.14046671986579895, -0.13514581322669983, -0.12982489168643951, -0.1245039701461792, -0.11918304860591888, -0.11386212706565857, -0.10854120552539825, -0.10322029143571854, -0.09789936989545822, -0.09257844090461731, -0.087257519364357, -0.08193659782409668, -0.07661567628383636, -0.07129475474357605, -0.06597383320331573, -0.06065291911363602, -0.0553319975733757, -0.05001107603311539, -0.04469015449285507, -0.03936923295259476, -0.03404831513762474, -0.028727393597364426, -0.02340647205710411, -0.018085554242134094, -0.01276463270187378, -0.007443711161613464, -0.002122790552675724, 0.0031981300562620163, 0.008519049733877182, 0.013839971274137497, 0.019160892814397812, 0.02448181062936783, 0.029802732169628143, 0.03512365370988846, 0.04044457525014877, 0.04576549679040909, 0.051086414605379105, 0.05640733614563942, 0.061728257685899734, 0.06704917550086975, 0.07237009704113007, 0.07769101858139038]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 7.0, 2.0, 8.0, 11.0, 8.0, 11.0, 20.0, 25.0, 42.0, 54.0, 65.0, 99.0, 85.0, 92.0, 99.0, 94.0, 62.0, 53.0, 41.0, 37.0, 19.0, 17.0, 9.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1677730679512024, -0.1625528782606125, -0.15733268857002258, -0.15211249887943268, -0.14689230918884277, -0.14167211949825287, -0.13645192980766296, -0.13123172521591187, -0.12601155042648315, -0.12079136073589325, -0.11557117104530334, -0.11035098135471344, -0.10513079166412354, -0.09991060197353363, -0.09469040483236313, -0.08947021514177322, -0.08425001800060272, -0.07902982831001282, -0.07380963861942291, -0.06858944892883301, -0.0633692592382431, -0.0581490658223629, -0.0529288724064827, -0.04770868271589279, -0.04248849302530289, -0.03726830333471298, -0.03204811364412308, -0.026827920228242874, -0.02160773053765297, -0.016387540847063065, -0.011167347431182861, -0.0059471577405929565, -0.0007269680500030518, 0.004493222571909428, 0.009713413193821907, 0.014933604747056961, 0.020153794437646866, 0.02537398412823677, 0.030594177544116974, 0.03581436723470688, 0.04103455692529678, 0.04625474661588669, 0.05147493630647659, 0.056695129722356796, 0.0619153194129467, 0.0671355128288269, 0.07235570251941681, 0.07757589221000671, 0.08279608190059662, 0.08801627159118652, 0.09323646128177643, 0.09845665097236633, 0.10367684066295624, 0.10889703035354614, 0.11411722749471664, 0.11933741718530655, 0.12455760687589645, 0.12977780401706696, 0.13499799370765686, 0.14021818339824677, 0.14543837308883667, 0.15065856277942657, 0.15587875247001648, 0.16109894216060638, 0.1663191318511963]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 9.0, 9.0, 11.0, 12.0, 30.0, 33.0, 52.0, 63.0, 96.0, 143.0, 166.0, 251.0, 397.0, 527.0, 846.0, 1283.0, 2041.0, 3472.0, 6262.0, 13193.0, 42240.0, 904518.0, 43173.0, 13474.0, 6511.0, 3510.0, 2046.0, 1334.0, 842.0, 585.0, 401.0, 290.0, 201.0, 134.0, 111.0, 80.0, 57.0, 47.0, 28.0, 23.0, 13.0, 16.0, 7.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.039581298828125, -0.0382843017578125, -0.0369873046875, -0.0356903076171875, -0.034393310546875, -0.0330963134765625, -0.03179931640625, -0.0305023193359375, -0.029205322265625, -0.0279083251953125, -0.026611328125, -0.0253143310546875, -0.024017333984375, -0.0227203369140625, -0.02142333984375, -0.0201263427734375, -0.018829345703125, -0.0175323486328125, -0.0162353515625, -0.0149383544921875, -0.013641357421875, -0.0123443603515625, -0.01104736328125, -0.0097503662109375, -0.008453369140625, -0.0071563720703125, -0.005859375, -0.0045623779296875, -0.003265380859375, -0.0019683837890625, -0.00067138671875, 0.0006256103515625, 0.001922607421875, 0.0032196044921875, 0.0045166015625, 0.0058135986328125, 0.007110595703125, 0.0084075927734375, 0.00970458984375, 0.0110015869140625, 0.012298583984375, 0.0135955810546875, 0.014892578125, 0.0161895751953125, 0.017486572265625, 0.0187835693359375, 0.02008056640625, 0.0213775634765625, 0.022674560546875, 0.0239715576171875, 0.0252685546875, 0.0265655517578125, 0.027862548828125, 0.0291595458984375, 0.03045654296875, 0.0317535400390625, 0.033050537109375, 0.0343475341796875, 0.03564453125, 0.0369415283203125, 0.038238525390625, 0.0395355224609375, 0.04083251953125, 0.0421295166015625, 0.043426513671875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 5.0, 4.0, 1.0, 7.0, 4.0, 4.0, 10.0, 11.0, 6.0, 13.0, 10.0, 38.0, 259.0, 438.0, 84.0, 14.0, 13.0, 8.0, 9.0, 11.0, 7.0, 6.0, 4.0, 6.0, 4.0, 3.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01080322265625, -0.010449647903442383, -0.010096073150634766, -0.009742498397827148, -0.009388923645019531, -0.009035348892211914, -0.008681774139404297, -0.00832819938659668, -0.007974624633789062, -0.007621049880981445, -0.007267475128173828, -0.006913900375366211, -0.006560325622558594, -0.0062067508697509766, -0.005853176116943359, -0.005499601364135742, -0.005146026611328125, -0.004792451858520508, -0.004438877105712891, -0.0040853023529052734, -0.0037317276000976562, -0.003378152847290039, -0.003024578094482422, -0.0026710033416748047, -0.0023174285888671875, -0.0019638538360595703, -0.0016102790832519531, -0.001256704330444336, -0.0009031295776367188, -0.0005495548248291016, -0.00019598007202148438, 0.0001575946807861328, 0.00051116943359375, 0.0008647441864013672, 0.0012183189392089844, 0.0015718936920166016, 0.0019254684448242188, 0.002279043197631836, 0.002632617950439453, 0.0029861927032470703, 0.0033397674560546875, 0.0036933422088623047, 0.004046916961669922, 0.004400491714477539, 0.004754066467285156, 0.0051076412200927734, 0.005461215972900391, 0.005814790725708008, 0.006168365478515625, 0.006521940231323242, 0.006875514984130859, 0.0072290897369384766, 0.007582664489746094, 0.007936239242553711, 0.008289813995361328, 0.008643388748168945, 0.008996963500976562, 0.00935053825378418, 0.009704113006591797, 0.010057687759399414, 0.010411262512207031, 0.010764837265014648, 0.011118412017822266, 0.011471986770629883, 0.0118255615234375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 11.0, 13.0, 21.0, 24.0, 36.0, 34.0, 42.0, 46.0, 66.0, 70.0, 87.0, 97.0, 125.0, 175.0, 254.0, 539.0, 2198.0, 49141.0, 979576.0, 13276.0, 1228.0, 407.0, 223.0, 163.0, 134.0, 110.0, 81.0, 59.0, 57.0, 47.0, 31.0, 31.0, 25.0, 21.0, 19.0, 15.0, 11.0, 13.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0966796875, -0.093780517578125, -0.09088134765625, -0.087982177734375, -0.0850830078125, -0.082183837890625, -0.07928466796875, -0.076385498046875, -0.073486328125, -0.070587158203125, -0.06768798828125, -0.064788818359375, -0.0618896484375, -0.058990478515625, -0.05609130859375, -0.053192138671875, -0.05029296875, -0.047393798828125, -0.04449462890625, -0.041595458984375, -0.0386962890625, -0.035797119140625, -0.03289794921875, -0.029998779296875, -0.027099609375, -0.024200439453125, -0.02130126953125, -0.018402099609375, -0.0155029296875, -0.012603759765625, -0.00970458984375, -0.006805419921875, -0.00390625, -0.001007080078125, 0.00189208984375, 0.004791259765625, 0.0076904296875, 0.010589599609375, 0.01348876953125, 0.016387939453125, 0.019287109375, 0.022186279296875, 0.02508544921875, 0.027984619140625, 0.0308837890625, 0.033782958984375, 0.03668212890625, 0.039581298828125, 0.04248046875, 0.045379638671875, 0.04827880859375, 0.051177978515625, 0.0540771484375, 0.056976318359375, 0.05987548828125, 0.062774658203125, 0.065673828125, 0.068572998046875, 0.07147216796875, 0.074371337890625, 0.0772705078125, 0.080169677734375, 0.08306884765625, 0.085968017578125, 0.0888671875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 8.0, 5.0, 6.0, 9.0, 12.0, 17.0, 14.0, 24.0, 17.0, 27.0, 28.0, 28.0, 23.0, 27.0, 36.0, 44.0, 48.0, 50.0, 39.0, 56.0, 54.0, 38.0, 41.0, 35.0, 43.0, 44.0, 47.0, 21.0, 23.0, 15.0, 22.0, 14.0, 11.0, 9.0, 8.0, 9.0, 8.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0308074951171875, -0.029883384704589844, -0.028959274291992188, -0.02803516387939453, -0.027111053466796875, -0.02618694305419922, -0.025262832641601562, -0.024338722229003906, -0.02341461181640625, -0.022490501403808594, -0.021566390991210938, -0.02064228057861328, -0.019718170166015625, -0.01879405975341797, -0.017869949340820312, -0.016945838928222656, -0.016021728515625, -0.015097618103027344, -0.014173507690429688, -0.013249397277832031, -0.012325286865234375, -0.011401176452636719, -0.010477066040039062, -0.009552955627441406, -0.00862884521484375, -0.007704734802246094, -0.0067806243896484375, -0.005856513977050781, -0.004932403564453125, -0.004008293151855469, -0.0030841827392578125, -0.0021600723266601562, -0.0012359619140625, -0.00031185150146484375, 0.0006122589111328125, 0.0015363693237304688, 0.002460479736328125, 0.0033845901489257812, 0.0043087005615234375, 0.005232810974121094, 0.00615692138671875, 0.007081031799316406, 0.008005142211914062, 0.008929252624511719, 0.009853363037109375, 0.010777473449707031, 0.011701583862304688, 0.012625694274902344, 0.0135498046875, 0.014473915100097656, 0.015398025512695312, 0.01632213592529297, 0.017246246337890625, 0.01817035675048828, 0.019094467163085938, 0.020018577575683594, 0.02094268798828125, 0.021866798400878906, 0.022790908813476562, 0.02371501922607422, 0.024639129638671875, 0.02556324005126953, 0.026487350463867188, 0.027411460876464844, 0.0283355712890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 10.0, 14.0, 23.0, 42.0, 42.0, 57.0, 85.0, 153.0, 200.0, 368.0, 828.0, 2850.0, 51927.0, 981696.0, 7426.0, 1506.0, 490.0, 271.0, 170.0, 107.0, 69.0, 53.0, 39.0, 31.0, 14.0, 14.0, 13.0, 11.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00019669532775878906, -0.00019059516489505768, -0.0001844950020313263, -0.0001783948391675949, -0.00017229467630386353, -0.00016619451344013214, -0.00016009435057640076, -0.00015399418771266937, -0.000147894024848938, -0.0001417938619852066, -0.00013569369912147522, -0.00012959353625774384, -0.00012349337339401245, -0.00011739321053028107, -0.00011129304766654968, -0.0001051928848028183, -9.909272193908691e-05, -9.299255907535553e-05, -8.689239621162415e-05, -8.079223334789276e-05, -7.469207048416138e-05, -6.859190762042999e-05, -6.249174475669861e-05, -5.6391581892967224e-05, -5.029141902923584e-05, -4.4191256165504456e-05, -3.809109330177307e-05, -3.199093043804169e-05, -2.5890767574310303e-05, -1.979060471057892e-05, -1.3690441846847534e-05, -7.59027898311615e-06, -1.4901161193847656e-06, 4.610046744346619e-06, 1.0710209608078003e-05, 1.6810372471809387e-05, 2.291053533554077e-05, 2.9010698199272156e-05, 3.511086106300354e-05, 4.1211023926734924e-05, 4.731118679046631e-05, 5.341134965419769e-05, 5.951151251792908e-05, 6.561167538166046e-05, 7.171183824539185e-05, 7.781200110912323e-05, 8.391216397285461e-05, 9.0012326836586e-05, 9.611248970031738e-05, 0.00010221265256404877, 0.00010831281542778015, 0.00011441297829151154, 0.00012051314115524292, 0.0001266133040189743, 0.0001327134668827057, 0.00013881362974643707, 0.00014491379261016846, 0.00015101395547389984, 0.00015711411833763123, 0.0001632142812013626, 0.000169314444065094, 0.00017541460692882538, 0.00018151476979255676, 0.00018761493265628815, 0.00019371509552001953]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 10.0, 14.0, 20.0, 33.0, 40.0, 65.0, 85.0, 61.0, 108.0, 81.0, 101.0, 76.0, 79.0, 43.0, 57.0, 23.0, 29.0, 19.0, 8.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.185604095458984e-06, -4.974193871021271e-06, -4.762783646583557e-06, -4.5513734221458435e-06, -4.33996319770813e-06, -4.128552973270416e-06, -3.917142748832703e-06, -3.705732524394989e-06, -3.4943222999572754e-06, -3.2829120755195618e-06, -3.071501851081848e-06, -2.8600916266441345e-06, -2.648681402206421e-06, -2.4372711777687073e-06, -2.2258609533309937e-06, -2.01445072889328e-06, -1.8030405044555664e-06, -1.5916302800178528e-06, -1.3802200555801392e-06, -1.1688098311424255e-06, -9.57399606704712e-07, -7.459893822669983e-07, -5.345791578292847e-07, -3.2316893339157104e-07, -1.1175870895385742e-07, 9.96515154838562e-08, 3.110617399215698e-07, 5.224719643592834e-07, 7.338821887969971e-07, 9.452924132347107e-07, 1.1567026376724243e-06, 1.368112862110138e-06, 1.5795230865478516e-06, 1.7909333109855652e-06, 2.002343535423279e-06, 2.2137537598609924e-06, 2.425163984298706e-06, 2.6365742087364197e-06, 2.8479844331741333e-06, 3.059394657611847e-06, 3.2708048820495605e-06, 3.482215106487274e-06, 3.693625330924988e-06, 3.905035555362701e-06, 4.116445779800415e-06, 4.327856004238129e-06, 4.539266228675842e-06, 4.750676453113556e-06, 4.9620866775512695e-06, 5.173496901988983e-06, 5.384907126426697e-06, 5.59631735086441e-06, 5.807727575302124e-06, 6.019137799739838e-06, 6.230548024177551e-06, 6.441958248615265e-06, 6.6533684730529785e-06, 6.864778697490692e-06, 7.076188921928406e-06, 7.287599146366119e-06, 7.499009370803833e-06, 7.710419595241547e-06, 7.92182981967926e-06, 8.133240044116974e-06, 8.344650268554688e-06]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 13.0, 19.0, 28.0, 27.0, 52.0, 94.0, 158.0, 367.0, 1885.0, 1031367.0, 13345.0, 654.0, 238.0, 107.0, 57.0, 43.0, 31.0, 26.0, 5.0, 9.0, 11.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002770423889160156, -0.0002666749060153961, -0.0002563074231147766, -0.0002459399402141571, -0.0002355724573135376, -0.0002252049744129181, -0.00021483749151229858, -0.00020447000861167908, -0.00019410252571105957, -0.00018373504281044006, -0.00017336755990982056, -0.00016300007700920105, -0.00015263259410858154, -0.00014226511120796204, -0.00013189762830734253, -0.00012153014540672302, -0.00011116266250610352, -0.00010079517960548401, -9.04276967048645e-05, -8.0060213804245e-05, -6.969273090362549e-05, -5.932524800300598e-05, -4.8957765102386475e-05, -3.859028220176697e-05, -2.822279930114746e-05, -1.7855316400527954e-05, -7.487833499908447e-06, 2.8796494007110596e-06, 1.3247132301330566e-05, 2.3614615201950073e-05, 3.398209810256958e-05, 4.434958100318909e-05, 5.4717063903808594e-05, 6.50845468044281e-05, 7.545202970504761e-05, 8.581951260566711e-05, 9.618699550628662e-05, 0.00010655447840690613, 0.00011692196130752563, 0.00012728944420814514, 0.00013765692710876465, 0.00014802441000938416, 0.00015839189291000366, 0.00016875937581062317, 0.00017912685871124268, 0.00018949434161186218, 0.0001998618245124817, 0.0002102293074131012, 0.0002205967903137207, 0.0002309642732143402, 0.00024133175611495972, 0.0002516992390155792, 0.00026206672191619873, 0.00027243420481681824, 0.00028280168771743774, 0.00029316917061805725, 0.00030353665351867676, 0.00031390413641929626, 0.00032427161931991577, 0.0003346391022205353, 0.0003450065851211548, 0.0003553740680217743, 0.0003657415509223938, 0.0003761090338230133, 0.0003864765167236328]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 11.0, 3.0, 11.0, 11.0, 12.0, 36.0, 35.0, 62.0, 106.0, 131.0, 165.0, 153.0, 94.0, 54.0, 40.0, 22.0, 18.0, 9.0, 11.0, 5.0, 4.0, 5.0, 7.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.641315460205078e-05, -7.329508662223816e-05, -7.017701864242554e-05, -6.705895066261292e-05, -6.394088268280029e-05, -6.082281470298767e-05, -5.770474672317505e-05, -5.458667874336243e-05, -5.1468610763549805e-05, -4.835054278373718e-05, -4.523247480392456e-05, -4.211440682411194e-05, -3.8996338844299316e-05, -3.5878270864486694e-05, -3.276020288467407e-05, -2.964213490486145e-05, -2.6524066925048828e-05, -2.3405998945236206e-05, -2.0287930965423584e-05, -1.7169862985610962e-05, -1.405179500579834e-05, -1.0933727025985718e-05, -7.815659046173096e-06, -4.697591066360474e-06, -1.5795230865478516e-06, 1.5385448932647705e-06, 4.656612873077393e-06, 7.774680852890015e-06, 1.0892748832702637e-05, 1.4010816812515259e-05, 1.712888479232788e-05, 2.0246952772140503e-05, 2.3365020751953125e-05, 2.6483088731765747e-05, 2.960115671157837e-05, 3.271922469139099e-05, 3.583729267120361e-05, 3.8955360651016235e-05, 4.207342863082886e-05, 4.519149661064148e-05, 4.83095645904541e-05, 5.1427632570266724e-05, 5.4545700550079346e-05, 5.766376852989197e-05, 6.078183650970459e-05, 6.389990448951721e-05, 6.701797246932983e-05, 7.013604044914246e-05, 7.325410842895508e-05, 7.63721764087677e-05, 7.949024438858032e-05, 8.260831236839294e-05, 8.572638034820557e-05, 8.884444832801819e-05, 9.196251630783081e-05, 9.508058428764343e-05, 9.819865226745605e-05, 0.00010131672024726868, 0.0001044347882270813, 0.00010755285620689392, 0.00011067092418670654, 0.00011378899216651917, 0.00011690706014633179, 0.00012002512812614441, 0.00012314319610595703]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 977.0, 35.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.464580774307251, -1.4350593090057373, -1.4055379629135132, -1.3760164976119995, -1.3464950323104858, -1.3169736862182617, -1.287452220916748, -1.2579307556152344, -1.2284094095230103, -1.1988879442214966, -1.1693665981292725, -1.1398451328277588, -1.1103236675262451, -1.080802321434021, -1.0512808561325073, -1.0217595100402832, -0.9922380447387695, -0.9627166390419006, -0.933195173740387, -0.9036737680435181, -0.8741523623466492, -0.8446309566497803, -0.8151094913482666, -0.7855880856513977, -0.756066620349884, -0.7265452146530151, -0.6970237493515015, -0.6675023436546326, -0.6379809379577637, -0.60845947265625, -0.5789380669593811, -0.5494166612625122, -0.5198952555656433, -0.490373820066452, -0.46085241436958313, -0.43133097887039185, -0.40180957317352295, -0.37228813767433167, -0.3427667021751404, -0.3132452964782715, -0.2837238907814026, -0.2542024552822113, -0.2246810495853424, -0.19515961408615112, -0.16563820838928223, -0.13611677289009094, -0.10659535229206085, -0.07707393169403076, -0.04755249619483948, -0.018031073734164238, 0.011490348726511002, 0.04101177304983139, 0.07053319364786148, 0.10005462169647217, 0.12957604229450226, 0.15909746289253235, 0.18861888349056244, 0.21814030408859253, 0.24766172468662262, 0.2771831452846527, 0.306704580783844, 0.3362259864807129, 0.3657474219799042, 0.39526885747909546, 0.42479026317596436]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 4.0, 11.0, 11.0, 17.0, 19.0, 35.0, 31.0, 48.0, 44.0, 60.0, 69.0, 69.0, 67.0, 59.0, 77.0, 66.0, 65.0, 51.0, 43.0, 25.0, 37.0, 20.0, 17.0, 21.0, 10.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.42555153369903564, -0.4158328175544739, -0.4061141014099121, -0.39639535546302795, -0.3866766393184662, -0.3769579231739044, -0.36723917722702026, -0.3575204610824585, -0.34780174493789673, -0.33808302879333496, -0.3283643126487732, -0.31864556670188904, -0.30892685055732727, -0.2992081344127655, -0.28948938846588135, -0.2797706723213196, -0.2700519561767578, -0.26033324003219604, -0.2506145238876343, -0.24089577794075012, -0.23117706179618835, -0.2214583456516266, -0.21173961460590363, -0.20202088356018066, -0.1923021674156189, -0.18258345127105713, -0.17286472022533417, -0.1631459891796112, -0.15342727303504944, -0.14370855689048767, -0.1339898258447647, -0.12427110224962234, -0.11455237865447998, -0.10483365505933762, -0.09511493146419525, -0.08539620786905289, -0.07567748427391052, -0.06595876067876816, -0.05624003708362579, -0.04652131348848343, -0.036802589893341064, -0.0270838662981987, -0.017365142703056335, -0.007646419107913971, 0.0020723044872283936, 0.011791028082370758, 0.021509751677513123, 0.031228475272655487, 0.04094719886779785, 0.050665922462940216, 0.06038464605808258, 0.07010336965322495, 0.07982209324836731, 0.08954081684350967, 0.09925954043865204, 0.1089782640337944, 0.11869698762893677, 0.12841570377349854, 0.1381344348192215, 0.14785316586494446, 0.15757188200950623, 0.167290598154068, 0.17700932919979095, 0.18672806024551392, 0.19644677639007568]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 11.0, 8.0, 8.0, 23.0, 31.0, 59.0, 109.0, 273.0, 839.0, 4639.0, 4180180.0, 5912.0, 1271.0, 457.0, 189.0, 95.0, 52.0, 28.0, 18.0, 9.0, 13.0, 6.0, 9.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.156494140625, -0.1513671875, -0.146240234375, -0.14111328125, -0.135986328125, -0.130859375, -0.125732421875, -0.12060546875, -0.115478515625, -0.1103515625, -0.105224609375, -0.10009765625, -0.094970703125, -0.08984375, -0.084716796875, -0.07958984375, -0.074462890625, -0.0693359375, -0.064208984375, -0.05908203125, -0.053955078125, -0.048828125, -0.043701171875, -0.03857421875, -0.033447265625, -0.0283203125, -0.023193359375, -0.01806640625, -0.012939453125, -0.0078125, -0.002685546875, 0.00244140625, 0.007568359375, 0.0126953125, 0.017822265625, 0.02294921875, 0.028076171875, 0.033203125, 0.038330078125, 0.04345703125, 0.048583984375, 0.0537109375, 0.058837890625, 0.06396484375, 0.069091796875, 0.07421875, 0.079345703125, 0.08447265625, 0.089599609375, 0.0947265625, 0.099853515625, 0.10498046875, 0.110107421875, 0.115234375, 0.120361328125, 0.12548828125, 0.130615234375, 0.1357421875, 0.140869140625, 0.14599609375, 0.151123046875, 0.15625, 0.161376953125, 0.16650390625, 0.171630859375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 9.0, 4.0, 3.0, 13.0, 9.0, 7.0, 10.0, 11.0, 50.0, 282.0, 383.0, 98.0, 19.0, 12.0, 8.0, 10.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 5.0, 2.0, 3.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01043701171875, -0.01009523868560791, -0.00975346565246582, -0.00941169261932373, -0.00906991958618164, -0.00872814655303955, -0.008386373519897461, -0.008044600486755371, -0.007702827453613281, -0.007361054420471191, -0.0070192813873291016, -0.006677508354187012, -0.006335735321044922, -0.005993962287902832, -0.005652189254760742, -0.005310416221618652, -0.0049686431884765625, -0.004626870155334473, -0.004285097122192383, -0.003943324089050293, -0.003601551055908203, -0.0032597780227661133, -0.0029180049896240234, -0.0025762319564819336, -0.0022344589233398438, -0.001892685890197754, -0.001550912857055664, -0.0012091398239135742, -0.0008673667907714844, -0.0005255937576293945, -0.0001838207244873047, 0.00015795230865478516, 0.000499725341796875, 0.0008414983749389648, 0.0011832714080810547, 0.0015250444412231445, 0.0018668174743652344, 0.0022085905075073242, 0.002550363540649414, 0.002892136573791504, 0.0032339096069335938, 0.0035756826400756836, 0.0039174556732177734, 0.004259228706359863, 0.004601001739501953, 0.004942774772644043, 0.005284547805786133, 0.005626320838928223, 0.0059680938720703125, 0.006309866905212402, 0.006651639938354492, 0.006993412971496582, 0.007335186004638672, 0.007676959037780762, 0.008018732070922852, 0.008360505104064941, 0.008702278137207031, 0.009044051170349121, 0.009385824203491211, 0.0097275972366333, 0.01006937026977539, 0.01041114330291748, 0.01075291633605957, 0.01109468936920166, 0.01143646240234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 13.0, 8.0, 11.0, 6.0, 18.0, 21.0, 23.0, 43.0, 51.0, 71.0, 96.0, 152.0, 421.0, 2049.0, 4070474.0, 118211.0, 1677.0, 421.0, 149.0, 102.0, 63.0, 47.0, 34.0, 26.0, 18.0, 15.0, 8.0, 13.0, 9.0, 8.0, 4.0, 2.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.121826171875, -0.11730384826660156, -0.11278152465820312, -0.10825920104980469, -0.10373687744140625, -0.09921455383300781, -0.09469223022460938, -0.09016990661621094, -0.0856475830078125, -0.08112525939941406, -0.07660293579101562, -0.07208061218261719, -0.06755828857421875, -0.06303596496582031, -0.058513641357421875, -0.05399131774902344, -0.049468994140625, -0.04494667053222656, -0.040424346923828125, -0.03590202331542969, -0.03137969970703125, -0.026857376098632812, -0.022335052490234375, -0.017812728881835938, -0.0132904052734375, -0.008768081665039062, -0.004245758056640625, 0.0002765655517578125, 0.00479888916015625, 0.009321212768554688, 0.013843536376953125, 0.018365859985351562, 0.02288818359375, 0.027410507202148438, 0.031932830810546875, 0.03645515441894531, 0.04097747802734375, 0.04549980163574219, 0.050022125244140625, 0.05454444885253906, 0.0590667724609375, 0.06358909606933594, 0.06811141967773438, 0.07263374328613281, 0.07715606689453125, 0.08167839050292969, 0.08620071411132812, 0.09072303771972656, 0.095245361328125, 0.09976768493652344, 0.10429000854492188, 0.10881233215332031, 0.11333465576171875, 0.11785697937011719, 0.12237930297851562, 0.12690162658691406, 0.1314239501953125, 0.13594627380371094, 0.14046859741210938, 0.1449909210205078, 0.14951324462890625, 0.1540355682373047, 0.15855789184570312, 0.16308021545410156, 0.1676025390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 9.0, 9.0, 10.0, 14.0, 21.0, 14.0, 14.0, 36.0, 58.0, 132.0, 3195.0, 327.0, 65.0, 39.0, 21.0, 19.0, 16.0, 12.0, 7.0, 8.0, 6.0, 4.0, 5.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.017974853515625, -0.017302513122558594, -0.016630172729492188, -0.01595783233642578, -0.015285491943359375, -0.014613151550292969, -0.013940811157226562, -0.013268470764160156, -0.01259613037109375, -0.011923789978027344, -0.011251449584960938, -0.010579109191894531, -0.009906768798828125, -0.009234428405761719, -0.008562088012695312, -0.007889747619628906, -0.0072174072265625, -0.006545066833496094, -0.0058727264404296875, -0.005200386047363281, -0.004528045654296875, -0.0038557052612304688, -0.0031833648681640625, -0.0025110244750976562, -0.00183868408203125, -0.0011663436889648438, -0.0004940032958984375, 0.00017833709716796875, 0.000850677490234375, 0.0015230178833007812, 0.0021953582763671875, 0.0028676986694335938, 0.0035400390625, 0.004212379455566406, 0.0048847198486328125, 0.005557060241699219, 0.006229400634765625, 0.006901741027832031, 0.0075740814208984375, 0.008246421813964844, 0.00891876220703125, 0.009591102600097656, 0.010263442993164062, 0.010935783386230469, 0.011608123779296875, 0.012280464172363281, 0.012952804565429688, 0.013625144958496094, 0.0142974853515625, 0.014969825744628906, 0.015642166137695312, 0.01631450653076172, 0.016986846923828125, 0.01765918731689453, 0.018331527709960938, 0.019003868103027344, 0.01967620849609375, 0.020348548889160156, 0.021020889282226562, 0.02169322967529297, 0.022365570068359375, 0.02303791046142578, 0.023710250854492188, 0.024382591247558594, 0.025054931640625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 996.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16822035610675812, -0.15810665488243103, -0.14799295365810394, -0.13787925243377686, -0.12776553630828857, -0.11765184253454208, -0.1075381338596344, -0.09742443263530731, -0.08731073141098022, -0.07719703018665314, -0.06708332896232605, -0.056969620287418365, -0.04685591906309128, -0.03674221783876419, -0.026628512889146805, -0.01651480793952942, -0.0064011067152023315, 0.003712596371769905, 0.013826299458742142, 0.02394000254571438, 0.034053705632686615, 0.0441674068570137, 0.05428111180663109, 0.06439481675624847, 0.07450851798057556, 0.08462221920490265, 0.09473592042922974, 0.10484962910413742, 0.11496333032846451, 0.1250770390033722, 0.13519074022769928, 0.14530444145202637, 0.15541812777519226, 0.16553182899951935, 0.17564553022384644, 0.18575923144817352, 0.1958729326725006, 0.2059866487979889, 0.21610035002231598, 0.22621405124664307, 0.23632775247097015, 0.24644145369529724, 0.2565551698207855, 0.2666688561439514, 0.2767825722694397, 0.2868962585926056, 0.29700997471809387, 0.30712366104125977, 0.31723737716674805, 0.32735109329223633, 0.3374647796154022, 0.3475784957408905, 0.3576921820640564, 0.3678058981895447, 0.37791958451271057, 0.38803330063819885, 0.39814698696136475, 0.408260703086853, 0.4183743894100189, 0.4284881055355072, 0.4386017918586731, 0.4487155079841614, 0.45882919430732727, 0.46894291043281555, 0.47905662655830383]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 10.0, 16.0, 26.0, 27.0, 19.0, 35.0, 46.0, 50.0, 68.0, 45.0, 60.0, 67.0, 54.0, 59.0, 55.0, 61.0, 52.0, 29.0, 37.0, 27.0, 27.0, 29.0, 10.0, 14.0, 11.0, 10.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0648425817489624, -0.06285306811332703, -0.06086354702711105, -0.05887402966618538, -0.056884512305259705, -0.05489499494433403, -0.052905477583408356, -0.05091596022248268, -0.04892644286155701, -0.04693692550063133, -0.04494740813970566, -0.042957890778779984, -0.04096837341785431, -0.038978856056928635, -0.03698933869600296, -0.034999821335077286, -0.03301030397415161, -0.031020786613225937, -0.029031269252300262, -0.027041751891374588, -0.025052234530448914, -0.02306271716952324, -0.021073199808597565, -0.01908368244767189, -0.017094165086746216, -0.015104647725820541, -0.013115130364894867, -0.011125613003969193, -0.009136095643043518, -0.007146578282117844, -0.005157060921192169, -0.0031675435602664948, -0.0011780261993408203, 0.0008114911615848541, 0.0028010085225105286, 0.004790525883436203, 0.0067800432443618774, 0.008769560605287552, 0.010759077966213226, 0.0127485953271389, 0.014738112688064575, 0.01672763004899025, 0.018717147409915924, 0.0207066647708416, 0.022696182131767273, 0.024685699492692947, 0.026675216853618622, 0.028664734214544296, 0.03065425157546997, 0.032643768936395645, 0.03463328629732132, 0.036622803658246994, 0.03861232101917267, 0.04060183838009834, 0.04259135574102402, 0.04458087310194969, 0.046570390462875366, 0.04855990782380104, 0.050549425184726715, 0.05253894254565239, 0.054528459906578064, 0.05651797726750374, 0.05850749462842941, 0.06049701198935509, 0.06248652935028076]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 12.0, 13.0, 28.0, 41.0, 45.0, 86.0, 100.0, 183.0, 251.0, 384.0, 633.0, 1037.0, 1693.0, 2928.0, 5493.0, 11463.0, 30096.0, 875360.0, 83938.0, 17357.0, 7603.0, 4057.0, 2208.0, 1287.0, 787.0, 506.0, 315.0, 224.0, 134.0, 93.0, 61.0, 40.0, 27.0, 20.0, 11.0, 9.0, 7.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03668212890625, -0.035594940185546875, -0.03450775146484375, -0.033420562744140625, -0.0323333740234375, -0.031246185302734375, -0.03015899658203125, -0.029071807861328125, -0.027984619140625, -0.026897430419921875, -0.02581024169921875, -0.024723052978515625, -0.0236358642578125, -0.022548675537109375, -0.02146148681640625, -0.020374298095703125, -0.019287109375, -0.018199920654296875, -0.01711273193359375, -0.016025543212890625, -0.0149383544921875, -0.013851165771484375, -0.01276397705078125, -0.011676788330078125, -0.010589599609375, -0.009502410888671875, -0.00841522216796875, -0.007328033447265625, -0.0062408447265625, -0.005153656005859375, -0.00406646728515625, -0.002979278564453125, -0.00189208984375, -0.000804901123046875, 0.00028228759765625, 0.001369476318359375, 0.0024566650390625, 0.003543853759765625, 0.00463104248046875, 0.005718231201171875, 0.006805419921875, 0.007892608642578125, 0.00897979736328125, 0.010066986083984375, 0.0111541748046875, 0.012241363525390625, 0.01332855224609375, 0.014415740966796875, 0.0155029296875, 0.016590118408203125, 0.01767730712890625, 0.018764495849609375, 0.0198516845703125, 0.020938873291015625, 0.02202606201171875, 0.023113250732421875, 0.024200439453125, 0.025287628173828125, 0.02637481689453125, 0.027462005615234375, 0.0285491943359375, 0.029636383056640625, 0.03072357177734375, 0.031810760498046875, 0.03289794921875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 7.0, 3.0, 8.0, 8.0, 12.0, 9.0, 8.0, 18.0, 92.0, 354.0, 295.0, 67.0, 18.0, 7.0, 7.0, 15.0, 10.0, 5.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 3.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0098876953125, -0.00956106185913086, -0.009234428405761719, -0.008907794952392578, -0.008581161499023438, -0.008254528045654297, -0.007927894592285156, -0.007601261138916016, -0.007274627685546875, -0.006947994232177734, -0.006621360778808594, -0.006294727325439453, -0.0059680938720703125, -0.005641460418701172, -0.005314826965332031, -0.004988193511962891, -0.00466156005859375, -0.004334926605224609, -0.004008293151855469, -0.003681659698486328, -0.0033550262451171875, -0.003028392791748047, -0.0027017593383789062, -0.0023751258850097656, -0.002048492431640625, -0.0017218589782714844, -0.0013952255249023438, -0.0010685920715332031, -0.0007419586181640625, -0.0004153251647949219, -8.869171142578125e-05, 0.00023794174194335938, 0.0005645751953125, 0.0008912086486816406, 0.0012178421020507812, 0.0015444755554199219, 0.0018711090087890625, 0.002197742462158203, 0.0025243759155273438, 0.0028510093688964844, 0.003177642822265625, 0.0035042762756347656, 0.0038309097290039062, 0.004157543182373047, 0.0044841766357421875, 0.004810810089111328, 0.005137443542480469, 0.005464076995849609, 0.00579071044921875, 0.006117343902587891, 0.006443977355957031, 0.006770610809326172, 0.0070972442626953125, 0.007423877716064453, 0.007750511169433594, 0.008077144622802734, 0.008403778076171875, 0.008730411529541016, 0.009057044982910156, 0.009383678436279297, 0.009710311889648438, 0.010036945343017578, 0.010363578796386719, 0.01069021224975586, 0.011016845703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 11.0, 7.0, 11.0, 14.0, 21.0, 27.0, 25.0, 33.0, 37.0, 39.0, 55.0, 69.0, 69.0, 98.0, 104.0, 121.0, 190.0, 288.0, 488.0, 1301.0, 9873.0, 942326.0, 88509.0, 2662.0, 732.0, 357.0, 220.0, 160.0, 127.0, 103.0, 70.0, 76.0, 52.0, 59.0, 50.0, 41.0, 29.0, 22.0, 19.0, 10.0, 12.0, 15.0, 8.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0859375, -0.08339118957519531, -0.08084487915039062, -0.07829856872558594, -0.07575225830078125, -0.07320594787597656, -0.07065963745117188, -0.06811332702636719, -0.0655670166015625, -0.06302070617675781, -0.060474395751953125, -0.05792808532714844, -0.05538177490234375, -0.05283546447753906, -0.050289154052734375, -0.04774284362792969, -0.045196533203125, -0.04265022277832031, -0.040103912353515625, -0.03755760192871094, -0.03501129150390625, -0.03246498107910156, -0.029918670654296875, -0.027372360229492188, -0.0248260498046875, -0.022279739379882812, -0.019733428955078125, -0.017187118530273438, -0.01464080810546875, -0.012094497680664062, -0.009548187255859375, -0.0070018768310546875, -0.00445556640625, -0.0019092559814453125, 0.000637054443359375, 0.0031833648681640625, 0.00572967529296875, 0.008275985717773438, 0.010822296142578125, 0.013368606567382812, 0.0159149169921875, 0.018461227416992188, 0.021007537841796875, 0.023553848266601562, 0.02610015869140625, 0.028646469116210938, 0.031192779541015625, 0.03373908996582031, 0.036285400390625, 0.03883171081542969, 0.041378021240234375, 0.04392433166503906, 0.04647064208984375, 0.04901695251464844, 0.051563262939453125, 0.05410957336425781, 0.0566558837890625, 0.05920219421386719, 0.061748504638671875, 0.06429481506347656, 0.06684112548828125, 0.06938743591308594, 0.07193374633789062, 0.07448005676269531, 0.0770263671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 1.0, 5.0, 4.0, 10.0, 8.0, 8.0, 12.0, 14.0, 9.0, 15.0, 17.0, 15.0, 35.0, 23.0, 31.0, 26.0, 31.0, 33.0, 38.0, 46.0, 27.0, 61.0, 48.0, 57.0, 47.0, 45.0, 39.0, 41.0, 42.0, 30.0, 28.0, 20.0, 24.0, 18.0, 17.0, 20.0, 17.0, 8.0, 6.0, 5.0, 7.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.03399658203125, -0.03305482864379883, -0.032113075256347656, -0.031171321868896484, -0.030229568481445312, -0.02928781509399414, -0.02834606170654297, -0.027404308319091797, -0.026462554931640625, -0.025520801544189453, -0.02457904815673828, -0.02363729476928711, -0.022695541381835938, -0.021753787994384766, -0.020812034606933594, -0.019870281219482422, -0.01892852783203125, -0.017986774444580078, -0.017045021057128906, -0.016103267669677734, -0.015161514282226562, -0.01421976089477539, -0.013278007507324219, -0.012336254119873047, -0.011394500732421875, -0.010452747344970703, -0.009510993957519531, -0.00856924057006836, -0.0076274871826171875, -0.006685733795166016, -0.005743980407714844, -0.004802227020263672, -0.0038604736328125, -0.002918720245361328, -0.0019769668579101562, -0.0010352134704589844, -9.34600830078125e-05, 0.0008482933044433594, 0.0017900466918945312, 0.002731800079345703, 0.003673553466796875, 0.004615306854248047, 0.005557060241699219, 0.006498813629150391, 0.0074405670166015625, 0.008382320404052734, 0.009324073791503906, 0.010265827178955078, 0.01120758056640625, 0.012149333953857422, 0.013091087341308594, 0.014032840728759766, 0.014974594116210938, 0.01591634750366211, 0.01685810089111328, 0.017799854278564453, 0.018741607666015625, 0.019683361053466797, 0.02062511444091797, 0.02156686782836914, 0.022508621215820312, 0.023450374603271484, 0.024392127990722656, 0.025333881378173828, 0.026275634765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 2.0, 3.0, 3.0, 16.0, 17.0, 22.0, 33.0, 39.0, 78.0, 106.0, 204.0, 460.0, 1008.0, 3883.0, 218102.0, 817524.0, 4806.0, 1170.0, 462.0, 226.0, 130.0, 88.0, 43.0, 35.0, 23.0, 26.0, 9.0, 13.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00015401840209960938, -0.00014974642544984818, -0.00014547444880008698, -0.00014120247215032578, -0.00013693049550056458, -0.00013265851885080338, -0.00012838654220104218, -0.00012411456555128098, -0.00011984258890151978, -0.00011557061225175858, -0.00011129863560199738, -0.00010702665895223618, -0.00010275468230247498, -9.848270565271378e-05, -9.421072900295258e-05, -8.993875235319138e-05, -8.566677570343018e-05, -8.139479905366898e-05, -7.712282240390778e-05, -7.285084575414658e-05, -6.857886910438538e-05, -6.430689245462418e-05, -6.0034915804862976e-05, -5.5762939155101776e-05, -5.1490962505340576e-05, -4.7218985855579376e-05, -4.2947009205818176e-05, -3.8675032556056976e-05, -3.4403055906295776e-05, -3.0131079256534576e-05, -2.5859102606773376e-05, -2.1587125957012177e-05, -1.7315149307250977e-05, -1.3043172657489777e-05, -8.771196007728577e-06, -4.499219357967377e-06, -2.2724270820617676e-07, 4.044733941555023e-06, 8.316710591316223e-06, 1.2588687241077423e-05, 1.6860663890838623e-05, 2.1132640540599823e-05, 2.5404617190361023e-05, 2.9676593840122223e-05, 3.394857048988342e-05, 3.822054713964462e-05, 4.249252378940582e-05, 4.676450043916702e-05, 5.103647708892822e-05, 5.530845373868942e-05, 5.958043038845062e-05, 6.385240703821182e-05, 6.812438368797302e-05, 7.239636033773422e-05, 7.666833698749542e-05, 8.094031363725662e-05, 8.521229028701782e-05, 8.948426693677902e-05, 9.375624358654022e-05, 9.802822023630142e-05, 0.00010230019688606262, 0.00010657217353582382, 0.00011084415018558502, 0.00011511612683534622, 0.00011938810348510742]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 5.0, 11.0, 11.0, 29.0, 22.0, 21.0, 35.0, 41.0, 43.0, 42.0, 68.0, 63.0, 67.0, 74.0, 80.0, 75.0, 54.0, 47.0, 22.0, 36.0, 29.0, 18.0, 21.0, 14.0, 11.0, 10.0, 12.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.874301910400391e-06, -3.702007234096527e-06, -3.5297125577926636e-06, -3.3574178814888e-06, -3.1851232051849365e-06, -3.012828528881073e-06, -2.8405338525772095e-06, -2.668239176273346e-06, -2.4959444999694824e-06, -2.323649823665619e-06, -2.1513551473617554e-06, -1.979060471057892e-06, -1.8067657947540283e-06, -1.6344711184501648e-06, -1.4621764421463013e-06, -1.2898817658424377e-06, -1.1175870895385742e-06, -9.452924132347107e-07, -7.729977369308472e-07, -6.007030606269836e-07, -4.284083843231201e-07, -2.561137080192566e-07, -8.381903171539307e-08, 8.847564458847046e-08, 2.60770320892334e-07, 4.330649971961975e-07, 6.05359673500061e-07, 7.776543498039246e-07, 9.499490261077881e-07, 1.1222437024116516e-06, 1.2945383787155151e-06, 1.4668330550193787e-06, 1.6391277313232422e-06, 1.8114224076271057e-06, 1.9837170839309692e-06, 2.1560117602348328e-06, 2.3283064365386963e-06, 2.50060111284256e-06, 2.6728957891464233e-06, 2.845190465450287e-06, 3.0174851417541504e-06, 3.189779818058014e-06, 3.3620744943618774e-06, 3.534369170665741e-06, 3.7066638469696045e-06, 3.878958523273468e-06, 4.0512531995773315e-06, 4.223547875881195e-06, 4.395842552185059e-06, 4.568137228488922e-06, 4.740431904792786e-06, 4.912726581096649e-06, 5.085021257400513e-06, 5.257315933704376e-06, 5.42961061000824e-06, 5.601905286312103e-06, 5.774199962615967e-06, 5.94649463891983e-06, 6.118789315223694e-06, 6.291083991527557e-06, 6.463378667831421e-06, 6.6356733441352844e-06, 6.807968020439148e-06, 6.9802626967430115e-06, 7.152557373046875e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 4.0, 12.0, 22.0, 26.0, 37.0, 62.0, 127.0, 203.0, 441.0, 2022.0, 1026259.0, 17815.0, 820.0, 285.0, 152.0, 92.0, 64.0, 32.0, 29.0, 11.0, 4.0, 5.0, 3.0, 4.0, 5.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00019228458404541016, -0.0001865886151790619, -0.00018089264631271362, -0.00017519667744636536, -0.0001695007085800171, -0.00016380473971366882, -0.00015810877084732056, -0.0001524128019809723, -0.00014671683311462402, -0.00014102086424827576, -0.0001353248953819275, -0.00012962892651557922, -0.00012393295764923096, -0.00011823698878288269, -0.00011254101991653442, -0.00010684505105018616, -0.00010114908218383789, -9.545311331748962e-05, -8.975714445114136e-05, -8.406117558479309e-05, -7.836520671844482e-05, -7.266923785209656e-05, -6.697326898574829e-05, -6.127730011940002e-05, -5.558133125305176e-05, -4.988536238670349e-05, -4.4189393520355225e-05, -3.849342465400696e-05, -3.279745578765869e-05, -2.7101486921310425e-05, -2.1405518054962158e-05, -1.570954918861389e-05, -1.0013580322265625e-05, -4.317611455917358e-06, 1.3783574104309082e-06, 7.074326276779175e-06, 1.2770295143127441e-05, 1.8466264009475708e-05, 2.4162232875823975e-05, 2.985820174217224e-05, 3.555417060852051e-05, 4.1250139474868774e-05, 4.694610834121704e-05, 5.264207720756531e-05, 5.8338046073913574e-05, 6.403401494026184e-05, 6.972998380661011e-05, 7.542595267295837e-05, 8.112192153930664e-05, 8.681789040565491e-05, 9.251385927200317e-05, 9.820982813835144e-05, 0.00010390579700469971, 0.00010960176587104797, 0.00011529773473739624, 0.00012099370360374451, 0.00012668967247009277, 0.00013238564133644104, 0.0001380816102027893, 0.00014377757906913757, 0.00014947354793548584, 0.0001551695168018341, 0.00016086548566818237, 0.00016656145453453064, 0.0001722574234008789]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 8.0, 10.0, 10.0, 19.0, 41.0, 56.0, 96.0, 142.0, 167.0, 160.0, 97.0, 72.0, 36.0, 32.0, 22.0, 11.0, 10.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.617473602294922e-05, -7.397308945655823e-05, -7.177144289016724e-05, -6.956979632377625e-05, -6.736814975738525e-05, -6.516650319099426e-05, -6.296485662460327e-05, -6.076321005821228e-05, -5.856156349182129e-05, -5.63599169254303e-05, -5.415827035903931e-05, -5.1956623792648315e-05, -4.9754977226257324e-05, -4.755333065986633e-05, -4.535168409347534e-05, -4.315003752708435e-05, -4.094839096069336e-05, -3.874674439430237e-05, -3.654509782791138e-05, -3.4343451261520386e-05, -3.2141804695129395e-05, -2.9940158128738403e-05, -2.7738511562347412e-05, -2.553686499595642e-05, -2.333521842956543e-05, -2.113357186317444e-05, -1.8931925296783447e-05, -1.6730278730392456e-05, -1.4528632164001465e-05, -1.2326985597610474e-05, -1.0125339031219482e-05, -7.923692464828491e-06, -5.7220458984375e-06, -3.520399332046509e-06, -1.3187527656555176e-06, 8.828938007354736e-07, 3.084540367126465e-06, 5.286186933517456e-06, 7.487833499908447e-06, 9.689480066299438e-06, 1.189112663269043e-05, 1.4092773199081421e-05, 1.6294419765472412e-05, 1.8496066331863403e-05, 2.0697712898254395e-05, 2.2899359464645386e-05, 2.5101006031036377e-05, 2.7302652597427368e-05, 2.950429916381836e-05, 3.170594573020935e-05, 3.390759229660034e-05, 3.610923886299133e-05, 3.8310885429382324e-05, 4.0512531995773315e-05, 4.271417856216431e-05, 4.49158251285553e-05, 4.711747169494629e-05, 4.931911826133728e-05, 5.152076482772827e-05, 5.372241139411926e-05, 5.5924057960510254e-05, 5.8125704526901245e-05, 6.0327351093292236e-05, 6.252899765968323e-05, 6.473064422607422e-05]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 6.0, 27.0, 774.0, 193.0, 14.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04335526376962662, -0.031961411237716675, -0.020567556843161583, -0.009173702448606491, 0.0022201500833034515, 0.013614002615213394, 0.025007858872413635, 0.03640171140432358, 0.04779556393623352, 0.05918941646814346, 0.0705832690000534, 0.08197712898254395, 0.09337097406387329, 0.10476483404636383, 0.11615868657827377, 0.12755253911018372, 0.13894638419151306, 0.1503402441740036, 0.16173408925533295, 0.1731279492378235, 0.18452179431915283, 0.19591565430164337, 0.2073095142841339, 0.21870335936546326, 0.2300972193479538, 0.24149107933044434, 0.2528849244117737, 0.264278769493103, 0.27567264437675476, 0.2870664894580841, 0.29846033453941345, 0.3098542094230652, 0.32124802470207214, 0.3326418697834015, 0.3440357446670532, 0.35542958974838257, 0.3668234348297119, 0.37821727991104126, 0.389611154794693, 0.40100499987602234, 0.4123988449573517, 0.42379269003868103, 0.43518656492233276, 0.4465804100036621, 0.45797425508499146, 0.4693681001663208, 0.48076197504997253, 0.4921558201313019, 0.5035496950149536, 0.514943540096283, 0.5263373851776123, 0.5377312302589417, 0.5491251349449158, 0.5605189800262451, 0.5719128251075745, 0.5833066701889038, 0.5947005152702332, 0.6060943603515625, 0.6174882054328918, 0.6288820505142212, 0.6402759552001953, 0.6516698002815247, 0.663063645362854, 0.6744574904441833, 0.6858513355255127]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 1.0, 3.0, 8.0, 7.0, 11.0, 13.0, 8.0, 20.0, 23.0, 33.0, 27.0, 35.0, 27.0, 45.0, 54.0, 49.0, 47.0, 44.0, 58.0, 42.0, 52.0, 60.0, 53.0, 47.0, 40.0, 43.0, 35.0, 28.0, 24.0, 15.0, 9.0, 14.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2533220052719116, -0.24554792046546936, -0.2377738356590271, -0.22999975085258484, -0.22222565114498138, -0.21445156633853912, -0.20667748153209686, -0.1989033967256546, -0.19112929701805115, -0.1833552122116089, -0.17558112740516663, -0.16780704259872437, -0.1600329428911209, -0.15225885808467865, -0.1444847732782364, -0.13671068847179413, -0.12893660366535187, -0.1211625188589096, -0.11338842660188675, -0.10561434179544449, -0.09784024953842163, -0.09006616473197937, -0.08229207992553711, -0.07451799511909485, -0.06674390286207199, -0.05896981433033943, -0.05119572579860687, -0.04342164099216461, -0.03564755246043205, -0.027873463928699493, -0.020099379122257233, -0.012325290590524673, -0.004551202058792114, 0.0032228855416178703, 0.010996973142027855, 0.018771059811115265, 0.026545148342847824, 0.03431923687458038, 0.042093321681022644, 0.0498674102127552, 0.05764149874448776, 0.06541558355093002, 0.07318967580795288, 0.08096376061439514, 0.0887378454208374, 0.09651193767786026, 0.10428602248430252, 0.11206011474132538, 0.11983419954776764, 0.1276082843542099, 0.13538236916065216, 0.14315646886825562, 0.15093055367469788, 0.15870463848114014, 0.1664787232875824, 0.17425280809402466, 0.18202689290046692, 0.18980097770690918, 0.19757506251335144, 0.2053491473197937, 0.21312324702739716, 0.22089733183383942, 0.22867141664028168, 0.23644550144672394, 0.2442196011543274]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 9.0, 6.0, 14.0, 12.0, 33.0, 28.0, 52.0, 66.0, 115.0, 128.0, 219.0, 325.0, 624.0, 1298.0, 18874.0, 4156866.0, 11910.0, 1524.0, 690.0, 401.0, 305.0, 207.0, 153.0, 107.0, 74.0, 60.0, 44.0, 35.0, 17.0, 21.0, 10.0, 19.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.037506103515625, -0.03627634048461914, -0.03504657745361328, -0.03381681442260742, -0.03258705139160156, -0.0313572883605957, -0.030127525329589844, -0.028897762298583984, -0.027667999267578125, -0.026438236236572266, -0.025208473205566406, -0.023978710174560547, -0.022748947143554688, -0.021519184112548828, -0.02028942108154297, -0.01905965805053711, -0.01782989501953125, -0.01660013198852539, -0.015370368957519531, -0.014140605926513672, -0.012910842895507812, -0.011681079864501953, -0.010451316833496094, -0.009221553802490234, -0.007991790771484375, -0.006762027740478516, -0.005532264709472656, -0.004302501678466797, -0.0030727386474609375, -0.0018429756164550781, -0.0006132125854492188, 0.0006165504455566406, 0.0018463134765625, 0.0030760765075683594, 0.004305839538574219, 0.005535602569580078, 0.0067653656005859375, 0.007995128631591797, 0.009224891662597656, 0.010454654693603516, 0.011684417724609375, 0.012914180755615234, 0.014143943786621094, 0.015373706817626953, 0.016603469848632812, 0.017833232879638672, 0.01906299591064453, 0.02029275894165039, 0.02152252197265625, 0.02275228500366211, 0.02398204803466797, 0.025211811065673828, 0.026441574096679688, 0.027671337127685547, 0.028901100158691406, 0.030130863189697266, 0.031360626220703125, 0.032590389251708984, 0.033820152282714844, 0.0350499153137207, 0.03627967834472656, 0.03750944137573242, 0.03873920440673828, 0.03996896743774414, 0.04119873046875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 4.0, 13.0, 10.0, 6.0, 9.0, 17.0, 51.0, 243.0, 369.0, 128.0, 28.0, 14.0, 9.0, 12.0, 12.0, 8.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 9.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00970458984375, -0.009387731552124023, -0.009070873260498047, -0.00875401496887207, -0.008437156677246094, -0.008120298385620117, -0.007803440093994141, -0.007486581802368164, -0.0071697235107421875, -0.006852865219116211, -0.006536006927490234, -0.006219148635864258, -0.005902290344238281, -0.005585432052612305, -0.005268573760986328, -0.0049517154693603516, -0.004634857177734375, -0.0043179988861083984, -0.004001140594482422, -0.0036842823028564453, -0.0033674240112304688, -0.003050565719604492, -0.0027337074279785156, -0.002416849136352539, -0.0020999908447265625, -0.001783132553100586, -0.0014662742614746094, -0.0011494159698486328, -0.0008325576782226562, -0.0005156993865966797, -0.00019884109497070312, 0.00011801719665527344, 0.00043487548828125, 0.0007517337799072266, 0.0010685920715332031, 0.0013854503631591797, 0.0017023086547851562, 0.002019166946411133, 0.0023360252380371094, 0.002652883529663086, 0.0029697418212890625, 0.003286600112915039, 0.0036034584045410156, 0.003920316696166992, 0.004237174987792969, 0.004554033279418945, 0.004870891571044922, 0.0051877498626708984, 0.005504608154296875, 0.0058214664459228516, 0.006138324737548828, 0.006455183029174805, 0.006772041320800781, 0.007088899612426758, 0.007405757904052734, 0.007722616195678711, 0.008039474487304688, 0.008356332778930664, 0.00867319107055664, 0.008990049362182617, 0.009306907653808594, 0.00962376594543457, 0.009940624237060547, 0.010257482528686523, 0.0105743408203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 5.0, 3.0, 6.0, 10.0, 7.0, 9.0, 12.0, 7.0, 15.0, 14.0, 21.0, 37.0, 53.0, 88.0, 154.0, 463.0, 2731.0, 4061645.0, 126088.0, 2112.0, 356.0, 174.0, 59.0, 39.0, 42.0, 24.0, 16.0, 19.0, 12.0, 15.0, 3.0, 10.0, 5.0, 3.0, 3.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.0799713134765625, -0.077301025390625, -0.0746307373046875, -0.07196044921875, -0.0692901611328125, -0.066619873046875, -0.0639495849609375, -0.061279296875, -0.0586090087890625, -0.055938720703125, -0.0532684326171875, -0.05059814453125, -0.0479278564453125, -0.045257568359375, -0.0425872802734375, -0.0399169921875, -0.0372467041015625, -0.034576416015625, -0.0319061279296875, -0.02923583984375, -0.0265655517578125, -0.023895263671875, -0.0212249755859375, -0.0185546875, -0.0158843994140625, -0.013214111328125, -0.0105438232421875, -0.00787353515625, -0.0052032470703125, -0.002532958984375, 0.0001373291015625, 0.0028076171875, 0.0054779052734375, 0.008148193359375, 0.0108184814453125, 0.01348876953125, 0.0161590576171875, 0.018829345703125, 0.0214996337890625, 0.024169921875, 0.0268402099609375, 0.029510498046875, 0.0321807861328125, 0.03485107421875, 0.0375213623046875, 0.040191650390625, 0.0428619384765625, 0.0455322265625, 0.0482025146484375, 0.050872802734375, 0.0535430908203125, 0.05621337890625, 0.0588836669921875, 0.061553955078125, 0.0642242431640625, 0.06689453125, 0.0695648193359375, 0.072235107421875, 0.0749053955078125, 0.07757568359375, 0.0802459716796875, 0.082916259765625, 0.0855865478515625, 0.0882568359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 13.0, 11.0, 7.0, 21.0, 50.0, 73.0, 457.0, 3149.0, 135.0, 58.0, 20.0, 12.0, 5.0, 5.0, 6.0, 7.0, 5.0, 1.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.016998291015625, -0.01648545265197754, -0.015972614288330078, -0.015459775924682617, -0.014946937561035156, -0.014434099197387695, -0.013921260833740234, -0.013408422470092773, -0.012895584106445312, -0.012382745742797852, -0.01186990737915039, -0.01135706901550293, -0.010844230651855469, -0.010331392288208008, -0.009818553924560547, -0.009305715560913086, -0.008792877197265625, -0.008280038833618164, -0.007767200469970703, -0.007254362106323242, -0.006741523742675781, -0.00622868537902832, -0.005715847015380859, -0.0052030086517333984, -0.0046901702880859375, -0.0041773319244384766, -0.0036644935607910156, -0.0031516551971435547, -0.0026388168334960938, -0.002125978469848633, -0.0016131401062011719, -0.001100301742553711, -0.00058746337890625, -7.462501525878906e-05, 0.0004382133483886719, 0.0009510517120361328, 0.0014638900756835938, 0.0019767284393310547, 0.0024895668029785156, 0.0030024051666259766, 0.0035152435302734375, 0.0040280818939208984, 0.004540920257568359, 0.00505375862121582, 0.005566596984863281, 0.006079435348510742, 0.006592273712158203, 0.007105112075805664, 0.007617950439453125, 0.008130788803100586, 0.008643627166748047, 0.009156465530395508, 0.009669303894042969, 0.01018214225769043, 0.01069498062133789, 0.011207818984985352, 0.011720657348632812, 0.012233495712280273, 0.012746334075927734, 0.013259172439575195, 0.013772010803222656, 0.014284849166870117, 0.014797687530517578, 0.015310525894165039, 0.0158233642578125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 960.0, 50.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26537030935287476, -0.2606084942817688, -0.25584667921066284, -0.2510848939418793, -0.24632307887077332, -0.24156126379966736, -0.2367994636297226, -0.23203766345977783, -0.22727584838867188, -0.22251403331756592, -0.21775223314762115, -0.2129904329776764, -0.20822861790657043, -0.20346680283546448, -0.19870500266551971, -0.19394320249557495, -0.189181387424469, -0.18441957235336304, -0.17965777218341827, -0.1748959720134735, -0.17013415694236755, -0.1653723418712616, -0.16061054170131683, -0.15584874153137207, -0.1510869264602661, -0.14632511138916016, -0.1415633112192154, -0.13680151104927063, -0.13203969597816467, -0.12727788090705872, -0.12251608073711395, -0.11775427311658859, -0.11299246549606323, -0.10823065787553787, -0.10346885025501251, -0.09870704263448715, -0.09394523501396179, -0.08918342739343643, -0.08442161977291107, -0.07965981215238571, -0.07489800453186035, -0.07013619691133499, -0.06537438929080963, -0.06061258167028427, -0.05585077404975891, -0.05108896642923355, -0.04632715880870819, -0.04156535118818283, -0.03680354356765747, -0.03204173594713211, -0.02727992832660675, -0.02251812070608139, -0.01775631308555603, -0.01299450546503067, -0.00823269784450531, -0.00347089022397995, 0.0012909173965454102, 0.00605272501707077, 0.01081453263759613, 0.01557634025812149, 0.02033814787864685, 0.02509995549917221, 0.02986176311969757, 0.03462357074022293, 0.03938537836074829]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 9.0, 5.0, 12.0, 12.0, 18.0, 21.0, 24.0, 25.0, 36.0, 37.0, 39.0, 41.0, 50.0, 56.0, 64.0, 54.0, 70.0, 67.0, 57.0, 45.0, 37.0, 38.0, 44.0, 30.0, 24.0, 23.0, 12.0, 13.0, 18.0, 8.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0466805100440979, -0.04540916532278061, -0.04413782060146332, -0.042866479605436325, -0.041595134884119034, -0.04032379016280174, -0.03905244916677475, -0.03778110444545746, -0.03650975972414017, -0.035238415002822876, -0.033967070281505585, -0.03269572928547859, -0.0314243845641613, -0.03015303984284401, -0.028881696984171867, -0.027610354125499725, -0.026339009404182434, -0.025067664682865143, -0.023796321824193, -0.02252497896552086, -0.021253634244203568, -0.019982289522886276, -0.018710946664214134, -0.017439603805541992, -0.0161682590842247, -0.014896915294229984, -0.013625571504235268, -0.012354227714240551, -0.011082883924245834, -0.009811540134251118, -0.008540196344256401, -0.007268852554261684, -0.005997508764266968, -0.004726164974272251, -0.0034548211842775345, -0.002183477394282818, -0.0009121336042881012, 0.00035921018570661545, 0.001630553975701332, 0.0029018977656960487, 0.004173241555690765, 0.005444585345685482, 0.006715929135680199, 0.007987272925674915, 0.009258616715669632, 0.010529960505664349, 0.011801304295659065, 0.013072648085653782, 0.014343991875648499, 0.015615335665643215, 0.016886679455637932, 0.018158022314310074, 0.019429367035627365, 0.020700711756944656, 0.0219720546156168, 0.02324339747428894, 0.02451474219560623, 0.025786086916923523, 0.027057429775595665, 0.028328772634267807, 0.0296001173555851, 0.03087146207690239, 0.03214280307292938, 0.033414147794246674, 0.034685492515563965]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 8.0, 12.0, 16.0, 20.0, 32.0, 37.0, 54.0, 64.0, 109.0, 135.0, 172.0, 275.0, 382.0, 546.0, 817.0, 1203.0, 1854.0, 3010.0, 5184.0, 9521.0, 21327.0, 190503.0, 759489.0, 27116.0, 11110.0, 5805.0, 3389.0, 2099.0, 1396.0, 862.0, 580.0, 422.0, 272.0, 205.0, 153.0, 95.0, 71.0, 53.0, 43.0, 27.0, 19.0, 15.0, 13.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0216217041015625, -0.020926713943481445, -0.02023172378540039, -0.019536733627319336, -0.01884174346923828, -0.018146753311157227, -0.017451763153076172, -0.016756772994995117, -0.016061782836914062, -0.015366792678833008, -0.014671802520751953, -0.013976812362670898, -0.013281822204589844, -0.012586832046508789, -0.011891841888427734, -0.01119685173034668, -0.010501861572265625, -0.00980687141418457, -0.009111881256103516, -0.008416891098022461, -0.007721900939941406, -0.0070269107818603516, -0.006331920623779297, -0.005636930465698242, -0.0049419403076171875, -0.004246950149536133, -0.003551959991455078, -0.0028569698333740234, -0.0021619796752929688, -0.001466989517211914, -0.0007719993591308594, -7.700920104980469e-05, 0.00061798095703125, 0.0013129711151123047, 0.0020079612731933594, 0.002702951431274414, 0.0033979415893554688, 0.0040929317474365234, 0.004787921905517578, 0.005482912063598633, 0.0061779022216796875, 0.006872892379760742, 0.007567882537841797, 0.008262872695922852, 0.008957862854003906, 0.009652853012084961, 0.010347843170166016, 0.01104283332824707, 0.011737823486328125, 0.01243281364440918, 0.013127803802490234, 0.013822793960571289, 0.014517784118652344, 0.015212774276733398, 0.015907764434814453, 0.016602754592895508, 0.017297744750976562, 0.017992734909057617, 0.018687725067138672, 0.019382715225219727, 0.02007770538330078, 0.020772695541381836, 0.02146768569946289, 0.022162675857543945, 0.022857666015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 7.0, 5.0, 4.0, 5.0, 14.0, 6.0, 8.0, 9.0, 20.0, 61.0, 253.0, 357.0, 117.0, 27.0, 14.0, 9.0, 9.0, 14.0, 8.0, 6.0, 2.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 9.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00946807861328125, -0.009158492088317871, -0.008848905563354492, -0.008539319038391113, -0.008229732513427734, -0.007920145988464355, -0.0076105594635009766, -0.007300972938537598, -0.006991386413574219, -0.00668179988861084, -0.006372213363647461, -0.006062626838684082, -0.005753040313720703, -0.005443453788757324, -0.005133867263793945, -0.004824280738830566, -0.0045146942138671875, -0.004205107688903809, -0.0038955211639404297, -0.0035859346389770508, -0.003276348114013672, -0.002966761589050293, -0.002657175064086914, -0.002347588539123535, -0.0020380020141601562, -0.0017284154891967773, -0.0014188289642333984, -0.0011092424392700195, -0.0007996559143066406, -0.0004900693893432617, -0.0001804828643798828, 0.0001291036605834961, 0.000438690185546875, 0.0007482767105102539, 0.0010578632354736328, 0.0013674497604370117, 0.0016770362854003906, 0.0019866228103637695, 0.0022962093353271484, 0.0026057958602905273, 0.0029153823852539062, 0.003224968910217285, 0.003534555435180664, 0.003844141960144043, 0.004153728485107422, 0.004463315010070801, 0.00477290153503418, 0.005082488059997559, 0.0053920745849609375, 0.005701661109924316, 0.006011247634887695, 0.006320834159851074, 0.006630420684814453, 0.006940007209777832, 0.007249593734741211, 0.00755918025970459, 0.007868766784667969, 0.008178353309631348, 0.008487939834594727, 0.008797526359558105, 0.009107112884521484, 0.009416699409484863, 0.009726285934448242, 0.010035872459411621, 0.010345458984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 2.0, 6.0, 5.0, 7.0, 14.0, 12.0, 15.0, 25.0, 25.0, 21.0, 28.0, 46.0, 40.0, 64.0, 73.0, 92.0, 92.0, 146.0, 191.0, 254.0, 362.0, 668.0, 1702.0, 11452.0, 927394.0, 99224.0, 3734.0, 1054.0, 499.0, 295.0, 207.0, 155.0, 119.0, 91.0, 90.0, 61.0, 54.0, 54.0, 30.0, 23.0, 27.0, 23.0, 18.0, 15.0, 14.0, 8.0, 4.0, 9.0, 3.0, 8.0, 1.0, 2.0, 0.0, 0.0, 5.0], "bins": [-0.0621337890625, -0.06029367446899414, -0.05845355987548828, -0.05661344528198242, -0.05477333068847656, -0.0529332160949707, -0.051093101501464844, -0.049252986907958984, -0.047412872314453125, -0.045572757720947266, -0.043732643127441406, -0.04189252853393555, -0.04005241394042969, -0.03821229934692383, -0.03637218475341797, -0.03453207015991211, -0.03269195556640625, -0.03085184097290039, -0.02901172637939453, -0.027171611785888672, -0.025331497192382812, -0.023491382598876953, -0.021651268005371094, -0.019811153411865234, -0.017971038818359375, -0.016130924224853516, -0.014290809631347656, -0.012450695037841797, -0.010610580444335938, -0.008770465850830078, -0.006930351257324219, -0.005090236663818359, -0.0032501220703125, -0.0014100074768066406, 0.00043010711669921875, 0.002270221710205078, 0.0041103363037109375, 0.005950450897216797, 0.007790565490722656, 0.009630680084228516, 0.011470794677734375, 0.013310909271240234, 0.015151023864746094, 0.016991138458251953, 0.018831253051757812, 0.020671367645263672, 0.02251148223876953, 0.02435159683227539, 0.02619171142578125, 0.02803182601928711, 0.02987194061279297, 0.03171205520629883, 0.03355216979980469, 0.03539228439331055, 0.037232398986816406, 0.039072513580322266, 0.040912628173828125, 0.042752742767333984, 0.044592857360839844, 0.0464329719543457, 0.04827308654785156, 0.05011320114135742, 0.05195331573486328, 0.05379343032836914, 0.055633544921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 7.0, 5.0, 8.0, 9.0, 9.0, 9.0, 18.0, 11.0, 24.0, 20.0, 22.0, 37.0, 38.0, 36.0, 54.0, 31.0, 38.0, 57.0, 45.0, 47.0, 30.0, 43.0, 35.0, 48.0, 27.0, 40.0, 28.0, 36.0, 24.0, 21.0, 21.0, 22.0, 17.0, 15.0, 9.0, 13.0, 3.0, 6.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.030426025390625, -0.029525041580200195, -0.02862405776977539, -0.027723073959350586, -0.02682209014892578, -0.025921106338500977, -0.025020122528076172, -0.024119138717651367, -0.023218154907226562, -0.022317171096801758, -0.021416187286376953, -0.02051520347595215, -0.019614219665527344, -0.01871323585510254, -0.017812252044677734, -0.01691126823425293, -0.016010284423828125, -0.01510930061340332, -0.014208316802978516, -0.013307332992553711, -0.012406349182128906, -0.011505365371704102, -0.010604381561279297, -0.009703397750854492, -0.008802413940429688, -0.007901430130004883, -0.007000446319580078, -0.0060994625091552734, -0.005198478698730469, -0.004297494888305664, -0.0033965110778808594, -0.0024955272674560547, -0.00159454345703125, -0.0006935596466064453, 0.00020742416381835938, 0.001108407974243164, 0.0020093917846679688, 0.0029103755950927734, 0.003811359405517578, 0.004712343215942383, 0.0056133270263671875, 0.006514310836791992, 0.007415294647216797, 0.008316278457641602, 0.009217262268066406, 0.010118246078491211, 0.011019229888916016, 0.01192021369934082, 0.012821197509765625, 0.01372218132019043, 0.014623165130615234, 0.015524148941040039, 0.016425132751464844, 0.01732611656188965, 0.018227100372314453, 0.019128084182739258, 0.020029067993164062, 0.020930051803588867, 0.021831035614013672, 0.022732019424438477, 0.02363300323486328, 0.024533987045288086, 0.02543497085571289, 0.026335954666137695, 0.0272369384765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 2.0, 6.0, 9.0, 2.0, 12.0, 10.0, 18.0, 29.0, 37.0, 52.0, 69.0, 130.0, 157.0, 258.0, 462.0, 897.0, 2644.0, 13507.0, 881742.0, 137882.0, 6927.0, 1820.0, 779.0, 401.0, 219.0, 146.0, 95.0, 73.0, 45.0, 24.0, 24.0, 11.0, 23.0, 9.0, 9.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0471553802490234e-05, -3.9159320294857025e-05, -3.7847086787223816e-05, -3.653485327959061e-05, -3.52226197719574e-05, -3.391038626432419e-05, -3.259815275669098e-05, -3.128591924905777e-05, -2.997368574142456e-05, -2.866145223379135e-05, -2.7349218726158142e-05, -2.6036985218524933e-05, -2.4724751710891724e-05, -2.3412518203258514e-05, -2.2100284695625305e-05, -2.0788051187992096e-05, -1.9475817680358887e-05, -1.8163584172725677e-05, -1.6851350665092468e-05, -1.553911715745926e-05, -1.422688364982605e-05, -1.291465014219284e-05, -1.1602416634559631e-05, -1.0290183126926422e-05, -8.977949619293213e-06, -7.665716111660004e-06, -6.3534826040267944e-06, -5.041249096393585e-06, -3.729015588760376e-06, -2.4167820811271667e-06, -1.1045485734939575e-06, 2.076849341392517e-07, 1.519918441772461e-06, 2.83215194940567e-06, 4.144385457038879e-06, 5.456618964672089e-06, 6.768852472305298e-06, 8.081085979938507e-06, 9.393319487571716e-06, 1.0705552995204926e-05, 1.2017786502838135e-05, 1.3330020010471344e-05, 1.4642253518104553e-05, 1.5954487025737762e-05, 1.726672053337097e-05, 1.857895404100418e-05, 1.989118754863739e-05, 2.12034210562706e-05, 2.251565456390381e-05, 2.3827888071537018e-05, 2.5140121579170227e-05, 2.6452355086803436e-05, 2.7764588594436646e-05, 2.9076822102069855e-05, 3.0389055609703064e-05, 3.170128911733627e-05, 3.301352262496948e-05, 3.432575613260269e-05, 3.56379896402359e-05, 3.695022314786911e-05, 3.826245665550232e-05, 3.957469016313553e-05, 4.088692367076874e-05, 4.219915717840195e-05, 4.3511390686035156e-05]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 8.0, 9.0, 15.0, 13.0, 10.0, 26.0, 35.0, 36.0, 31.0, 46.0, 47.0, 73.0, 60.0, 50.0, 76.0, 76.0, 59.0, 34.0, 45.0, 51.0, 46.0, 38.0, 23.0, 21.0, 16.0, 11.0, 5.0, 11.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.649162292480469e-06, -4.4833868741989136e-06, -4.317611455917358e-06, -4.151836037635803e-06, -3.986060619354248e-06, -3.820285201072693e-06, -3.6545097827911377e-06, -3.4887343645095825e-06, -3.3229589462280273e-06, -3.157183527946472e-06, -2.991408109664917e-06, -2.825632691383362e-06, -2.6598572731018066e-06, -2.4940818548202515e-06, -2.3283064365386963e-06, -2.162531018257141e-06, -1.996755599975586e-06, -1.8309801816940308e-06, -1.6652047634124756e-06, -1.4994293451309204e-06, -1.3336539268493652e-06, -1.16787850856781e-06, -1.0021030902862549e-06, -8.363276720046997e-07, -6.705522537231445e-07, -5.047768354415894e-07, -3.390014171600342e-07, -1.73225998878479e-07, -7.450580596923828e-09, 1.5832483768463135e-07, 3.241002559661865e-07, 4.898756742477417e-07, 6.556510925292969e-07, 8.21426510810852e-07, 9.872019290924072e-07, 1.1529773473739624e-06, 1.3187527656555176e-06, 1.4845281839370728e-06, 1.650303602218628e-06, 1.816079020500183e-06, 1.9818544387817383e-06, 2.1476298570632935e-06, 2.3134052753448486e-06, 2.479180693626404e-06, 2.644956111907959e-06, 2.810731530189514e-06, 2.9765069484710693e-06, 3.1422823667526245e-06, 3.3080577850341797e-06, 3.473833203315735e-06, 3.63960862159729e-06, 3.8053840398788452e-06, 3.9711594581604e-06, 4.1369348764419556e-06, 4.302710294723511e-06, 4.468485713005066e-06, 4.634261131286621e-06, 4.800036549568176e-06, 4.9658119678497314e-06, 5.131587386131287e-06, 5.297362804412842e-06, 5.463138222694397e-06, 5.628913640975952e-06, 5.794689059257507e-06, 5.9604644775390625e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 10.0, 15.0, 13.0, 26.0, 18.0, 41.0, 55.0, 105.0, 151.0, 252.0, 427.0, 1531.0, 65986.0, 975765.0, 2771.0, 577.0, 288.0, 169.0, 112.0, 72.0, 34.0, 33.0, 21.0, 18.0, 10.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.927417755126953e-05, -7.695145905017853e-05, -7.462874054908752e-05, -7.230602204799652e-05, -6.998330354690552e-05, -6.766058504581451e-05, -6.533786654472351e-05, -6.301514804363251e-05, -6.0692429542541504e-05, -5.83697110414505e-05, -5.60469925403595e-05, -5.3724274039268494e-05, -5.140155553817749e-05, -4.907883703708649e-05, -4.6756118535995483e-05, -4.443340003490448e-05, -4.2110681533813477e-05, -3.978796303272247e-05, -3.746524453163147e-05, -3.5142526030540466e-05, -3.281980752944946e-05, -3.049708902835846e-05, -2.8174370527267456e-05, -2.5851652026176453e-05, -2.352893352508545e-05, -2.1206215023994446e-05, -1.8883496522903442e-05, -1.656077802181244e-05, -1.4238059520721436e-05, -1.1915341019630432e-05, -9.592622518539429e-06, -7.269904017448425e-06, -4.947185516357422e-06, -2.6244670152664185e-06, -3.0174851417541504e-07, 2.0209699869155884e-06, 4.343688488006592e-06, 6.666406989097595e-06, 8.989125490188599e-06, 1.1311843991279602e-05, 1.3634562492370605e-05, 1.595728099346161e-05, 1.8279999494552612e-05, 2.0602717995643616e-05, 2.292543649673462e-05, 2.5248154997825623e-05, 2.7570873498916626e-05, 2.989359200000763e-05, 3.221631050109863e-05, 3.4539029002189636e-05, 3.686174750328064e-05, 3.918446600437164e-05, 4.1507184505462646e-05, 4.382990300655365e-05, 4.615262150764465e-05, 4.847534000873566e-05, 5.079805850982666e-05, 5.3120777010917664e-05, 5.544349551200867e-05, 5.776621401309967e-05, 6.0088932514190674e-05, 6.241165101528168e-05, 6.473436951637268e-05, 6.705708801746368e-05, 6.937980651855469e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 5.0, 11.0, 4.0, 13.0, 22.0, 27.0, 41.0, 46.0, 52.0, 96.0, 118.0, 148.0, 114.0, 74.0, 48.0, 51.0, 40.0, 18.0, 21.0, 12.0, 8.0, 5.0, 6.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8743019104003906e-05, -3.764685243368149e-05, -3.655068576335907e-05, -3.545451909303665e-05, -3.4358352422714233e-05, -3.3262185752391815e-05, -3.21660190820694e-05, -3.106985241174698e-05, -2.997368574142456e-05, -2.8877519071102142e-05, -2.7781352400779724e-05, -2.6685185730457306e-05, -2.5589019060134888e-05, -2.449285238981247e-05, -2.339668571949005e-05, -2.2300519049167633e-05, -2.1204352378845215e-05, -2.0108185708522797e-05, -1.901201903820038e-05, -1.791585236787796e-05, -1.6819685697555542e-05, -1.5723519027233124e-05, -1.4627352356910706e-05, -1.3531185686588287e-05, -1.2435019016265869e-05, -1.1338852345943451e-05, -1.0242685675621033e-05, -9.146519005298615e-06, -8.050352334976196e-06, -6.954185664653778e-06, -5.85801899433136e-06, -4.761852324008942e-06, -3.6656856536865234e-06, -2.5695189833641052e-06, -1.473352313041687e-06, -3.771856427192688e-07, 7.189810276031494e-07, 1.8151476979255676e-06, 2.911314368247986e-06, 4.007481038570404e-06, 5.103647708892822e-06, 6.1998143792152405e-06, 7.295981049537659e-06, 8.392147719860077e-06, 9.488314390182495e-06, 1.0584481060504913e-05, 1.1680647730827332e-05, 1.277681440114975e-05, 1.3872981071472168e-05, 1.4969147741794586e-05, 1.6065314412117004e-05, 1.7161481082439423e-05, 1.825764775276184e-05, 1.935381442308426e-05, 2.0449981093406677e-05, 2.1546147763729095e-05, 2.2642314434051514e-05, 2.3738481104373932e-05, 2.483464777469635e-05, 2.593081444501877e-05, 2.7026981115341187e-05, 2.8123147785663605e-05, 2.9219314455986023e-05, 3.031548112630844e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [12.0, 938.0, 64.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03425495699048042, -0.014300649985671043, 0.005653657019138336, 0.025607962161302567, 0.045562271028757095, 0.06551657617092133, 0.08547088503837585, 0.10542519390583038, 0.1253795027732849, 0.14533381164073944, 0.16528812050819397, 0.1852424144744873, 0.20519673824310303, 0.22515103220939636, 0.2451053410768509, 0.2650596499443054, 0.28501394391059875, 0.3049682378768921, 0.3249225616455078, 0.34487685561180115, 0.36483117938041687, 0.3847854733467102, 0.4047397971153259, 0.42469409108161926, 0.444648414850235, 0.4646027088165283, 0.48455703258514404, 0.5045113563537598, 0.5244656205177307, 0.5444199442863464, 0.5643742680549622, 0.5843285322189331, 0.6042829155921936, 0.6242372393608093, 0.6441915035247803, 0.664145827293396, 0.6841001510620117, 0.7040544748306274, 0.7240087389945984, 0.7439630627632141, 0.7639173865318298, 0.7838717103004456, 0.8038259744644165, 0.8237802982330322, 0.843734622001648, 0.8636889457702637, 0.8836432099342346, 0.9035975337028503, 0.9235517978668213, 0.943506121635437, 0.963460385799408, 0.9834147095680237, 1.0033689737319946, 1.0233232975006104, 1.043277621269226, 1.0632319450378418, 1.0831862688064575, 1.1031405925750732, 1.123094916343689, 1.1430492401123047, 1.1630034446716309, 1.1829577684402466, 1.2029120922088623, 1.222866415977478, 1.2428207397460938]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 9.0, 12.0, 11.0, 14.0, 26.0, 31.0, 35.0, 50.0, 54.0, 42.0, 65.0, 76.0, 64.0, 77.0, 60.0, 67.0, 60.0, 55.0, 52.0, 36.0, 23.0, 20.0, 17.0, 16.0, 10.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2950636148452759, -0.2866082191467285, -0.27815282344818115, -0.2696973979473114, -0.26124200224876404, -0.2527866065502167, -0.24433119595050812, -0.23587578535079956, -0.2274203896522522, -0.21896499395370483, -0.21050958335399628, -0.20205417275428772, -0.19359877705574036, -0.185143381357193, -0.17668797075748444, -0.16823256015777588, -0.15977716445922852, -0.15132176876068115, -0.1428663581609726, -0.13441094756126404, -0.12595555186271667, -0.11750014871358871, -0.10904474556446075, -0.1005893424153328, -0.09213393926620483, -0.08367853611707687, -0.07522313296794891, -0.06676772981882095, -0.05831232666969299, -0.04985692352056503, -0.04140152037143707, -0.03294611722230911, -0.024490714073181152, -0.016035310924053192, -0.007579907774925232, 0.0008754953742027283, 0.009330898523330688, 0.01778630167245865, 0.02624170482158661, 0.03469710797071457, 0.04315251111984253, 0.05160791426897049, 0.06006331741809845, 0.06851872056722641, 0.07697412371635437, 0.08542952686548233, 0.09388493001461029, 0.10234033316373825, 0.11079573631286621, 0.11925113946199417, 0.12770654261112213, 0.1361619532108307, 0.14461734890937805, 0.15307274460792542, 0.16152815520763397, 0.16998356580734253, 0.1784389615058899, 0.18689435720443726, 0.1953497678041458, 0.20380517840385437, 0.21226057410240173, 0.2207159698009491, 0.22917138040065765, 0.2376267910003662, 0.24608218669891357]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 5.0, 11.0, 10.0, 15.0, 15.0, 25.0, 26.0, 35.0, 52.0, 64.0, 84.0, 138.0, 220.0, 644.0, 11736.0, 4171602.0, 8169.0, 492.0, 257.0, 159.0, 98.0, 80.0, 64.0, 39.0, 39.0, 23.0, 29.0, 23.0, 20.0, 15.0, 13.0, 15.0, 10.0, 4.0, 9.0, 2.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.031219482421875, -0.03016185760498047, -0.029104232788085938, -0.028046607971191406, -0.026988983154296875, -0.025931358337402344, -0.024873733520507812, -0.02381610870361328, -0.02275848388671875, -0.02170085906982422, -0.020643234252929688, -0.019585609436035156, -0.018527984619140625, -0.017470359802246094, -0.016412734985351562, -0.015355110168457031, -0.0142974853515625, -0.013239860534667969, -0.012182235717773438, -0.011124610900878906, -0.010066986083984375, -0.009009361267089844, -0.007951736450195312, -0.006894111633300781, -0.00583648681640625, -0.004778861999511719, -0.0037212371826171875, -0.0026636123657226562, -0.001605987548828125, -0.0005483627319335938, 0.0005092620849609375, 0.0015668869018554688, 0.00262451171875, 0.0036821365356445312, 0.0047397613525390625, 0.005797386169433594, 0.006855010986328125, 0.007912635803222656, 0.008970260620117188, 0.010027885437011719, 0.01108551025390625, 0.012143135070800781, 0.013200759887695312, 0.014258384704589844, 0.015316009521484375, 0.016373634338378906, 0.017431259155273438, 0.01848888397216797, 0.0195465087890625, 0.02060413360595703, 0.021661758422851562, 0.022719383239746094, 0.023777008056640625, 0.024834632873535156, 0.025892257690429688, 0.02694988250732422, 0.02800750732421875, 0.02906513214111328, 0.030122756958007812, 0.031180381774902344, 0.032238006591796875, 0.033295631408691406, 0.03435325622558594, 0.03541088104248047, 0.036468505859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 4.0, 7.0, 10.0, 10.0, 7.0, 14.0, 15.0, 69.0, 238.0, 326.0, 139.0, 44.0, 9.0, 12.0, 9.0, 11.0, 10.0, 7.0, 2.0, 3.0, 6.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0087127685546875, -0.008418679237365723, -0.008124589920043945, -0.007830500602722168, -0.007536411285400391, -0.007242321968078613, -0.006948232650756836, -0.006654143333435059, -0.006360054016113281, -0.006065964698791504, -0.0057718753814697266, -0.005477786064147949, -0.005183696746826172, -0.0048896074295043945, -0.004595518112182617, -0.00430142879486084, -0.0040073394775390625, -0.003713250160217285, -0.003419160842895508, -0.0031250715255737305, -0.002830982208251953, -0.0025368928909301758, -0.0022428035736083984, -0.001948714256286621, -0.0016546249389648438, -0.0013605356216430664, -0.001066446304321289, -0.0007723569869995117, -0.0004782676696777344, -0.00018417835235595703, 0.00010991096496582031, 0.00040400028228759766, 0.000698089599609375, 0.0009921789169311523, 0.0012862682342529297, 0.001580357551574707, 0.0018744468688964844, 0.0021685361862182617, 0.002462625503540039, 0.0027567148208618164, 0.0030508041381835938, 0.003344893455505371, 0.0036389827728271484, 0.003933072090148926, 0.004227161407470703, 0.0045212507247924805, 0.004815340042114258, 0.005109429359436035, 0.0054035186767578125, 0.00569760799407959, 0.005991697311401367, 0.0062857866287231445, 0.006579875946044922, 0.006873965263366699, 0.0071680545806884766, 0.007462143898010254, 0.007756233215332031, 0.008050322532653809, 0.008344411849975586, 0.008638501167297363, 0.00893259048461914, 0.009226679801940918, 0.009520769119262695, 0.009814858436584473, 0.01010894775390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 8.0, 6.0, 14.0, 12.0, 21.0, 42.0, 98.0, 376.0, 3730.0, 4184109.0, 5113.0, 494.0, 116.0, 55.0, 22.0, 31.0, 6.0, 14.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0845947265625, -0.08234071731567383, -0.08008670806884766, -0.07783269882202148, -0.07557868957519531, -0.07332468032836914, -0.07107067108154297, -0.0688166618347168, -0.06656265258789062, -0.06430864334106445, -0.06205463409423828, -0.05980062484741211, -0.05754661560058594, -0.055292606353759766, -0.053038597106933594, -0.05078458786010742, -0.04853057861328125, -0.04627656936645508, -0.044022560119628906, -0.041768550872802734, -0.03951454162597656, -0.03726053237915039, -0.03500652313232422, -0.03275251388549805, -0.030498504638671875, -0.028244495391845703, -0.02599048614501953, -0.02373647689819336, -0.021482467651367188, -0.019228458404541016, -0.016974449157714844, -0.014720439910888672, -0.0124664306640625, -0.010212421417236328, -0.007958412170410156, -0.005704402923583984, -0.0034503936767578125, -0.0011963844299316406, 0.0010576248168945312, 0.003311634063720703, 0.005565643310546875, 0.007819652557373047, 0.010073661804199219, 0.01232767105102539, 0.014581680297851562, 0.016835689544677734, 0.019089698791503906, 0.021343708038330078, 0.02359771728515625, 0.025851726531982422, 0.028105735778808594, 0.030359745025634766, 0.03261375427246094, 0.03486776351928711, 0.03712177276611328, 0.03937578201293945, 0.041629791259765625, 0.0438838005065918, 0.04613780975341797, 0.04839181900024414, 0.05064582824707031, 0.052899837493896484, 0.055153846740722656, 0.05740785598754883, 0.059661865234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 5.0, 5.0, 6.0, 19.0, 47.0, 163.0, 3591.0, 150.0, 41.0, 14.0, 8.0, 5.0, 6.0, 4.0, 2.0, 8.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01169586181640625, -0.011237263679504395, -0.010778665542602539, -0.010320067405700684, -0.009861469268798828, -0.009402871131896973, -0.008944272994995117, -0.008485674858093262, -0.008027076721191406, -0.007568478584289551, -0.007109880447387695, -0.00665128231048584, -0.006192684173583984, -0.005734086036682129, -0.0052754878997802734, -0.004816889762878418, -0.0043582916259765625, -0.003899693489074707, -0.0034410953521728516, -0.002982497215270996, -0.0025238990783691406, -0.002065300941467285, -0.0016067028045654297, -0.0011481046676635742, -0.0006895065307617188, -0.00023090839385986328, 0.0002276897430419922, 0.0006862878799438477, 0.0011448860168457031, 0.0016034841537475586, 0.002062082290649414, 0.0025206804275512695, 0.002979278564453125, 0.0034378767013549805, 0.003896474838256836, 0.004355072975158691, 0.004813671112060547, 0.005272269248962402, 0.005730867385864258, 0.006189465522766113, 0.006648063659667969, 0.007106661796569824, 0.00756525993347168, 0.008023858070373535, 0.00848245620727539, 0.008941054344177246, 0.009399652481079102, 0.009858250617980957, 0.010316848754882812, 0.010775446891784668, 0.011234045028686523, 0.011692643165588379, 0.012151241302490234, 0.01260983943939209, 0.013068437576293945, 0.0135270357131958, 0.013985633850097656, 0.014444231986999512, 0.014902830123901367, 0.015361428260803223, 0.015820026397705078, 0.016278624534606934, 0.01673722267150879, 0.017195820808410645, 0.0176544189453125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 1001.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21490637958049774, -0.2060028314590454, -0.19709926843643188, -0.18819572031497955, -0.17929217219352722, -0.1703886240720749, -0.16148507595062256, -0.15258151292800903, -0.1436779648065567, -0.13477441668510437, -0.12587085366249084, -0.11696730554103851, -0.10806375741958618, -0.09916020929813385, -0.09025665372610092, -0.081353098154068, -0.07244955003261566, -0.06354600191116333, -0.0546424463391304, -0.04573889449238777, -0.03683534264564514, -0.02793179079890251, -0.01902823895215988, -0.010124687105417252, -0.0012211352586746216, 0.007682416588068008, 0.01658596843481064, 0.02548952028155327, 0.0343930721282959, 0.04329662397503853, 0.05220017582178116, 0.06110372766852379, 0.07000729441642761, 0.07891084253787994, 0.08781439810991287, 0.0967179536819458, 0.10562150180339813, 0.11452504992485046, 0.12342860549688339, 0.13233216106891632, 0.14123570919036865, 0.15013925731182098, 0.15904280543327332, 0.16794636845588684, 0.17684991657733917, 0.1857534646987915, 0.19465702772140503, 0.20356057584285736, 0.2124641239643097, 0.22136767208576202, 0.23027122020721436, 0.23917478322982788, 0.2480783313512802, 0.25698187947273254, 0.26588544249534607, 0.2747889757156372, 0.28369253873825073, 0.29259610176086426, 0.3014996349811554, 0.3104031980037689, 0.31930673122406006, 0.3282102942466736, 0.3371138572692871, 0.34601739048957825, 0.3549209535121918]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 8.0, 17.0, 17.0, 14.0, 24.0, 29.0, 37.0, 40.0, 46.0, 56.0, 72.0, 59.0, 43.0, 58.0, 54.0, 64.0, 60.0, 45.0, 44.0, 35.0, 28.0, 31.0, 25.0, 31.0, 19.0, 6.0, 8.0, 8.0, 5.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.025498926639556885, -0.02464284375309944, -0.023786762729287148, -0.022930681705474854, -0.02207459881901741, -0.021218515932559967, -0.020362434908747673, -0.01950635388493538, -0.018650270998477936, -0.017794188112020493, -0.0169381070882082, -0.016082026064395905, -0.015225943177938461, -0.014369861222803593, -0.013513779267668724, -0.012657697312533855, -0.011801615357398987, -0.010945533402264118, -0.01008945144712925, -0.009233369491994381, -0.008377287536859512, -0.007521205581724644, -0.006665123626589775, -0.0058090416714549065, -0.004952959716320038, -0.004096877761185169, -0.0032407958060503006, -0.002384713850915432, -0.0015286318957805634, -0.0006725499406456947, 0.0001835320144891739, 0.0010396139696240425, 0.0018956959247589111, 0.0027517778798937798, 0.0036078598350286484, 0.004463941790163517, 0.005320023745298386, 0.006176105700433254, 0.007032187655568123, 0.007888269610702991, 0.00874435156583786, 0.009600433520972729, 0.010456515476107597, 0.011312597431242466, 0.012168679386377335, 0.013024761341512203, 0.013880843296647072, 0.01473692525178194, 0.015593007206916809, 0.016449090093374252, 0.017305171117186546, 0.01816125214099884, 0.019017335027456284, 0.019873417913913727, 0.02072949893772602, 0.021585579961538315, 0.022441662847995758, 0.0232977457344532, 0.024153826758265495, 0.02500990778207779, 0.025865990668535233, 0.026722073554992676, 0.02757815457880497, 0.028434235602617264, 0.029290318489074707]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 4.0, 15.0, 18.0, 20.0, 25.0, 37.0, 52.0, 60.0, 98.0, 108.0, 180.0, 203.0, 284.0, 367.0, 553.0, 767.0, 1087.0, 1496.0, 2229.0, 3269.0, 5013.0, 8655.0, 16295.0, 54671.0, 839653.0, 70187.0, 17540.0, 9166.0, 5302.0, 3383.0, 2296.0, 1520.0, 1087.0, 749.0, 545.0, 411.0, 294.0, 231.0, 180.0, 129.0, 90.0, 60.0, 44.0, 45.0, 26.0, 19.0, 22.0, 15.0, 10.0, 11.0, 8.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.01184844970703125, -0.011460661888122559, -0.011072874069213867, -0.010685086250305176, -0.010297298431396484, -0.009909510612487793, -0.009521722793579102, -0.00913393497467041, -0.008746147155761719, -0.008358359336853027, -0.007970571517944336, -0.0075827836990356445, -0.007194995880126953, -0.006807208061218262, -0.00641942024230957, -0.006031632423400879, -0.0056438446044921875, -0.005256056785583496, -0.004868268966674805, -0.004480481147766113, -0.004092693328857422, -0.0037049055099487305, -0.003317117691040039, -0.0029293298721313477, -0.0025415420532226562, -0.002153754234313965, -0.0017659664154052734, -0.001378178596496582, -0.0009903907775878906, -0.0006026029586791992, -0.0002148151397705078, 0.0001729726791381836, 0.000560760498046875, 0.0009485483169555664, 0.0013363361358642578, 0.0017241239547729492, 0.0021119117736816406, 0.002499699592590332, 0.0028874874114990234, 0.003275275230407715, 0.0036630630493164062, 0.004050850868225098, 0.004438638687133789, 0.0048264265060424805, 0.005214214324951172, 0.005602002143859863, 0.005989789962768555, 0.006377577781677246, 0.0067653656005859375, 0.007153153419494629, 0.00754094123840332, 0.007928729057312012, 0.008316516876220703, 0.008704304695129395, 0.009092092514038086, 0.009479880332946777, 0.009867668151855469, 0.01025545597076416, 0.010643243789672852, 0.011031031608581543, 0.011418819427490234, 0.011806607246398926, 0.012194395065307617, 0.012582182884216309, 0.012969970703125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 4.0, 4.0, 13.0, 8.0, 9.0, 8.0, 20.0, 57.0, 215.0, 331.0, 162.0, 49.0, 12.0, 12.0, 8.0, 11.0, 11.0, 6.0, 3.0, 3.0, 6.0, 4.0, 1.0, 3.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0087432861328125, -0.008449196815490723, -0.008155107498168945, -0.007861018180847168, -0.007566928863525391, -0.007272839546203613, -0.006978750228881836, -0.006684660911560059, -0.006390571594238281, -0.006096482276916504, -0.0058023929595947266, -0.005508303642272949, -0.005214214324951172, -0.0049201250076293945, -0.004626035690307617, -0.00433194637298584, -0.0040378570556640625, -0.003743767738342285, -0.003449678421020508, -0.0031555891036987305, -0.002861499786376953, -0.0025674104690551758, -0.0022733211517333984, -0.001979231834411621, -0.0016851425170898438, -0.0013910531997680664, -0.001096963882446289, -0.0008028745651245117, -0.0005087852478027344, -0.00021469593048095703, 7.939338684082031e-05, 0.00037348270416259766, 0.000667572021484375, 0.0009616613388061523, 0.0012557506561279297, 0.001549839973449707, 0.0018439292907714844, 0.0021380186080932617, 0.002432107925415039, 0.0027261972427368164, 0.0030202865600585938, 0.003314375877380371, 0.0036084651947021484, 0.0039025545120239258, 0.004196643829345703, 0.0044907331466674805, 0.004784822463989258, 0.005078911781311035, 0.0053730010986328125, 0.00566709041595459, 0.005961179733276367, 0.0062552690505981445, 0.006549358367919922, 0.006843447685241699, 0.0071375370025634766, 0.007431626319885254, 0.007725715637207031, 0.008019804954528809, 0.008313894271850586, 0.008607983589172363, 0.00890207290649414, 0.009196162223815918, 0.009490251541137695, 0.009784340858459473, 0.01007843017578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 6.0, 14.0, 9.0, 10.0, 16.0, 22.0, 31.0, 36.0, 49.0, 50.0, 58.0, 73.0, 78.0, 116.0, 164.0, 213.0, 343.0, 583.0, 1034.0, 2825.0, 31626.0, 967953.0, 37388.0, 2842.0, 1105.0, 579.0, 315.0, 236.0, 167.0, 136.0, 100.0, 70.0, 55.0, 42.0, 42.0, 35.0, 23.0, 20.0, 17.0, 16.0, 9.0, 8.0, 4.0, 2.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0408935546875, -0.03950834274291992, -0.038123130798339844, -0.036737918853759766, -0.03535270690917969, -0.03396749496459961, -0.03258228302001953, -0.031197071075439453, -0.029811859130859375, -0.028426647186279297, -0.02704143524169922, -0.02565622329711914, -0.024271011352539062, -0.022885799407958984, -0.021500587463378906, -0.020115375518798828, -0.01873016357421875, -0.017344951629638672, -0.015959739685058594, -0.014574527740478516, -0.013189315795898438, -0.01180410385131836, -0.010418891906738281, -0.009033679962158203, -0.007648468017578125, -0.006263256072998047, -0.004878044128417969, -0.0034928321838378906, -0.0021076202392578125, -0.0007224082946777344, 0.0006628036499023438, 0.002048015594482422, 0.0034332275390625, 0.004818439483642578, 0.006203651428222656, 0.007588863372802734, 0.008974075317382812, 0.01035928726196289, 0.011744499206542969, 0.013129711151123047, 0.014514923095703125, 0.015900135040283203, 0.01728534698486328, 0.01867055892944336, 0.020055770874023438, 0.021440982818603516, 0.022826194763183594, 0.024211406707763672, 0.02559661865234375, 0.026981830596923828, 0.028367042541503906, 0.029752254486083984, 0.031137466430664062, 0.03252267837524414, 0.03390789031982422, 0.0352931022644043, 0.036678314208984375, 0.03806352615356445, 0.03944873809814453, 0.04083395004272461, 0.04221916198730469, 0.043604373931884766, 0.044989585876464844, 0.04637479782104492, 0.047760009765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 9.0, 9.0, 14.0, 21.0, 20.0, 20.0, 31.0, 26.0, 29.0, 28.0, 36.0, 32.0, 35.0, 46.0, 26.0, 48.0, 55.0, 32.0, 43.0, 31.0, 35.0, 41.0, 39.0, 32.0, 31.0, 30.0, 28.0, 22.0, 10.0, 13.0, 16.0, 18.0, 14.0, 9.0, 12.0, 11.0, 6.0, 4.0, 4.0, 2.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0235137939453125, -0.022716522216796875, -0.02191925048828125, -0.021121978759765625, -0.02032470703125, -0.019527435302734375, -0.01873016357421875, -0.017932891845703125, -0.0171356201171875, -0.016338348388671875, -0.01554107666015625, -0.014743804931640625, -0.013946533203125, -0.013149261474609375, -0.01235198974609375, -0.011554718017578125, -0.0107574462890625, -0.009960174560546875, -0.00916290283203125, -0.008365631103515625, -0.007568359375, -0.006771087646484375, -0.00597381591796875, -0.005176544189453125, -0.0043792724609375, -0.003582000732421875, -0.00278472900390625, -0.001987457275390625, -0.001190185546875, -0.000392913818359375, 0.00040435791015625, 0.001201629638671875, 0.0019989013671875, 0.002796173095703125, 0.00359344482421875, 0.004390716552734375, 0.00518798828125, 0.005985260009765625, 0.00678253173828125, 0.007579803466796875, 0.0083770751953125, 0.009174346923828125, 0.00997161865234375, 0.010768890380859375, 0.011566162109375, 0.012363433837890625, 0.01316070556640625, 0.013957977294921875, 0.0147552490234375, 0.015552520751953125, 0.01634979248046875, 0.017147064208984375, 0.0179443359375, 0.018741607666015625, 0.01953887939453125, 0.020336151123046875, 0.0211334228515625, 0.021930694580078125, 0.02272796630859375, 0.023525238037109375, 0.024322509765625, 0.025119781494140625, 0.02591705322265625, 0.026714324951171875, 0.0275115966796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 7.0, 10.0, 14.0, 15.0, 24.0, 32.0, 58.0, 82.0, 125.0, 248.0, 524.0, 1407.0, 7119.0, 875579.0, 157216.0, 4158.0, 1008.0, 386.0, 179.0, 111.0, 68.0, 36.0, 34.0, 22.0, 10.0, 16.0, 6.0, 8.0, 8.0, 8.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.445148468017578e-05, -3.311969339847565e-05, -3.178790211677551e-05, -3.045611083507538e-05, -2.9124319553375244e-05, -2.779252827167511e-05, -2.6460736989974976e-05, -2.512894570827484e-05, -2.3797154426574707e-05, -2.2465363144874573e-05, -2.113357186317444e-05, -1.9801780581474304e-05, -1.846998929977417e-05, -1.7138198018074036e-05, -1.58064067363739e-05, -1.4474615454673767e-05, -1.3142824172973633e-05, -1.1811032891273499e-05, -1.0479241609573364e-05, -9.14745032787323e-06, -7.815659046173096e-06, -6.4838677644729614e-06, -5.152076482772827e-06, -3.820285201072693e-06, -2.4884939193725586e-06, -1.1567026376724243e-06, 1.7508864402770996e-07, 1.5068799257278442e-06, 2.8386712074279785e-06, 4.170462489128113e-06, 5.502253770828247e-06, 6.834045052528381e-06, 8.165836334228516e-06, 9.49762761592865e-06, 1.0829418897628784e-05, 1.2161210179328918e-05, 1.3493001461029053e-05, 1.4824792742729187e-05, 1.615658402442932e-05, 1.7488375306129456e-05, 1.882016658782959e-05, 2.0151957869529724e-05, 2.148374915122986e-05, 2.2815540432929993e-05, 2.4147331714630127e-05, 2.547912299633026e-05, 2.6810914278030396e-05, 2.814270555973053e-05, 2.9474496841430664e-05, 3.08062881231308e-05, 3.213807940483093e-05, 3.346987068653107e-05, 3.48016619682312e-05, 3.6133453249931335e-05, 3.746524453163147e-05, 3.8797035813331604e-05, 4.012882709503174e-05, 4.146061837673187e-05, 4.279240965843201e-05, 4.412420094013214e-05, 4.5455992221832275e-05, 4.678778350353241e-05, 4.8119574785232544e-05, 4.945136606693268e-05, 5.078315734863281e-05]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 6.0, 12.0, 6.0, 17.0, 8.0, 17.0, 33.0, 22.0, 39.0, 25.0, 74.0, 67.0, 63.0, 88.0, 73.0, 93.0, 58.0, 43.0, 52.0, 19.0, 52.0, 19.0, 19.0, 18.0, 11.0, 13.0, 13.0, 9.0, 7.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.602836608886719e-06, -5.448237061500549e-06, -5.29363751411438e-06, -5.1390379667282104e-06, -4.984438419342041e-06, -4.829838871955872e-06, -4.675239324569702e-06, -4.520639777183533e-06, -4.366040229797363e-06, -4.211440682411194e-06, -4.056841135025024e-06, -3.902241587638855e-06, -3.7476420402526855e-06, -3.593042492866516e-06, -3.4384429454803467e-06, -3.2838433980941772e-06, -3.129243850708008e-06, -2.9746443033218384e-06, -2.820044755935669e-06, -2.6654452085494995e-06, -2.51084566116333e-06, -2.3562461137771606e-06, -2.201646566390991e-06, -2.0470470190048218e-06, -1.8924474716186523e-06, -1.737847924232483e-06, -1.5832483768463135e-06, -1.428648829460144e-06, -1.2740492820739746e-06, -1.1194497346878052e-06, -9.648501873016357e-07, -8.102506399154663e-07, -6.556510925292969e-07, -5.010515451431274e-07, -3.46451997756958e-07, -1.9185245037078857e-07, -3.725290298461914e-08, 1.1734664440155029e-07, 2.7194619178771973e-07, 4.2654573917388916e-07, 5.811452865600586e-07, 7.35744833946228e-07, 8.903443813323975e-07, 1.044943928718567e-06, 1.1995434761047363e-06, 1.3541430234909058e-06, 1.5087425708770752e-06, 1.6633421182632446e-06, 1.817941665649414e-06, 1.9725412130355835e-06, 2.127140760421753e-06, 2.2817403078079224e-06, 2.436339855194092e-06, 2.5909394025802612e-06, 2.7455389499664307e-06, 2.9001384973526e-06, 3.0547380447387695e-06, 3.209337592124939e-06, 3.3639371395111084e-06, 3.518536686897278e-06, 3.6731362342834473e-06, 3.827735781669617e-06, 3.982335329055786e-06, 4.1369348764419556e-06, 4.291534423828125e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 10.0, 8.0, 8.0, 22.0, 27.0, 36.0, 89.0, 121.0, 229.0, 711.0, 4777.0, 1033941.0, 7206.0, 748.0, 266.0, 141.0, 79.0, 41.0, 29.0, 18.0, 10.0, 12.0, 5.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16908073425293e-05, -5.960371345281601e-05, -5.751661956310272e-05, -5.5429525673389435e-05, -5.334243178367615e-05, -5.125533789396286e-05, -4.916824400424957e-05, -4.7081150114536285e-05, -4.4994056224823e-05, -4.290696233510971e-05, -4.081986844539642e-05, -3.8732774555683136e-05, -3.664568066596985e-05, -3.455858677625656e-05, -3.2471492886543274e-05, -3.0384398996829987e-05, -2.82973051071167e-05, -2.6210211217403412e-05, -2.4123117327690125e-05, -2.2036023437976837e-05, -1.994892954826355e-05, -1.7861835658550262e-05, -1.5774741768836975e-05, -1.3687647879123688e-05, -1.16005539894104e-05, -9.513460099697113e-06, -7.426366209983826e-06, -5.339272320270538e-06, -3.252178430557251e-06, -1.1650845408439636e-06, 9.220093488693237e-07, 3.009103238582611e-06, 5.0961971282958984e-06, 7.183291018009186e-06, 9.270384907722473e-06, 1.135747879743576e-05, 1.3444572687149048e-05, 1.5531666576862335e-05, 1.7618760466575623e-05, 1.970585435628891e-05, 2.1792948246002197e-05, 2.3880042135715485e-05, 2.5967136025428772e-05, 2.805422991514206e-05, 3.0141323804855347e-05, 3.2228417694568634e-05, 3.431551158428192e-05, 3.640260547399521e-05, 3.8489699363708496e-05, 4.0576793253421783e-05, 4.266388714313507e-05, 4.475098103284836e-05, 4.6838074922561646e-05, 4.892516881227493e-05, 5.101226270198822e-05, 5.309935659170151e-05, 5.5186450481414795e-05, 5.727354437112808e-05, 5.936063826084137e-05, 6.144773215055466e-05, 6.353482604026794e-05, 6.562191992998123e-05, 6.770901381969452e-05, 6.97961077094078e-05, 7.18832015991211e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 8.0, 26.0, 26.0, 20.0, 44.0, 78.0, 118.0, 207.0, 153.0, 102.0, 58.0, 39.0, 37.0, 20.0, 12.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.759695053100586e-05, -2.6520341634750366e-05, -2.5443732738494873e-05, -2.436712384223938e-05, -2.3290514945983887e-05, -2.2213906049728394e-05, -2.11372971534729e-05, -2.0060688257217407e-05, -1.8984079360961914e-05, -1.790747046470642e-05, -1.6830861568450928e-05, -1.5754252672195435e-05, -1.4677643775939941e-05, -1.3601034879684448e-05, -1.2524425983428955e-05, -1.1447817087173462e-05, -1.0371208190917969e-05, -9.294599294662476e-06, -8.217990398406982e-06, -7.141381502151489e-06, -6.064772605895996e-06, -4.988163709640503e-06, -3.91155481338501e-06, -2.8349459171295166e-06, -1.7583370208740234e-06, -6.817281246185303e-07, 3.948807716369629e-07, 1.471489667892456e-06, 2.5480985641479492e-06, 3.6247074604034424e-06, 4.7013163566589355e-06, 5.777925252914429e-06, 6.854534149169922e-06, 7.931143045425415e-06, 9.007751941680908e-06, 1.0084360837936401e-05, 1.1160969734191895e-05, 1.2237578630447388e-05, 1.3314187526702881e-05, 1.4390796422958374e-05, 1.5467405319213867e-05, 1.654401421546936e-05, 1.7620623111724854e-05, 1.8697232007980347e-05, 1.977384090423584e-05, 2.0850449800491333e-05, 2.1927058696746826e-05, 2.300366759300232e-05, 2.4080276489257812e-05, 2.5156885385513306e-05, 2.62334942817688e-05, 2.7310103178024292e-05, 2.8386712074279785e-05, 2.946332097053528e-05, 3.053992986679077e-05, 3.1616538763046265e-05, 3.269314765930176e-05, 3.376975655555725e-05, 3.4846365451812744e-05, 3.592297434806824e-05, 3.699958324432373e-05, 3.8076192140579224e-05, 3.915280103683472e-05, 4.022940993309021e-05, 4.13060188293457e-05]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 23.0, 79.0, 574.0, 241.0, 59.0, 17.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12260283529758453, -0.11834025382995605, -0.11407766491174698, -0.1098150759935379, -0.10555249452590942, -0.10128991305828094, -0.09702732414007187, -0.09276473522186279, -0.08850215375423431, -0.08423957228660583, -0.07997698336839676, -0.07571439445018768, -0.0714518129825592, -0.06718923151493073, -0.06292664259672165, -0.05866405740380287, -0.054401472210884094, -0.05013888701796532, -0.04587630182504654, -0.04161371663212776, -0.037351131439208984, -0.03308854624629021, -0.02882596105337143, -0.024563375860452652, -0.020300790667533875, -0.016038205474615097, -0.01177562028169632, -0.007513035088777542, -0.0032504498958587646, 0.0010121352970600128, 0.00527472048997879, 0.009537305682897568, 0.013799875974655151, 0.01806246116757393, 0.022325046360492706, 0.026587631553411484, 0.03085021674633026, 0.03511280193924904, 0.039375387132167816, 0.043637972325086594, 0.04790055751800537, 0.05216314271092415, 0.056425727903842926, 0.060688313096761703, 0.06495089828968048, 0.06921347975730896, 0.07347606867551804, 0.07773865759372711, 0.08200123906135559, 0.08626382052898407, 0.09052640944719315, 0.09478899836540222, 0.0990515798330307, 0.10331416130065918, 0.10757675021886826, 0.11183933913707733, 0.11610192060470581, 0.12036450207233429, 0.12462709099054337, 0.12888967990875244, 0.13315226137638092, 0.1374148428440094, 0.14167743921279907, 0.14594002068042755, 0.15020260214805603]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 10.0, 14.0, 17.0, 13.0, 21.0, 35.0, 36.0, 57.0, 58.0, 76.0, 86.0, 85.0, 80.0, 101.0, 47.0, 53.0, 49.0, 39.0, 31.0, 24.0, 17.0, 19.0, 10.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3054198622703552, -0.2963999807834625, -0.28738006949424744, -0.27836018800735474, -0.26934030652046204, -0.26032042503356934, -0.25130051374435425, -0.24228063225746155, -0.23326073586940765, -0.22424083948135376, -0.21522095799446106, -0.20620106160640717, -0.19718116521835327, -0.18816128373146057, -0.17914138734340668, -0.17012149095535278, -0.16110160946846008, -0.1520817130804062, -0.1430618315935135, -0.1340419352054596, -0.1250220537185669, -0.116002157330513, -0.1069822609424591, -0.09796237200498581, -0.08894248306751251, -0.07992259413003922, -0.07090270519256592, -0.061882808804512024, -0.05286291986703873, -0.04384303092956543, -0.034823138266801834, -0.02580324560403824, -0.01678335666656494, -0.007763465866446495, 0.0012564249336719513, 0.010276315733790398, 0.019296206533908844, 0.02831609547138214, 0.03733598813414574, 0.04635588079690933, 0.05537576973438263, 0.06439565867185593, 0.07341554760932922, 0.08243544399738312, 0.09145533293485641, 0.10047522187232971, 0.1094951182603836, 0.1185150071978569, 0.1275348961353302, 0.1365547925233841, 0.1455746740102768, 0.1545945703983307, 0.1636144518852234, 0.17263434827327728, 0.18165424466133118, 0.19067412614822388, 0.19969402253627777, 0.20871391892433167, 0.21773380041122437, 0.22675369679927826, 0.23577359318733215, 0.24479347467422485, 0.25381335616111755, 0.26283326745033264, 0.27185314893722534]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 12.0, 7.0, 12.0, 23.0, 27.0, 31.0, 41.0, 70.0, 93.0, 131.0, 203.0, 371.0, 1133.0, 18583.0, 3843278.0, 320433.0, 7921.0, 607.0, 381.0, 248.0, 176.0, 122.0, 83.0, 70.0, 50.0, 41.0, 29.0, 19.0, 18.0, 9.0, 11.0, 10.0, 10.0, 4.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211639404296875, -0.020406246185302734, -0.01964855194091797, -0.018890857696533203, -0.018133163452148438, -0.017375469207763672, -0.016617774963378906, -0.01586008071899414, -0.015102386474609375, -0.01434469223022461, -0.013586997985839844, -0.012829303741455078, -0.012071609497070312, -0.011313915252685547, -0.010556221008300781, -0.009798526763916016, -0.00904083251953125, -0.008283138275146484, -0.007525444030761719, -0.006767749786376953, -0.0060100555419921875, -0.005252361297607422, -0.004494667053222656, -0.0037369728088378906, -0.002979278564453125, -0.0022215843200683594, -0.0014638900756835938, -0.0007061958312988281, 5.14984130859375e-05, 0.0008091926574707031, 0.0015668869018554688, 0.0023245811462402344, 0.003082275390625, 0.0038399696350097656, 0.004597663879394531, 0.005355358123779297, 0.0061130523681640625, 0.006870746612548828, 0.007628440856933594, 0.00838613510131836, 0.009143829345703125, 0.00990152359008789, 0.010659217834472656, 0.011416912078857422, 0.012174606323242188, 0.012932300567626953, 0.013689994812011719, 0.014447689056396484, 0.01520538330078125, 0.015963077545166016, 0.01672077178955078, 0.017478466033935547, 0.018236160278320312, 0.018993854522705078, 0.019751548767089844, 0.02050924301147461, 0.021266937255859375, 0.02202463150024414, 0.022782325744628906, 0.023540019989013672, 0.024297714233398438, 0.025055408477783203, 0.02581310272216797, 0.026570796966552734, 0.0273284912109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 5.0, 2.0, 6.0, 11.0, 11.0, 7.0, 5.0, 17.0, 51.0, 147.0, 307.0, 216.0, 90.0, 20.0, 7.0, 10.0, 10.0, 8.0, 10.0, 5.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00777435302734375, -0.007497429847717285, -0.00722050666809082, -0.0069435834884643555, -0.006666660308837891, -0.006389737129211426, -0.006112813949584961, -0.005835890769958496, -0.005558967590332031, -0.005282044410705566, -0.0050051212310791016, -0.004728198051452637, -0.004451274871826172, -0.004174351692199707, -0.003897428512573242, -0.0036205053329467773, -0.0033435821533203125, -0.0030666589736938477, -0.002789735794067383, -0.002512812614440918, -0.002235889434814453, -0.0019589662551879883, -0.0016820430755615234, -0.0014051198959350586, -0.0011281967163085938, -0.0008512735366821289, -0.0005743503570556641, -0.0002974271774291992, -2.0503997802734375e-05, 0.00025641918182373047, 0.0005333423614501953, 0.0008102655410766602, 0.001087188720703125, 0.0013641119003295898, 0.0016410350799560547, 0.0019179582595825195, 0.0021948814392089844, 0.0024718046188354492, 0.002748727798461914, 0.003025650978088379, 0.0033025741577148438, 0.0035794973373413086, 0.0038564205169677734, 0.004133343696594238, 0.004410266876220703, 0.004687190055847168, 0.004964113235473633, 0.005241036415100098, 0.0055179595947265625, 0.005794882774353027, 0.006071805953979492, 0.006348729133605957, 0.006625652313232422, 0.006902575492858887, 0.0071794986724853516, 0.007456421852111816, 0.007733345031738281, 0.008010268211364746, 0.008287191390991211, 0.008564114570617676, 0.00884103775024414, 0.009117960929870605, 0.00939488410949707, 0.009671807289123535, 0.00994873046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 10.0, 12.0, 15.0, 31.0, 29.0, 75.0, 150.0, 411.0, 1848.0, 37173.0, 4148994.0, 4413.0, 662.0, 188.0, 102.0, 38.0, 35.0, 17.0, 11.0, 4.0, 10.0, 12.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043914794921875, -0.04246091842651367, -0.041007041931152344, -0.039553165435791016, -0.03809928894042969, -0.03664541244506836, -0.03519153594970703, -0.0337376594543457, -0.032283782958984375, -0.030829906463623047, -0.02937602996826172, -0.02792215347290039, -0.026468276977539062, -0.025014400482177734, -0.023560523986816406, -0.022106647491455078, -0.02065277099609375, -0.019198894500732422, -0.017745018005371094, -0.016291141510009766, -0.014837265014648438, -0.01338338851928711, -0.011929512023925781, -0.010475635528564453, -0.009021759033203125, -0.007567882537841797, -0.006114006042480469, -0.004660129547119141, -0.0032062530517578125, -0.0017523765563964844, -0.00029850006103515625, 0.0011553764343261719, 0.0026092529296875, 0.004063129425048828, 0.005517005920410156, 0.006970882415771484, 0.008424758911132812, 0.00987863540649414, 0.011332511901855469, 0.012786388397216797, 0.014240264892578125, 0.015694141387939453, 0.01714801788330078, 0.01860189437866211, 0.020055770874023438, 0.021509647369384766, 0.022963523864746094, 0.024417400360107422, 0.02587127685546875, 0.027325153350830078, 0.028779029846191406, 0.030232906341552734, 0.03168678283691406, 0.03314065933227539, 0.03459453582763672, 0.03604841232299805, 0.037502288818359375, 0.0389561653137207, 0.04041004180908203, 0.04186391830444336, 0.04331779479980469, 0.044771671295166016, 0.046225547790527344, 0.04767942428588867, 0.04913330078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 21.0, 49.0, 101.0, 293.0, 1532.0, 1495.0, 319.0, 115.0, 61.0, 21.0, 11.0, 7.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.016082763671875, -0.015659451484680176, -0.015236139297485352, -0.014812827110290527, -0.014389514923095703, -0.013966202735900879, -0.013542890548706055, -0.01311957836151123, -0.012696266174316406, -0.012272953987121582, -0.011849641799926758, -0.011426329612731934, -0.01100301742553711, -0.010579705238342285, -0.010156393051147461, -0.009733080863952637, -0.009309768676757812, -0.008886456489562988, -0.008463144302368164, -0.00803983211517334, -0.007616519927978516, -0.007193207740783691, -0.006769895553588867, -0.006346583366394043, -0.005923271179199219, -0.0054999589920043945, -0.00507664680480957, -0.004653334617614746, -0.004230022430419922, -0.0038067102432250977, -0.0033833980560302734, -0.0029600858688354492, -0.002536773681640625, -0.0021134614944458008, -0.0016901493072509766, -0.0012668371200561523, -0.0008435249328613281, -0.0004202127456665039, 3.0994415283203125e-06, 0.00042641162872314453, 0.0008497238159179688, 0.001273036003112793, 0.0016963481903076172, 0.0021196603775024414, 0.0025429725646972656, 0.00296628475189209, 0.003389596939086914, 0.0038129091262817383, 0.0042362213134765625, 0.004659533500671387, 0.005082845687866211, 0.005506157875061035, 0.005929470062255859, 0.006352782249450684, 0.006776094436645508, 0.007199406623840332, 0.007622718811035156, 0.00804603099822998, 0.008469343185424805, 0.008892655372619629, 0.009315967559814453, 0.009739279747009277, 0.010162591934204102, 0.010585904121398926, 0.01100921630859375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 970.0, 34.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15761198103427887, -0.153827503323555, -0.15004302561283112, -0.14625854790210724, -0.14247405529022217, -0.1386895775794983, -0.13490509986877441, -0.13112062215805054, -0.12733614444732666, -0.12355166673660278, -0.1197671890258789, -0.11598270386457443, -0.11219822615385056, -0.10841374844312668, -0.1046292632818222, -0.10084478557109833, -0.09706030786037445, -0.09327583014965057, -0.0894913524389267, -0.08570686727762222, -0.08192238956689835, -0.07813791185617447, -0.07435342669487, -0.07056894898414612, -0.06678447127342224, -0.06299999356269836, -0.05921551212668419, -0.05543103069067001, -0.051646552979946136, -0.04786207526922226, -0.044077593833208084, -0.04029311239719391, -0.03650863468647003, -0.032724156975746155, -0.02893967553973198, -0.025155195966362953, -0.021370716392993927, -0.0175862368196249, -0.013801757246255875, -0.010017277672886848, -0.006232798099517822, -0.002448318526148796, 0.00133616104722023, 0.005120640620589256, 0.008905120193958282, 0.012689599767327309, 0.016474079340696335, 0.02025855891406536, 0.024043038487434387, 0.027827518060803413, 0.03161199763417244, 0.035396479070186615, 0.03918095678091049, 0.04296543449163437, 0.046749915927648544, 0.05053439736366272, 0.0543188750743866, 0.058103352785110474, 0.06188783422112465, 0.06567231565713882, 0.0694567933678627, 0.07324127107858658, 0.07702575623989105, 0.08081023395061493, 0.0845947116613388]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 10.0, 12.0, 20.0, 20.0, 23.0, 30.0, 40.0, 51.0, 43.0, 48.0, 57.0, 41.0, 61.0, 56.0, 45.0, 39.0, 41.0, 46.0, 33.0, 44.0, 27.0, 23.0, 28.0, 33.0, 22.0, 17.0, 12.0, 12.0, 10.0, 9.0, 11.0, 5.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.03274601697921753, -0.03188027814030647, -0.031014541164040565, -0.030148804187774658, -0.0292830653488636, -0.028417326509952545, -0.027551589533686638, -0.02668585255742073, -0.025820113718509674, -0.024954374879598618, -0.02408863790333271, -0.023222900927066803, -0.022357162088155746, -0.02149142324924469, -0.020625686272978783, -0.019759949296712875, -0.01889421045780182, -0.018028471618890762, -0.017162734642624855, -0.016296997666358948, -0.015431258827447891, -0.01456552091985941, -0.013699783012270927, -0.012834045104682446, -0.011968307197093964, -0.011102569289505482, -0.010236831381917, -0.009371093474328518, -0.008505355566740036, -0.007639617659151554, -0.006773879751563072, -0.00590814184397459, -0.005042403936386108, -0.0041766660287976265, -0.0033109281212091446, -0.0024451902136206627, -0.0015794523060321808, -0.0007137143984436989, 0.00015202350914478302, 0.001017761416733265, 0.0018834993243217468, 0.0027492372319102287, 0.0036149751394987106, 0.0044807130470871925, 0.0053464509546756744, 0.006212188862264156, 0.007077926769852638, 0.00794366467744112, 0.008809402585029602, 0.009675140492618084, 0.010540878400206566, 0.011406616307795048, 0.01227235421538353, 0.013138092122972012, 0.014003830030560493, 0.014869567938148975, 0.015735305845737457, 0.016601044684648514, 0.01746678166091442, 0.01833251863718033, 0.019198257476091385, 0.02006399631500244, 0.02092973329126835, 0.021795470267534256, 0.022661209106445312]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 5.0, 9.0, 10.0, 11.0, 21.0, 19.0, 34.0, 42.0, 70.0, 100.0, 129.0, 173.0, 232.0, 356.0, 519.0, 810.0, 1174.0, 1791.0, 2821.0, 4616.0, 8240.0, 17087.0, 68515.0, 858691.0, 48504.0, 14967.0, 7562.0, 4177.0, 2668.0, 1672.0, 1153.0, 743.0, 491.0, 344.0, 245.0, 143.0, 125.0, 81.0, 55.0, 40.0, 28.0, 24.0, 11.0, 5.0, 12.0, 5.0, 8.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.01500701904296875, -0.014571070671081543, -0.014135122299194336, -0.013699173927307129, -0.013263225555419922, -0.012827277183532715, -0.012391328811645508, -0.0119553804397583, -0.011519432067871094, -0.011083483695983887, -0.01064753532409668, -0.010211586952209473, -0.009775638580322266, -0.009339690208435059, -0.008903741836547852, -0.008467793464660645, -0.008031845092773438, -0.0075958967208862305, -0.0071599483489990234, -0.006723999977111816, -0.006288051605224609, -0.005852103233337402, -0.005416154861450195, -0.004980206489562988, -0.004544258117675781, -0.004108309745788574, -0.003672361373901367, -0.00323641300201416, -0.002800464630126953, -0.002364516258239746, -0.001928567886352539, -0.001492619514465332, -0.001056671142578125, -0.000620722770690918, -0.00018477439880371094, 0.0002511739730834961, 0.0006871223449707031, 0.0011230707168579102, 0.0015590190887451172, 0.0019949674606323242, 0.0024309158325195312, 0.0028668642044067383, 0.0033028125762939453, 0.0037387609481811523, 0.004174709320068359, 0.004610657691955566, 0.0050466060638427734, 0.0054825544357299805, 0.0059185028076171875, 0.0063544511795043945, 0.0067903995513916016, 0.007226347923278809, 0.007662296295166016, 0.008098244667053223, 0.00853419303894043, 0.008970141410827637, 0.009406089782714844, 0.00984203815460205, 0.010277986526489258, 0.010713934898376465, 0.011149883270263672, 0.011585831642150879, 0.012021780014038086, 0.012457728385925293, 0.0128936767578125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 6.0, 1.0, 4.0, 13.0, 11.0, 8.0, 4.0, 16.0, 48.0, 146.0, 309.0, 219.0, 85.0, 25.0, 6.0, 10.0, 11.0, 8.0, 9.0, 6.0, 2.0, 4.0, 5.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0077667236328125, -0.0074901580810546875, -0.007213592529296875, -0.0069370269775390625, -0.00666046142578125, -0.0063838958740234375, -0.006107330322265625, -0.0058307647705078125, -0.00555419921875, -0.0052776336669921875, -0.005001068115234375, -0.0047245025634765625, -0.00444793701171875, -0.0041713714599609375, -0.003894805908203125, -0.0036182403564453125, -0.0033416748046875, -0.0030651092529296875, -0.002788543701171875, -0.0025119781494140625, -0.00223541259765625, -0.0019588470458984375, -0.001682281494140625, -0.0014057159423828125, -0.001129150390625, -0.0008525848388671875, -0.000576019287109375, -0.0002994537353515625, -2.288818359375e-05, 0.0002536773681640625, 0.000530242919921875, 0.0008068084716796875, 0.0010833740234375, 0.0013599395751953125, 0.001636505126953125, 0.0019130706787109375, 0.00218963623046875, 0.0024662017822265625, 0.002742767333984375, 0.0030193328857421875, 0.0032958984375, 0.0035724639892578125, 0.003849029541015625, 0.0041255950927734375, 0.00440216064453125, 0.0046787261962890625, 0.004955291748046875, 0.0052318572998046875, 0.0055084228515625, 0.0057849884033203125, 0.006061553955078125, 0.0063381195068359375, 0.00661468505859375, 0.0068912506103515625, 0.007167816162109375, 0.0074443817138671875, 0.007720947265625, 0.007997512817382812, 0.008274078369140625, 0.008550643920898438, 0.00882720947265625, 0.009103775024414062, 0.009380340576171875, 0.009656906127929688, 0.0099334716796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 5.0, 11.0, 14.0, 14.0, 14.0, 19.0, 28.0, 31.0, 37.0, 46.0, 63.0, 67.0, 66.0, 118.0, 142.0, 191.0, 250.0, 437.0, 661.0, 1510.0, 8531.0, 821542.0, 206649.0, 4836.0, 1209.0, 634.0, 348.0, 260.0, 162.0, 116.0, 96.0, 100.0, 56.0, 34.0, 43.0, 37.0, 28.0, 36.0, 22.0, 16.0, 20.0, 10.0, 4.0, 7.0, 6.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.03973388671875, -0.03852558135986328, -0.03731727600097656, -0.036108970642089844, -0.034900665283203125, -0.033692359924316406, -0.03248405456542969, -0.03127574920654297, -0.03006744384765625, -0.02885913848876953, -0.027650833129882812, -0.026442527770996094, -0.025234222412109375, -0.024025917053222656, -0.022817611694335938, -0.02160930633544922, -0.0204010009765625, -0.01919269561767578, -0.017984390258789062, -0.016776084899902344, -0.015567779541015625, -0.014359474182128906, -0.013151168823242188, -0.011942863464355469, -0.01073455810546875, -0.009526252746582031, -0.008317947387695312, -0.007109642028808594, -0.005901336669921875, -0.004693031311035156, -0.0034847259521484375, -0.0022764205932617188, -0.001068115234375, 0.00014019012451171875, 0.0013484954833984375, 0.0025568008422851562, 0.003765106201171875, 0.004973411560058594, 0.0061817169189453125, 0.007390022277832031, 0.00859832763671875, 0.009806632995605469, 0.011014938354492188, 0.012223243713378906, 0.013431549072265625, 0.014639854431152344, 0.015848159790039062, 0.01705646514892578, 0.0182647705078125, 0.01947307586669922, 0.020681381225585938, 0.021889686584472656, 0.023097991943359375, 0.024306297302246094, 0.025514602661132812, 0.02672290802001953, 0.02793121337890625, 0.02913951873779297, 0.030347824096679688, 0.031556129455566406, 0.032764434814453125, 0.033972740173339844, 0.03518104553222656, 0.03638935089111328, 0.03759765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 9.0, 9.0, 7.0, 10.0, 13.0, 14.0, 12.0, 21.0, 28.0, 21.0, 23.0, 24.0, 33.0, 33.0, 27.0, 52.0, 39.0, 30.0, 45.0, 38.0, 32.0, 32.0, 33.0, 32.0, 31.0, 24.0, 33.0, 30.0, 33.0, 36.0, 26.0, 10.0, 28.0, 20.0, 14.0, 20.0, 13.0, 11.0, 13.0, 7.0, 4.0, 5.0, 4.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0235443115234375, -0.02282881736755371, -0.022113323211669922, -0.021397829055786133, -0.020682334899902344, -0.019966840744018555, -0.019251346588134766, -0.018535852432250977, -0.017820358276367188, -0.0171048641204834, -0.01638936996459961, -0.01567387580871582, -0.014958381652832031, -0.014242887496948242, -0.013527393341064453, -0.012811899185180664, -0.012096405029296875, -0.011380910873413086, -0.010665416717529297, -0.009949922561645508, -0.009234428405761719, -0.00851893424987793, -0.007803440093994141, -0.0070879459381103516, -0.0063724517822265625, -0.0056569576263427734, -0.004941463470458984, -0.004225969314575195, -0.0035104751586914062, -0.002794981002807617, -0.002079486846923828, -0.001363992691040039, -0.00064849853515625, 6.699562072753906e-05, 0.0007824897766113281, 0.0014979839324951172, 0.0022134780883789062, 0.0029289722442626953, 0.0036444664001464844, 0.0043599605560302734, 0.0050754547119140625, 0.0057909488677978516, 0.006506443023681641, 0.00722193717956543, 0.007937431335449219, 0.008652925491333008, 0.009368419647216797, 0.010083913803100586, 0.010799407958984375, 0.011514902114868164, 0.012230396270751953, 0.012945890426635742, 0.013661384582519531, 0.01437687873840332, 0.01509237289428711, 0.0158078670501709, 0.016523361206054688, 0.017238855361938477, 0.017954349517822266, 0.018669843673706055, 0.019385337829589844, 0.020100831985473633, 0.020816326141357422, 0.02153182029724121, 0.022247314453125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 8.0, 15.0, 15.0, 23.0, 28.0, 45.0, 57.0, 91.0, 179.0, 306.0, 711.0, 2035.0, 9988.0, 169467.0, 844383.0, 16650.0, 2806.0, 839.0, 348.0, 238.0, 120.0, 69.0, 41.0, 30.0, 22.0, 5.0, 9.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-05, -1.5014782547950745e-05, -1.4532357454299927e-05, -1.4049932360649109e-05, -1.3567507266998291e-05, -1.3085082173347473e-05, -1.2602657079696655e-05, -1.2120231986045837e-05, -1.163780689239502e-05, -1.1155381798744202e-05, -1.0672956705093384e-05, -1.0190531611442566e-05, -9.708106517791748e-06, -9.22568142414093e-06, -8.743256330490112e-06, -8.260831236839294e-06, -7.778406143188477e-06, -7.295981049537659e-06, -6.813555955886841e-06, -6.331130862236023e-06, -5.848705768585205e-06, -5.366280674934387e-06, -4.883855581283569e-06, -4.4014304876327515e-06, -3.919005393981934e-06, -3.4365803003311157e-06, -2.954155206680298e-06, -2.47173011302948e-06, -1.989305019378662e-06, -1.5068799257278442e-06, -1.0244548320770264e-06, -5.420297384262085e-07, -5.960464477539063e-08, 4.2282044887542725e-07, 9.052455425262451e-07, 1.387670636177063e-06, 1.8700957298278809e-06, 2.3525208234786987e-06, 2.8349459171295166e-06, 3.3173710107803345e-06, 3.7997961044311523e-06, 4.28222119808197e-06, 4.764646291732788e-06, 5.247071385383606e-06, 5.729496479034424e-06, 6.211921572685242e-06, 6.6943466663360596e-06, 7.1767717599868774e-06, 7.659196853637695e-06, 8.141621947288513e-06, 8.624047040939331e-06, 9.106472134590149e-06, 9.588897228240967e-06, 1.0071322321891785e-05, 1.0553747415542603e-05, 1.103617250919342e-05, 1.1518597602844238e-05, 1.2001022696495056e-05, 1.2483447790145874e-05, 1.2965872883796692e-05, 1.344829797744751e-05, 1.3930723071098328e-05, 1.4413148164749146e-05, 1.4895573258399963e-05, 1.537799835205078e-05]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 12.0, 19.0, 26.0, 24.0, 44.0, 40.0, 86.0, 63.0, 65.0, 124.0, 76.0, 87.0, 91.0, 44.0, 49.0, 29.0, 25.0, 13.0, 22.0, 13.0, 5.0, 10.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.066394805908203e-06, -4.852190613746643e-06, -4.637986421585083e-06, -4.423782229423523e-06, -4.209578037261963e-06, -3.995373845100403e-06, -3.7811696529388428e-06, -3.5669654607772827e-06, -3.3527612686157227e-06, -3.1385570764541626e-06, -2.9243528842926025e-06, -2.7101486921310425e-06, -2.4959444999694824e-06, -2.2817403078079224e-06, -2.0675361156463623e-06, -1.8533319234848022e-06, -1.6391277313232422e-06, -1.4249235391616821e-06, -1.210719347000122e-06, -9.96515154838562e-07, -7.82310962677002e-07, -5.681067705154419e-07, -3.5390257835388184e-07, -1.3969838619232178e-07, 7.450580596923828e-08, 2.8870999813079834e-07, 5.029141902923584e-07, 7.171183824539185e-07, 9.313225746154785e-07, 1.1455267667770386e-06, 1.3597309589385986e-06, 1.5739351511001587e-06, 1.7881393432617188e-06, 2.002343535423279e-06, 2.216547727584839e-06, 2.430751919746399e-06, 2.644956111907959e-06, 2.859160304069519e-06, 3.073364496231079e-06, 3.287568688392639e-06, 3.5017728805541992e-06, 3.7159770727157593e-06, 3.930181264877319e-06, 4.144385457038879e-06, 4.3585896492004395e-06, 4.5727938413619995e-06, 4.7869980335235596e-06, 5.00120222568512e-06, 5.21540641784668e-06, 5.42961061000824e-06, 5.6438148021698e-06, 5.85801899433136e-06, 6.07222318649292e-06, 6.28642737865448e-06, 6.50063157081604e-06, 6.7148357629776e-06, 6.92903995513916e-06, 7.14324414730072e-06, 7.35744833946228e-06, 7.57165253162384e-06, 7.7858567237854e-06, 8.00006091594696e-06, 8.21426510810852e-06, 8.42846930027008e-06, 8.64267349243164e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 9.0, 9.0, 12.0, 11.0, 18.0, 29.0, 47.0, 109.0, 308.0, 1712.0, 1036926.0, 8449.0, 568.0, 164.0, 84.0, 31.0, 19.0, 15.0, 10.0, 7.0, 4.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.039308547973633e-05, -6.836559623479843e-05, -6.633810698986053e-05, -6.431061774492264e-05, -6.228312849998474e-05, -6.0255639255046844e-05, -5.822815001010895e-05, -5.620066076517105e-05, -5.4173171520233154e-05, -5.214568227529526e-05, -5.011819303035736e-05, -4.8090703785419464e-05, -4.606321454048157e-05, -4.403572529554367e-05, -4.2008236050605774e-05, -3.998074680566788e-05, -3.795325756072998e-05, -3.5925768315792084e-05, -3.389827907085419e-05, -3.187078982591629e-05, -2.9843300580978394e-05, -2.7815811336040497e-05, -2.57883220911026e-05, -2.3760832846164703e-05, -2.1733343601226807e-05, -1.970585435628891e-05, -1.7678365111351013e-05, -1.5650875866413116e-05, -1.362338662147522e-05, -1.1595897376537323e-05, -9.568408131599426e-06, -7.5409188866615295e-06, -5.513429641723633e-06, -3.485940396785736e-06, -1.4584511518478394e-06, 5.690380930900574e-07, 2.596527338027954e-06, 4.624016582965851e-06, 6.6515058279037476e-06, 8.678995072841644e-06, 1.0706484317779541e-05, 1.2733973562717438e-05, 1.4761462807655334e-05, 1.678895205259323e-05, 1.8816441297531128e-05, 2.0843930542469025e-05, 2.287141978740692e-05, 2.4898909032344818e-05, 2.6926398277282715e-05, 2.895388752222061e-05, 3.098137676715851e-05, 3.3008866012096405e-05, 3.50363552570343e-05, 3.70638445019722e-05, 3.9091333746910095e-05, 4.111882299184799e-05, 4.314631223678589e-05, 4.5173801481723785e-05, 4.720129072666168e-05, 4.922877997159958e-05, 5.1256269216537476e-05, 5.328375846147537e-05, 5.531124770641327e-05, 5.7338736951351166e-05, 5.936622619628906e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 6.0, 6.0, 2.0, 5.0, 16.0, 15.0, 42.0, 75.0, 144.0, 306.0, 177.0, 106.0, 48.0, 17.0, 14.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-05, -4.0617771446704865e-05, -3.951229155063629e-05, -3.840681165456772e-05, -3.7301331758499146e-05, -3.619585186243057e-05, -3.5090371966362e-05, -3.3984892070293427e-05, -3.2879412174224854e-05, -3.177393227815628e-05, -3.066845238208771e-05, -2.9562972486019135e-05, -2.845749258995056e-05, -2.735201269388199e-05, -2.6246532797813416e-05, -2.5141052901744843e-05, -2.403557300567627e-05, -2.2930093109607697e-05, -2.1824613213539124e-05, -2.071913331747055e-05, -1.9613653421401978e-05, -1.8508173525333405e-05, -1.740269362926483e-05, -1.629721373319626e-05, -1.5191733837127686e-05, -1.4086253941059113e-05, -1.298077404499054e-05, -1.1875294148921967e-05, -1.0769814252853394e-05, -9.66433435678482e-06, -8.558854460716248e-06, -7.4533745646476746e-06, -6.3478946685791016e-06, -5.2424147725105286e-06, -4.1369348764419556e-06, -3.0314549803733826e-06, -1.9259750843048096e-06, -8.204951882362366e-07, 2.849847078323364e-07, 1.3904646039009094e-06, 2.4959444999694824e-06, 3.6014243960380554e-06, 4.706904292106628e-06, 5.812384188175201e-06, 6.917864084243774e-06, 8.023343980312347e-06, 9.12882387638092e-06, 1.0234303772449493e-05, 1.1339783668518066e-05, 1.244526356458664e-05, 1.3550743460655212e-05, 1.4656223356723785e-05, 1.576170325279236e-05, 1.686718314886093e-05, 1.7972663044929504e-05, 1.9078142940998077e-05, 2.018362283706665e-05, 2.1289102733135223e-05, 2.2394582629203796e-05, 2.350006252527237e-05, 2.4605542421340942e-05, 2.5711022317409515e-05, 2.681650221347809e-05, 2.792198210954666e-05, 2.9027462005615234e-05]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 10.0, 21.0, 34.0, 137.0, 496.0, 199.0, 68.0, 16.0, 10.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06408916413784027, -0.06138811260461807, -0.058687061071395874, -0.055986013263463974, -0.053284961730241776, -0.05058391019701958, -0.04788286238908768, -0.04518181085586548, -0.04248075932264328, -0.03977970778942108, -0.03707865625619888, -0.03437760844826698, -0.031676556915044785, -0.028975505381822586, -0.026274455711245537, -0.023573406040668488, -0.02087235450744629, -0.01817130297422409, -0.015470253303647041, -0.012769202701747417, -0.010068152099847794, -0.00736710149794817, -0.004666050896048546, -0.0019650012254714966, 0.0007360503077507019, 0.0034371009096503258, 0.00613815151154995, 0.008839202113449574, 0.011540252715349197, 0.014241303317248821, 0.016942353919148445, 0.019643403589725494, 0.022344455122947693, 0.02504550665616989, 0.02774655632674694, 0.03044760599732399, 0.03314865753054619, 0.03584970906376839, 0.03855075687170029, 0.041251808404922485, 0.043952859938144684, 0.04665391147136688, 0.04935496300458908, 0.05205601081252098, 0.05475706234574318, 0.05745811387896538, 0.06015916168689728, 0.06286021322011948, 0.06556126475334167, 0.06826231628656387, 0.07096336781978607, 0.07366441935300827, 0.07636547088623047, 0.07906651496887207, 0.08176756650209427, 0.08446861803531647, 0.08716966956853867, 0.08987072110176086, 0.09257177263498306, 0.09527282416820526, 0.09797386825084686, 0.10067491978406906, 0.10337597131729126, 0.10607702285051346, 0.10877807438373566]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 6.0, 11.0, 8.0, 14.0, 15.0, 12.0, 16.0, 15.0, 24.0, 34.0, 20.0, 22.0, 44.0, 33.0, 46.0, 45.0, 45.0, 43.0, 52.0, 43.0, 55.0, 42.0, 38.0, 35.0, 42.0, 28.0, 29.0, 18.0, 20.0, 16.0, 17.0, 18.0, 16.0, 11.0, 14.0, 4.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.15168660879135132, -0.14716698229312897, -0.14264734089374542, -0.13812771439552307, -0.13360807299613953, -0.12908844649791718, -0.12456881999969482, -0.12004918605089188, -0.11552955210208893, -0.11100991815328598, -0.10649028420448303, -0.10197065770626068, -0.09745102375745773, -0.09293138980865479, -0.08841176331043243, -0.08389212936162949, -0.07937249541282654, -0.07485286146402359, -0.07033322751522064, -0.06581360101699829, -0.06129396706819534, -0.056774333119392395, -0.052254702895879745, -0.047735072672367096, -0.04321543872356415, -0.0386958047747612, -0.03417617455124855, -0.02965654246509075, -0.025136910378932953, -0.020617278292775154, -0.016097646206617355, -0.011578015983104706, -0.007058382034301758, -0.002538749948143959, 0.0019808821380138397, 0.0065005142241716385, 0.011020146310329437, 0.015539778396487236, 0.020059410482645035, 0.024579040706157684, 0.029098674654960632, 0.03361830860376358, 0.03813793882727623, 0.04265756905078888, 0.04717720299959183, 0.051696836948394775, 0.056216467171907425, 0.060736097395420074, 0.06525573134422302, 0.06977536529302597, 0.07429499924182892, 0.07881462574005127, 0.08333425968885422, 0.08785389363765717, 0.09237352013587952, 0.09689315408468246, 0.10141278803348541, 0.10593242198228836, 0.11045205593109131, 0.11497168242931366, 0.11949131637811661, 0.12401095032691956, 0.1285305768251419, 0.13305020332336426, 0.1375698447227478]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 7.0, 18.0, 20.0, 27.0, 23.0, 32.0, 68.0, 556.0, 4603.0, 4161182.0, 25990.0, 1408.0, 80.0, 38.0, 38.0, 41.0, 35.0, 16.0, 15.0, 12.0, 6.0, 10.0, 4.0, 4.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0185394287109375, -0.017873287200927734, -0.01720714569091797, -0.016541004180908203, -0.015874862670898438, -0.015208721160888672, -0.014542579650878906, -0.01387643814086914, -0.013210296630859375, -0.01254415512084961, -0.011878013610839844, -0.011211872100830078, -0.010545730590820312, -0.009879589080810547, -0.009213447570800781, -0.008547306060791016, -0.00788116455078125, -0.007215023040771484, -0.006548881530761719, -0.005882740020751953, -0.0052165985107421875, -0.004550457000732422, -0.0038843154907226562, -0.0032181739807128906, -0.002552032470703125, -0.0018858909606933594, -0.0012197494506835938, -0.0005536079406738281, 0.0001125335693359375, 0.0007786750793457031, 0.0014448165893554688, 0.0021109580993652344, 0.002777099609375, 0.0034432411193847656, 0.004109382629394531, 0.004775524139404297, 0.0054416656494140625, 0.006107807159423828, 0.006773948669433594, 0.007440090179443359, 0.008106231689453125, 0.00877237319946289, 0.009438514709472656, 0.010104656219482422, 0.010770797729492188, 0.011436939239501953, 0.012103080749511719, 0.012769222259521484, 0.01343536376953125, 0.014101505279541016, 0.014767646789550781, 0.015433788299560547, 0.016099929809570312, 0.016766071319580078, 0.017432212829589844, 0.01809835433959961, 0.018764495849609375, 0.01943063735961914, 0.020096778869628906, 0.020762920379638672, 0.021429061889648438, 0.022095203399658203, 0.02276134490966797, 0.023427486419677734, 0.0240936279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 5.0, 13.0, 10.0, 6.0, 6.0, 15.0, 64.0, 139.0, 278.0, 228.0, 95.0, 26.0, 9.0, 8.0, 12.0, 9.0, 9.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00760650634765625, -0.007335662841796875, -0.0070648193359375, -0.006793975830078125, -0.00652313232421875, -0.006252288818359375, -0.0059814453125, -0.005710601806640625, -0.00543975830078125, -0.005168914794921875, -0.0048980712890625, -0.004627227783203125, -0.00435638427734375, -0.004085540771484375, -0.003814697265625, -0.003543853759765625, -0.00327301025390625, -0.003002166748046875, -0.0027313232421875, -0.002460479736328125, -0.00218963623046875, -0.001918792724609375, -0.00164794921875, -0.001377105712890625, -0.00110626220703125, -0.000835418701171875, -0.0005645751953125, -0.000293731689453125, -2.288818359375e-05, 0.000247955322265625, 0.000518798828125, 0.000789642333984375, 0.00106048583984375, 0.001331329345703125, 0.0016021728515625, 0.001873016357421875, 0.00214385986328125, 0.002414703369140625, 0.002685546875, 0.002956390380859375, 0.00322723388671875, 0.003498077392578125, 0.0037689208984375, 0.004039764404296875, 0.00431060791015625, 0.004581451416015625, 0.004852294921875, 0.005123138427734375, 0.00539398193359375, 0.005664825439453125, 0.0059356689453125, 0.006206512451171875, 0.00647735595703125, 0.006748199462890625, 0.00701904296875, 0.007289886474609375, 0.00756072998046875, 0.007831573486328125, 0.0081024169921875, 0.008373260498046875, 0.00864410400390625, 0.008914947509765625, 0.009185791015625, 0.009456634521484375, 0.00972747802734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 14.0, 9.0, 22.0, 38.0, 109.0, 313.0, 1561.0, 70134.0, 4118719.0, 2561.0, 496.0, 159.0, 62.0, 22.0, 15.0, 12.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02703857421875, -0.02628946304321289, -0.02554035186767578, -0.024791240692138672, -0.024042129516601562, -0.023293018341064453, -0.022543907165527344, -0.021794795989990234, -0.021045684814453125, -0.020296573638916016, -0.019547462463378906, -0.018798351287841797, -0.018049240112304688, -0.017300128936767578, -0.01655101776123047, -0.01580190658569336, -0.01505279541015625, -0.01430368423461914, -0.013554573059082031, -0.012805461883544922, -0.012056350708007812, -0.011307239532470703, -0.010558128356933594, -0.009809017181396484, -0.009059906005859375, -0.008310794830322266, -0.007561683654785156, -0.006812572479248047, -0.0060634613037109375, -0.005314350128173828, -0.004565238952636719, -0.0038161277770996094, -0.0030670166015625, -0.0023179054260253906, -0.0015687942504882812, -0.0008196830749511719, -7.05718994140625e-05, 0.0006785392761230469, 0.0014276504516601562, 0.0021767616271972656, 0.002925872802734375, 0.0036749839782714844, 0.004424095153808594, 0.005173206329345703, 0.0059223175048828125, 0.006671428680419922, 0.007420539855957031, 0.00816965103149414, 0.00891876220703125, 0.00966787338256836, 0.010416984558105469, 0.011166095733642578, 0.011915206909179688, 0.012664318084716797, 0.013413429260253906, 0.014162540435791016, 0.014911651611328125, 0.015660762786865234, 0.016409873962402344, 0.017158985137939453, 0.017908096313476562, 0.018657207489013672, 0.01940631866455078, 0.02015542984008789, 0.020904541015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 11.0, 27.0, 42.0, 108.0, 3207.0, 506.0, 86.0, 40.0, 18.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005298614501953125, -0.005076348781585693, -0.004854083061218262, -0.00463181734085083, -0.0044095516204833984, -0.004187285900115967, -0.003965020179748535, -0.0037427544593811035, -0.003520488739013672, -0.0032982230186462402, -0.0030759572982788086, -0.002853691577911377, -0.0026314258575439453, -0.0024091601371765137, -0.002186894416809082, -0.0019646286964416504, -0.0017423629760742188, -0.0015200972557067871, -0.0012978315353393555, -0.0010755658149719238, -0.0008533000946044922, -0.0006310343742370605, -0.0004087686538696289, -0.00018650293350219727, 3.5762786865234375e-05, 0.000258028507232666, 0.00048029422760009766, 0.0007025599479675293, 0.0009248256683349609, 0.0011470913887023926, 0.0013693571090698242, 0.0015916228294372559, 0.0018138885498046875, 0.002036154270172119, 0.0022584199905395508, 0.0024806857109069824, 0.002702951431274414, 0.0029252171516418457, 0.0031474828720092773, 0.003369748592376709, 0.0035920143127441406, 0.0038142800331115723, 0.004036545753479004, 0.0042588114738464355, 0.004481077194213867, 0.004703342914581299, 0.0049256086349487305, 0.005147874355316162, 0.005370140075683594, 0.005592405796051025, 0.005814671516418457, 0.006036937236785889, 0.00625920295715332, 0.006481468677520752, 0.006703734397888184, 0.006926000118255615, 0.007148265838623047, 0.0073705315589904785, 0.00759279727935791, 0.007815062999725342, 0.008037328720092773, 0.008259594440460205, 0.008481860160827637, 0.008704125881195068, 0.0089263916015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 724.0, 287.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012417360208928585, -0.01033632643520832, -0.008255291730165482, -0.006174257956445217, -0.004093224182724953, -0.0020121904090046883, 6.884429603815079e-05, 0.0021498780697584152, 0.00423091184347868, 0.006311945617198944, 0.008392980322241783, 0.010474014095962048, 0.012555047869682312, 0.014636081643402576, 0.01671711727976799, 0.01879815012216568, 0.02087918296456337, 0.02296021766960621, 0.0250412505120039, 0.027122285217046738, 0.029203318059444427, 0.031284354627132416, 0.033365387469530106, 0.035446420311927795, 0.037527456879615784, 0.039608489722013474, 0.04168952628970146, 0.04377055913209915, 0.04585159197449684, 0.04793262481689453, 0.05001366138458252, 0.05209469422698021, 0.054175734519958496, 0.056256767362356186, 0.058337803930044174, 0.060418836772441864, 0.062499869614839554, 0.06458090245723724, 0.06666193902492523, 0.06874297559261322, 0.07082400470972061, 0.0729050412774086, 0.07498607039451599, 0.07706710696220398, 0.07914814352989197, 0.08122917264699936, 0.08331020921468735, 0.08539124578237534, 0.08747227489948273, 0.08955331146717072, 0.0916343405842781, 0.0937153771519661, 0.09579641371965408, 0.09787744283676147, 0.09995847940444946, 0.10203951597213745, 0.10412055253982544, 0.10620158910751343, 0.10828261822462082, 0.11036365479230881, 0.1124446913599968, 0.11452572047710419, 0.11660675704479218, 0.11868779361248016, 0.12076882272958755]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 13.0, 18.0, 26.0, 29.0, 41.0, 66.0, 66.0, 82.0, 74.0, 75.0, 90.0, 63.0, 68.0, 70.0, 66.0, 35.0, 37.0, 31.0, 21.0, 9.0, 6.0, 9.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.019170522689819336, -0.018626732751727104, -0.018082942813634872, -0.01753915287554264, -0.01699536293745041, -0.016451572999358177, -0.015907783061265945, -0.015363993123173714, -0.014820203185081482, -0.01427641324698925, -0.013732623308897018, -0.013188833370804787, -0.012645043432712555, -0.012101253494620323, -0.011557463556528091, -0.01101367361843586, -0.010469883680343628, -0.009926093742251396, -0.009382303804159164, -0.008838513866066933, -0.008294723927974701, -0.007750933989882469, -0.007207144051790237, -0.006663354113698006, -0.006119564175605774, -0.005575774237513542, -0.00503198429942131, -0.004488194361329079, -0.003944404423236847, -0.003400614485144615, -0.0028568245470523834, -0.0023130346089601517, -0.00176924467086792, -0.0012254547327756882, -0.0006816647946834564, -0.00013787485659122467, 0.0004059150815010071, 0.0009497050195932388, 0.0014934949576854706, 0.0020372848957777023, 0.002581074833869934, 0.003124864771962166, 0.0036686547100543976, 0.004212444648146629, 0.004756234586238861, 0.005300024524331093, 0.005843814462423325, 0.006387604400515556, 0.006931394338607788, 0.00747518427670002, 0.008018974214792252, 0.008562764152884483, 0.009106554090976715, 0.009650344029068947, 0.010194133967161179, 0.01073792390525341, 0.011281713843345642, 0.011825503781437874, 0.012369293719530106, 0.012913083657622337, 0.013456873595714569, 0.0140006635338068, 0.014544453471899033, 0.015088243409991264, 0.015632033348083496]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 8.0, 12.0, 15.0, 17.0, 14.0, 24.0, 24.0, 41.0, 46.0, 62.0, 81.0, 91.0, 147.0, 174.0, 277.0, 482.0, 905.0, 1729.0, 3570.0, 7843.0, 21900.0, 704514.0, 273239.0, 19255.0, 6944.0, 3187.0, 1637.0, 867.0, 458.0, 276.0, 188.0, 114.0, 75.0, 69.0, 43.0, 42.0, 42.0, 28.0, 27.0, 16.0, 16.0, 14.0, 5.0, 3.0, 6.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.015716552734375, -0.015191793441772461, -0.014667034149169922, -0.014142274856567383, -0.013617515563964844, -0.013092756271362305, -0.012567996978759766, -0.012043237686157227, -0.011518478393554688, -0.010993719100952148, -0.01046895980834961, -0.00994420051574707, -0.009419441223144531, -0.008894681930541992, -0.008369922637939453, -0.007845163345336914, -0.007320404052734375, -0.006795644760131836, -0.006270885467529297, -0.005746126174926758, -0.005221366882324219, -0.00469660758972168, -0.004171848297119141, -0.0036470890045166016, -0.0031223297119140625, -0.0025975704193115234, -0.0020728111267089844, -0.0015480518341064453, -0.0010232925415039062, -0.0004985332489013672, 2.6226043701171875e-05, 0.0005509853363037109, 0.00107574462890625, 0.001600503921508789, 0.002125263214111328, 0.002650022506713867, 0.0031747817993164062, 0.0036995410919189453, 0.004224300384521484, 0.0047490596771240234, 0.0052738189697265625, 0.0057985782623291016, 0.006323337554931641, 0.00684809684753418, 0.007372856140136719, 0.007897615432739258, 0.008422374725341797, 0.008947134017944336, 0.009471893310546875, 0.009996652603149414, 0.010521411895751953, 0.011046171188354492, 0.011570930480957031, 0.01209568977355957, 0.01262044906616211, 0.013145208358764648, 0.013669967651367188, 0.014194726943969727, 0.014719486236572266, 0.015244245529174805, 0.015769004821777344, 0.016293764114379883, 0.016818523406982422, 0.01734328269958496, 0.0178680419921875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 5.0, 15.0, 9.0, 6.0, 6.0, 18.0, 67.0, 156.0, 287.0, 209.0, 84.0, 23.0, 10.0, 7.0, 14.0, 8.0, 8.0, 4.0, 5.0, 2.0, 6.0, 2.0, 4.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0075836181640625, -0.007312655448913574, -0.0070416927337646484, -0.006770730018615723, -0.006499767303466797, -0.006228804588317871, -0.005957841873168945, -0.0056868791580200195, -0.005415916442871094, -0.005144953727722168, -0.004873991012573242, -0.004603028297424316, -0.004332065582275391, -0.004061102867126465, -0.003790140151977539, -0.0035191774368286133, -0.0032482147216796875, -0.0029772520065307617, -0.002706289291381836, -0.00243532657623291, -0.0021643638610839844, -0.0018934011459350586, -0.0016224384307861328, -0.001351475715637207, -0.0010805130004882812, -0.0008095502853393555, -0.0005385875701904297, -0.0002676248550415039, 3.337860107421875e-06, 0.00027430057525634766, 0.0005452632904052734, 0.0008162260055541992, 0.001087188720703125, 0.0013581514358520508, 0.0016291141510009766, 0.0019000768661499023, 0.002171039581298828, 0.002442002296447754, 0.0027129650115966797, 0.0029839277267456055, 0.0032548904418945312, 0.003525853157043457, 0.003796815872192383, 0.004067778587341309, 0.004338741302490234, 0.00460970401763916, 0.004880666732788086, 0.005151629447937012, 0.0054225921630859375, 0.005693554878234863, 0.005964517593383789, 0.006235480308532715, 0.006506443023681641, 0.006777405738830566, 0.007048368453979492, 0.007319331169128418, 0.007590293884277344, 0.00786125659942627, 0.008132219314575195, 0.008403182029724121, 0.008674144744873047, 0.008945107460021973, 0.009216070175170898, 0.009487032890319824, 0.00975799560546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 2.0, 13.0, 14.0, 17.0, 13.0, 20.0, 23.0, 24.0, 43.0, 58.0, 46.0, 62.0, 78.0, 110.0, 135.0, 180.0, 274.0, 450.0, 787.0, 1824.0, 11462.0, 990311.0, 37465.0, 2469.0, 919.0, 517.0, 311.0, 212.0, 159.0, 110.0, 82.0, 65.0, 52.0, 39.0, 40.0, 32.0, 35.0, 17.0, 24.0, 13.0, 8.0, 10.0, 7.0, 11.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0352783203125, -0.03412675857543945, -0.032975196838378906, -0.03182363510131836, -0.030672073364257812, -0.029520511627197266, -0.02836894989013672, -0.027217388153076172, -0.026065826416015625, -0.024914264678955078, -0.02376270294189453, -0.022611141204833984, -0.021459579467773438, -0.02030801773071289, -0.019156455993652344, -0.018004894256591797, -0.01685333251953125, -0.015701770782470703, -0.014550209045410156, -0.01339864730834961, -0.012247085571289062, -0.011095523834228516, -0.009943962097167969, -0.008792400360107422, -0.007640838623046875, -0.006489276885986328, -0.005337715148925781, -0.004186153411865234, -0.0030345916748046875, -0.0018830299377441406, -0.0007314682006835938, 0.0004200935363769531, 0.0015716552734375, 0.002723217010498047, 0.0038747787475585938, 0.005026340484619141, 0.0061779022216796875, 0.007329463958740234, 0.008481025695800781, 0.009632587432861328, 0.010784149169921875, 0.011935710906982422, 0.013087272644042969, 0.014238834381103516, 0.015390396118164062, 0.01654195785522461, 0.017693519592285156, 0.018845081329345703, 0.01999664306640625, 0.021148204803466797, 0.022299766540527344, 0.02345132827758789, 0.024602890014648438, 0.025754451751708984, 0.02690601348876953, 0.028057575225830078, 0.029209136962890625, 0.030360698699951172, 0.03151226043701172, 0.032663822174072266, 0.03381538391113281, 0.03496694564819336, 0.036118507385253906, 0.03727006912231445, 0.038421630859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 7.0, 5.0, 13.0, 7.0, 10.0, 14.0, 12.0, 15.0, 30.0, 17.0, 23.0, 30.0, 40.0, 37.0, 37.0, 35.0, 26.0, 44.0, 38.0, 46.0, 31.0, 44.0, 33.0, 24.0, 48.0, 37.0, 33.0, 37.0, 38.0, 25.0, 21.0, 15.0, 19.0, 16.0, 15.0, 24.0, 3.0, 14.0, 10.0, 5.0, 6.0, 4.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0212554931640625, -0.020560741424560547, -0.019865989685058594, -0.01917123794555664, -0.018476486206054688, -0.017781734466552734, -0.01708698272705078, -0.016392230987548828, -0.015697479248046875, -0.015002727508544922, -0.014307975769042969, -0.013613224029541016, -0.012918472290039062, -0.01222372055053711, -0.011528968811035156, -0.010834217071533203, -0.01013946533203125, -0.009444713592529297, -0.008749961853027344, -0.00805521011352539, -0.0073604583740234375, -0.006665706634521484, -0.005970954895019531, -0.005276203155517578, -0.004581451416015625, -0.003886699676513672, -0.0031919479370117188, -0.0024971961975097656, -0.0018024444580078125, -0.0011076927185058594, -0.00041294097900390625, 0.0002818107604980469, 0.0009765625, 0.0016713142395019531, 0.0023660659790039062, 0.0030608177185058594, 0.0037555694580078125, 0.004450321197509766, 0.005145072937011719, 0.005839824676513672, 0.006534576416015625, 0.007229328155517578, 0.007924079895019531, 0.008618831634521484, 0.009313583374023438, 0.01000833511352539, 0.010703086853027344, 0.011397838592529297, 0.01209259033203125, 0.012787342071533203, 0.013482093811035156, 0.01417684555053711, 0.014871597290039062, 0.015566349029541016, 0.01626110076904297, 0.016955852508544922, 0.017650604248046875, 0.018345355987548828, 0.01904010772705078, 0.019734859466552734, 0.020429611206054688, 0.02112436294555664, 0.021819114685058594, 0.022513866424560547, 0.0232086181640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 4.0, 8.0, 10.0, 9.0, 17.0, 20.0, 25.0, 43.0, 46.0, 62.0, 139.0, 244.0, 427.0, 753.0, 2751.0, 13727.0, 133467.0, 860111.0, 29893.0, 4464.0, 1067.0, 534.0, 273.0, 125.0, 119.0, 58.0, 38.0, 25.0, 33.0, 18.0, 3.0, 8.0, 6.0, 2.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.1622905731201172e-05, -1.1282972991466522e-05, -1.0943040251731873e-05, -1.0603107511997223e-05, -1.0263174772262573e-05, -9.923242032527924e-06, -9.583309292793274e-06, -9.243376553058624e-06, -8.903443813323975e-06, -8.563511073589325e-06, -8.223578333854675e-06, -7.883645594120026e-06, -7.543712854385376e-06, -7.203780114650726e-06, -6.863847374916077e-06, -6.523914635181427e-06, -6.183981895446777e-06, -5.844049155712128e-06, -5.504116415977478e-06, -5.164183676242828e-06, -4.824250936508179e-06, -4.484318196773529e-06, -4.144385457038879e-06, -3.8044527173042297e-06, -3.46451997756958e-06, -3.1245872378349304e-06, -2.7846544981002808e-06, -2.444721758365631e-06, -2.1047890186309814e-06, -1.7648562788963318e-06, -1.4249235391616821e-06, -1.0849907994270325e-06, -7.450580596923828e-07, -4.0512531995773315e-07, -6.51925802230835e-08, 2.7474015951156616e-07, 6.146728992462158e-07, 9.546056389808655e-07, 1.2945383787155151e-06, 1.6344711184501648e-06, 1.9744038581848145e-06, 2.314336597919464e-06, 2.6542693376541138e-06, 2.9942020773887634e-06, 3.334134817123413e-06, 3.6740675568580627e-06, 4.014000296592712e-06, 4.353933036327362e-06, 4.693865776062012e-06, 5.033798515796661e-06, 5.373731255531311e-06, 5.713663995265961e-06, 6.05359673500061e-06, 6.39352947473526e-06, 6.73346221446991e-06, 7.073394954204559e-06, 7.413327693939209e-06, 7.753260433673859e-06, 8.093193173408508e-06, 8.433125913143158e-06, 8.773058652877808e-06, 9.112991392612457e-06, 9.452924132347107e-06, 9.792856872081757e-06, 1.0132789611816406e-05]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 11.0, 9.0, 13.0, 14.0, 46.0, 31.0, 37.0, 82.0, 68.0, 99.0, 105.0, 117.0, 62.0, 69.0, 73.0, 39.0, 47.0, 18.0, 10.0, 12.0, 11.0, 6.0, 4.0, 2.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.271766662597656e-06, -7.068738341331482e-06, -6.865710020065308e-06, -6.662681698799133e-06, -6.459653377532959e-06, -6.256625056266785e-06, -6.05359673500061e-06, -5.850568413734436e-06, -5.647540092468262e-06, -5.444511771202087e-06, -5.241483449935913e-06, -5.038455128669739e-06, -4.8354268074035645e-06, -4.63239848613739e-06, -4.429370164871216e-06, -4.2263418436050415e-06, -4.023313522338867e-06, -3.820285201072693e-06, -3.6172568798065186e-06, -3.4142285585403442e-06, -3.21120023727417e-06, -3.0081719160079956e-06, -2.8051435947418213e-06, -2.602115273475647e-06, -2.3990869522094727e-06, -2.1960586309432983e-06, -1.993030309677124e-06, -1.7900019884109497e-06, -1.5869736671447754e-06, -1.383945345878601e-06, -1.1809170246124268e-06, -9.778887033462524e-07, -7.748603820800781e-07, -5.718320608139038e-07, -3.688037395477295e-07, -1.6577541828155518e-07, 3.725290298461914e-08, 2.4028122425079346e-07, 4.4330954551696777e-07, 6.463378667831421e-07, 8.493661880493164e-07, 1.0523945093154907e-06, 1.255422830581665e-06, 1.4584511518478394e-06, 1.6614794731140137e-06, 1.864507794380188e-06, 2.0675361156463623e-06, 2.2705644369125366e-06, 2.473592758178711e-06, 2.6766210794448853e-06, 2.8796494007110596e-06, 3.082677721977234e-06, 3.285706043243408e-06, 3.4887343645095825e-06, 3.691762685775757e-06, 3.894791007041931e-06, 4.0978193283081055e-06, 4.30084764957428e-06, 4.503875970840454e-06, 4.706904292106628e-06, 4.909932613372803e-06, 5.112960934638977e-06, 5.315989255905151e-06, 5.519017577171326e-06, 5.7220458984375e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 9.0, 21.0, 19.0, 43.0, 57.0, 94.0, 184.0, 594.0, 3890.0, 1039782.0, 2927.0, 484.0, 193.0, 102.0, 46.0, 27.0, 36.0, 13.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6835670471191406e-05, -3.5585835576057434e-05, -3.433600068092346e-05, -3.308616578578949e-05, -3.183633089065552e-05, -3.0586495995521545e-05, -2.9336661100387573e-05, -2.80868262052536e-05, -2.683699131011963e-05, -2.5587156414985657e-05, -2.4337321519851685e-05, -2.3087486624717712e-05, -2.183765172958374e-05, -2.0587816834449768e-05, -1.9337981939315796e-05, -1.8088147044181824e-05, -1.683831214904785e-05, -1.558847725391388e-05, -1.4338642358779907e-05, -1.3088807463645935e-05, -1.1838972568511963e-05, -1.058913767337799e-05, -9.339302778244019e-06, -8.089467883110046e-06, -6.839632987976074e-06, -5.589798092842102e-06, -4.33996319770813e-06, -3.0901283025741577e-06, -1.8402934074401855e-06, -5.904585123062134e-07, 6.593763828277588e-07, 1.909211277961731e-06, 3.159046173095703e-06, 4.408881068229675e-06, 5.6587159633636475e-06, 6.90855085849762e-06, 8.158385753631592e-06, 9.408220648765564e-06, 1.0658055543899536e-05, 1.1907890439033508e-05, 1.315772533416748e-05, 1.4407560229301453e-05, 1.5657395124435425e-05, 1.6907230019569397e-05, 1.815706491470337e-05, 1.940689980983734e-05, 2.0656734704971313e-05, 2.1906569600105286e-05, 2.3156404495239258e-05, 2.440623939037323e-05, 2.5656074285507202e-05, 2.6905909180641174e-05, 2.8155744075775146e-05, 2.940557897090912e-05, 3.065541386604309e-05, 3.190524876117706e-05, 3.3155083656311035e-05, 3.440491855144501e-05, 3.565475344657898e-05, 3.690458834171295e-05, 3.8154423236846924e-05, 3.9404258131980896e-05, 4.065409302711487e-05, 4.190392792224884e-05, 4.315376281738281e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 11.0, 7.0, 9.0, 18.0, 31.0, 31.0, 58.0, 124.0, 138.0, 267.0, 118.0, 71.0, 41.0, 21.0, 14.0, 13.0, 15.0, 4.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0384788513183594e-05, -1.965835690498352e-05, -1.8931925296783447e-05, -1.8205493688583374e-05, -1.74790620803833e-05, -1.6752630472183228e-05, -1.6026198863983154e-05, -1.529976725578308e-05, -1.4573335647583008e-05, -1.3846904039382935e-05, -1.3120472431182861e-05, -1.2394040822982788e-05, -1.1667609214782715e-05, -1.0941177606582642e-05, -1.0214745998382568e-05, -9.488314390182495e-06, -8.761882781982422e-06, -8.035451173782349e-06, -7.309019565582275e-06, -6.582587957382202e-06, -5.856156349182129e-06, -5.129724740982056e-06, -4.403293132781982e-06, -3.676861524581909e-06, -2.950429916381836e-06, -2.2239983081817627e-06, -1.4975666999816895e-06, -7.711350917816162e-07, -4.470348358154297e-08, 6.817281246185303e-07, 1.4081597328186035e-06, 2.1345913410186768e-06, 2.86102294921875e-06, 3.5874545574188232e-06, 4.3138861656188965e-06, 5.04031777381897e-06, 5.766749382019043e-06, 6.493180990219116e-06, 7.2196125984191895e-06, 7.946044206619263e-06, 8.672475814819336e-06, 9.39890742301941e-06, 1.0125339031219482e-05, 1.0851770639419556e-05, 1.1578202247619629e-05, 1.2304633855819702e-05, 1.3031065464019775e-05, 1.3757497072219849e-05, 1.4483928680419922e-05, 1.5210360288619995e-05, 1.593679189682007e-05, 1.666322350502014e-05, 1.7389655113220215e-05, 1.8116086721420288e-05, 1.884251832962036e-05, 1.9568949937820435e-05, 2.0295381546020508e-05, 2.102181315422058e-05, 2.1748244762420654e-05, 2.2474676370620728e-05, 2.32011079788208e-05, 2.3927539587020874e-05, 2.4653971195220947e-05, 2.538040280342102e-05, 2.6106834411621094e-05]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 48.0, 735.0, 200.0, 20.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27395039796829224, -0.2670600414276123, -0.26016965508461, -0.25327929854393005, -0.24638892710208893, -0.2394985556602478, -0.23260819911956787, -0.22571782767772675, -0.21882745623588562, -0.2119370847940445, -0.20504672825336456, -0.19815635681152344, -0.1912659853696823, -0.1843756139278412, -0.17748525738716125, -0.17059488594532013, -0.163704514503479, -0.15681414306163788, -0.14992378652095795, -0.14303341507911682, -0.1361430436372757, -0.12925267219543457, -0.12236231565475464, -0.11547194421291351, -0.10858158767223358, -0.10169122368097305, -0.09480085223913193, -0.0879104882478714, -0.08102011680603027, -0.07412975281476974, -0.06723938882350922, -0.06034901738166809, -0.053458645939826965, -0.04656827822327614, -0.03967791050672531, -0.03278754651546478, -0.025897176936268806, -0.01900681108236313, -0.012116443365812302, -0.005226075649261475, 0.0016642920672893524, 0.00855465978384018, 0.015445026569068432, 0.022335393354296684, 0.02922576107084751, 0.03611612692475319, 0.043006494641304016, 0.04989686235785484, 0.05678723007440567, 0.0636775940656662, 0.07056796550750732, 0.07745832949876785, 0.08434870094060898, 0.0912390649318695, 0.09812943637371063, 0.10501980036497116, 0.11191016435623169, 0.11880052834749222, 0.12569089233875275, 0.13258126378059387, 0.139471635222435, 0.14636200666427612, 0.15325236320495605, 0.16014273464679718, 0.1670331060886383]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 8.0, 6.0, 5.0, 11.0, 10.0, 13.0, 14.0, 19.0, 28.0, 29.0, 37.0, 42.0, 45.0, 50.0, 57.0, 56.0, 62.0, 51.0, 43.0, 48.0, 40.0, 46.0, 35.0, 41.0, 33.0, 38.0, 23.0, 19.0, 20.0, 15.0, 14.0, 8.0, 6.0, 5.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16866850852966309, -0.1637195497751236, -0.1587705910205841, -0.15382163226604462, -0.14887267351150513, -0.14392371475696564, -0.13897475600242615, -0.13402581214904785, -0.12907683849334717, -0.12412787973880768, -0.11917892098426819, -0.1142299622297287, -0.10928100347518921, -0.10433204472064972, -0.09938309341669083, -0.09443413466215134, -0.08948518335819244, -0.08453622460365295, -0.07958726584911346, -0.07463830709457397, -0.06968934834003448, -0.064740389585495, -0.0597914382815361, -0.05484247952699661, -0.04989352077245712, -0.04494456201791763, -0.03999560326337814, -0.03504664823412895, -0.030097689479589462, -0.025148730725049973, -0.020199773833155632, -0.015250816941261292, -0.010301858186721802, -0.005352900363504887, -0.0004039425402879715, 0.004545015282928944, 0.009493973106145859, 0.014442931860685349, 0.01939188875257969, 0.02434084564447403, 0.02928980439901352, 0.03423876315355301, 0.0391877219080925, 0.04413667693734169, 0.04908563569188118, 0.05403459444642067, 0.05898354947566986, 0.06393250823020935, 0.06888146698474884, 0.07383042573928833, 0.07877938449382782, 0.08372834324836731, 0.0886773020029068, 0.09362626075744629, 0.09857521206140518, 0.10352417081594467, 0.10847312957048416, 0.11342208832502365, 0.11837104707956314, 0.12332000583410263, 0.12826895713806152, 0.133217915892601, 0.1381668746471405, 0.14311583340168, 0.14806479215621948]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 2.0, 7.0, 13.0, 7.0, 10.0, 10.0, 25.0, 84.0, 207.0, 4163852.0, 29758.0, 136.0, 42.0, 16.0, 16.0, 12.0, 11.0, 6.0, 4.0, 5.0, 1.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09820556640625, -0.09469318389892578, -0.09118080139160156, -0.08766841888427734, -0.08415603637695312, -0.0806436538696289, -0.07713127136230469, -0.07361888885498047, -0.07010650634765625, -0.06659412384033203, -0.06308174133300781, -0.059569358825683594, -0.056056976318359375, -0.052544593811035156, -0.04903221130371094, -0.04551982879638672, -0.0420074462890625, -0.03849506378173828, -0.03498268127441406, -0.031470298767089844, -0.027957916259765625, -0.024445533752441406, -0.020933151245117188, -0.01742076873779297, -0.01390838623046875, -0.010396003723144531, -0.0068836212158203125, -0.0033712387084960938, 0.000141143798828125, 0.0036535263061523438, 0.0071659088134765625, 0.010678291320800781, 0.014190673828125, 0.01770305633544922, 0.021215438842773438, 0.024727821350097656, 0.028240203857421875, 0.031752586364746094, 0.03526496887207031, 0.03877735137939453, 0.04228973388671875, 0.04580211639404297, 0.04931449890136719, 0.052826881408691406, 0.056339263916015625, 0.059851646423339844, 0.06336402893066406, 0.06687641143798828, 0.0703887939453125, 0.07390117645263672, 0.07741355895996094, 0.08092594146728516, 0.08443832397460938, 0.0879507064819336, 0.09146308898925781, 0.09497547149658203, 0.09848785400390625, 0.10200023651123047, 0.10551261901855469, 0.1090250015258789, 0.11253738403320312, 0.11604976654052734, 0.11956214904785156, 0.12307453155517578, 0.1265869140625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 5.0, 15.0, 7.0, 9.0, 8.0, 14.0, 70.0, 142.0, 281.0, 209.0, 99.0, 26.0, 8.0, 10.0, 10.0, 10.0, 9.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007396697998046875, -0.007133066654205322, -0.0068694353103637695, -0.006605803966522217, -0.006342172622680664, -0.006078541278839111, -0.005814909934997559, -0.005551278591156006, -0.005287647247314453, -0.0050240159034729, -0.004760384559631348, -0.004496753215789795, -0.004233121871948242, -0.0039694905281066895, -0.0037058591842651367, -0.003442227840423584, -0.0031785964965820312, -0.0029149651527404785, -0.0026513338088989258, -0.002387702465057373, -0.0021240711212158203, -0.0018604397773742676, -0.0015968084335327148, -0.0013331770896911621, -0.0010695457458496094, -0.0008059144020080566, -0.0005422830581665039, -0.00027865171432495117, -1.5020370483398438e-05, 0.0002486109733581543, 0.000512242317199707, 0.0007758736610412598, 0.0010395050048828125, 0.0013031363487243652, 0.001566767692565918, 0.0018303990364074707, 0.0020940303802490234, 0.002357661724090576, 0.002621293067932129, 0.0028849244117736816, 0.0031485557556152344, 0.003412187099456787, 0.00367581844329834, 0.003939449787139893, 0.004203081130981445, 0.004466712474822998, 0.004730343818664551, 0.0049939751625061035, 0.005257606506347656, 0.005521237850189209, 0.005784869194030762, 0.0060485005378723145, 0.006312131881713867, 0.00657576322555542, 0.006839394569396973, 0.007103025913238525, 0.007366657257080078, 0.007630288600921631, 0.007893919944763184, 0.008157551288604736, 0.008421182632446289, 0.008684813976287842, 0.008948445320129395, 0.009212076663970947, 0.0094757080078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 9.0, 13.0, 23.0, 75.0, 202.0, 721.0, 6143.0, 4179271.0, 6784.0, 722.0, 190.0, 62.0, 27.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018585205078125, -0.017976045608520508, -0.017366886138916016, -0.016757726669311523, -0.01614856719970703, -0.015539407730102539, -0.014930248260498047, -0.014321088790893555, -0.013711929321289062, -0.01310276985168457, -0.012493610382080078, -0.011884450912475586, -0.011275291442871094, -0.010666131973266602, -0.01005697250366211, -0.009447813034057617, -0.008838653564453125, -0.008229494094848633, -0.007620334625244141, -0.0070111751556396484, -0.006402015686035156, -0.005792856216430664, -0.005183696746826172, -0.00457453727722168, -0.0039653778076171875, -0.0033562183380126953, -0.002747058868408203, -0.002137899398803711, -0.0015287399291992188, -0.0009195804595947266, -0.0003104209899902344, 0.0002987384796142578, 0.00090789794921875, 0.0015170574188232422, 0.0021262168884277344, 0.0027353763580322266, 0.0033445358276367188, 0.003953695297241211, 0.004562854766845703, 0.005172014236450195, 0.0057811737060546875, 0.00639033317565918, 0.006999492645263672, 0.007608652114868164, 0.008217811584472656, 0.008826971054077148, 0.00943613052368164, 0.010045289993286133, 0.010654449462890625, 0.011263608932495117, 0.01187276840209961, 0.012481927871704102, 0.013091087341308594, 0.013700246810913086, 0.014309406280517578, 0.01491856575012207, 0.015527725219726562, 0.016136884689331055, 0.016746044158935547, 0.01735520362854004, 0.01796436309814453, 0.018573522567749023, 0.019182682037353516, 0.019791841506958008, 0.0204010009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 12.0, 19.0, 37.0, 90.0, 193.0, 2958.0, 528.0, 128.0, 56.0, 29.0, 9.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00806427001953125, -0.007861495018005371, -0.007658720016479492, -0.007455945014953613, -0.007253170013427734, -0.0070503950119018555, -0.0068476200103759766, -0.006644845008850098, -0.006442070007324219, -0.00623929500579834, -0.006036520004272461, -0.005833745002746582, -0.005630970001220703, -0.005428194999694824, -0.005225419998168945, -0.005022644996643066, -0.0048198699951171875, -0.004617094993591309, -0.00441431999206543, -0.004211544990539551, -0.004008769989013672, -0.003805994987487793, -0.003603219985961914, -0.003400444984436035, -0.0031976699829101562, -0.0029948949813842773, -0.0027921199798583984, -0.0025893449783325195, -0.0023865699768066406, -0.0021837949752807617, -0.001981019973754883, -0.001778244972229004, -0.001575469970703125, -0.001372694969177246, -0.0011699199676513672, -0.0009671449661254883, -0.0007643699645996094, -0.0005615949630737305, -0.00035881996154785156, -0.00015604496002197266, 4.673004150390625e-05, 0.00024950504302978516, 0.00045228004455566406, 0.000655055046081543, 0.0008578300476074219, 0.0010606050491333008, 0.0012633800506591797, 0.0014661550521850586, 0.0016689300537109375, 0.0018717050552368164, 0.0020744800567626953, 0.0022772550582885742, 0.002480030059814453, 0.002682805061340332, 0.002885580062866211, 0.00308835506439209, 0.0032911300659179688, 0.0034939050674438477, 0.0036966800689697266, 0.0038994550704956055, 0.004102230072021484, 0.004305005073547363, 0.004507780075073242, 0.004710555076599121, 0.004913330078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [107.0, 909.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004444257356226444, -0.00020800484344363213, 0.00402824766933918, 0.008264499716460705, 0.012500752694904804, 0.01673700660467148, 0.02097325772047043, 0.02520950883626938, 0.029445763677358627, 0.03368201479315758, 0.037918269634246826, 0.042154520750045776, 0.04639077186584473, 0.050627026706933975, 0.054863277822732925, 0.059099532663822174, 0.06333578377962112, 0.06757203489542007, 0.07180828601121902, 0.07604454457759857, 0.08028079569339752, 0.08451704680919647, 0.08875329792499542, 0.09298954904079437, 0.09722580015659332, 0.10146205127239227, 0.10569830238819122, 0.10993455350399017, 0.11417081207036972, 0.11840706318616867, 0.12264331430196762, 0.12687957286834717, 0.13111580908298492, 0.13535206019878387, 0.13958831131458282, 0.14382456243038177, 0.14806081354618073, 0.15229707956314087, 0.15653333067893982, 0.16076958179473877, 0.16500583291053772, 0.16924208402633667, 0.17347833514213562, 0.17771458625793457, 0.18195083737373352, 0.18618708848953247, 0.19042333960533142, 0.19465960562229156, 0.19889584183692932, 0.20313209295272827, 0.20736834406852722, 0.21160459518432617, 0.21584084630012512, 0.22007709741592407, 0.22431334853172302, 0.22854961454868317, 0.23278586566448212, 0.23702211678028107, 0.24125836789608002, 0.24549461901187897, 0.24973087012767792, 0.25396713614463806, 0.258203387260437, 0.26243963837623596, 0.2666758894920349]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 6.0, 14.0, 13.0, 19.0, 17.0, 21.0, 23.0, 27.0, 40.0, 35.0, 57.0, 44.0, 65.0, 55.0, 45.0, 47.0, 54.0, 50.0, 50.0, 36.0, 37.0, 40.0, 29.0, 26.0, 33.0, 21.0, 10.0, 21.0, 11.0, 9.0, 14.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008043885231018066, -0.007724401541054249, -0.007404917851090431, -0.007085434161126614, -0.006765950471162796, -0.006446466781198978, -0.006126983091235161, -0.005807499401271343, -0.005488015711307526, -0.005168532021343708, -0.0048490483313798904, -0.004529564641416073, -0.004210080951452255, -0.0038905972614884377, -0.00357111357152462, -0.0032516298815608025, -0.002932146191596985, -0.0026126625016331673, -0.0022931788116693497, -0.001973695121705532, -0.0016542114317417145, -0.0013347277417778969, -0.0010152440518140793, -0.0006957603618502617, -0.0003762766718864441, -5.6792981922626495e-05, 0.0002626907080411911, 0.0005821743980050087, 0.0009016580879688263, 0.0012211417779326439, 0.0015406254678964615, 0.001860109157860279, 0.0021795928478240967, 0.0024990765377879143, 0.002818560227751732, 0.0031380439177155495, 0.003457527607679367, 0.0037770112976431847, 0.004096494987607002, 0.00441597867757082, 0.0047354623675346375, 0.005054946057498455, 0.005374429747462273, 0.00569391343742609, 0.006013397127389908, 0.006332880817353725, 0.006652364507317543, 0.006971848197281361, 0.007291331887245178, 0.007610815577208996, 0.007930299267172813, 0.008249782957136631, 0.008569266647100449, 0.008888750337064266, 0.009208234027028084, 0.009527717716991901, 0.009847201406955719, 0.010166685096919537, 0.010486168786883354, 0.010805652476847172, 0.01112513616681099, 0.011444619856774807, 0.011764103546738625, 0.012083587236702442, 0.01240307092666626]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 8.0, 9.0, 12.0, 18.0, 24.0, 32.0, 38.0, 42.0, 77.0, 114.0, 156.0, 217.0, 372.0, 547.0, 887.0, 1380.0, 2521.0, 4589.0, 9715.0, 27367.0, 813729.0, 151509.0, 18309.0, 7676.0, 3661.0, 2044.0, 1185.0, 752.0, 508.0, 319.0, 197.0, 176.0, 106.0, 80.0, 40.0, 28.0, 29.0, 19.0, 15.0, 14.0, 6.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.01155853271484375, -0.011236071586608887, -0.010913610458374023, -0.01059114933013916, -0.010268688201904297, -0.009946227073669434, -0.00962376594543457, -0.009301304817199707, -0.008978843688964844, -0.00865638256072998, -0.008333921432495117, -0.008011460304260254, -0.007688999176025391, -0.007366538047790527, -0.007044076919555664, -0.006721615791320801, -0.0063991546630859375, -0.006076693534851074, -0.005754232406616211, -0.005431771278381348, -0.005109310150146484, -0.004786849021911621, -0.004464387893676758, -0.0041419267654418945, -0.0038194656372070312, -0.003497004508972168, -0.0031745433807373047, -0.0028520822525024414, -0.002529621124267578, -0.002207159996032715, -0.0018846988677978516, -0.0015622377395629883, -0.001239776611328125, -0.0009173154830932617, -0.0005948543548583984, -0.00027239322662353516, 5.0067901611328125e-05, 0.0003725290298461914, 0.0006949901580810547, 0.001017451286315918, 0.0013399124145507812, 0.0016623735427856445, 0.001984834671020508, 0.002307295799255371, 0.0026297569274902344, 0.0029522180557250977, 0.003274679183959961, 0.0035971403121948242, 0.0039196014404296875, 0.004242062568664551, 0.004564523696899414, 0.004886984825134277, 0.005209445953369141, 0.005531907081604004, 0.005854368209838867, 0.0061768293380737305, 0.006499290466308594, 0.006821751594543457, 0.00714421272277832, 0.007466673851013184, 0.007789134979248047, 0.00811159610748291, 0.008434057235717773, 0.008756518363952637, 0.0090789794921875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 3.0, 6.0, 14.0, 7.0, 8.0, 9.0, 14.0, 70.0, 149.0, 278.0, 209.0, 96.0, 25.0, 8.0, 10.0, 11.0, 9.0, 9.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00738525390625, -0.0071218013763427734, -0.006858348846435547, -0.00659489631652832, -0.006331443786621094, -0.006067991256713867, -0.005804538726806641, -0.005541086196899414, -0.0052776336669921875, -0.005014181137084961, -0.004750728607177734, -0.004487276077270508, -0.004223823547363281, -0.003960371017456055, -0.003696918487548828, -0.0034334659576416016, -0.003170013427734375, -0.0029065608978271484, -0.002643108367919922, -0.0023796558380126953, -0.0021162033081054688, -0.0018527507781982422, -0.0015892982482910156, -0.001325845718383789, -0.0010623931884765625, -0.0007989406585693359, -0.0005354881286621094, -0.0002720355987548828, -8.58306884765625e-06, 0.0002548694610595703, 0.0005183219909667969, 0.0007817745208740234, 0.00104522705078125, 0.0013086795806884766, 0.0015721321105957031, 0.0018355846405029297, 0.0020990371704101562, 0.002362489700317383, 0.0026259422302246094, 0.002889394760131836, 0.0031528472900390625, 0.003416299819946289, 0.0036797523498535156, 0.003943204879760742, 0.004206657409667969, 0.004470109939575195, 0.004733562469482422, 0.0049970149993896484, 0.005260467529296875, 0.0055239200592041016, 0.005787372589111328, 0.006050825119018555, 0.006314277648925781, 0.006577730178833008, 0.006841182708740234, 0.007104635238647461, 0.0073680877685546875, 0.007631540298461914, 0.00789499282836914, 0.008158445358276367, 0.008421897888183594, 0.00868535041809082, 0.008948802947998047, 0.009212255477905273, 0.0094757080078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 10.0, 7.0, 14.0, 24.0, 17.0, 17.0, 31.0, 35.0, 32.0, 61.0, 100.0, 118.0, 137.0, 187.0, 308.0, 576.0, 1068.0, 4259.0, 799459.0, 236536.0, 3050.0, 939.0, 471.0, 309.0, 191.0, 151.0, 100.0, 95.0, 63.0, 41.0, 28.0, 29.0, 16.0, 15.0, 17.0, 10.0, 10.0, 6.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02581787109375, -0.02503371238708496, -0.024249553680419922, -0.023465394973754883, -0.022681236267089844, -0.021897077560424805, -0.021112918853759766, -0.020328760147094727, -0.019544601440429688, -0.01876044273376465, -0.01797628402709961, -0.01719212532043457, -0.01640796661376953, -0.015623807907104492, -0.014839649200439453, -0.014055490493774414, -0.013271331787109375, -0.012487173080444336, -0.011703014373779297, -0.010918855667114258, -0.010134696960449219, -0.00935053825378418, -0.00856637954711914, -0.0077822208404541016, -0.0069980621337890625, -0.0062139034271240234, -0.005429744720458984, -0.004645586013793945, -0.0038614273071289062, -0.003077268600463867, -0.002293109893798828, -0.001508951187133789, -0.00072479248046875, 5.936622619628906e-05, 0.0008435249328613281, 0.0016276836395263672, 0.0024118423461914062, 0.0031960010528564453, 0.003980159759521484, 0.0047643184661865234, 0.0055484771728515625, 0.0063326358795166016, 0.007116794586181641, 0.00790095329284668, 0.008685111999511719, 0.009469270706176758, 0.010253429412841797, 0.011037588119506836, 0.011821746826171875, 0.012605905532836914, 0.013390064239501953, 0.014174222946166992, 0.014958381652832031, 0.01574254035949707, 0.01652669906616211, 0.01731085777282715, 0.018095016479492188, 0.018879175186157227, 0.019663333892822266, 0.020447492599487305, 0.021231651306152344, 0.022015810012817383, 0.022799968719482422, 0.02358412742614746, 0.0243682861328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 10.0, 6.0, 13.0, 20.0, 13.0, 10.0, 19.0, 21.0, 19.0, 27.0, 40.0, 36.0, 37.0, 26.0, 38.0, 36.0, 44.0, 58.0, 39.0, 43.0, 34.0, 35.0, 38.0, 44.0, 40.0, 50.0, 25.0, 32.0, 24.0, 17.0, 19.0, 19.0, 10.0, 9.0, 15.0, 7.0, 8.0, 5.0, 1.0, 1.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.022247314453125, -0.02157115936279297, -0.020895004272460938, -0.020218849182128906, -0.019542694091796875, -0.018866539001464844, -0.018190383911132812, -0.01751422882080078, -0.01683807373046875, -0.01616191864013672, -0.015485763549804688, -0.014809608459472656, -0.014133453369140625, -0.013457298278808594, -0.012781143188476562, -0.012104988098144531, -0.0114288330078125, -0.010752677917480469, -0.010076522827148438, -0.009400367736816406, -0.008724212646484375, -0.008048057556152344, -0.0073719024658203125, -0.006695747375488281, -0.00601959228515625, -0.005343437194824219, -0.0046672821044921875, -0.003991127014160156, -0.003314971923828125, -0.0026388168334960938, -0.0019626617431640625, -0.0012865066528320312, -0.0006103515625, 6.580352783203125e-05, 0.0007419586181640625, 0.0014181137084960938, 0.002094268798828125, 0.0027704238891601562, 0.0034465789794921875, 0.004122734069824219, 0.00479888916015625, 0.005475044250488281, 0.0061511993408203125, 0.006827354431152344, 0.007503509521484375, 0.008179664611816406, 0.008855819702148438, 0.009531974792480469, 0.0102081298828125, 0.010884284973144531, 0.011560440063476562, 0.012236595153808594, 0.012912750244140625, 0.013588905334472656, 0.014265060424804688, 0.014941215515136719, 0.01561737060546875, 0.01629352569580078, 0.016969680786132812, 0.017645835876464844, 0.018321990966796875, 0.018998146057128906, 0.019674301147460938, 0.02035045623779297, 0.021026611328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 4.0, 8.0, 11.0, 23.0, 15.0, 22.0, 42.0, 37.0, 109.0, 86.0, 112.0, 298.0, 323.0, 1054.0, 1839.0, 15046.0, 147643.0, 836544.0, 39231.0, 3178.0, 1544.0, 444.0, 371.0, 175.0, 99.0, 97.0, 46.0, 43.0, 20.0, 17.0, 24.0, 6.0, 4.0, 7.0, 5.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.649162292480469e-06, -4.50480729341507e-06, -4.36045229434967e-06, -4.216097295284271e-06, -4.071742296218872e-06, -3.927387297153473e-06, -3.7830322980880737e-06, -3.6386772990226746e-06, -3.4943222999572754e-06, -3.3499673008918762e-06, -3.205612301826477e-06, -3.061257302761078e-06, -2.9169023036956787e-06, -2.7725473046302795e-06, -2.6281923055648804e-06, -2.483837306499481e-06, -2.339482307434082e-06, -2.195127308368683e-06, -2.0507723093032837e-06, -1.9064173102378845e-06, -1.7620623111724854e-06, -1.6177073121070862e-06, -1.473352313041687e-06, -1.3289973139762878e-06, -1.1846423149108887e-06, -1.0402873158454895e-06, -8.959323167800903e-07, -7.515773177146912e-07, -6.07222318649292e-07, -4.628673195838928e-07, -3.1851232051849365e-07, -1.7415732145309448e-07, -2.9802322387695312e-08, 1.1455267667770386e-07, 2.5890767574310303e-07, 4.032626748085022e-07, 5.476176738739014e-07, 6.919726729393005e-07, 8.363276720046997e-07, 9.806826710700989e-07, 1.125037670135498e-06, 1.2693926692008972e-06, 1.4137476682662964e-06, 1.5581026673316956e-06, 1.7024576663970947e-06, 1.846812665462494e-06, 1.991167664527893e-06, 2.1355226635932922e-06, 2.2798776626586914e-06, 2.4242326617240906e-06, 2.5685876607894897e-06, 2.712942659854889e-06, 2.857297658920288e-06, 3.0016526579856873e-06, 3.1460076570510864e-06, 3.2903626561164856e-06, 3.4347176551818848e-06, 3.579072654247284e-06, 3.723427653312683e-06, 3.867782652378082e-06, 4.0121376514434814e-06, 4.156492650508881e-06, 4.30084764957428e-06, 4.445202648639679e-06, 4.589557647705078e-06]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 4.0, 3.0, 6.0, 9.0, 5.0, 17.0, 9.0, 17.0, 18.0, 28.0, 19.0, 40.0, 17.0, 39.0, 23.0, 61.0, 19.0, 64.0, 34.0, 91.0, 80.0, 38.0, 68.0, 15.0, 47.0, 29.0, 33.0, 18.0, 38.0, 17.0, 19.0, 7.0, 12.0, 6.0, 9.0, 8.0, 1.0, 2.0, 2.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.9206275939941406e-06, -2.8293579816818237e-06, -2.738088369369507e-06, -2.64681875705719e-06, -2.555549144744873e-06, -2.464279532432556e-06, -2.3730099201202393e-06, -2.2817403078079224e-06, -2.1904706954956055e-06, -2.0992010831832886e-06, -2.0079314708709717e-06, -1.9166618585586548e-06, -1.8253922462463379e-06, -1.734122633934021e-06, -1.642853021621704e-06, -1.5515834093093872e-06, -1.4603137969970703e-06, -1.3690441846847534e-06, -1.2777745723724365e-06, -1.1865049600601196e-06, -1.0952353477478027e-06, -1.0039657354354858e-06, -9.126961231231689e-07, -8.21426510810852e-07, -7.301568984985352e-07, -6.388872861862183e-07, -5.476176738739014e-07, -4.5634806156158447e-07, -3.650784492492676e-07, -2.738088369369507e-07, -1.825392246246338e-07, -9.12696123123169e-08, 0.0, 9.12696123123169e-08, 1.825392246246338e-07, 2.738088369369507e-07, 3.650784492492676e-07, 4.5634806156158447e-07, 5.476176738739014e-07, 6.388872861862183e-07, 7.301568984985352e-07, 8.21426510810852e-07, 9.126961231231689e-07, 1.0039657354354858e-06, 1.0952353477478027e-06, 1.1865049600601196e-06, 1.2777745723724365e-06, 1.3690441846847534e-06, 1.4603137969970703e-06, 1.5515834093093872e-06, 1.642853021621704e-06, 1.734122633934021e-06, 1.8253922462463379e-06, 1.9166618585586548e-06, 2.0079314708709717e-06, 2.0992010831832886e-06, 2.1904706954956055e-06, 2.2817403078079224e-06, 2.3730099201202393e-06, 2.464279532432556e-06, 2.555549144744873e-06, 2.64681875705719e-06, 2.738088369369507e-06, 2.8293579816818237e-06, 2.9206275939941406e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 15.0, 19.0, 27.0, 51.0, 78.0, 167.0, 415.0, 3803.0, 1040571.0, 2588.0, 452.0, 148.0, 84.0, 45.0, 29.0, 20.0, 7.0, 7.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5795230865478516e-05, -1.5174970030784607e-05, -1.4554709196090698e-05, -1.393444836139679e-05, -1.3314187526702881e-05, -1.2693926692008972e-05, -1.2073665857315063e-05, -1.1453405022621155e-05, -1.0833144187927246e-05, -1.0212883353233337e-05, -9.592622518539429e-06, -8.97236168384552e-06, -8.352100849151611e-06, -7.731840014457703e-06, -7.111579179763794e-06, -6.491318345069885e-06, -5.8710575103759766e-06, -5.250796675682068e-06, -4.630535840988159e-06, -4.0102750062942505e-06, -3.390014171600342e-06, -2.769753336906433e-06, -2.1494925022125244e-06, -1.5292316675186157e-06, -9.08970832824707e-07, -2.8870999813079834e-07, 3.3155083656311035e-07, 9.51811671257019e-07, 1.5720725059509277e-06, 2.1923333406448364e-06, 2.812594175338745e-06, 3.432855010032654e-06, 4.0531158447265625e-06, 4.673376679420471e-06, 5.29363751411438e-06, 5.9138983488082886e-06, 6.534159183502197e-06, 7.154420018196106e-06, 7.774680852890015e-06, 8.394941687583923e-06, 9.015202522277832e-06, 9.63546335697174e-06, 1.025572419166565e-05, 1.0875985026359558e-05, 1.1496245861053467e-05, 1.2116506695747375e-05, 1.2736767530441284e-05, 1.3357028365135193e-05, 1.3977289199829102e-05, 1.459755003452301e-05, 1.5217810869216919e-05, 1.5838071703910828e-05, 1.6458332538604736e-05, 1.7078593373298645e-05, 1.7698854207992554e-05, 1.8319115042686462e-05, 1.893937587738037e-05, 1.955963671207428e-05, 2.017989754676819e-05, 2.0800158381462097e-05, 2.1420419216156006e-05, 2.2040680050849915e-05, 2.2660940885543823e-05, 2.3281201720237732e-05, 2.390146255493164e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 8.0, 10.0, 9.0, 25.0, 30.0, 42.0, 67.0, 81.0, 481.0, 78.0, 55.0, 32.0, 23.0, 21.0, 6.0, 10.0, 5.0, 5.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.3055279850959778e-05, -1.2520700693130493e-05, -1.1986121535301208e-05, -1.1451542377471924e-05, -1.091696321964264e-05, -1.0382384061813354e-05, -9.84780490398407e-06, -9.313225746154785e-06, -8.7786465883255e-06, -8.244067430496216e-06, -7.709488272666931e-06, -7.1749091148376465e-06, -6.640329957008362e-06, -6.105750799179077e-06, -5.5711716413497925e-06, -5.036592483520508e-06, -4.502013325691223e-06, -3.9674341678619385e-06, -3.432855010032654e-06, -2.898275852203369e-06, -2.3636966943740845e-06, -1.8291175365447998e-06, -1.2945383787155151e-06, -7.599592208862305e-07, -2.253800630569458e-07, 3.0919909477233887e-07, 8.437782526016235e-07, 1.3783574104309082e-06, 1.912936568260193e-06, 2.4475157260894775e-06, 2.982094883918762e-06, 3.516674041748047e-06, 4.0512531995773315e-06, 4.585832357406616e-06, 5.120411515235901e-06, 5.6549906730651855e-06, 6.18956983089447e-06, 6.724148988723755e-06, 7.2587281465530396e-06, 7.793307304382324e-06, 8.327886462211609e-06, 8.862465620040894e-06, 9.397044777870178e-06, 9.931623935699463e-06, 1.0466203093528748e-05, 1.1000782251358032e-05, 1.1535361409187317e-05, 1.2069940567016602e-05, 1.2604519724845886e-05, 1.3139098882675171e-05, 1.3673678040504456e-05, 1.420825719833374e-05, 1.4742836356163025e-05, 1.527741551399231e-05, 1.5811994671821594e-05, 1.634657382965088e-05, 1.6881152987480164e-05, 1.7415732145309448e-05, 1.7950311303138733e-05, 1.8484890460968018e-05, 1.9019469618797302e-05, 1.9554048776626587e-05, 2.008862793445587e-05, 2.0623207092285156e-05]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 104.0, 878.0, 27.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07476025819778442, -0.06575579941272736, -0.05675134062767029, -0.04774687811732292, -0.038742419332265854, -0.029737960547208786, -0.02073349803686142, -0.011729039251804352, -0.002724580466747284, 0.0062798792496323586, 0.015284338966012001, 0.024288799613714218, 0.033293258398771286, 0.042297717183828354, 0.05130217969417572, 0.06030663847923279, 0.06931109726428986, 0.07831555604934692, 0.08732001483440399, 0.09632447361946106, 0.10532893240451813, 0.1143333911895752, 0.12333785742521286, 0.13234230875968933, 0.1413467824459076, 0.15035124123096466, 0.15935570001602173, 0.1683601588010788, 0.17736461758613586, 0.18636907637119293, 0.19537353515625, 0.20437800884246826, 0.21338245272636414, 0.2223869115114212, 0.23139137029647827, 0.24039582908153534, 0.2494002878665924, 0.25840476155281067, 0.26740920543670654, 0.2764136791229248, 0.2854181230068207, 0.29442259669303894, 0.3034270405769348, 0.3124315142631531, 0.32143595814704895, 0.3304404318332672, 0.3394448757171631, 0.34844934940338135, 0.3574538230895996, 0.36645829677581787, 0.37546274065971375, 0.384467214345932, 0.3934716582298279, 0.40247613191604614, 0.411480575799942, 0.4204850494861603, 0.42948949337005615, 0.4384939670562744, 0.4474984109401703, 0.45650288462638855, 0.4655073285102844, 0.4745118021965027, 0.48351624608039856, 0.4925207197666168, 0.5015251636505127]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 8.0, 7.0, 6.0, 9.0, 12.0, 10.0, 17.0, 15.0, 14.0, 25.0, 23.0, 31.0, 41.0, 34.0, 40.0, 37.0, 54.0, 56.0, 49.0, 44.0, 54.0, 55.0, 38.0, 41.0, 29.0, 35.0, 23.0, 28.0, 26.0, 24.0, 18.0, 24.0, 13.0, 13.0, 8.0, 9.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12279540300369263, -0.11929187923669815, -0.11578836292028427, -0.1122848391532898, -0.10878132283687592, -0.10527779906988144, -0.10177427530288696, -0.09827075898647308, -0.09476723521947861, -0.09126371145248413, -0.08776019513607025, -0.08425667136907578, -0.0807531476020813, -0.07724963128566742, -0.07374610751867294, -0.07024258375167847, -0.06673906743526459, -0.06323554366827011, -0.05973202735185623, -0.056228503584861755, -0.05272498354315758, -0.0492214635014534, -0.04571793973445892, -0.042214419692754745, -0.03871089965105057, -0.03520737960934639, -0.03170385956764221, -0.028200335800647736, -0.024696815758943558, -0.02119329571723938, -0.017689773812890053, -0.014186251908540726, -0.010682731866836548, -0.007179210893809795, -0.003675689920783043, -0.00017216894775629044, 0.003331352025270462, 0.00683487206697464, 0.010338393971323967, 0.013841915875673294, 0.017345435917377472, 0.02084895595908165, 0.024352477863430977, 0.027855999767780304, 0.03135951980948448, 0.03486303985118866, 0.038366563618183136, 0.041870083659887314, 0.04537360370159149, 0.04887712374329567, 0.05238064378499985, 0.055884167551994324, 0.0593876875936985, 0.06289120763540268, 0.06639473140239716, 0.06989824771881104, 0.07340177148580551, 0.07690529525279999, 0.08040881156921387, 0.08391233533620834, 0.08741585910320282, 0.0909193754196167, 0.09442289918661118, 0.09792642295360565, 0.10142993927001953]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 2.0, 4.0, 16.0, 5.0, 11.0, 6.0, 21.0, 88.0, 498.0, 12074.0, 4180730.0, 613.0, 76.0, 27.0, 11.0, 12.0, 12.0, 6.0, 5.0, 6.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0277099609375, -0.026724815368652344, -0.025739669799804688, -0.02475452423095703, -0.023769378662109375, -0.02278423309326172, -0.021799087524414062, -0.020813941955566406, -0.01982879638671875, -0.018843650817871094, -0.017858505249023438, -0.01687335968017578, -0.015888214111328125, -0.014903068542480469, -0.013917922973632812, -0.012932777404785156, -0.0119476318359375, -0.010962486267089844, -0.009977340698242188, -0.008992195129394531, -0.008007049560546875, -0.007021903991699219, -0.0060367584228515625, -0.005051612854003906, -0.00406646728515625, -0.0030813217163085938, -0.0020961761474609375, -0.0011110305786132812, -0.000125885009765625, 0.0008592605590820312, 0.0018444061279296875, 0.0028295516967773438, 0.003814697265625, 0.004799842834472656, 0.0057849884033203125, 0.006770133972167969, 0.007755279541015625, 0.008740425109863281, 0.009725570678710938, 0.010710716247558594, 0.01169586181640625, 0.012681007385253906, 0.013666152954101562, 0.014651298522949219, 0.015636444091796875, 0.01662158966064453, 0.017606735229492188, 0.018591880798339844, 0.0195770263671875, 0.020562171936035156, 0.021547317504882812, 0.02253246307373047, 0.023517608642578125, 0.02450275421142578, 0.025487899780273438, 0.026473045349121094, 0.02745819091796875, 0.028443336486816406, 0.029428482055664062, 0.03041362762451172, 0.031398773193359375, 0.03238391876220703, 0.03336906433105469, 0.034354209899902344, 0.03533935546875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 3.0, 16.0, 6.0, 10.0, 6.0, 15.0, 54.0, 118.0, 265.0, 233.0, 116.0, 37.0, 14.0, 7.0, 12.0, 10.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007404327392578125, -0.007142364978790283, -0.006880402565002441, -0.0066184401512146, -0.006356477737426758, -0.006094515323638916, -0.005832552909851074, -0.005570590496063232, -0.005308628082275391, -0.005046665668487549, -0.004784703254699707, -0.004522740840911865, -0.0042607784271240234, -0.003998816013336182, -0.00373685359954834, -0.003474891185760498, -0.0032129287719726562, -0.0029509663581848145, -0.0026890039443969727, -0.002427041530609131, -0.002165079116821289, -0.0019031167030334473, -0.0016411542892456055, -0.0013791918754577637, -0.0011172294616699219, -0.0008552670478820801, -0.0005933046340942383, -0.0003313422203063965, -6.937980651855469e-05, 0.0001925826072692871, 0.0004545450210571289, 0.0007165074348449707, 0.0009784698486328125, 0.0012404322624206543, 0.001502394676208496, 0.0017643570899963379, 0.0020263195037841797, 0.0022882819175720215, 0.0025502443313598633, 0.002812206745147705, 0.003074169158935547, 0.0033361315727233887, 0.0035980939865112305, 0.0038600564002990723, 0.004122018814086914, 0.004383981227874756, 0.004645943641662598, 0.0049079060554504395, 0.005169868469238281, 0.005431830883026123, 0.005693793296813965, 0.005955755710601807, 0.0062177181243896484, 0.00647968053817749, 0.006741642951965332, 0.007003605365753174, 0.007265567779541016, 0.007527530193328857, 0.007789492607116699, 0.008051455020904541, 0.008313417434692383, 0.008575379848480225, 0.008837342262268066, 0.009099304676055908, 0.00936126708984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 11.0, 4.0, 22.0, 22.0, 44.0, 56.0, 209.0, 646.0, 2926.0, 27620.0, 4148640.0, 11572.0, 1730.0, 454.0, 136.0, 73.0, 18.0, 22.0, 16.0, 11.0, 8.0, 3.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0074310302734375, -0.007214725017547607, -0.006998419761657715, -0.006782114505767822, -0.00656580924987793, -0.006349503993988037, -0.0061331987380981445, -0.005916893482208252, -0.005700588226318359, -0.005484282970428467, -0.005267977714538574, -0.005051672458648682, -0.004835367202758789, -0.0046190619468688965, -0.004402756690979004, -0.004186451435089111, -0.003970146179199219, -0.003753840923309326, -0.0035375356674194336, -0.003321230411529541, -0.0031049251556396484, -0.002888619899749756, -0.0026723146438598633, -0.0024560093879699707, -0.002239704132080078, -0.0020233988761901855, -0.001807093620300293, -0.0015907883644104004, -0.0013744831085205078, -0.0011581778526306152, -0.0009418725967407227, -0.0007255673408508301, -0.0005092620849609375, -0.0002929568290710449, -7.665157318115234e-05, 0.00013965368270874023, 0.0003559589385986328, 0.0005722641944885254, 0.000788569450378418, 0.0010048747062683105, 0.0012211799621582031, 0.0014374852180480957, 0.0016537904739379883, 0.0018700957298278809, 0.0020864009857177734, 0.002302706241607666, 0.0025190114974975586, 0.002735316753387451, 0.0029516220092773438, 0.0031679272651672363, 0.003384232521057129, 0.0036005377769470215, 0.003816843032836914, 0.004033148288726807, 0.004249453544616699, 0.004465758800506592, 0.004682064056396484, 0.004898369312286377, 0.0051146745681762695, 0.005330979824066162, 0.005547285079956055, 0.005763590335845947, 0.00597989559173584, 0.006196200847625732, 0.006412506103515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 4.0, 7.0, 8.0, 3.0, 7.0, 15.0, 25.0, 36.0, 162.0, 3526.0, 152.0, 43.0, 23.0, 17.0, 11.0, 10.0, 3.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002166748046875, -0.0020933449268341064, -0.002019941806793213, -0.0019465386867523193, -0.0018731355667114258, -0.0017997324466705322, -0.0017263293266296387, -0.0016529262065887451, -0.0015795230865478516, -0.001506119966506958, -0.0014327168464660645, -0.001359313726425171, -0.0012859106063842773, -0.0012125074863433838, -0.0011391043663024902, -0.0010657012462615967, -0.0009922981262207031, -0.0009188950061798096, -0.000845491886138916, -0.0007720887660980225, -0.0006986856460571289, -0.0006252825260162354, -0.0005518794059753418, -0.00047847628593444824, -0.0004050731658935547, -0.00033167004585266113, -0.0002582669258117676, -0.00018486380577087402, -0.00011146068572998047, -3.8057565689086914e-05, 3.534555435180664e-05, 0.0001087486743927002, 0.00018215179443359375, 0.0002555549144744873, 0.00032895803451538086, 0.0004023611545562744, 0.00047576427459716797, 0.0005491673946380615, 0.0006225705146789551, 0.0006959736347198486, 0.0007693767547607422, 0.0008427798748016357, 0.0009161829948425293, 0.0009895861148834229, 0.0010629892349243164, 0.00113639235496521, 0.0012097954750061035, 0.001283198595046997, 0.0013566017150878906, 0.0014300048351287842, 0.0015034079551696777, 0.0015768110752105713, 0.0016502141952514648, 0.0017236173152923584, 0.001797020435333252, 0.0018704235553741455, 0.001943826675415039, 0.0020172297954559326, 0.002090632915496826, 0.0021640360355377197, 0.0022374391555786133, 0.002310842275619507, 0.0023842453956604004, 0.002457648515701294, 0.0025310516357421875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 17.0, 918.0, 72.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020353326573967934, -0.019935347139835358, -0.01951736770570278, -0.019099388271570206, -0.01868141070008278, -0.018263431265950203, -0.017845451831817627, -0.01742747239768505, -0.017009492963552475, -0.0165915135294199, -0.016173534095287323, -0.015755556523799896, -0.015337576158344746, -0.014919597655534744, -0.014501618221402168, -0.014083638787269592, -0.013665660284459591, -0.013247680850327015, -0.012829702347517014, -0.012411722913384438, -0.011993743479251862, -0.011575764045119286, -0.011157785542309284, -0.010739806108176708, -0.010321827605366707, -0.00990384817123413, -0.00948586966842413, -0.009067890234291553, -0.008649910800158978, -0.008231932297348976, -0.0078139528632164, -0.007395973429083824, -0.006977994926273823, -0.006560015957802534, -0.006142036523669958, -0.005724057555198669, -0.0053060781210660934, -0.004888099152594805, -0.004470120184123516, -0.00405214074999094, -0.0036341617815196514, -0.003216182580217719, -0.0027982033789157867, -0.002380224410444498, -0.0019622452091425657, -0.0015442660078406334, -0.0011262870393693447, -0.0007083078380674124, -0.00029032863676548004, 0.00012765050632879138, 0.0005456296494230628, 0.0009636087343096733, 0.0013815879356116056, 0.001799567136913538, 0.0022175461053848267, 0.002635525306686759, 0.0030535045079886913, 0.0034714837092906237, 0.003889462910592556, 0.004307441879063845, 0.004725420847535133, 0.005143400281667709, 0.005561379250138998, 0.005979358218610287, 0.006397337652742863]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 16.0, 14.0, 10.0, 19.0, 22.0, 22.0, 29.0, 30.0, 38.0, 40.0, 39.0, 36.0, 36.0, 56.0, 55.0, 59.0, 51.0, 47.0, 49.0, 41.0, 46.0, 38.0, 37.0, 30.0, 37.0, 16.0, 17.0, 10.0, 12.0, 7.0, 4.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.004937589168548584, -0.0047957561910152435, -0.004653923213481903, -0.004512090235948563, -0.004370257258415222, -0.004228424280881882, -0.004086591303348541, -0.003944758325815201, -0.0038029253482818604, -0.00366109237074852, -0.0035192593932151794, -0.003377426415681839, -0.0032355934381484985, -0.003093760460615158, -0.0029519274830818176, -0.002810094505548477, -0.0026682615280151367, -0.0025264285504817963, -0.002384595572948456, -0.0022427625954151154, -0.002100929617881775, -0.0019590966403484344, -0.001817263662815094, -0.0016754306852817535, -0.001533597707748413, -0.0013917647302150726, -0.0012499317526817322, -0.0011080987751483917, -0.0009662657976150513, -0.0008244328200817108, -0.0006825998425483704, -0.0005407668650150299, -0.00039893388748168945, -0.000257100909948349, -0.00011526793241500854, 2.656504511833191e-05, 0.00016839802265167236, 0.0003102310001850128, 0.00045206397771835327, 0.0005938969552516937, 0.0007357299327850342, 0.0008775629103183746, 0.001019395887851715, 0.0011612288653850555, 0.001303061842918396, 0.0014448948204517365, 0.001586727797985077, 0.0017285607755184174, 0.0018703937530517578, 0.0020122267305850983, 0.0021540597081184387, 0.002295892685651779, 0.0024377256631851196, 0.00257955864071846, 0.0027213916182518005, 0.002863224595785141, 0.0030050575733184814, 0.003146890550851822, 0.0032887235283851624, 0.003430556505918503, 0.0035723894834518433, 0.0037142224609851837, 0.003856055438518524, 0.003997888416051865, 0.004139721393585205]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 9.0, 4.0, 14.0, 9.0, 14.0, 17.0, 37.0, 55.0, 59.0, 93.0, 142.0, 208.0, 322.0, 440.0, 622.0, 988.0, 1604.0, 2544.0, 4350.0, 8113.0, 17370.0, 81866.0, 857292.0, 42220.0, 13513.0, 6741.0, 3664.0, 2117.0, 1370.0, 887.0, 597.0, 394.0, 272.0, 174.0, 110.0, 83.0, 65.0, 54.0, 38.0, 22.0, 16.0, 17.0, 7.0, 4.0, 4.0, 6.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00897216796875, -0.008666515350341797, -0.008360862731933594, -0.00805521011352539, -0.0077495574951171875, -0.007443904876708984, -0.007138252258300781, -0.006832599639892578, -0.006526947021484375, -0.006221294403076172, -0.005915641784667969, -0.005609989166259766, -0.0053043365478515625, -0.004998683929443359, -0.004693031311035156, -0.004387378692626953, -0.00408172607421875, -0.003776073455810547, -0.0034704208374023438, -0.0031647682189941406, -0.0028591156005859375, -0.0025534629821777344, -0.0022478103637695312, -0.0019421577453613281, -0.001636505126953125, -0.0013308525085449219, -0.0010251998901367188, -0.0007195472717285156, -0.0004138946533203125, -0.00010824203491210938, 0.00019741058349609375, 0.0005030632019042969, 0.0008087158203125, 0.0011143684387207031, 0.0014200210571289062, 0.0017256736755371094, 0.0020313262939453125, 0.0023369789123535156, 0.0026426315307617188, 0.002948284149169922, 0.003253936767578125, 0.003559589385986328, 0.0038652420043945312, 0.004170894622802734, 0.0044765472412109375, 0.004782199859619141, 0.005087852478027344, 0.005393505096435547, 0.00569915771484375, 0.006004810333251953, 0.006310462951660156, 0.006616115570068359, 0.0069217681884765625, 0.007227420806884766, 0.007533073425292969, 0.007838726043701172, 0.008144378662109375, 0.008450031280517578, 0.008755683898925781, 0.009061336517333984, 0.009366989135742188, 0.00967264175415039, 0.009978294372558594, 0.010283946990966797, 0.010589599609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 4.0, 16.0, 5.0, 10.0, 6.0, 15.0, 56.0, 116.0, 271.0, 227.0, 116.0, 39.0, 12.0, 7.0, 12.0, 10.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007396697998046875, -0.007134854793548584, -0.006873011589050293, -0.006611168384552002, -0.006349325180053711, -0.00608748197555542, -0.005825638771057129, -0.005563795566558838, -0.005301952362060547, -0.005040109157562256, -0.004778265953063965, -0.004516422748565674, -0.004254579544067383, -0.003992736339569092, -0.0037308931350708008, -0.0034690499305725098, -0.0032072067260742188, -0.0029453635215759277, -0.0026835203170776367, -0.0024216771125793457, -0.0021598339080810547, -0.0018979907035827637, -0.0016361474990844727, -0.0013743042945861816, -0.0011124610900878906, -0.0008506178855895996, -0.0005887746810913086, -0.0003269314765930176, -6.508827209472656e-05, 0.00019675493240356445, 0.00045859813690185547, 0.0007204413414001465, 0.0009822845458984375, 0.0012441277503967285, 0.0015059709548950195, 0.0017678141593933105, 0.0020296573638916016, 0.0022915005683898926, 0.0025533437728881836, 0.0028151869773864746, 0.0030770301818847656, 0.0033388733863830566, 0.0036007165908813477, 0.0038625597953796387, 0.00412440299987793, 0.004386246204376221, 0.004648089408874512, 0.004909932613372803, 0.005171775817871094, 0.005433619022369385, 0.005695462226867676, 0.005957305431365967, 0.006219148635864258, 0.006480991840362549, 0.00674283504486084, 0.007004678249359131, 0.007266521453857422, 0.007528364658355713, 0.007790207862854004, 0.008052051067352295, 0.008313894271850586, 0.008575737476348877, 0.008837580680847168, 0.009099423885345459, 0.00936126708984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 6.0, 8.0, 11.0, 12.0, 15.0, 9.0, 27.0, 40.0, 44.0, 48.0, 78.0, 101.0, 130.0, 224.0, 338.0, 583.0, 1389.0, 11482.0, 988220.0, 41750.0, 2018.0, 747.0, 397.0, 245.0, 143.0, 110.0, 95.0, 61.0, 43.0, 36.0, 36.0, 22.0, 17.0, 12.0, 13.0, 9.0, 10.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02239990234375, -0.02158975601196289, -0.02077960968017578, -0.019969463348388672, -0.019159317016601562, -0.018349170684814453, -0.017539024353027344, -0.016728878021240234, -0.015918731689453125, -0.015108585357666016, -0.014298439025878906, -0.013488292694091797, -0.012678146362304688, -0.011868000030517578, -0.011057853698730469, -0.01024770736694336, -0.00943756103515625, -0.00862741470336914, -0.007817268371582031, -0.007007122039794922, -0.0061969757080078125, -0.005386829376220703, -0.004576683044433594, -0.0037665367126464844, -0.002956390380859375, -0.0021462440490722656, -0.0013360977172851562, -0.0005259513854980469, 0.0002841949462890625, 0.0010943412780761719, 0.0019044876098632812, 0.0027146339416503906, 0.0035247802734375, 0.004334926605224609, 0.005145072937011719, 0.005955219268798828, 0.0067653656005859375, 0.007575511932373047, 0.008385658264160156, 0.009195804595947266, 0.010005950927734375, 0.010816097259521484, 0.011626243591308594, 0.012436389923095703, 0.013246536254882812, 0.014056682586669922, 0.014866828918457031, 0.01567697525024414, 0.01648712158203125, 0.01729726791381836, 0.01810741424560547, 0.018917560577392578, 0.019727706909179688, 0.020537853240966797, 0.021347999572753906, 0.022158145904541016, 0.022968292236328125, 0.023778438568115234, 0.024588584899902344, 0.025398731231689453, 0.026208877563476562, 0.027019023895263672, 0.02782917022705078, 0.02863931655883789, 0.029449462890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 10.0, 8.0, 11.0, 5.0, 14.0, 24.0, 25.0, 21.0, 32.0, 31.0, 34.0, 53.0, 46.0, 47.0, 42.0, 47.0, 49.0, 41.0, 35.0, 34.0, 42.0, 38.0, 42.0, 41.0, 42.0, 31.0, 28.0, 16.0, 23.0, 16.0, 9.0, 11.0, 11.0, 7.0, 10.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0197296142578125, -0.01901698112487793, -0.01830434799194336, -0.01759171485900879, -0.01687908172607422, -0.01616644859313965, -0.015453815460205078, -0.014741182327270508, -0.014028549194335938, -0.013315916061401367, -0.012603282928466797, -0.011890649795532227, -0.011178016662597656, -0.010465383529663086, -0.009752750396728516, -0.009040117263793945, -0.008327484130859375, -0.007614850997924805, -0.006902217864990234, -0.006189584732055664, -0.005476951599121094, -0.0047643184661865234, -0.004051685333251953, -0.003339052200317383, -0.0026264190673828125, -0.0019137859344482422, -0.0012011528015136719, -0.0004885196685791016, 0.00022411346435546875, 0.0009367465972900391, 0.0016493797302246094, 0.0023620128631591797, 0.00307464599609375, 0.0037872791290283203, 0.004499912261962891, 0.005212545394897461, 0.005925178527832031, 0.0066378116607666016, 0.007350444793701172, 0.008063077926635742, 0.008775711059570312, 0.009488344192504883, 0.010200977325439453, 0.010913610458374023, 0.011626243591308594, 0.012338876724243164, 0.013051509857177734, 0.013764142990112305, 0.014476776123046875, 0.015189409255981445, 0.015902042388916016, 0.016614675521850586, 0.017327308654785156, 0.018039941787719727, 0.018752574920654297, 0.019465208053588867, 0.020177841186523438, 0.020890474319458008, 0.021603107452392578, 0.02231574058532715, 0.02302837371826172, 0.02374100685119629, 0.02445363998413086, 0.02516627311706543, 0.02587890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 7.0, 6.0, 14.0, 12.0, 21.0, 36.0, 32.0, 53.0, 56.0, 87.0, 166.0, 356.0, 865.0, 1357.0, 6704.0, 53288.0, 922044.0, 53612.0, 6699.0, 1347.0, 909.0, 323.0, 172.0, 113.0, 51.0, 54.0, 45.0, 22.0, 18.0, 5.0, 13.0, 8.0, 8.0, 8.0, 9.0, 1.0, 8.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.6140124797821045e-06, -5.446374416351318e-06, -5.278736352920532e-06, -5.111098289489746e-06, -4.94346022605896e-06, -4.775822162628174e-06, -4.608184099197388e-06, -4.4405460357666016e-06, -4.2729079723358154e-06, -4.105269908905029e-06, -3.937631845474243e-06, -3.769993782043457e-06, -3.602355718612671e-06, -3.4347176551818848e-06, -3.2670795917510986e-06, -3.0994415283203125e-06, -2.9318034648895264e-06, -2.7641654014587402e-06, -2.596527338027954e-06, -2.428889274597168e-06, -2.261251211166382e-06, -2.0936131477355957e-06, -1.9259750843048096e-06, -1.7583370208740234e-06, -1.5906989574432373e-06, -1.4230608940124512e-06, -1.255422830581665e-06, -1.087784767150879e-06, -9.201467037200928e-07, -7.525086402893066e-07, -5.848705768585205e-07, -4.172325134277344e-07, -2.4959444999694824e-07, -8.195638656616211e-08, 8.568167686462402e-08, 2.5331974029541016e-07, 4.209578037261963e-07, 5.885958671569824e-07, 7.562339305877686e-07, 9.238719940185547e-07, 1.0915100574493408e-06, 1.259148120880127e-06, 1.426786184310913e-06, 1.5944242477416992e-06, 1.7620623111724854e-06, 1.9297003746032715e-06, 2.0973384380340576e-06, 2.2649765014648438e-06, 2.43261456489563e-06, 2.600252628326416e-06, 2.767890691757202e-06, 2.9355287551879883e-06, 3.1031668186187744e-06, 3.2708048820495605e-06, 3.4384429454803467e-06, 3.606081008911133e-06, 3.773719072341919e-06, 3.941357135772705e-06, 4.108995199203491e-06, 4.276633262634277e-06, 4.4442713260650635e-06, 4.61190938949585e-06, 4.779547452926636e-06, 4.947185516357422e-06]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 7.0, 8.0, 9.0, 16.0, 16.0, 10.0, 17.0, 34.0, 25.0, 31.0, 39.0, 79.0, 51.0, 52.0, 77.0, 95.0, 58.0, 83.0, 44.0, 37.0, 22.0, 33.0, 16.0, 32.0, 17.0, 13.0, 10.0, 8.0, 6.0, 8.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-4.947185516357422e-06, -4.81773167848587e-06, -4.688277840614319e-06, -4.558824002742767e-06, -4.429370164871216e-06, -4.299916326999664e-06, -4.170462489128113e-06, -4.041008651256561e-06, -3.91155481338501e-06, -3.7821009755134583e-06, -3.6526471376419067e-06, -3.5231932997703552e-06, -3.3937394618988037e-06, -3.264285624027252e-06, -3.1348317861557007e-06, -3.005377948284149e-06, -2.8759241104125977e-06, -2.746470272541046e-06, -2.6170164346694946e-06, -2.487562596797943e-06, -2.3581087589263916e-06, -2.22865492105484e-06, -2.0992010831832886e-06, -1.969747245311737e-06, -1.8402934074401855e-06, -1.710839569568634e-06, -1.5813857316970825e-06, -1.451931893825531e-06, -1.3224780559539795e-06, -1.193024218082428e-06, -1.0635703802108765e-06, -9.34116542339325e-07, -8.046627044677734e-07, -6.752088665962219e-07, -5.457550287246704e-07, -4.163011908531189e-07, -2.868473529815674e-07, -1.5739351511001587e-07, -2.7939677238464355e-08, 1.0151416063308716e-07, 2.3096799850463867e-07, 3.604218363761902e-07, 4.898756742477417e-07, 6.193295121192932e-07, 7.487833499908447e-07, 8.782371878623962e-07, 1.0076910257339478e-06, 1.1371448636054993e-06, 1.2665987014770508e-06, 1.3960525393486023e-06, 1.5255063772201538e-06, 1.6549602150917053e-06, 1.7844140529632568e-06, 1.9138678908348083e-06, 2.04332172870636e-06, 2.1727755665779114e-06, 2.302229404449463e-06, 2.4316832423210144e-06, 2.561137080192566e-06, 2.6905909180641174e-06, 2.820044755935669e-06, 2.9494985938072205e-06, 3.078952431678772e-06, 3.2084062695503235e-06, 3.337860107421875e-06]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 10.0, 15.0, 23.0, 28.0, 36.0, 85.0, 202.0, 820.0, 78333.0, 967444.0, 1094.0, 206.0, 100.0, 42.0, 32.0, 20.0, 12.0, 12.0, 6.0, 1.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.1517276763916016e-05, -2.0920298993587494e-05, -2.0323321223258972e-05, -1.972634345293045e-05, -1.912936568260193e-05, -1.8532387912273407e-05, -1.7935410141944885e-05, -1.7338432371616364e-05, -1.6741454601287842e-05, -1.614447683095932e-05, -1.55474990606308e-05, -1.4950521290302277e-05, -1.4353543519973755e-05, -1.3756565749645233e-05, -1.3159587979316711e-05, -1.256261020898819e-05, -1.1965632438659668e-05, -1.1368654668331146e-05, -1.0771676898002625e-05, -1.0174699127674103e-05, -9.577721357345581e-06, -8.98074358701706e-06, -8.383765816688538e-06, -7.786788046360016e-06, -7.189810276031494e-06, -6.592832505702972e-06, -5.995854735374451e-06, -5.398876965045929e-06, -4.801899194717407e-06, -4.2049214243888855e-06, -3.6079436540603638e-06, -3.010965883731842e-06, -2.4139881134033203e-06, -1.8170103430747986e-06, -1.2200325727462769e-06, -6.230548024177551e-07, -2.60770320892334e-08, 5.709007382392883e-07, 1.16787850856781e-06, 1.7648562788963318e-06, 2.3618340492248535e-06, 2.9588118195533752e-06, 3.555789589881897e-06, 4.152767360210419e-06, 4.7497451305389404e-06, 5.346722900867462e-06, 5.943700671195984e-06, 6.540678441524506e-06, 7.137656211853027e-06, 7.734633982181549e-06, 8.33161175251007e-06, 8.928589522838593e-06, 9.525567293167114e-06, 1.0122545063495636e-05, 1.0719522833824158e-05, 1.131650060415268e-05, 1.1913478374481201e-05, 1.2510456144809723e-05, 1.3107433915138245e-05, 1.3704411685466766e-05, 1.4301389455795288e-05, 1.489836722612381e-05, 1.549534499645233e-05, 1.6092322766780853e-05, 1.6689300537109375e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 3.0, 10.0, 25.0, 34.0, 55.0, 103.0, 544.0, 74.0, 47.0, 32.0, 17.0, 9.0, 5.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.901388168334961e-05, -1.848861575126648e-05, -1.796334981918335e-05, -1.743808388710022e-05, -1.691281795501709e-05, -1.638755202293396e-05, -1.586228609085083e-05, -1.53370201587677e-05, -1.481175422668457e-05, -1.428648829460144e-05, -1.376122236251831e-05, -1.323595643043518e-05, -1.271069049835205e-05, -1.2185424566268921e-05, -1.1660158634185791e-05, -1.1134892702102661e-05, -1.0609626770019531e-05, -1.0084360837936401e-05, -9.559094905853271e-06, -9.033828973770142e-06, -8.508563041687012e-06, -7.983297109603882e-06, -7.458031177520752e-06, -6.932765245437622e-06, -6.407499313354492e-06, -5.882233381271362e-06, -5.356967449188232e-06, -4.8317015171051025e-06, -4.306435585021973e-06, -3.7811696529388428e-06, -3.255903720855713e-06, -2.730637788772583e-06, -2.205371856689453e-06, -1.6801059246063232e-06, -1.1548399925231934e-06, -6.295740604400635e-07, -1.043081283569336e-07, 4.209578037261963e-07, 9.462237358093262e-07, 1.471489667892456e-06, 1.996755599975586e-06, 2.522021532058716e-06, 3.0472874641418457e-06, 3.5725533962249756e-06, 4.0978193283081055e-06, 4.623085260391235e-06, 5.148351192474365e-06, 5.673617124557495e-06, 6.198883056640625e-06, 6.724148988723755e-06, 7.249414920806885e-06, 7.774680852890015e-06, 8.299946784973145e-06, 8.825212717056274e-06, 9.350478649139404e-06, 9.875744581222534e-06, 1.0401010513305664e-05, 1.0926276445388794e-05, 1.1451542377471924e-05, 1.1976808309555054e-05, 1.2502074241638184e-05, 1.3027340173721313e-05, 1.3552606105804443e-05, 1.4077872037887573e-05, 1.4603137969970703e-05]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 11.0, 35.0, 240.0, 634.0, 78.0, 12.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.20908275246620178, -0.20536312460899353, -0.20164349675178528, -0.19792388379573822, -0.19420425593852997, -0.19048462808132172, -0.18676500022411346, -0.1830453723669052, -0.17932575941085815, -0.1756061315536499, -0.17188650369644165, -0.1681668907403946, -0.16444726288318634, -0.1607276350259781, -0.15700800716876984, -0.15328837931156158, -0.14956875145435333, -0.14584912359714508, -0.14212949573993683, -0.13840988278388977, -0.13469025492668152, -0.13097062706947327, -0.12725099921226501, -0.12353137880563736, -0.1198117583990097, -0.11609213054180145, -0.1123725101351738, -0.10865288227796555, -0.10493326187133789, -0.10121363401412964, -0.09749400615692139, -0.09377438575029373, -0.09005476534366608, -0.08633513748645782, -0.08261551707983017, -0.07889588922262192, -0.07517626881599426, -0.07145664095878601, -0.06773701310157776, -0.0640173926949501, -0.06029776483774185, -0.0565781407058239, -0.052858516573905945, -0.04913888871669769, -0.04541926458477974, -0.041699640452861786, -0.03798001632094383, -0.03426039218902588, -0.030540764331817627, -0.026821140199899673, -0.02310151420533657, -0.019381890073418617, -0.015662264078855515, -0.011942639946937561, -0.008223015815019608, -0.004503389820456505, -0.0007837656885385513, 0.002935859141871333, 0.006655483972281218, 0.010375108569860458, 0.014094733633100986, 0.017814358696341515, 0.021533982828259468, 0.02525360882282257, 0.028973232954740524]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 7.0, 3.0, 5.0, 8.0, 12.0, 14.0, 8.0, 17.0, 20.0, 24.0, 20.0, 37.0, 33.0, 36.0, 38.0, 42.0, 44.0, 39.0, 46.0, 48.0, 44.0, 45.0, 53.0, 35.0, 45.0, 34.0, 37.0, 32.0, 30.0, 31.0, 29.0, 17.0, 21.0, 11.0, 13.0, 5.0, 3.0, 5.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1010514497756958, -0.09765557199716568, -0.09425970166921616, -0.09086382389068604, -0.08746795356273651, -0.08407207578420639, -0.08067619800567627, -0.07728032767772675, -0.07388444989919662, -0.0704885721206665, -0.06709270179271698, -0.06369682401418686, -0.06030094996094704, -0.056905075907707214, -0.053509198129177094, -0.05011332407593727, -0.04671745002269745, -0.043321575969457626, -0.039925701916217804, -0.03652982413768768, -0.03313395008444786, -0.02973807603120804, -0.026342200115323067, -0.022946324199438095, -0.019550450146198273, -0.01615457609295845, -0.012758700177073479, -0.009362825192511082, -0.005966950207948685, -0.0025710761547088623, 0.0008247997611761093, 0.004220675677061081, 0.007616549730300903, 0.0110124247148633, 0.014408299699425697, 0.01780417561531067, 0.02120004966855049, 0.024595923721790314, 0.027991799637675285, 0.03138767555356026, 0.03478354960680008, 0.0381794236600399, 0.041575297713279724, 0.044971175491809845, 0.04836704954504967, 0.05176292359828949, 0.05515880137681961, 0.05855467543005943, 0.061950549483299255, 0.06534642726182938, 0.0687422975897789, 0.07213817536830902, 0.07553404569625854, 0.07892992347478867, 0.08232580125331879, 0.08572167158126831, 0.08911754935979843, 0.09251342713832855, 0.09590929746627808, 0.0993051752448082, 0.10270105302333832, 0.10609692335128784, 0.10949280112981796, 0.11288867890834808, 0.11628454923629761]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 3.0, 14.0, 9.0, 8.0, 9.0, 18.0, 72.0, 166.0, 1615.0, 4191893.0, 244.0, 84.0, 29.0, 15.0, 14.0, 6.0, 12.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07489013671875, -0.07224273681640625, -0.0695953369140625, -0.06694793701171875, -0.064300537109375, -0.06165313720703125, -0.0590057373046875, -0.05635833740234375, -0.0537109375, -0.05106353759765625, -0.0484161376953125, -0.04576873779296875, -0.043121337890625, -0.04047393798828125, -0.0378265380859375, -0.03517913818359375, -0.03253173828125, -0.02988433837890625, -0.0272369384765625, -0.02458953857421875, -0.021942138671875, -0.01929473876953125, -0.0166473388671875, -0.01399993896484375, -0.0113525390625, -0.00870513916015625, -0.0060577392578125, -0.00341033935546875, -0.000762939453125, 0.00188446044921875, 0.0045318603515625, 0.00717926025390625, 0.00982666015625, 0.01247406005859375, 0.0151214599609375, 0.01776885986328125, 0.020416259765625, 0.02306365966796875, 0.0257110595703125, 0.02835845947265625, 0.031005859375, 0.03365325927734375, 0.0363006591796875, 0.03894805908203125, 0.041595458984375, 0.04424285888671875, 0.0468902587890625, 0.04953765869140625, 0.05218505859375, 0.05483245849609375, 0.0574798583984375, 0.06012725830078125, 0.062774658203125, 0.06542205810546875, 0.0680694580078125, 0.07071685791015625, 0.0733642578125, 0.07601165771484375, 0.0786590576171875, 0.08130645751953125, 0.083953857421875, 0.08660125732421875, 0.0892486572265625, 0.09189605712890625, 0.09454345703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 1.0, 4.0, 12.0, 10.0, 9.0, 7.0, 15.0, 40.0, 119.0, 228.0, 256.0, 131.0, 47.0, 14.0, 8.0, 11.0, 9.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00737762451171875, -0.0071179866790771484, -0.006858348846435547, -0.006598711013793945, -0.006339073181152344, -0.006079435348510742, -0.005819797515869141, -0.005560159683227539, -0.0053005218505859375, -0.005040884017944336, -0.004781246185302734, -0.004521608352661133, -0.004261970520019531, -0.00400233268737793, -0.003742694854736328, -0.0034830570220947266, -0.003223419189453125, -0.0029637813568115234, -0.002704143524169922, -0.0024445056915283203, -0.0021848678588867188, -0.0019252300262451172, -0.0016655921936035156, -0.001405954360961914, -0.0011463165283203125, -0.0008866786956787109, -0.0006270408630371094, -0.0003674030303955078, -0.00010776519775390625, 0.0001518726348876953, 0.0004115104675292969, 0.0006711483001708984, 0.0009307861328125, 0.0011904239654541016, 0.0014500617980957031, 0.0017096996307373047, 0.0019693374633789062, 0.002228975296020508, 0.0024886131286621094, 0.002748250961303711, 0.0030078887939453125, 0.003267526626586914, 0.0035271644592285156, 0.003786802291870117, 0.004046440124511719, 0.00430607795715332, 0.004565715789794922, 0.0048253536224365234, 0.005084991455078125, 0.0053446292877197266, 0.005604267120361328, 0.00586390495300293, 0.006123542785644531, 0.006383180618286133, 0.006642818450927734, 0.006902456283569336, 0.0071620941162109375, 0.007421731948852539, 0.007681369781494141, 0.007941007614135742, 0.008200645446777344, 0.008460283279418945, 0.008719921112060547, 0.008979558944702148, 0.00923919677734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 5.0, 13.0, 38.0, 117.0, 422.0, 1267.0, 81219.0, 4109075.0, 1471.0, 421.0, 126.0, 58.0, 21.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0125732421875, -0.01220393180847168, -0.01183462142944336, -0.011465311050415039, -0.011096000671386719, -0.010726690292358398, -0.010357379913330078, -0.009988069534301758, -0.009618759155273438, -0.009249448776245117, -0.008880138397216797, -0.008510828018188477, -0.008141517639160156, -0.007772207260131836, -0.007402896881103516, -0.007033586502075195, -0.006664276123046875, -0.006294965744018555, -0.005925655364990234, -0.005556344985961914, -0.005187034606933594, -0.0048177242279052734, -0.004448413848876953, -0.004079103469848633, -0.0037097930908203125, -0.003340482711791992, -0.002971172332763672, -0.0026018619537353516, -0.0022325515747070312, -0.001863241195678711, -0.0014939308166503906, -0.0011246204376220703, -0.00075531005859375, -0.0003859996795654297, -1.6689300537109375e-05, 0.00035262107849121094, 0.0007219314575195312, 0.0010912418365478516, 0.0014605522155761719, 0.0018298625946044922, 0.0021991729736328125, 0.002568483352661133, 0.002937793731689453, 0.0033071041107177734, 0.0036764144897460938, 0.004045724868774414, 0.004415035247802734, 0.004784345626831055, 0.005153656005859375, 0.005522966384887695, 0.005892276763916016, 0.006261587142944336, 0.006630897521972656, 0.0070002079010009766, 0.007369518280029297, 0.007738828659057617, 0.008108139038085938, 0.008477449417114258, 0.008846759796142578, 0.009216070175170898, 0.009585380554199219, 0.009954690933227539, 0.01032400131225586, 0.01069331169128418, 0.0110626220703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 16.0, 36.0, 155.0, 3775.0, 51.0, 17.0, 5.0, 6.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028514862060546875, -0.002742379903793335, -0.0026332736015319824, -0.00252416729927063, -0.0024150609970092773, -0.002305954694747925, -0.0021968483924865723, -0.0020877420902252197, -0.001978635787963867, -0.0018695294857025146, -0.0017604231834411621, -0.0016513168811798096, -0.001542210578918457, -0.0014331042766571045, -0.001323997974395752, -0.0012148916721343994, -0.0011057853698730469, -0.0009966790676116943, -0.0008875727653503418, -0.0007784664630889893, -0.0006693601608276367, -0.0005602538585662842, -0.00045114755630493164, -0.0003420412540435791, -0.00023293495178222656, -0.00012382864952087402, -1.4722347259521484e-05, 9.438395500183105e-05, 0.0002034902572631836, 0.00031259655952453613, 0.00042170286178588867, 0.0005308091640472412, 0.0006399154663085938, 0.0007490217685699463, 0.0008581280708312988, 0.0009672343730926514, 0.001076340675354004, 0.0011854469776153564, 0.001294553279876709, 0.0014036595821380615, 0.001512765884399414, 0.0016218721866607666, 0.0017309784889221191, 0.0018400847911834717, 0.0019491910934448242, 0.0020582973957061768, 0.0021674036979675293, 0.002276510000228882, 0.0023856163024902344, 0.002494722604751587, 0.0026038289070129395, 0.002712935209274292, 0.0028220415115356445, 0.002931147813796997, 0.0030402541160583496, 0.003149360418319702, 0.0032584667205810547, 0.0033675730228424072, 0.0034766793251037598, 0.0035857856273651123, 0.003694891929626465, 0.0038039982318878174, 0.00391310453414917, 0.0040222108364105225, 0.004131317138671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1001.0, 17.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001215107156895101, 0.0004822030896320939, 0.002179513219743967, 0.003876823466271162, 0.005574133712798357, 0.007271443959325552, 0.008968754671514034, 0.01066606491804123, 0.012363375164568424, 0.01406068541109562, 0.01575799658894539, 0.01745530590415001, 0.01915261521935463, 0.0208499263972044, 0.02254723757505417, 0.02424454689025879, 0.02594185620546341, 0.02763916552066803, 0.0293364766985178, 0.03103378787636757, 0.03273109719157219, 0.03442840650677681, 0.03612571954727173, 0.03782302886247635, 0.03952033817768097, 0.04121764749288559, 0.04291495680809021, 0.04461226984858513, 0.04630957916378975, 0.04800688847899437, 0.04970420151948929, 0.05140151083469391, 0.05309882014989853, 0.05479612946510315, 0.05649343878030777, 0.05819075182080269, 0.05988806113600731, 0.06158537045121193, 0.06328268349170685, 0.06497999280691147, 0.06667730212211609, 0.06837461143732071, 0.07007192075252533, 0.07176923006772995, 0.07346653938293457, 0.07516385614871979, 0.07686116546392441, 0.07855847477912903, 0.08025578409433365, 0.08195309340953827, 0.08365040272474289, 0.08534771203994751, 0.08704502880573273, 0.08874233812093735, 0.09043964743614197, 0.09213695675134659, 0.09383426606655121, 0.09553157538175583, 0.09722888469696045, 0.09892619401216507, 0.10062350332736969, 0.10232082009315491, 0.10401812940835953, 0.10571543872356415, 0.10741274803876877]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 10.0, 14.0, 29.0, 43.0, 63.0, 57.0, 91.0, 90.0, 112.0, 83.0, 92.0, 84.0, 73.0, 52.0, 33.0, 22.0, 19.0, 12.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006871998310089111, -0.006643389351665974, -0.006414780393242836, -0.006186171434819698, -0.005957562476396561, -0.005728953517973423, -0.005500344559550285, -0.005271735601127148, -0.00504312664270401, -0.004814517684280872, -0.004585908725857735, -0.004357299767434597, -0.004128690809011459, -0.0039000818505883217, -0.003671472892165184, -0.0034428639337420464, -0.0032142549753189087, -0.002985646016895771, -0.0027570370584726334, -0.0025284281000494957, -0.002299819141626358, -0.0020712101832032204, -0.0018426012247800827, -0.001613992266356945, -0.0013853833079338074, -0.0011567743495106697, -0.000928165391087532, -0.0006995564326643944, -0.0004709474742412567, -0.00024233851581811905, -1.3729557394981384e-05, 0.00021487940102815628, 0.00044348835945129395, 0.0006720973178744316, 0.0009007062762975693, 0.001129315234720707, 0.0013579241931438446, 0.0015865331515669823, 0.00181514210999012, 0.0020437510684132576, 0.0022723600268363953, 0.002500968985259533, 0.0027295779436826706, 0.0029581869021058083, 0.003186795860528946, 0.0034154048189520836, 0.0036440137773752213, 0.003872622735798359, 0.004101231694221497, 0.004329840652644634, 0.004558449611067772, 0.00478705856949091, 0.005015667527914047, 0.005244276486337185, 0.005472885444760323, 0.00570149440318346, 0.005930103361606598, 0.0061587123200297356, 0.006387321278452873, 0.006615930236876011, 0.0068445391952991486, 0.007073148153722286, 0.007301757112145424, 0.0075303660705685616, 0.007758975028991699]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 13.0, 14.0, 17.0, 27.0, 25.0, 54.0, 69.0, 89.0, 164.0, 229.0, 364.0, 529.0, 855.0, 1397.0, 2572.0, 4858.0, 10688.0, 37155.0, 900380.0, 62487.0, 13481.0, 5897.0, 2922.0, 1634.0, 950.0, 595.0, 356.0, 234.0, 159.0, 104.0, 74.0, 55.0, 25.0, 23.0, 19.0, 7.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0219573974609375, -0.02134084701538086, -0.02072429656982422, -0.020107746124267578, -0.019491195678710938, -0.018874645233154297, -0.018258094787597656, -0.017641544342041016, -0.017024993896484375, -0.016408443450927734, -0.015791893005371094, -0.015175342559814453, -0.014558792114257812, -0.013942241668701172, -0.013325691223144531, -0.01270914077758789, -0.01209259033203125, -0.01147603988647461, -0.010859489440917969, -0.010242938995361328, -0.009626388549804688, -0.009009838104248047, -0.008393287658691406, -0.007776737213134766, -0.007160186767578125, -0.006543636322021484, -0.005927085876464844, -0.005310535430908203, -0.0046939849853515625, -0.004077434539794922, -0.0034608840942382812, -0.0028443336486816406, -0.002227783203125, -0.0016112327575683594, -0.0009946823120117188, -0.0003781318664550781, 0.0002384185791015625, 0.0008549690246582031, 0.0014715194702148438, 0.0020880699157714844, 0.002704620361328125, 0.0033211708068847656, 0.003937721252441406, 0.004554271697998047, 0.0051708221435546875, 0.005787372589111328, 0.006403923034667969, 0.007020473480224609, 0.00763702392578125, 0.00825357437133789, 0.008870124816894531, 0.009486675262451172, 0.010103225708007812, 0.010719776153564453, 0.011336326599121094, 0.011952877044677734, 0.012569427490234375, 0.013185977935791016, 0.013802528381347656, 0.014419078826904297, 0.015035629272460938, 0.015652179718017578, 0.01626873016357422, 0.01688528060913086, 0.0175018310546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 1.0, 4.0, 12.0, 10.0, 9.0, 7.0, 15.0, 41.0, 118.0, 230.0, 255.0, 131.0, 46.0, 14.0, 8.0, 10.0, 10.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007373809814453125, -0.007114231586456299, -0.006854653358459473, -0.0065950751304626465, -0.00633549690246582, -0.006075918674468994, -0.005816340446472168, -0.005556762218475342, -0.005297183990478516, -0.0050376057624816895, -0.004778027534484863, -0.004518449306488037, -0.004258871078491211, -0.003999292850494385, -0.0037397146224975586, -0.0034801363945007324, -0.0032205581665039062, -0.00296097993850708, -0.002701401710510254, -0.0024418234825134277, -0.0021822452545166016, -0.0019226670265197754, -0.0016630887985229492, -0.001403510570526123, -0.0011439323425292969, -0.0008843541145324707, -0.0006247758865356445, -0.00036519765853881836, -0.00010561943054199219, 0.00015395879745483398, 0.00041353702545166016, 0.0006731152534484863, 0.0009326934814453125, 0.0011922717094421387, 0.0014518499374389648, 0.001711428165435791, 0.001971006393432617, 0.0022305846214294434, 0.0024901628494262695, 0.0027497410774230957, 0.003009319305419922, 0.003268897533416748, 0.0035284757614135742, 0.0037880539894104004, 0.0040476322174072266, 0.004307210445404053, 0.004566788673400879, 0.004826366901397705, 0.005085945129394531, 0.005345523357391357, 0.005605101585388184, 0.00586467981338501, 0.006124258041381836, 0.006383836269378662, 0.006643414497375488, 0.0069029927253723145, 0.007162570953369141, 0.007422149181365967, 0.007681727409362793, 0.00794130563735962, 0.008200883865356445, 0.008460462093353271, 0.008720040321350098, 0.008979618549346924, 0.00923919677734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 3.0, 4.0, 7.0, 11.0, 12.0, 17.0, 23.0, 26.0, 33.0, 27.0, 40.0, 55.0, 63.0, 90.0, 138.0, 244.0, 404.0, 768.0, 1681.0, 9253.0, 1018456.0, 13366.0, 1790.0, 783.0, 422.0, 241.0, 154.0, 104.0, 96.0, 50.0, 33.0, 34.0, 27.0, 20.0, 17.0, 12.0, 10.0, 7.0, 11.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03839111328125, -0.03721141815185547, -0.03603172302246094, -0.034852027893066406, -0.033672332763671875, -0.032492637634277344, -0.03131294250488281, -0.03013324737548828, -0.02895355224609375, -0.02777385711669922, -0.026594161987304688, -0.025414466857910156, -0.024234771728515625, -0.023055076599121094, -0.021875381469726562, -0.02069568634033203, -0.0195159912109375, -0.01833629608154297, -0.017156600952148438, -0.015976905822753906, -0.014797210693359375, -0.013617515563964844, -0.012437820434570312, -0.011258125305175781, -0.01007843017578125, -0.008898735046386719, -0.0077190399169921875, -0.006539344787597656, -0.005359649658203125, -0.004179954528808594, -0.0030002593994140625, -0.0018205642700195312, -0.000640869140625, 0.0005388259887695312, 0.0017185211181640625, 0.0028982162475585938, 0.004077911376953125, 0.005257606506347656, 0.0064373016357421875, 0.007616996765136719, 0.00879669189453125, 0.009976387023925781, 0.011156082153320312, 0.012335777282714844, 0.013515472412109375, 0.014695167541503906, 0.015874862670898438, 0.01705455780029297, 0.0182342529296875, 0.01941394805908203, 0.020593643188476562, 0.021773338317871094, 0.022953033447265625, 0.024132728576660156, 0.025312423706054688, 0.02649211883544922, 0.02767181396484375, 0.02885150909423828, 0.030031204223632812, 0.031210899353027344, 0.032390594482421875, 0.033570289611816406, 0.03474998474121094, 0.03592967987060547, 0.037109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 6.0, 3.0, 2.0, 9.0, 11.0, 11.0, 16.0, 23.0, 24.0, 27.0, 21.0, 31.0, 25.0, 34.0, 32.0, 30.0, 35.0, 37.0, 32.0, 39.0, 48.0, 45.0, 29.0, 51.0, 27.0, 41.0, 33.0, 25.0, 37.0, 41.0, 25.0, 25.0, 23.0, 19.0, 15.0, 17.0, 11.0, 8.0, 6.0, 12.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0205078125, -0.019878387451171875, -0.01924896240234375, -0.018619537353515625, -0.0179901123046875, -0.017360687255859375, -0.01673126220703125, -0.016101837158203125, -0.015472412109375, -0.014842987060546875, -0.01421356201171875, -0.013584136962890625, -0.0129547119140625, -0.012325286865234375, -0.01169586181640625, -0.011066436767578125, -0.01043701171875, -0.009807586669921875, -0.00917816162109375, -0.008548736572265625, -0.0079193115234375, -0.007289886474609375, -0.00666046142578125, -0.006031036376953125, -0.005401611328125, -0.004772186279296875, -0.00414276123046875, -0.003513336181640625, -0.0028839111328125, -0.002254486083984375, -0.00162506103515625, -0.000995635986328125, -0.0003662109375, 0.000263214111328125, 0.00089263916015625, 0.001522064208984375, 0.0021514892578125, 0.002780914306640625, 0.00341033935546875, 0.004039764404296875, 0.004669189453125, 0.005298614501953125, 0.00592803955078125, 0.006557464599609375, 0.0071868896484375, 0.007816314697265625, 0.00844573974609375, 0.009075164794921875, 0.00970458984375, 0.010334014892578125, 0.01096343994140625, 0.011592864990234375, 0.0122222900390625, 0.012851715087890625, 0.01348114013671875, 0.014110565185546875, 0.014739990234375, 0.015369415283203125, 0.01599884033203125, 0.016628265380859375, 0.0172576904296875, 0.017887115478515625, 0.01851654052734375, 0.019145965576171875, 0.019775390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 8.0, 6.0, 8.0, 17.0, 15.0, 26.0, 59.0, 70.0, 137.0, 358.0, 1287.0, 34820.0, 1002748.0, 7744.0, 759.0, 209.0, 120.0, 53.0, 40.0, 17.0, 16.0, 9.0, 10.0, 7.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1517276763916016e-05, -2.0829960703849792e-05, -2.014264464378357e-05, -1.9455328583717346e-05, -1.8768012523651123e-05, -1.80806964635849e-05, -1.7393380403518677e-05, -1.6706064343452454e-05, -1.601874828338623e-05, -1.5331432223320007e-05, -1.4644116163253784e-05, -1.3956800103187561e-05, -1.3269484043121338e-05, -1.2582167983055115e-05, -1.1894851922988892e-05, -1.1207535862922668e-05, -1.0520219802856445e-05, -9.832903742790222e-06, -9.145587682723999e-06, -8.458271622657776e-06, -7.770955562591553e-06, -7.08363950252533e-06, -6.3963234424591064e-06, -5.709007382392883e-06, -5.02169132232666e-06, -4.334375262260437e-06, -3.647059202194214e-06, -2.9597431421279907e-06, -2.2724270820617676e-06, -1.5851110219955444e-06, -8.977949619293213e-07, -2.1047890186309814e-07, 4.76837158203125e-07, 1.1641532182693481e-06, 1.8514692783355713e-06, 2.5387853384017944e-06, 3.2261013984680176e-06, 3.913417458534241e-06, 4.600733518600464e-06, 5.288049578666687e-06, 5.97536563873291e-06, 6.662681698799133e-06, 7.3499977588653564e-06, 8.03731381893158e-06, 8.724629878997803e-06, 9.411945939064026e-06, 1.0099261999130249e-05, 1.0786578059196472e-05, 1.1473894119262695e-05, 1.2161210179328918e-05, 1.2848526239395142e-05, 1.3535842299461365e-05, 1.4223158359527588e-05, 1.4910474419593811e-05, 1.5597790479660034e-05, 1.6285106539726257e-05, 1.697242259979248e-05, 1.7659738659858704e-05, 1.8347054719924927e-05, 1.903437077999115e-05, 1.9721686840057373e-05, 2.0409002900123596e-05, 2.109631896018982e-05, 2.1783635020256042e-05, 2.2470951080322266e-05]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 10.0, 11.0, 16.0, 21.0, 22.0, 30.0, 51.0, 69.0, 111.0, 116.0, 150.0, 116.0, 73.0, 57.0, 32.0, 30.0, 23.0, 15.0, 8.0, 6.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-05, -1.0973773896694183e-05, -1.0622665286064148e-05, -1.0271556675434113e-05, -9.920448064804077e-06, -9.569339454174042e-06, -9.218230843544006e-06, -8.867122232913971e-06, -8.516013622283936e-06, -8.1649050116539e-06, -7.813796401023865e-06, -7.462687790393829e-06, -7.111579179763794e-06, -6.7604705691337585e-06, -6.409361958503723e-06, -6.058253347873688e-06, -5.707144737243652e-06, -5.356036126613617e-06, -5.0049275159835815e-06, -4.653818905353546e-06, -4.302710294723511e-06, -3.951601684093475e-06, -3.60049307346344e-06, -3.2493844628334045e-06, -2.898275852203369e-06, -2.5471672415733337e-06, -2.1960586309432983e-06, -1.844950020313263e-06, -1.4938414096832275e-06, -1.1427327990531921e-06, -7.916241884231567e-07, -4.4051557779312134e-07, -8.940696716308594e-08, 2.6170164346694946e-07, 6.128102540969849e-07, 9.639188647270203e-07, 1.3150274753570557e-06, 1.666136085987091e-06, 2.0172446966171265e-06, 2.368353307247162e-06, 2.7194619178771973e-06, 3.0705705285072327e-06, 3.421679139137268e-06, 3.7727877497673035e-06, 4.123896360397339e-06, 4.475004971027374e-06, 4.82611358165741e-06, 5.177222192287445e-06, 5.5283308029174805e-06, 5.879439413547516e-06, 6.230548024177551e-06, 6.581656634807587e-06, 6.932765245437622e-06, 7.2838738560676575e-06, 7.634982466697693e-06, 7.986091077327728e-06, 8.337199687957764e-06, 8.688308298587799e-06, 9.039416909217834e-06, 9.39052551984787e-06, 9.741634130477905e-06, 1.009274274110794e-05, 1.0443851351737976e-05, 1.0794959962368011e-05, 1.1146068572998047e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 5.0, 9.0, 7.0, 13.0, 24.0, 36.0, 55.0, 118.0, 333.0, 1906.0, 1043067.0, 2321.0, 365.0, 123.0, 72.0, 34.0, 23.0, 15.0, 8.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9591064453125e-05, -4.791188985109329e-05, -4.6232715249061584e-05, -4.455354064702988e-05, -4.287436604499817e-05, -4.119519144296646e-05, -3.9516016840934753e-05, -3.7836842238903046e-05, -3.615766763687134e-05, -3.447849303483963e-05, -3.279931843280792e-05, -3.1120143830776215e-05, -2.9440969228744507e-05, -2.77617946267128e-05, -2.608262002468109e-05, -2.4403445422649384e-05, -2.2724270820617676e-05, -2.1045096218585968e-05, -1.936592161655426e-05, -1.7686747014522552e-05, -1.6007572412490845e-05, -1.4328397810459137e-05, -1.264922320842743e-05, -1.0970048606395721e-05, -9.290874004364014e-06, -7.611699402332306e-06, -5.932524800300598e-06, -4.25335019826889e-06, -2.5741755962371826e-06, -8.950009942054749e-07, 7.841736078262329e-07, 2.4633482098579407e-06, 4.1425228118896484e-06, 5.821697413921356e-06, 7.500872015953064e-06, 9.180046617984772e-06, 1.085922122001648e-05, 1.2538395822048187e-05, 1.4217570424079895e-05, 1.5896745026111603e-05, 1.757591962814331e-05, 1.925509423017502e-05, 2.0934268832206726e-05, 2.2613443434238434e-05, 2.429261803627014e-05, 2.597179263830185e-05, 2.7650967240333557e-05, 2.9330141842365265e-05, 3.100931644439697e-05, 3.268849104642868e-05, 3.436766564846039e-05, 3.6046840250492096e-05, 3.7726014852523804e-05, 3.940518945455551e-05, 4.108436405658722e-05, 4.276353865861893e-05, 4.4442713260650635e-05, 4.612188786268234e-05, 4.780106246471405e-05, 4.948023706674576e-05, 5.1159411668777466e-05, 5.2838586270809174e-05, 5.451776087284088e-05, 5.619693547487259e-05, 5.78761100769043e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 4.0, 7.0, 11.0, 13.0, 22.0, 29.0, 55.0, 130.0, 440.0, 107.0, 65.0, 35.0, 28.0, 9.0, 12.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6524066925048828e-05, -2.5626271963119507e-05, -2.4728477001190186e-05, -2.3830682039260864e-05, -2.2932887077331543e-05, -2.203509211540222e-05, -2.11372971534729e-05, -2.023950219154358e-05, -1.9341707229614258e-05, -1.8443912267684937e-05, -1.7546117305755615e-05, -1.6648322343826294e-05, -1.5750527381896973e-05, -1.4852732419967651e-05, -1.395493745803833e-05, -1.3057142496109009e-05, -1.2159347534179688e-05, -1.1261552572250366e-05, -1.0363757610321045e-05, -9.465962648391724e-06, -8.568167686462402e-06, -7.670372724533081e-06, -6.77257776260376e-06, -5.8747828006744385e-06, -4.976987838745117e-06, -4.079192876815796e-06, -3.1813979148864746e-06, -2.2836029529571533e-06, -1.385807991027832e-06, -4.880130290985107e-07, 4.0978193283081055e-07, 1.3075768947601318e-06, 2.205371856689453e-06, 3.1031668186187744e-06, 4.000961780548096e-06, 4.898756742477417e-06, 5.796551704406738e-06, 6.6943466663360596e-06, 7.592141628265381e-06, 8.489936590194702e-06, 9.387731552124023e-06, 1.0285526514053345e-05, 1.1183321475982666e-05, 1.2081116437911987e-05, 1.2978911399841309e-05, 1.387670636177063e-05, 1.4774501323699951e-05, 1.5672296285629272e-05, 1.6570091247558594e-05, 1.7467886209487915e-05, 1.8365681171417236e-05, 1.9263476133346558e-05, 2.016127109527588e-05, 2.10590660572052e-05, 2.195686101913452e-05, 2.2854655981063843e-05, 2.3752450942993164e-05, 2.4650245904922485e-05, 2.5548040866851807e-05, 2.6445835828781128e-05, 2.734363079071045e-05, 2.824142575263977e-05, 2.9139220714569092e-05, 3.0037015676498413e-05, 3.0934810638427734e-05]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 121.0, 854.0, 30.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07917436212301254, -0.07066558301448822, -0.062156811356544495, -0.05364803597331047, -0.04513926059007645, -0.03663048520684242, -0.0281217098236084, -0.019612934440374374, -0.01110415905714035, -0.0025953836739063263, 0.005913391709327698, 0.014422167092561722, 0.022930942475795746, 0.03143971785902977, 0.039948493242263794, 0.04845726862549782, 0.05696604400873184, 0.06547482311725616, 0.07398359477519989, 0.08249236643314362, 0.09100114554166794, 0.09950992465019226, 0.10801869630813599, 0.11652746796607971, 0.12503623962402344, 0.13354501128196716, 0.1420537829399109, 0.1505625694990158, 0.15907134115695953, 0.16758011281490326, 0.17608889937400818, 0.1845976710319519, 0.19310647249221802, 0.20161524415016174, 0.21012401580810547, 0.2186328023672104, 0.2271415740251541, 0.23565034568309784, 0.24415913224220276, 0.2526679039001465, 0.2611766755580902, 0.26968544721603394, 0.27819421887397766, 0.2867029905319214, 0.2952117919921875, 0.3037205636501312, 0.31222933530807495, 0.3207381069660187, 0.3292468786239624, 0.33775565028190613, 0.34626442193984985, 0.3547731935977936, 0.3632819652557373, 0.3717907667160034, 0.38029953837394714, 0.38880831003189087, 0.3973170816898346, 0.4058258533477783, 0.41433462500572205, 0.42284339666366577, 0.4313521981239319, 0.4398609697818756, 0.44836974143981934, 0.45687851309776306, 0.4653872847557068]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 10.0, 14.0, 11.0, 22.0, 24.0, 27.0, 38.0, 28.0, 39.0, 48.0, 59.0, 65.0, 50.0, 53.0, 48.0, 57.0, 54.0, 48.0, 47.0, 41.0, 36.0, 35.0, 21.0, 23.0, 22.0, 18.0, 17.0, 9.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15125852823257446, -0.14704565703868866, -0.14283278584480286, -0.13861992955207825, -0.13440705835819244, -0.13019418716430664, -0.12598131597042084, -0.12176844477653503, -0.11755558103322983, -0.11334270983934402, -0.10912984609603882, -0.10491697490215302, -0.10070410370826721, -0.096491239964962, -0.0922783687710762, -0.088065505027771, -0.08385263383388519, -0.07963976263999939, -0.07542689889669418, -0.07121402770280838, -0.06700116395950317, -0.06278829276561737, -0.05857542157173157, -0.05436255410313606, -0.05014968663454056, -0.04593681916594505, -0.04172395169734955, -0.037511080503463745, -0.03329821303486824, -0.029085345566272736, -0.02487247623503208, -0.020659606903791428, -0.016446739435195923, -0.012233871035277843, -0.008021002635359764, -0.0038081342354416847, 0.00040473416447639465, 0.004617601633071899, 0.008830470964312553, 0.013043340295553207, 0.017256207764148712, 0.021469075232744217, 0.02568194456398487, 0.029894813895225525, 0.03410768136382103, 0.038320548832416534, 0.04253342002630234, 0.04674628749489784, 0.05095915496349335, 0.05517202243208885, 0.05938488990068436, 0.06359776109457016, 0.06781062483787537, 0.07202349603176117, 0.07623636722564697, 0.08044923841953278, 0.08466210216283798, 0.08887497335672379, 0.09308783710002899, 0.0973007082939148, 0.1015135794878006, 0.1057264432311058, 0.10993931442499161, 0.11415217816829681, 0.11836504936218262]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 5.0, 10.0, 7.0, 12.0, 25.0, 23.0, 19.0, 41.0, 44.0, 735.0, 3518.0, 4094215.0, 93020.0, 2069.0, 274.0, 39.0, 35.0, 24.0, 28.0, 16.0, 16.0, 12.0, 10.0, 10.0, 9.0, 4.0, 8.0, 2.0, 10.0, 2.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0151824951171875, -0.014658451080322266, -0.014134407043457031, -0.013610363006591797, -0.013086318969726562, -0.012562274932861328, -0.012038230895996094, -0.01151418685913086, -0.010990142822265625, -0.01046609878540039, -0.009942054748535156, -0.009418010711669922, -0.008893966674804688, -0.008369922637939453, -0.007845878601074219, -0.007321834564208984, -0.00679779052734375, -0.006273746490478516, -0.005749702453613281, -0.005225658416748047, -0.0047016143798828125, -0.004177570343017578, -0.0036535263061523438, -0.0031294822692871094, -0.002605438232421875, -0.0020813941955566406, -0.0015573501586914062, -0.0010333061218261719, -0.0005092620849609375, 1.4781951904296875e-05, 0.0005388259887695312, 0.0010628700256347656, 0.0015869140625, 0.0021109580993652344, 0.0026350021362304688, 0.003159046173095703, 0.0036830902099609375, 0.004207134246826172, 0.004731178283691406, 0.005255222320556641, 0.005779266357421875, 0.006303310394287109, 0.006827354431152344, 0.007351398468017578, 0.007875442504882812, 0.008399486541748047, 0.008923530578613281, 0.009447574615478516, 0.00997161865234375, 0.010495662689208984, 0.011019706726074219, 0.011543750762939453, 0.012067794799804688, 0.012591838836669922, 0.013115882873535156, 0.01363992691040039, 0.014163970947265625, 0.01468801498413086, 0.015212059020996094, 0.015736103057861328, 0.016260147094726562, 0.016784191131591797, 0.01730823516845703, 0.017832279205322266, 0.0183563232421875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 3.0, 5.0, 14.0, 10.0, 10.0, 9.0, 25.0, 89.0, 184.0, 266.0, 184.0, 71.0, 18.0, 9.0, 11.0, 10.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0, 6.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007389068603515625, -0.007132232189178467, -0.006875395774841309, -0.00661855936050415, -0.006361722946166992, -0.006104886531829834, -0.005848050117492676, -0.005591213703155518, -0.005334377288818359, -0.005077540874481201, -0.004820704460144043, -0.004563868045806885, -0.0043070316314697266, -0.004050195217132568, -0.00379335880279541, -0.003536522388458252, -0.0032796859741210938, -0.0030228495597839355, -0.0027660131454467773, -0.002509176731109619, -0.002252340316772461, -0.0019955039024353027, -0.0017386674880981445, -0.0014818310737609863, -0.0012249946594238281, -0.0009681582450866699, -0.0007113218307495117, -0.0004544854164123535, -0.0001976490020751953, 5.918741226196289e-05, 0.0003160238265991211, 0.0005728602409362793, 0.0008296966552734375, 0.0010865330696105957, 0.001343369483947754, 0.0016002058982849121, 0.0018570423126220703, 0.0021138787269592285, 0.0023707151412963867, 0.002627551555633545, 0.002884387969970703, 0.0031412243843078613, 0.0033980607986450195, 0.0036548972129821777, 0.003911733627319336, 0.004168570041656494, 0.004425406455993652, 0.0046822428703308105, 0.004939079284667969, 0.005195915699005127, 0.005452752113342285, 0.005709588527679443, 0.0059664249420166016, 0.00622326135635376, 0.006480097770690918, 0.006736934185028076, 0.006993770599365234, 0.007250607013702393, 0.007507443428039551, 0.007764279842376709, 0.008021116256713867, 0.008277952671051025, 0.008534789085388184, 0.008791625499725342, 0.0090484619140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 27.0, 97.0, 317.0, 678.0, 2795.0, 4186952.0, 2259.0, 639.0, 334.0, 108.0, 35.0, 11.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0201416015625, -0.019408464431762695, -0.01867532730102539, -0.017942190170288086, -0.01720905303955078, -0.016475915908813477, -0.015742778778076172, -0.015009641647338867, -0.014276504516601562, -0.013543367385864258, -0.012810230255126953, -0.012077093124389648, -0.011343955993652344, -0.010610818862915039, -0.009877681732177734, -0.00914454460144043, -0.008411407470703125, -0.00767827033996582, -0.006945133209228516, -0.006211996078491211, -0.005478858947753906, -0.0047457218170166016, -0.004012584686279297, -0.003279447555541992, -0.0025463104248046875, -0.0018131732940673828, -0.0010800361633300781, -0.00034689903259277344, 0.00038623809814453125, 0.001119375228881836, 0.0018525123596191406, 0.0025856494903564453, 0.00331878662109375, 0.004051923751831055, 0.004785060882568359, 0.005518198013305664, 0.006251335144042969, 0.0069844722747802734, 0.007717609405517578, 0.008450746536254883, 0.009183883666992188, 0.009917020797729492, 0.010650157928466797, 0.011383295059204102, 0.012116432189941406, 0.012849569320678711, 0.013582706451416016, 0.01431584358215332, 0.015048980712890625, 0.01578211784362793, 0.016515254974365234, 0.01724839210510254, 0.017981529235839844, 0.01871466636657715, 0.019447803497314453, 0.020180940628051758, 0.020914077758789062, 0.021647214889526367, 0.022380352020263672, 0.023113489151000977, 0.02384662628173828, 0.024579763412475586, 0.02531290054321289, 0.026046037673950195, 0.0267791748046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 16.0, 24.0, 351.0, 3635.0, 33.0, 11.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0094451904296875, -0.009190082550048828, -0.008934974670410156, -0.008679866790771484, -0.008424758911132812, -0.00816965103149414, -0.007914543151855469, -0.007659435272216797, -0.007404327392578125, -0.007149219512939453, -0.006894111633300781, -0.006639003753662109, -0.0063838958740234375, -0.006128787994384766, -0.005873680114746094, -0.005618572235107422, -0.00536346435546875, -0.005108356475830078, -0.004853248596191406, -0.004598140716552734, -0.0043430328369140625, -0.004087924957275391, -0.0038328170776367188, -0.003577709197998047, -0.003322601318359375, -0.003067493438720703, -0.0028123855590820312, -0.0025572776794433594, -0.0023021697998046875, -0.0020470619201660156, -0.0017919540405273438, -0.0015368461608886719, -0.00128173828125, -0.0010266304016113281, -0.0007715225219726562, -0.0005164146423339844, -0.0002613067626953125, -6.198883056640625e-06, 0.00024890899658203125, 0.0005040168762207031, 0.000759124755859375, 0.0010142326354980469, 0.0012693405151367188, 0.0015244483947753906, 0.0017795562744140625, 0.0020346641540527344, 0.0022897720336914062, 0.002544879913330078, 0.00279998779296875, 0.003055095672607422, 0.0033102035522460938, 0.0035653114318847656, 0.0038204193115234375, 0.004075527191162109, 0.004330635070800781, 0.004585742950439453, 0.004840850830078125, 0.005095958709716797, 0.005351066589355469, 0.005606174468994141, 0.0058612823486328125, 0.006116390228271484, 0.006371498107910156, 0.006626605987548828, 0.0068817138671875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 993.0, 14.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02370830811560154, -0.02196001075208187, -0.02021171525120735, -0.018463417887687683, -0.016715120524168015, -0.01496682409197092, -0.013218527659773827, -0.011470230296254158, -0.009721933864057064, -0.00797363743185997, -0.0062253400683403015, -0.0044770436361432076, -0.0027287467382848263, -0.000980449840426445, 0.000767846591770649, 0.0025161439552903175, 0.0042644403874874115, 0.006012737285345793, 0.007761034183204174, 0.009509330615401268, 0.011257627978920937, 0.01300592441111803, 0.014754220843315125, 0.016502518206834793, 0.01825081557035446, 0.01999911293387413, 0.02174740843474865, 0.023495705798268318, 0.025244003161787987, 0.026992298662662506, 0.028740596026182175, 0.030488893389701843, 0.03223719075322151, 0.03398548811674118, 0.03573378548026085, 0.03748208284378052, 0.03923037648200989, 0.040978673845529556, 0.042726971209049225, 0.04447526857256889, 0.04622356593608856, 0.04797186329960823, 0.0497201606631279, 0.05146845430135727, 0.05321675166487694, 0.054965049028396606, 0.056713346391916275, 0.058461643755435944, 0.060209937393665314, 0.06195823475718498, 0.06370653212070465, 0.06545482575893402, 0.06720312684774399, 0.06895142048597336, 0.07069972157478333, 0.0724480152130127, 0.07419631630182266, 0.07594460994005203, 0.077692911028862, 0.07944120466709137, 0.08118950575590134, 0.0829377993941307, 0.08468610048294067, 0.08643439412117004, 0.08818268775939941]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 12.0, 21.0, 24.0, 43.0, 38.0, 60.0, 80.0, 75.0, 86.0, 106.0, 109.0, 91.0, 67.0, 49.0, 39.0, 33.0, 24.0, 14.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01140064001083374, -0.011000651866197586, -0.010600663721561432, -0.010200675576925278, -0.009800687432289124, -0.00940069928765297, -0.009000711143016815, -0.008600722998380661, -0.008200734853744507, -0.007800746709108353, -0.0074007585644721985, -0.007000770419836044, -0.00660078227519989, -0.006200794130563736, -0.005800805985927582, -0.005400817841291428, -0.0050008296966552734, -0.004600841552019119, -0.004200853407382965, -0.003800865262746811, -0.0034008771181106567, -0.0030008889734745026, -0.0026009008288383484, -0.002200912684202194, -0.00180092453956604, -0.0014009363949298859, -0.0010009482502937317, -0.0006009601056575775, -0.00020097196102142334, 0.00019901618361473083, 0.000599004328250885, 0.0009989924728870392, 0.0013989806175231934, 0.0017989687621593475, 0.0021989569067955017, 0.002598945051431656, 0.00299893319606781, 0.0033989213407039642, 0.0037989094853401184, 0.004198897629976273, 0.004598885774612427, 0.004998873919248581, 0.005398862063884735, 0.005798850208520889, 0.0061988383531570435, 0.006598826497793198, 0.006998814642429352, 0.007398802787065506, 0.00779879093170166, 0.008198779076337814, 0.008598767220973969, 0.008998755365610123, 0.009398743510246277, 0.009798731654882431, 0.010198719799518585, 0.01059870794415474, 0.010998696088790894, 0.011398684233427048, 0.011798672378063202, 0.012198660522699356, 0.01259864866733551, 0.012998636811971664, 0.013398624956607819, 0.013798613101243973, 0.014198601245880127]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 8.0, 8.0, 6.0, 14.0, 18.0, 26.0, 33.0, 46.0, 89.0, 143.0, 269.0, 466.0, 864.0, 1899.0, 4055.0, 11287.0, 63361.0, 927677.0, 25599.0, 6909.0, 2770.0, 1331.0, 721.0, 359.0, 198.0, 130.0, 93.0, 59.0, 34.0, 27.0, 17.0, 7.0, 5.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0181427001953125, -0.017628788948059082, -0.017114877700805664, -0.016600966453552246, -0.016087055206298828, -0.01557314395904541, -0.015059232711791992, -0.014545321464538574, -0.014031410217285156, -0.013517498970031738, -0.01300358772277832, -0.012489676475524902, -0.011975765228271484, -0.011461853981018066, -0.010947942733764648, -0.01043403148651123, -0.009920120239257812, -0.009406208992004395, -0.008892297744750977, -0.008378386497497559, -0.00786447525024414, -0.007350564002990723, -0.006836652755737305, -0.006322741508483887, -0.005808830261230469, -0.005294919013977051, -0.004781007766723633, -0.004267096519470215, -0.003753185272216797, -0.003239274024963379, -0.002725362777709961, -0.002211451530456543, -0.001697540283203125, -0.001183629035949707, -0.0006697177886962891, -0.0001558065414428711, 0.0003581047058105469, 0.0008720159530639648, 0.0013859272003173828, 0.0018998384475708008, 0.0024137496948242188, 0.0029276609420776367, 0.0034415721893310547, 0.003955483436584473, 0.004469394683837891, 0.004983305931091309, 0.0054972171783447266, 0.0060111284255981445, 0.0065250396728515625, 0.0070389509201049805, 0.0075528621673583984, 0.008066773414611816, 0.008580684661865234, 0.009094595909118652, 0.00960850715637207, 0.010122418403625488, 0.010636329650878906, 0.011150240898132324, 0.011664152145385742, 0.01217806339263916, 0.012691974639892578, 0.013205885887145996, 0.013719797134399414, 0.014233708381652832, 0.01474761962890625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 6.0, 3.0, 5.0, 14.0, 10.0, 10.0, 9.0, 25.0, 88.0, 182.0, 265.0, 188.0, 69.0, 20.0, 9.0, 11.0, 10.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007396697998046875, -0.007139742374420166, -0.006882786750793457, -0.006625831127166748, -0.006368875503540039, -0.00611191987991333, -0.005854964256286621, -0.005598008632659912, -0.005341053009033203, -0.005084097385406494, -0.004827141761779785, -0.004570186138153076, -0.004313230514526367, -0.004056274890899658, -0.0037993192672729492, -0.0035423636436462402, -0.0032854080200195312, -0.0030284523963928223, -0.0027714967727661133, -0.0025145411491394043, -0.0022575855255126953, -0.0020006299018859863, -0.0017436742782592773, -0.0014867186546325684, -0.0012297630310058594, -0.0009728074073791504, -0.0007158517837524414, -0.0004588961601257324, -0.00020194053649902344, 5.501508712768555e-05, 0.00031197071075439453, 0.0005689263343811035, 0.0008258819580078125, 0.0010828375816345215, 0.0013397932052612305, 0.0015967488288879395, 0.0018537044525146484, 0.0021106600761413574, 0.0023676156997680664, 0.0026245713233947754, 0.0028815269470214844, 0.0031384825706481934, 0.0033954381942749023, 0.0036523938179016113, 0.00390934944152832, 0.004166305065155029, 0.004423260688781738, 0.004680216312408447, 0.004937171936035156, 0.005194127559661865, 0.005451083183288574, 0.005708038806915283, 0.005964994430541992, 0.006221950054168701, 0.00647890567779541, 0.006735861301422119, 0.006992816925048828, 0.007249772548675537, 0.007506728172302246, 0.007763683795928955, 0.008020639419555664, 0.008277595043182373, 0.008534550666809082, 0.008791506290435791, 0.0090484619140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 8.0, 2.0, 10.0, 11.0, 11.0, 13.0, 20.0, 25.0, 31.0, 26.0, 44.0, 45.0, 71.0, 91.0, 131.0, 190.0, 343.0, 767.0, 2016.0, 31238.0, 1004130.0, 6436.0, 1385.0, 563.0, 241.0, 190.0, 115.0, 89.0, 60.0, 52.0, 40.0, 25.0, 24.0, 19.0, 21.0, 9.0, 13.0, 11.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0275421142578125, -0.026662826538085938, -0.025783538818359375, -0.024904251098632812, -0.02402496337890625, -0.023145675659179688, -0.022266387939453125, -0.021387100219726562, -0.0205078125, -0.019628524780273438, -0.018749237060546875, -0.017869949340820312, -0.01699066162109375, -0.016111373901367188, -0.015232086181640625, -0.014352798461914062, -0.0134735107421875, -0.012594223022460938, -0.011714935302734375, -0.010835647583007812, -0.00995635986328125, -0.009077072143554688, -0.008197784423828125, -0.0073184967041015625, -0.006439208984375, -0.0055599212646484375, -0.004680633544921875, -0.0038013458251953125, -0.00292205810546875, -0.0020427703857421875, -0.001163482666015625, -0.0002841949462890625, 0.0005950927734375, 0.0014743804931640625, 0.002353668212890625, 0.0032329559326171875, 0.00411224365234375, 0.0049915313720703125, 0.005870819091796875, 0.0067501068115234375, 0.00762939453125, 0.008508682250976562, 0.009387969970703125, 0.010267257690429688, 0.01114654541015625, 0.012025833129882812, 0.012905120849609375, 0.013784408569335938, 0.0146636962890625, 0.015542984008789062, 0.016422271728515625, 0.017301559448242188, 0.01818084716796875, 0.019060134887695312, 0.019939422607421875, 0.020818710327148438, 0.021697998046875, 0.022577285766601562, 0.023456573486328125, 0.024335861206054688, 0.02521514892578125, 0.026094436645507812, 0.026973724365234375, 0.027853012084960938, 0.0287322998046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 2.0, 10.0, 11.0, 11.0, 12.0, 15.0, 22.0, 23.0, 20.0, 21.0, 23.0, 35.0, 28.0, 35.0, 38.0, 36.0, 39.0, 29.0, 55.0, 43.0, 39.0, 51.0, 31.0, 27.0, 44.0, 37.0, 35.0, 27.0, 30.0, 26.0, 21.0, 17.0, 16.0, 17.0, 7.0, 12.0, 11.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.01953125, -0.01890707015991211, -0.01828289031982422, -0.017658710479736328, -0.017034530639648438, -0.016410350799560547, -0.015786170959472656, -0.015161991119384766, -0.014537811279296875, -0.013913631439208984, -0.013289451599121094, -0.012665271759033203, -0.012041091918945312, -0.011416912078857422, -0.010792732238769531, -0.01016855239868164, -0.00954437255859375, -0.00892019271850586, -0.008296012878417969, -0.007671833038330078, -0.0070476531982421875, -0.006423473358154297, -0.005799293518066406, -0.005175113677978516, -0.004550933837890625, -0.003926753997802734, -0.0033025741577148438, -0.002678394317626953, -0.0020542144775390625, -0.0014300346374511719, -0.0008058547973632812, -0.00018167495727539062, 0.0004425048828125, 0.0010666847229003906, 0.0016908645629882812, 0.002315044403076172, 0.0029392242431640625, 0.003563404083251953, 0.004187583923339844, 0.004811763763427734, 0.005435943603515625, 0.006060123443603516, 0.006684303283691406, 0.007308483123779297, 0.007932662963867188, 0.008556842803955078, 0.009181022644042969, 0.00980520248413086, 0.01042938232421875, 0.01105356216430664, 0.011677742004394531, 0.012301921844482422, 0.012926101684570312, 0.013550281524658203, 0.014174461364746094, 0.014798641204833984, 0.015422821044921875, 0.016047000885009766, 0.016671180725097656, 0.017295360565185547, 0.017919540405273438, 0.018543720245361328, 0.01916790008544922, 0.01979207992553711, 0.020416259765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 1.0, 7.0, 9.0, 18.0, 20.0, 18.0, 45.0, 45.0, 66.0, 185.0, 246.0, 851.0, 2367.0, 27037.0, 951864.0, 58576.0, 5323.0, 972.0, 451.0, 149.0, 104.0, 69.0, 37.0, 24.0, 10.0, 14.0, 15.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-1.0192394256591797e-05, -9.928829967975616e-06, -9.665265679359436e-06, -9.401701390743256e-06, -9.138137102127075e-06, -8.874572813510895e-06, -8.611008524894714e-06, -8.347444236278534e-06, -8.083879947662354e-06, -7.820315659046173e-06, -7.556751370429993e-06, -7.293187081813812e-06, -7.029622793197632e-06, -6.766058504581451e-06, -6.502494215965271e-06, -6.2389299273490906e-06, -5.97536563873291e-06, -5.71180135011673e-06, -5.448237061500549e-06, -5.184672772884369e-06, -4.9211084842681885e-06, -4.657544195652008e-06, -4.393979907035828e-06, -4.130415618419647e-06, -3.866851329803467e-06, -3.6032870411872864e-06, -3.339722752571106e-06, -3.0761584639549255e-06, -2.812594175338745e-06, -2.5490298867225647e-06, -2.2854655981063843e-06, -2.021901309490204e-06, -1.7583370208740234e-06, -1.494772732257843e-06, -1.2312084436416626e-06, -9.676441550254822e-07, -7.040798664093018e-07, -4.4051557779312134e-07, -1.7695128917694092e-07, 8.66129994392395e-08, 3.501772880554199e-07, 6.137415766716003e-07, 8.773058652877808e-07, 1.1408701539039612e-06, 1.4044344425201416e-06, 1.667998731136322e-06, 1.9315630197525024e-06, 2.195127308368683e-06, 2.4586915969848633e-06, 2.7222558856010437e-06, 2.985820174217224e-06, 3.2493844628334045e-06, 3.512948751449585e-06, 3.7765130400657654e-06, 4.040077328681946e-06, 4.303641617298126e-06, 4.567205905914307e-06, 4.830770194530487e-06, 5.0943344831466675e-06, 5.357898771762848e-06, 5.621463060379028e-06, 5.885027348995209e-06, 6.148591637611389e-06, 6.41215592622757e-06, 6.67572021484375e-06]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 5.0, 14.0, 10.0, 13.0, 14.0, 21.0, 24.0, 55.0, 59.0, 83.0, 86.0, 204.0, 99.0, 77.0, 65.0, 62.0, 21.0, 15.0, 12.0, 12.0, 2.0, 5.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.450580596923828e-06, -7.257796823978424e-06, -7.06501305103302e-06, -6.872229278087616e-06, -6.679445505142212e-06, -6.486661732196808e-06, -6.293877959251404e-06, -6.101094186306e-06, -5.908310413360596e-06, -5.715526640415192e-06, -5.522742867469788e-06, -5.3299590945243835e-06, -5.1371753215789795e-06, -4.9443915486335754e-06, -4.751607775688171e-06, -4.558824002742767e-06, -4.366040229797363e-06, -4.173256456851959e-06, -3.980472683906555e-06, -3.787688910961151e-06, -3.594905138015747e-06, -3.402121365070343e-06, -3.209337592124939e-06, -3.016553819179535e-06, -2.823770046234131e-06, -2.630986273288727e-06, -2.4382025003433228e-06, -2.2454187273979187e-06, -2.0526349544525146e-06, -1.8598511815071106e-06, -1.6670674085617065e-06, -1.4742836356163025e-06, -1.2814998626708984e-06, -1.0887160897254944e-06, -8.959323167800903e-07, -7.031485438346863e-07, -5.103647708892822e-07, -3.175809979438782e-07, -1.2479722499847412e-07, 6.798654794692993e-08, 2.60770320892334e-07, 4.5355409383773804e-07, 6.463378667831421e-07, 8.391216397285461e-07, 1.0319054126739502e-06, 1.2246891856193542e-06, 1.4174729585647583e-06, 1.6102567315101624e-06, 1.8030405044555664e-06, 1.9958242774009705e-06, 2.1886080503463745e-06, 2.3813918232917786e-06, 2.5741755962371826e-06, 2.7669593691825867e-06, 2.9597431421279907e-06, 3.1525269150733948e-06, 3.345310688018799e-06, 3.538094460964203e-06, 3.730878233909607e-06, 3.923662006855011e-06, 4.116445779800415e-06, 4.309229552745819e-06, 4.502013325691223e-06, 4.694797098636627e-06, 4.887580871582031e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 8.0, 14.0, 14.0, 22.0, 39.0, 66.0, 113.0, 194.0, 647.0, 23591.0, 1022085.0, 1133.0, 314.0, 126.0, 63.0, 32.0, 21.0, 20.0, 8.0, 7.0, 5.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8298625946044922e-05, -1.7710961401462555e-05, -1.7123296856880188e-05, -1.653563231229782e-05, -1.5947967767715454e-05, -1.5360303223133087e-05, -1.477263867855072e-05, -1.4184974133968353e-05, -1.3597309589385986e-05, -1.300964504480362e-05, -1.2421980500221252e-05, -1.1834315955638885e-05, -1.1246651411056519e-05, -1.0658986866474152e-05, -1.0071322321891785e-05, -9.483657777309418e-06, -8.89599323272705e-06, -8.308328688144684e-06, -7.720664143562317e-06, -7.13299959897995e-06, -6.545335054397583e-06, -5.957670509815216e-06, -5.370005965232849e-06, -4.782341420650482e-06, -4.194676876068115e-06, -3.6070123314857483e-06, -3.0193477869033813e-06, -2.4316832423210144e-06, -1.8440186977386475e-06, -1.2563541531562805e-06, -6.686896085739136e-07, -8.102506399154663e-08, 5.066394805908203e-07, 1.0943040251731873e-06, 1.6819685697555542e-06, 2.269633114337921e-06, 2.857297658920288e-06, 3.444962203502655e-06, 4.032626748085022e-06, 4.620291292667389e-06, 5.207955837249756e-06, 5.795620381832123e-06, 6.38328492641449e-06, 6.970949470996857e-06, 7.558614015579224e-06, 8.14627856016159e-06, 8.733943104743958e-06, 9.321607649326324e-06, 9.909272193908691e-06, 1.0496936738491058e-05, 1.1084601283073425e-05, 1.1672265827655792e-05, 1.225993037223816e-05, 1.2847594916820526e-05, 1.3435259461402893e-05, 1.402292400598526e-05, 1.4610588550567627e-05, 1.5198253095149994e-05, 1.578591763973236e-05, 1.6373582184314728e-05, 1.6961246728897095e-05, 1.754891127347946e-05, 1.813657581806183e-05, 1.8724240362644196e-05, 1.9311904907226562e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 10.0, 14.0, 21.0, 31.0, 28.0, 46.0, 72.0, 95.0, 386.0, 70.0, 71.0, 47.0, 34.0, 10.0, 13.0, 10.0, 3.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3053417205810547e-05, -1.2635253369808197e-05, -1.2217089533805847e-05, -1.1798925697803497e-05, -1.1380761861801147e-05, -1.0962598025798798e-05, -1.0544434189796448e-05, -1.0126270353794098e-05, -9.708106517791748e-06, -9.289942681789398e-06, -8.871778845787048e-06, -8.453615009784698e-06, -8.035451173782349e-06, -7.617287337779999e-06, -7.199123501777649e-06, -6.780959665775299e-06, -6.362795829772949e-06, -5.944631993770599e-06, -5.5264681577682495e-06, -5.1083043217659e-06, -4.69014048576355e-06, -4.2719766497612e-06, -3.85381281375885e-06, -3.4356489777565002e-06, -3.0174851417541504e-06, -2.5993213057518005e-06, -2.1811574697494507e-06, -1.7629936337471008e-06, -1.344829797744751e-06, -9.266659617424011e-07, -5.085021257400513e-07, -9.033828973770142e-08, 3.2782554626464844e-07, 7.459893822669983e-07, 1.1641532182693481e-06, 1.582317054271698e-06, 2.000480890274048e-06, 2.4186447262763977e-06, 2.8368085622787476e-06, 3.2549723982810974e-06, 3.6731362342834473e-06, 4.091300070285797e-06, 4.509463906288147e-06, 4.927627742290497e-06, 5.345791578292847e-06, 5.7639554142951965e-06, 6.182119250297546e-06, 6.600283086299896e-06, 7.018446922302246e-06, 7.436610758304596e-06, 7.854774594306946e-06, 8.272938430309296e-06, 8.691102266311646e-06, 9.109266102313995e-06, 9.527429938316345e-06, 9.945593774318695e-06, 1.0363757610321045e-05, 1.0781921446323395e-05, 1.1200085282325745e-05, 1.1618249118328094e-05, 1.2036412954330444e-05, 1.2454576790332794e-05, 1.2872740626335144e-05, 1.3290904462337494e-05, 1.3709068298339844e-05]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 40.0, 599.0, 346.0, 21.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10943986475467682, -0.10366286337375641, -0.0978858694434166, -0.09210887551307678, -0.08633187413215637, -0.08055487275123596, -0.07477787882089615, -0.06900088489055634, -0.06322388350963593, -0.057446885854005814, -0.0516698881983757, -0.04589289054274559, -0.04011589288711548, -0.03433889523148537, -0.028561897575855255, -0.022784899920225143, -0.017007902264595032, -0.01123090460896492, -0.005453906953334808, 0.00032309070229530334, 0.006100088357925415, 0.011877086013555527, 0.01765408366918564, 0.02343108132481575, 0.029208078980445862, 0.034985076636075974, 0.040762074291706085, 0.0465390719473362, 0.05231606960296631, 0.05809306725859642, 0.06387006491422653, 0.06964705884456635, 0.07542404532432556, 0.08120104670524597, 0.08697804063558578, 0.0927550345659256, 0.09853203594684601, 0.10430903732776642, 0.11008603125810623, 0.11586302518844604, 0.12164002656936646, 0.12741702795028687, 0.13319402933120728, 0.1389710158109665, 0.1447480171918869, 0.1505250185728073, 0.15630200505256653, 0.16207900643348694, 0.16785600781440735, 0.17363300919532776, 0.17941001057624817, 0.18518699705600739, 0.1909639984369278, 0.1967409998178482, 0.20251798629760742, 0.20829498767852783, 0.21407198905944824, 0.21984899044036865, 0.22562599182128906, 0.23140297830104828, 0.2371799796819687, 0.2429569810628891, 0.24873396754264832, 0.2545109689235687, 0.26028797030448914]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 5.0, 9.0, 8.0, 16.0, 7.0, 12.0, 14.0, 18.0, 16.0, 10.0, 21.0, 22.0, 26.0, 35.0, 37.0, 35.0, 36.0, 49.0, 47.0, 46.0, 50.0, 41.0, 38.0, 38.0, 56.0, 37.0, 35.0, 23.0, 29.0, 29.0, 38.0, 17.0, 28.0, 10.0, 13.0, 7.0, 10.0, 9.0, 7.0, 9.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11164200305938721, -0.10829945653676987, -0.10495691001415253, -0.10161437094211578, -0.09827182441949844, -0.0949292778968811, -0.09158673882484436, -0.08824419230222702, -0.08490164577960968, -0.08155909925699234, -0.078216552734375, -0.07487401366233826, -0.07153146713972092, -0.06818892061710358, -0.06484638154506683, -0.06150383502244949, -0.05816128849983215, -0.05481874197721481, -0.05147619917988777, -0.04813365638256073, -0.04479110985994339, -0.04144856333732605, -0.03810602053999901, -0.03476347774267197, -0.031420931220054626, -0.028078386560082436, -0.024735841900110245, -0.021393297240138054, -0.018050752580165863, -0.014708207920193672, -0.011365663260221481, -0.00802311860024929, -0.0046805739402771, -0.0013380292803049088, 0.002004515379667282, 0.005347060039639473, 0.008689604699611664, 0.012032149359583855, 0.015374694019556046, 0.018717238679528236, 0.022059783339500427, 0.025402327999472618, 0.02874487265944481, 0.03208741545677185, 0.03542996197938919, 0.03877250850200653, 0.04211505129933357, 0.045457594096660614, 0.048800140619277954, 0.052142687141895294, 0.055485229939222336, 0.05882777273654938, 0.06217031925916672, 0.06551286578178406, 0.0688554048538208, 0.07219795137643814, 0.07554049789905548, 0.07888304442167282, 0.08222559094429016, 0.0855681300163269, 0.08891067653894424, 0.09225322306156158, 0.09559576213359833, 0.09893830865621567, 0.10228085517883301]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 2.0, 4.0, 2.0, 5.0, 4.0, 2.0, 4.0, 7.0, 12.0, 12.0, 11.0, 6.0, 22.0, 72.0, 195.0, 4193549.0, 181.0, 79.0, 21.0, 10.0, 9.0, 7.0, 16.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0014276504516601562, -0.001387074589729309, -0.001346498727798462, -0.0013059228658676147, -0.0012653470039367676, -0.0012247711420059204, -0.0011841952800750732, -0.001143619418144226, -0.001103043556213379, -0.0010624676942825317, -0.0010218918323516846, -0.0009813159704208374, -0.0009407401084899902, -0.0009001642465591431, -0.0008595883846282959, -0.0008190125226974487, -0.0007784366607666016, -0.0007378607988357544, -0.0006972849369049072, -0.0006567090749740601, -0.0006161332130432129, -0.0005755573511123657, -0.0005349814891815186, -0.0004944056272506714, -0.0004538297653198242, -0.00041325390338897705, -0.0003726780414581299, -0.0003321021795272827, -0.00029152631759643555, -0.0002509504556655884, -0.0002103745937347412, -0.00016979873180389404, -0.00012922286987304688, -8.864700794219971e-05, -4.807114601135254e-05, -7.495284080505371e-06, 3.30805778503418e-05, 7.365643978118896e-05, 0.00011423230171203613, 0.0001548081636428833, 0.00019538402557373047, 0.00023595988750457764, 0.0002765357494354248, 0.00031711161136627197, 0.00035768747329711914, 0.0003982633352279663, 0.0004388391971588135, 0.00047941505908966064, 0.0005199909210205078, 0.000560566782951355, 0.0006011426448822021, 0.0006417185068130493, 0.0006822943687438965, 0.0007228702306747437, 0.0007634460926055908, 0.000804021954536438, 0.0008445978164672852, 0.0008851736783981323, 0.0009257495403289795, 0.0009663254022598267, 0.0010069012641906738, 0.001047477126121521, 0.0010880529880523682, 0.0011286288499832153, 0.0011692047119140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 1.0, 5.0, 15.0, 11.0, 6.0, 11.0, 17.0, 66.0, 153.0, 264.0, 210.0, 100.0, 24.0, 11.0, 9.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007415771484375, -0.007160305976867676, -0.0069048404693603516, -0.006649374961853027, -0.006393909454345703, -0.006138443946838379, -0.005882978439331055, -0.0056275129318237305, -0.005372047424316406, -0.005116581916809082, -0.004861116409301758, -0.004605650901794434, -0.004350185394287109, -0.004094719886779785, -0.003839254379272461, -0.0035837888717651367, -0.0033283233642578125, -0.0030728578567504883, -0.002817392349243164, -0.00256192684173584, -0.0023064613342285156, -0.0020509958267211914, -0.0017955303192138672, -0.001540064811706543, -0.0012845993041992188, -0.0010291337966918945, -0.0007736682891845703, -0.0005182027816772461, -0.0002627372741699219, -7.271766662597656e-06, 0.00024819374084472656, 0.0005036592483520508, 0.000759124755859375, 0.0010145902633666992, 0.0012700557708740234, 0.0015255212783813477, 0.0017809867858886719, 0.002036452293395996, 0.0022919178009033203, 0.0025473833084106445, 0.0028028488159179688, 0.003058314323425293, 0.003313779830932617, 0.0035692453384399414, 0.0038247108459472656, 0.00408017635345459, 0.004335641860961914, 0.004591107368469238, 0.0048465728759765625, 0.005102038383483887, 0.005357503890991211, 0.005612969398498535, 0.005868434906005859, 0.006123900413513184, 0.006379365921020508, 0.006634831428527832, 0.006890296936035156, 0.0071457624435424805, 0.007401227951049805, 0.007656693458557129, 0.007912158966064453, 0.008167624473571777, 0.008423089981079102, 0.008678555488586426, 0.00893402099609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 17.0, 29.0, 43.0, 69.0, 81.0, 104.0, 88.0, 4193366.0, 105.0, 116.0, 80.0, 85.0, 43.0, 31.0, 17.0, 11.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.375810623168945e-05, -9.08728688955307e-05, -8.798763155937195e-05, -8.51023942232132e-05, -8.221715688705444e-05, -7.933191955089569e-05, -7.644668221473694e-05, -7.356144487857819e-05, -7.067620754241943e-05, -6.779097020626068e-05, -6.490573287010193e-05, -6.202049553394318e-05, -5.9135258197784424e-05, -5.625002086162567e-05, -5.336478352546692e-05, -5.0479546189308167e-05, -4.7594308853149414e-05, -4.470907151699066e-05, -4.182383418083191e-05, -3.893859684467316e-05, -3.6053359508514404e-05, -3.316812217235565e-05, -3.02828848361969e-05, -2.7397647500038147e-05, -2.4512410163879395e-05, -2.1627172827720642e-05, -1.874193549156189e-05, -1.5856698155403137e-05, -1.2971460819244385e-05, -1.0086223483085632e-05, -7.20098614692688e-06, -4.3157488107681274e-06, -1.430511474609375e-06, 1.4547258615493774e-06, 4.33996319770813e-06, 7.225200533866882e-06, 1.0110437870025635e-05, 1.2995675206184387e-05, 1.588091254234314e-05, 1.8766149878501892e-05, 2.1651387214660645e-05, 2.4536624550819397e-05, 2.742186188697815e-05, 3.0307099223136902e-05, 3.3192336559295654e-05, 3.607757389545441e-05, 3.896281123161316e-05, 4.184804856777191e-05, 4.4733285903930664e-05, 4.7618523240089417e-05, 5.050376057624817e-05, 5.338899791240692e-05, 5.6274235248565674e-05, 5.9159472584724426e-05, 6.204470992088318e-05, 6.492994725704193e-05, 6.781518459320068e-05, 7.070042192935944e-05, 7.358565926551819e-05, 7.647089660167694e-05, 7.93561339378357e-05, 8.224137127399445e-05, 8.51266086101532e-05, 8.801184594631195e-05, 9.08970832824707e-05]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4095.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [0.0, 4.0046870708465576e-07, 8.009374141693115e-07, 1.2014061212539673e-06, 1.601874828338623e-06, 2.002343535423279e-06, 2.4028122425079346e-06, 2.8032809495925903e-06, 3.203749656677246e-06, 3.604218363761902e-06, 4.004687070846558e-06, 4.405155777931213e-06, 4.805624485015869e-06, 5.206093192100525e-06, 5.606561899185181e-06, 6.0070306062698364e-06, 6.407499313354492e-06, 6.807968020439148e-06, 7.208436727523804e-06, 7.6089054346084595e-06, 8.009374141693115e-06, 8.409842848777771e-06, 8.810311555862427e-06, 9.210780262947083e-06, 9.611248970031738e-06, 1.0011717677116394e-05, 1.041218638420105e-05, 1.0812655091285706e-05, 1.1213123798370361e-05, 1.1613592505455017e-05, 1.2014061212539673e-05, 1.2414529919624329e-05, 1.2814998626708984e-05, 1.321546733379364e-05, 1.3615936040878296e-05, 1.4016404747962952e-05, 1.4416873455047607e-05, 1.4817342162132263e-05, 1.5217810869216919e-05, 1.5618279576301575e-05, 1.601874828338623e-05, 1.6419216990470886e-05, 1.6819685697555542e-05, 1.7220154404640198e-05, 1.7620623111724854e-05, 1.802109181880951e-05, 1.8421560525894165e-05, 1.882202923297882e-05, 1.9222497940063477e-05, 1.9622966647148132e-05, 2.0023435354232788e-05, 2.0423904061317444e-05, 2.08243727684021e-05, 2.1224841475486755e-05, 2.162531018257141e-05, 2.2025778889656067e-05, 2.2426247596740723e-05, 2.282671630382538e-05, 2.3227185010910034e-05, 2.362765371799469e-05, 2.4028122425079346e-05, 2.4428591132164e-05, 2.4829059839248657e-05, 2.5229528546333313e-05, 2.562999725341797e-05]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 39.0, 971.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014892354374751449, -0.00014188833301886916, -0.00013485312229022384, -0.0001278179115615785, -0.00012078269355697557, -0.00011374748282833025, -0.00010671226482372731, -9.967705409508198e-05, -9.264184336643666e-05, -8.560663263779134e-05, -7.857142190914601e-05, -7.153620390454307e-05, -6.450099317589775e-05, -5.746578244725242e-05, -5.043056808062829e-05, -4.339535371400416e-05, -3.6360142985358834e-05, -2.9324930437724106e-05, -2.2289717890089378e-05, -1.525450534245465e-05, -8.219292794819921e-06, -1.1840820661745965e-06, 5.851132300449535e-06, 1.2886346667073667e-05, 1.9921557395718992e-05, 2.695676994335372e-05, 3.399198249098845e-05, 4.102719685761258e-05, 4.8062407586257905e-05, 5.509761831490323e-05, 6.213283631950617e-05, 6.916804704815149e-05, 7.620325777679682e-05, 8.323846850544214e-05, 9.027367923408747e-05, 9.73088972386904e-05, 0.00010434410796733573, 0.00011137931869598106, 0.000118414536700584, 0.00012544974742922932, 0.00013248495815787464, 0.00013952016888651997, 0.0001465553796151653, 0.00015359059034381062, 0.00016062581562437117, 0.0001676610263530165, 0.00017469623708166182, 0.00018173144781030715, 0.00018876665853895247, 0.0001958018692675978, 0.00020283707999624312, 0.00020987229072488844, 0.00021690750145353377, 0.0002239427121821791, 0.00023097793746273965, 0.00023801314819138497, 0.0002450483734719455, 0.00025208358420059085, 0.0002591187949292362, 0.0002661540056578815, 0.0002731892163865268, 0.00028022442711517215, 0.00028725963784381747, 0.0002942948485724628, 0.0003013300593011081]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 7.0, 10.0, 48.0, 28.0, 92.0, 227.0, 99.0, 127.0, 182.0, 60.0, 43.0, 51.0, 4.0, 11.0, 0.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2351741790771484e-05, -2.1179206669330597e-05, -2.000667154788971e-05, -1.8834136426448822e-05, -1.7661601305007935e-05, -1.6489066183567047e-05, -1.531653106212616e-05, -1.4143995940685272e-05, -1.2971460819244385e-05, -1.1798925697803497e-05, -1.062639057636261e-05, -9.453855454921722e-06, -8.281320333480835e-06, -7.1087852120399475e-06, -5.93625009059906e-06, -4.763714969158173e-06, -3.591179847717285e-06, -2.4186447262763977e-06, -1.2461096048355103e-06, -7.35744833946228e-08, 1.0989606380462646e-06, 2.271495759487152e-06, 3.4440308809280396e-06, 4.616566002368927e-06, 5.7891011238098145e-06, 6.961636245250702e-06, 8.13417136669159e-06, 9.306706488132477e-06, 1.0479241609573364e-05, 1.1651776731014252e-05, 1.282431185245514e-05, 1.3996846973896027e-05, 1.5169382095336914e-05, 1.63419172167778e-05, 1.751445233821869e-05, 1.8686987459659576e-05, 1.9859522581100464e-05, 2.103205770254135e-05, 2.220459282398224e-05, 2.3377127945423126e-05, 2.4549663066864014e-05, 2.57221981883049e-05, 2.689473330974579e-05, 2.8067268431186676e-05, 2.9239803552627563e-05, 3.041233867406845e-05, 3.158487379550934e-05, 3.2757408916950226e-05, 3.392994403839111e-05, 3.5102479159832e-05, 3.627501428127289e-05, 3.7447549402713776e-05, 3.862008452415466e-05, 3.979261964559555e-05, 4.096515476703644e-05, 4.2137689888477325e-05, 4.331022500991821e-05, 4.44827601313591e-05, 4.565529525279999e-05, 4.6827830374240875e-05, 4.800036549568176e-05, 4.917290061712265e-05, 5.034543573856354e-05, 5.1517970860004425e-05, 5.269050598144531e-05]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 10.0, 5.0, 10.0, 8.0, 16.0, 17.0, 22.0, 25.0, 38.0, 49.0, 66.0, 80.0, 136.0, 205.0, 344.0, 504.0, 840.0, 1540.0, 3387.0, 9820.0, 64883.0, 933796.0, 21672.0, 5688.0, 2219.0, 1169.0, 684.0, 440.0, 278.0, 178.0, 114.0, 84.0, 59.0, 41.0, 31.0, 20.0, 19.0, 14.0, 11.0, 10.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020721435546875, -0.020058870315551758, -0.019396305084228516, -0.018733739852905273, -0.01807117462158203, -0.01740860939025879, -0.016746044158935547, -0.016083478927612305, -0.015420913696289062, -0.01475834846496582, -0.014095783233642578, -0.013433218002319336, -0.012770652770996094, -0.012108087539672852, -0.01144552230834961, -0.010782957077026367, -0.010120391845703125, -0.009457826614379883, -0.00879526138305664, -0.008132696151733398, -0.007470130920410156, -0.006807565689086914, -0.006145000457763672, -0.00548243522644043, -0.0048198699951171875, -0.004157304763793945, -0.003494739532470703, -0.002832174301147461, -0.0021696090698242188, -0.0015070438385009766, -0.0008444786071777344, -0.0001819133758544922, 0.00048065185546875, 0.0011432170867919922, 0.0018057823181152344, 0.0024683475494384766, 0.0031309127807617188, 0.003793478012084961, 0.004456043243408203, 0.005118608474731445, 0.0057811737060546875, 0.00644373893737793, 0.007106304168701172, 0.007768869400024414, 0.008431434631347656, 0.009093999862670898, 0.00975656509399414, 0.010419130325317383, 0.011081695556640625, 0.011744260787963867, 0.01240682601928711, 0.013069391250610352, 0.013731956481933594, 0.014394521713256836, 0.015057086944580078, 0.01571965217590332, 0.016382217407226562, 0.017044782638549805, 0.017707347869873047, 0.01836991310119629, 0.01903247833251953, 0.019695043563842773, 0.020357608795166016, 0.021020174026489258, 0.0216827392578125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 1.0, 5.0, 15.0, 11.0, 6.0, 11.0, 17.0, 66.0, 153.0, 263.0, 211.0, 100.0, 24.0, 11.0, 9.0, 13.0, 8.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007415771484375, -0.007160305976867676, -0.0069048404693603516, -0.006649374961853027, -0.006393909454345703, -0.006138443946838379, -0.005882978439331055, -0.0056275129318237305, -0.005372047424316406, -0.005116581916809082, -0.004861116409301758, -0.004605650901794434, -0.004350185394287109, -0.004094719886779785, -0.003839254379272461, -0.0035837888717651367, -0.0033283233642578125, -0.0030728578567504883, -0.002817392349243164, -0.00256192684173584, -0.0023064613342285156, -0.0020509958267211914, -0.0017955303192138672, -0.001540064811706543, -0.0012845993041992188, -0.0010291337966918945, -0.0007736682891845703, -0.0005182027816772461, -0.0002627372741699219, -7.271766662597656e-06, 0.00024819374084472656, 0.0005036592483520508, 0.000759124755859375, 0.0010145902633666992, 0.0012700557708740234, 0.0015255212783813477, 0.0017809867858886719, 0.002036452293395996, 0.0022919178009033203, 0.0025473833084106445, 0.0028028488159179688, 0.003058314323425293, 0.003313779830932617, 0.0035692453384399414, 0.0038247108459472656, 0.00408017635345459, 0.004335641860961914, 0.004591107368469238, 0.0048465728759765625, 0.005102038383483887, 0.005357503890991211, 0.005612969398498535, 0.005868434906005859, 0.006123900413513184, 0.006379365921020508, 0.006634831428527832, 0.006890296936035156, 0.0071457624435424805, 0.007401227951049805, 0.007656693458557129, 0.007912158966064453, 0.008167624473571777, 0.008423089981079102, 0.008678555488586426, 0.00893402099609375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 13.0, 11.0, 10.0, 11.0, 11.0, 24.0, 23.0, 31.0, 34.0, 52.0, 71.0, 83.0, 109.0, 151.0, 212.0, 352.0, 686.0, 1449.0, 8627.0, 1021664.0, 11448.0, 1540.0, 689.0, 377.0, 219.0, 139.0, 127.0, 81.0, 64.0, 46.0, 43.0, 32.0, 18.0, 25.0, 12.0, 12.0, 13.0, 4.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.0306854248046875, -0.029796838760375977, -0.028908252716064453, -0.02801966667175293, -0.027131080627441406, -0.026242494583129883, -0.02535390853881836, -0.024465322494506836, -0.023576736450195312, -0.02268815040588379, -0.021799564361572266, -0.020910978317260742, -0.02002239227294922, -0.019133806228637695, -0.018245220184326172, -0.01735663414001465, -0.016468048095703125, -0.015579462051391602, -0.014690876007080078, -0.013802289962768555, -0.012913703918457031, -0.012025117874145508, -0.011136531829833984, -0.010247945785522461, -0.009359359741210938, -0.008470773696899414, -0.007582187652587891, -0.006693601608276367, -0.005805015563964844, -0.00491642951965332, -0.004027843475341797, -0.0031392574310302734, -0.00225067138671875, -0.0013620853424072266, -0.0004734992980957031, 0.0004150867462158203, 0.0013036727905273438, 0.002192258834838867, 0.0030808448791503906, 0.003969430923461914, 0.0048580169677734375, 0.005746603012084961, 0.006635189056396484, 0.007523775100708008, 0.008412361145019531, 0.009300947189331055, 0.010189533233642578, 0.011078119277954102, 0.011966705322265625, 0.012855291366577148, 0.013743877410888672, 0.014632463455200195, 0.015521049499511719, 0.016409635543823242, 0.017298221588134766, 0.01818680763244629, 0.019075393676757812, 0.019963979721069336, 0.02085256576538086, 0.021741151809692383, 0.022629737854003906, 0.02351832389831543, 0.024406909942626953, 0.025295495986938477, 0.02618408203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 12.0, 12.0, 10.0, 10.0, 7.0, 20.0, 16.0, 17.0, 22.0, 29.0, 27.0, 29.0, 29.0, 35.0, 38.0, 45.0, 47.0, 42.0, 37.0, 31.0, 38.0, 44.0, 38.0, 30.0, 40.0, 28.0, 35.0, 34.0, 26.0, 18.0, 25.0, 20.0, 12.0, 18.0, 13.0, 12.0, 12.0, 3.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.02099609375, -0.020388364791870117, -0.019780635833740234, -0.01917290687561035, -0.01856517791748047, -0.017957448959350586, -0.017349720001220703, -0.01674199104309082, -0.016134262084960938, -0.015526533126831055, -0.014918804168701172, -0.014311075210571289, -0.013703346252441406, -0.013095617294311523, -0.01248788833618164, -0.011880159378051758, -0.011272430419921875, -0.010664701461791992, -0.01005697250366211, -0.009449243545532227, -0.008841514587402344, -0.008233785629272461, -0.007626056671142578, -0.007018327713012695, -0.0064105987548828125, -0.00580286979675293, -0.005195140838623047, -0.004587411880493164, -0.003979682922363281, -0.0033719539642333984, -0.0027642250061035156, -0.002156496047973633, -0.00154876708984375, -0.0009410381317138672, -0.0003333091735839844, 0.00027441978454589844, 0.0008821487426757812, 0.001489877700805664, 0.002097606658935547, 0.0027053356170654297, 0.0033130645751953125, 0.003920793533325195, 0.004528522491455078, 0.005136251449584961, 0.005743980407714844, 0.0063517093658447266, 0.006959438323974609, 0.007567167282104492, 0.008174896240234375, 0.008782625198364258, 0.00939035415649414, 0.009998083114624023, 0.010605812072753906, 0.011213541030883789, 0.011821269989013672, 0.012428998947143555, 0.013036727905273438, 0.01364445686340332, 0.014252185821533203, 0.014859914779663086, 0.015467643737792969, 0.01607537269592285, 0.016683101654052734, 0.017290830612182617, 0.0178985595703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 7.0, 7.0, 8.0, 8.0, 6.0, 20.0, 20.0, 24.0, 57.0, 99.0, 135.0, 329.0, 930.0, 9798.0, 976438.0, 56504.0, 3079.0, 566.0, 215.0, 98.0, 67.0, 44.0, 25.0, 17.0, 18.0, 5.0, 6.0, 5.0, 1.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.1861324310302734e-05, -1.1487863957881927e-05, -1.111440360546112e-05, -1.0740943253040314e-05, -1.0367482900619507e-05, -9.9940225481987e-06, -9.620562195777893e-06, -9.247101843357086e-06, -8.87364149093628e-06, -8.500181138515472e-06, -8.126720786094666e-06, -7.753260433673859e-06, -7.379800081253052e-06, -7.006339728832245e-06, -6.632879376411438e-06, -6.259419023990631e-06, -5.885958671569824e-06, -5.512498319149017e-06, -5.1390379667282104e-06, -4.7655776143074036e-06, -4.392117261886597e-06, -4.01865690946579e-06, -3.645196557044983e-06, -3.271736204624176e-06, -2.898275852203369e-06, -2.5248154997825623e-06, -2.1513551473617554e-06, -1.7778947949409485e-06, -1.4044344425201416e-06, -1.0309740900993347e-06, -6.575137376785278e-07, -2.8405338525772095e-07, 8.940696716308594e-08, 4.628673195838928e-07, 8.363276720046997e-07, 1.2097880244255066e-06, 1.5832483768463135e-06, 1.9567087292671204e-06, 2.3301690816879272e-06, 2.703629434108734e-06, 3.077089786529541e-06, 3.450550138950348e-06, 3.824010491371155e-06, 4.197470843791962e-06, 4.5709311962127686e-06, 4.9443915486335754e-06, 5.317851901054382e-06, 5.691312253475189e-06, 6.064772605895996e-06, 6.438232958316803e-06, 6.81169331073761e-06, 7.185153663158417e-06, 7.558614015579224e-06, 7.93207436800003e-06, 8.305534720420837e-06, 8.678995072841644e-06, 9.052455425262451e-06, 9.425915777683258e-06, 9.799376130104065e-06, 1.0172836482524872e-05, 1.0546296834945679e-05, 1.0919757187366486e-05, 1.1293217539787292e-05, 1.16666778922081e-05, 1.2040138244628906e-05]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 8.0, 3.0, 4.0, 3.0, 7.0, 10.0, 19.0, 16.0, 40.0, 42.0, 52.0, 86.0, 80.0, 143.0, 104.0, 102.0, 75.0, 53.0, 37.0, 26.0, 23.0, 20.0, 13.0, 7.0, 5.0, 3.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.331371307373047e-06, -7.101334631443024e-06, -6.8712979555130005e-06, -6.641261279582977e-06, -6.411224603652954e-06, -6.181187927722931e-06, -5.951151251792908e-06, -5.7211145758628845e-06, -5.491077899932861e-06, -5.261041224002838e-06, -5.031004548072815e-06, -4.800967872142792e-06, -4.5709311962127686e-06, -4.340894520282745e-06, -4.110857844352722e-06, -3.880821168422699e-06, -3.6507844924926758e-06, -3.4207478165626526e-06, -3.1907111406326294e-06, -2.960674464702606e-06, -2.730637788772583e-06, -2.50060111284256e-06, -2.2705644369125366e-06, -2.0405277609825134e-06, -1.8104910850524902e-06, -1.580454409122467e-06, -1.3504177331924438e-06, -1.1203810572624207e-06, -8.903443813323975e-07, -6.603077054023743e-07, -4.302710294723511e-07, -2.0023435354232788e-07, 2.9802322387695312e-08, 2.598389983177185e-07, 4.898756742477417e-07, 7.199123501777649e-07, 9.499490261077881e-07, 1.1799857020378113e-06, 1.4100223779678345e-06, 1.6400590538978577e-06, 1.8700957298278809e-06, 2.100132405757904e-06, 2.3301690816879272e-06, 2.5602057576179504e-06, 2.7902424335479736e-06, 3.020279109477997e-06, 3.25031578540802e-06, 3.4803524613380432e-06, 3.7103891372680664e-06, 3.94042581319809e-06, 4.170462489128113e-06, 4.400499165058136e-06, 4.630535840988159e-06, 4.860572516918182e-06, 5.0906091928482056e-06, 5.320645868778229e-06, 5.550682544708252e-06, 5.780719220638275e-06, 6.010755896568298e-06, 6.2407925724983215e-06, 6.470829248428345e-06, 6.700865924358368e-06, 6.930902600288391e-06, 7.160939276218414e-06, 7.3909759521484375e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 7.0, 11.0, 8.0, 11.0, 7.0, 23.0, 40.0, 55.0, 86.0, 191.0, 538.0, 5902.0, 1039334.0, 1630.0, 321.0, 156.0, 92.0, 41.0, 34.0, 17.0, 15.0, 7.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4020671844482422e-05, -2.317223697900772e-05, -2.232380211353302e-05, -2.147536724805832e-05, -2.0626932382583618e-05, -1.9778497517108917e-05, -1.8930062651634216e-05, -1.8081627786159515e-05, -1.7233192920684814e-05, -1.6384758055210114e-05, -1.5536323189735413e-05, -1.4687888324260712e-05, -1.383945345878601e-05, -1.299101859331131e-05, -1.2142583727836609e-05, -1.1294148862361908e-05, -1.0445713996887207e-05, -9.597279131412506e-06, -8.748844265937805e-06, -7.900409400463104e-06, -7.051974534988403e-06, -6.203539669513702e-06, -5.3551048040390015e-06, -4.5066699385643005e-06, -3.6582350730895996e-06, -2.8098002076148987e-06, -1.9613653421401978e-06, -1.1129304766654968e-06, -2.644956111907959e-07, 5.83939254283905e-07, 1.432374119758606e-06, 2.280808985233307e-06, 3.129243850708008e-06, 3.977678716182709e-06, 4.82611358165741e-06, 5.674548447132111e-06, 6.5229833126068115e-06, 7.3714181780815125e-06, 8.219853043556213e-06, 9.068287909030914e-06, 9.916722774505615e-06, 1.0765157639980316e-05, 1.1613592505455017e-05, 1.2462027370929718e-05, 1.3310462236404419e-05, 1.415889710187912e-05, 1.500733196735382e-05, 1.5855766832828522e-05, 1.6704201698303223e-05, 1.7552636563777924e-05, 1.8401071429252625e-05, 1.9249506294727325e-05, 2.0097941160202026e-05, 2.0946376025676727e-05, 2.1794810891151428e-05, 2.264324575662613e-05, 2.349168062210083e-05, 2.434011548757553e-05, 2.5188550353050232e-05, 2.6036985218524933e-05, 2.6885420083999634e-05, 2.7733854949474335e-05, 2.8582289814949036e-05, 2.9430724680423737e-05, 3.0279159545898438e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 10.0, 4.0, 6.0, 5.0, 13.0, 17.0, 22.0, 22.0, 39.0, 70.0, 83.0, 414.0, 94.0, 58.0, 44.0, 28.0, 15.0, 17.0, 12.0, 8.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6391277313232422e-05, -1.5811994671821594e-05, -1.5232712030410767e-05, -1.4653429388999939e-05, -1.4074146747589111e-05, -1.3494864106178284e-05, -1.2915581464767456e-05, -1.2336298823356628e-05, -1.17570161819458e-05, -1.1177733540534973e-05, -1.0598450899124146e-05, -1.0019168257713318e-05, -9.43988561630249e-06, -8.860602974891663e-06, -8.281320333480835e-06, -7.702037692070007e-06, -7.12275505065918e-06, -6.543472409248352e-06, -5.964189767837524e-06, -5.384907126426697e-06, -4.805624485015869e-06, -4.2263418436050415e-06, -3.647059202194214e-06, -3.0677765607833862e-06, -2.4884939193725586e-06, -1.909211277961731e-06, -1.3299286365509033e-06, -7.506459951400757e-07, -1.7136335372924805e-07, 4.079192876815796e-07, 9.872019290924072e-07, 1.5664845705032349e-06, 2.1457672119140625e-06, 2.72504985332489e-06, 3.3043324947357178e-06, 3.883615136146545e-06, 4.462897777557373e-06, 5.042180418968201e-06, 5.621463060379028e-06, 6.200745701789856e-06, 6.780028343200684e-06, 7.359310984611511e-06, 7.938593626022339e-06, 8.517876267433167e-06, 9.097158908843994e-06, 9.676441550254822e-06, 1.025572419166565e-05, 1.0835006833076477e-05, 1.1414289474487305e-05, 1.1993572115898132e-05, 1.257285475730896e-05, 1.3152137398719788e-05, 1.3731420040130615e-05, 1.4310702681541443e-05, 1.488998532295227e-05, 1.5469267964363098e-05, 1.6048550605773926e-05, 1.6627833247184753e-05, 1.720711588859558e-05, 1.778639853000641e-05, 1.8365681171417236e-05, 1.8944963812828064e-05, 1.952424645423889e-05, 2.010352909564972e-05, 2.0682811737060547e-05]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 82.0, 928.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39565974473953247, -0.3821330964565277, -0.36860647797584534, -0.3550798296928406, -0.3415532112121582, -0.32802656292915344, -0.3144999146461487, -0.3009732961654663, -0.28744664788246155, -0.2739199995994568, -0.2603933811187744, -0.24686673283576965, -0.2333400994539261, -0.21981346607208252, -0.20628683269023895, -0.19276019930839539, -0.17923356592655182, -0.16570693254470825, -0.15218029916286469, -0.13865366578102112, -0.12512701749801636, -0.11160038411617279, -0.09807375073432922, -0.08454710990190506, -0.07102047652006149, -0.05749383941292763, -0.04396720230579376, -0.030440568923950195, -0.01691393181681633, -0.0033872947096824646, 0.010139338672161102, 0.023665979504585266, 0.03719261288642883, 0.0507192499935627, 0.06424588710069656, 0.07777252048254013, 0.0912991613149643, 0.10482579469680786, 0.11835242807865143, 0.131879061460495, 0.14540570974349976, 0.15893234312534332, 0.1724589765071869, 0.18598562479019165, 0.19951225817203522, 0.21303889155387878, 0.22656552493572235, 0.24009215831756592, 0.2536187767982483, 0.26714542508125305, 0.2806720435619354, 0.2941986918449402, 0.30772531032562256, 0.3212519586086273, 0.3347786068916321, 0.34830522537231445, 0.3618318736553192, 0.375358521938324, 0.38888514041900635, 0.4024117887020111, 0.4159384071826935, 0.42946505546569824, 0.4429916739463806, 0.4565183222293854, 0.47004497051239014]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 7.0, 8.0, 7.0, 8.0, 8.0, 16.0, 13.0, 22.0, 16.0, 21.0, 19.0, 34.0, 36.0, 31.0, 40.0, 51.0, 36.0, 45.0, 41.0, 68.0, 49.0, 43.0, 40.0, 40.0, 37.0, 30.0, 23.0, 32.0, 24.0, 29.0, 21.0, 13.0, 12.0, 16.0, 13.0, 4.0, 11.0, 11.0, 3.0, 11.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.09758031368255615, -0.09430770576000214, -0.09103509783744812, -0.0877624899148941, -0.08448988199234009, -0.08121727406978607, -0.07794466614723206, -0.07467205822467804, -0.07139945030212402, -0.06812684237957001, -0.06485423445701599, -0.061581626534461975, -0.05830901861190796, -0.05503641068935394, -0.05176380276679993, -0.04849119484424591, -0.045218586921691895, -0.04194597899913788, -0.03867337107658386, -0.035400763154029846, -0.03212815523147583, -0.028855547308921814, -0.025582939386367798, -0.022310331463813782, -0.019037723541259766, -0.01576511561870575, -0.012492507696151733, -0.009219899773597717, -0.005947291851043701, -0.002674683928489685, 0.0005979239940643311, 0.003870531916618347, 0.007143139839172363, 0.01041574776172638, 0.013688355684280396, 0.01696096360683441, 0.020233571529388428, 0.023506179451942444, 0.02677878737449646, 0.030051395297050476, 0.03332400321960449, 0.03659661114215851, 0.039869219064712524, 0.04314182698726654, 0.04641443490982056, 0.04968704283237457, 0.05295965075492859, 0.056232258677482605, 0.05950486660003662, 0.06277747452259064, 0.06605008244514465, 0.06932269036769867, 0.07259529829025269, 0.0758679062128067, 0.07914051413536072, 0.08241312205791473, 0.08568572998046875, 0.08895833790302277, 0.09223094582557678, 0.0955035537481308, 0.09877616167068481, 0.10204876959323883, 0.10532137751579285, 0.10859398543834686, 0.11186659336090088]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 3.0, 1.0, 12.0, 9.0, 5.0, 4.0, 8.0, 8.0, 6.0, 8.0, 14.0, 11.0, 24.0, 21.0, 22.0, 23.0, 65.0, 225.0, 4192602.0, 610.0, 276.0, 112.0, 35.0, 16.0, 19.0, 22.0, 25.0, 10.0, 5.0, 7.0, 6.0, 10.0, 2.0, 4.0, 2.0, 4.0, 6.0, 2.0, 6.0, 0.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0], "bins": [-0.0014333724975585938, -0.0013922303915023804, -0.001351088285446167, -0.0013099461793899536, -0.0012688040733337402, -0.0012276619672775269, -0.0011865198612213135, -0.0011453777551651, -0.0011042356491088867, -0.0010630935430526733, -0.00102195143699646, -0.0009808093309402466, -0.0009396672248840332, -0.0008985251188278198, -0.0008573830127716064, -0.0008162409067153931, -0.0007750988006591797, -0.0007339566946029663, -0.0006928145885467529, -0.0006516724824905396, -0.0006105303764343262, -0.0005693882703781128, -0.0005282461643218994, -0.00048710405826568604, -0.00044596195220947266, -0.0004048198461532593, -0.0003636777400970459, -0.0003225356340408325, -0.00028139352798461914, -0.00024025142192840576, -0.00019910931587219238, -0.000157967209815979, -0.00011682510375976562, -7.568299770355225e-05, -3.454089164733887e-05, 6.601214408874512e-06, 4.774332046508789e-05, 8.888542652130127e-05, 0.00013002753257751465, 0.00017116963863372803, 0.0002123117446899414, 0.0002534538507461548, 0.00029459595680236816, 0.00033573806285858154, 0.0003768801689147949, 0.0004180222749710083, 0.0004591643810272217, 0.0005003064870834351, 0.0005414485931396484, 0.0005825906991958618, 0.0006237328052520752, 0.0006648749113082886, 0.000706017017364502, 0.0007471591234207153, 0.0007883012294769287, 0.0008294433355331421, 0.0008705854415893555, 0.0009117275476455688, 0.0009528696537017822, 0.0009940117597579956, 0.001035153865814209, 0.0010762959718704224, 0.0011174380779266357, 0.0011585801839828491, 0.0011997222900390625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 13.0, 11.0, 9.0, 9.0, 16.0, 57.0, 136.0, 257.0, 229.0, 109.0, 29.0, 12.0, 9.0, 12.0, 11.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161378860473633, -0.006906986236572266, -0.0066525936126708984, -0.006398200988769531, -0.006143808364868164, -0.005889415740966797, -0.00563502311706543, -0.0053806304931640625, -0.005126237869262695, -0.004871845245361328, -0.004617452621459961, -0.004363059997558594, -0.0041086673736572266, -0.0038542747497558594, -0.003599882125854492, -0.003345489501953125, -0.003091096878051758, -0.0028367042541503906, -0.0025823116302490234, -0.0023279190063476562, -0.002073526382446289, -0.0018191337585449219, -0.0015647411346435547, -0.0013103485107421875, -0.0010559558868408203, -0.0008015632629394531, -0.0005471706390380859, -0.00029277801513671875, -3.838539123535156e-05, 0.00021600723266601562, 0.0004703998565673828, 0.00072479248046875, 0.0009791851043701172, 0.0012335777282714844, 0.0014879703521728516, 0.0017423629760742188, 0.001996755599975586, 0.002251148223876953, 0.0025055408477783203, 0.0027599334716796875, 0.0030143260955810547, 0.003268718719482422, 0.003523111343383789, 0.0037775039672851562, 0.0040318965911865234, 0.004286289215087891, 0.004540681838989258, 0.004795074462890625, 0.005049467086791992, 0.005303859710693359, 0.0055582523345947266, 0.005812644958496094, 0.006067037582397461, 0.006321430206298828, 0.006575822830200195, 0.0068302154541015625, 0.00708460807800293, 0.007339000701904297, 0.007593393325805664, 0.007847785949707031, 0.008102178573608398, 0.008356571197509766, 0.008610963821411133, 0.0088653564453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 12.0, 35.0, 56.0, 82.0, 77.0, 170.0, 4191054.0, 2308.0, 143.0, 126.0, 103.0, 69.0, 23.0, 13.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004024505615234375, -0.0003880411386489868, -0.00037363171577453613, -0.00035922229290008545, -0.00034481287002563477, -0.0003304034471511841, -0.0003159940242767334, -0.0003015846014022827, -0.00028717517852783203, -0.00027276575565338135, -0.00025835633277893066, -0.00024394690990447998, -0.0002295374870300293, -0.0002151280641555786, -0.00020071864128112793, -0.00018630921840667725, -0.00017189979553222656, -0.00015749037265777588, -0.0001430809497833252, -0.0001286715269088745, -0.00011426210403442383, -9.985268115997314e-05, -8.544325828552246e-05, -7.103383541107178e-05, -5.6624412536621094e-05, -4.221498966217041e-05, -2.7805566787719727e-05, -1.3396143913269043e-05, 1.0132789611816406e-06, 1.5422701835632324e-05, 2.9832124710083008e-05, 4.424154758453369e-05, 5.8650970458984375e-05, 7.306039333343506e-05, 8.746981620788574e-05, 0.00010187923908233643, 0.00011628866195678711, 0.0001306980848312378, 0.00014510750770568848, 0.00015951693058013916, 0.00017392635345458984, 0.00018833577632904053, 0.0002027451992034912, 0.0002171546220779419, 0.00023156404495239258, 0.00024597346782684326, 0.00026038289070129395, 0.00027479231357574463, 0.0002892017364501953, 0.000303611159324646, 0.0003180205821990967, 0.00033243000507354736, 0.00034683942794799805, 0.00036124885082244873, 0.0003756582736968994, 0.0003900676965713501, 0.0004044771194458008, 0.00041888654232025146, 0.00043329596519470215, 0.00044770538806915283, 0.0004621148109436035, 0.0004765242338180542, 0.0004909336566925049, 0.0005053430795669556, 0.0005197525024414062]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4088.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014591217041015625, -0.00014322157949209213, -0.00014053098857402802, -0.0001378403976559639, -0.00013514980673789978, -0.00013245921581983566, -0.00012976862490177155, -0.00012707803398370743, -0.0001243874430656433, -0.00012169685214757919, -0.00011900626122951508, -0.00011631567031145096, -0.00011362507939338684, -0.00011093448847532272, -0.0001082438975572586, -0.00010555330663919449, -0.00010286271572113037, -0.00010017212480306625, -9.748153388500214e-05, -9.479094296693802e-05, -9.21003520488739e-05, -8.940976113080978e-05, -8.671917021274567e-05, -8.402857929468155e-05, -8.133798837661743e-05, -7.864739745855331e-05, -7.59568065404892e-05, -7.326621562242508e-05, -7.057562470436096e-05, -6.788503378629684e-05, -6.519444286823273e-05, -6.250385195016861e-05, -5.981326103210449e-05, -5.7122670114040375e-05, -5.443207919597626e-05, -5.174148827791214e-05, -4.905089735984802e-05, -4.6360306441783905e-05, -4.366971552371979e-05, -4.097912460565567e-05, -3.828853368759155e-05, -3.5597942769527435e-05, -3.290735185146332e-05, -3.02167609333992e-05, -2.7526170015335083e-05, -2.4835579097270966e-05, -2.2144988179206848e-05, -1.945439726114273e-05, -1.6763806343078613e-05, -1.4073215425014496e-05, -1.1382624506950378e-05, -8.692033588886261e-06, -6.0014426708221436e-06, -3.310851752758026e-06, -6.202608346939087e-07, 2.0703300833702087e-06, 4.760921001434326e-06, 7.451511919498444e-06, 1.0142102837562561e-05, 1.2832693755626678e-05, 1.5523284673690796e-05, 1.8213875591754913e-05, 2.090446650981903e-05, 2.3595057427883148e-05, 2.6285648345947266e-05]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 10.0, 864.0, 135.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002853727783076465, -0.0002710241242311895, -0.00025667547015473247, -0.00024232680152636021, -0.00022797813289798796, -0.00021362947882153094, -0.00019928082474507391, -0.0001849321706686169, -0.00017058350204024464, -0.00015623484796378762, -0.00014188617933541536, -0.00012753752525895834, -0.0001131888639065437, -9.884020255412906e-05, -8.449154847767204e-05, -7.01428871252574e-05, -5.5794225772842765e-05, -4.144556442042813e-05, -2.7096906705992296e-05, -1.2748248991556466e-05, 1.6004123608581722e-06, 1.594907371327281e-05, 3.0297727789729834e-05, 4.464638914214447e-05, 5.899505049455911e-05, 7.334371184697375e-05, 8.769237319938838e-05, 0.00010204102727584541, 0.00011638968862826005, 0.00013073834998067468, 0.0001450870040571317, 0.00015943567268550396, 0.00017378432676196098, 0.000188132980838418, 0.00020248164946679026, 0.00021683030354324728, 0.00023117897217161953, 0.00024552762624807656, 0.0002598762803245336, 0.0002742249344009906, 0.0002885736175812781, 0.0003029222716577351, 0.00031727092573419213, 0.00033161957981064916, 0.00034596826299093664, 0.00036031691706739366, 0.0003746655711438507, 0.0003890142252203077, 0.00040336287929676473, 0.00041771153337322176, 0.0004320601874496788, 0.00044640887062996626, 0.0004607575247064233, 0.0004751061787828803, 0.0004894548328593373, 0.0005038034869357944, 0.0005181521410122514, 0.0005325007950887084, 0.0005468494491651654, 0.0005611981032416224, 0.0005755467573180795, 0.0005898954113945365, 0.0006042440654709935, 0.0006185927777551115, 0.0006329414318315685]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 12.0, 25.0, 46.0, 97.0, 140.0, 181.0, 137.0, 177.0, 99.0, 48.0, 14.0, 10.0, 5.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00029224157333374023, -0.00028496887534856796, -0.0002776961773633957, -0.0002704234793782234, -0.00026315078139305115, -0.0002558780834078789, -0.0002486053854227066, -0.00024133268743753433, -0.00023405998945236206, -0.0002267872914671898, -0.00021951459348201752, -0.00021224189549684525, -0.00020496919751167297, -0.0001976964995265007, -0.00019042380154132843, -0.00018315110355615616, -0.0001758784055709839, -0.00016860570758581161, -0.00016133300960063934, -0.00015406031161546707, -0.0001467876136302948, -0.00013951491564512253, -0.00013224221765995026, -0.00012496951967477798, -0.00011769682168960571, -0.00011042412370443344, -0.00010315142571926117, -9.58787277340889e-05, -8.860602974891663e-05, -8.133333176374435e-05, -7.406063377857208e-05, -6.678793579339981e-05, -5.951523780822754e-05, -5.224253982305527e-05, -4.4969841837882996e-05, -3.7697143852710724e-05, -3.0424445867538452e-05, -2.315174788236618e-05, -1.587904989719391e-05, -8.606351912021637e-06, -1.3336539268493652e-06, 5.9390440583229065e-06, 1.3211742043495178e-05, 2.048444002866745e-05, 2.775713801383972e-05, 3.5029835999011993e-05, 4.2302533984184265e-05, 4.957523196935654e-05, 5.684792995452881e-05, 6.412062793970108e-05, 7.139332592487335e-05, 7.866602391004562e-05, 8.59387218952179e-05, 9.321141988039017e-05, 0.00010048411786556244, 0.00010775681585073471, 0.00011502951383590698, 0.00012230221182107925, 0.00012957490980625153, 0.0001368476077914238, 0.00014412030577659607, 0.00015139300376176834, 0.0001586657017469406, 0.00016593839973211288, 0.00017321109771728516]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 8.0, 2.0, 8.0, 10.0, 16.0, 17.0, 26.0, 29.0, 35.0, 67.0, 88.0, 111.0, 170.0, 242.0, 373.0, 534.0, 909.0, 1455.0, 2649.0, 5553.0, 15080.0, 153695.0, 833031.0, 20151.0, 6659.0, 3032.0, 1639.0, 976.0, 608.0, 430.0, 258.0, 200.0, 135.0, 84.0, 79.0, 50.0, 30.0, 27.0, 34.0, 12.0, 11.0, 8.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020172119140625, -0.01947927474975586, -0.01878643035888672, -0.018093585968017578, -0.017400741577148438, -0.016707897186279297, -0.016015052795410156, -0.015322208404541016, -0.014629364013671875, -0.013936519622802734, -0.013243675231933594, -0.012550830841064453, -0.011857986450195312, -0.011165142059326172, -0.010472297668457031, -0.00977945327758789, -0.00908660888671875, -0.00839376449584961, -0.007700920104980469, -0.007008075714111328, -0.0063152313232421875, -0.005622386932373047, -0.004929542541503906, -0.004236698150634766, -0.003543853759765625, -0.0028510093688964844, -0.0021581649780273438, -0.0014653205871582031, -0.0007724761962890625, -7.963180541992188e-05, 0.0006132125854492188, 0.0013060569763183594, 0.0019989013671875, 0.0026917457580566406, 0.0033845901489257812, 0.004077434539794922, 0.0047702789306640625, 0.005463123321533203, 0.006155967712402344, 0.006848812103271484, 0.007541656494140625, 0.008234500885009766, 0.008927345275878906, 0.009620189666748047, 0.010313034057617188, 0.011005878448486328, 0.011698722839355469, 0.01239156723022461, 0.01308441162109375, 0.01377725601196289, 0.014470100402832031, 0.015162944793701172, 0.015855789184570312, 0.016548633575439453, 0.017241477966308594, 0.017934322357177734, 0.018627166748046875, 0.019320011138916016, 0.020012855529785156, 0.020705699920654297, 0.021398544311523438, 0.022091388702392578, 0.02278423309326172, 0.02347707748413086, 0.024169921875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 13.0, 11.0, 9.0, 9.0, 16.0, 57.0, 136.0, 257.0, 229.0, 109.0, 29.0, 12.0, 9.0, 12.0, 11.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161378860473633, -0.006906986236572266, -0.0066525936126708984, -0.006398200988769531, -0.006143808364868164, -0.005889415740966797, -0.00563502311706543, -0.0053806304931640625, -0.005126237869262695, -0.004871845245361328, -0.004617452621459961, -0.004363059997558594, -0.0041086673736572266, -0.0038542747497558594, -0.003599882125854492, -0.003345489501953125, -0.003091096878051758, -0.0028367042541503906, -0.0025823116302490234, -0.0023279190063476562, -0.002073526382446289, -0.0018191337585449219, -0.0015647411346435547, -0.0013103485107421875, -0.0010559558868408203, -0.0008015632629394531, -0.0005471706390380859, -0.00029277801513671875, -3.838539123535156e-05, 0.00021600723266601562, 0.0004703998565673828, 0.00072479248046875, 0.0009791851043701172, 0.0012335777282714844, 0.0014879703521728516, 0.0017423629760742188, 0.001996755599975586, 0.002251148223876953, 0.0025055408477783203, 0.0027599334716796875, 0.0030143260955810547, 0.003268718719482422, 0.003523111343383789, 0.0037775039672851562, 0.0040318965911865234, 0.004286289215087891, 0.004540681838989258, 0.004795074462890625, 0.005049467086791992, 0.005303859710693359, 0.0055582523345947266, 0.005812644958496094, 0.006067037582397461, 0.006321430206298828, 0.006575822830200195, 0.0068302154541015625, 0.00708460807800293, 0.007339000701904297, 0.007593393325805664, 0.007847785949707031, 0.008102178573608398, 0.008356571197509766, 0.008610963821411133, 0.0088653564453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 9.0, 12.0, 14.0, 17.0, 22.0, 17.0, 19.0, 19.0, 24.0, 27.0, 32.0, 48.0, 77.0, 114.0, 233.0, 436.0, 1037.0, 2405.0, 170034.0, 868522.0, 3086.0, 1038.0, 534.0, 261.0, 149.0, 76.0, 48.0, 35.0, 38.0, 33.0, 15.0, 13.0, 14.0, 10.0, 18.0, 5.0, 8.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0293121337890625, -0.02836894989013672, -0.027425765991210938, -0.026482582092285156, -0.025539398193359375, -0.024596214294433594, -0.023653030395507812, -0.02270984649658203, -0.02176666259765625, -0.02082347869873047, -0.019880294799804688, -0.018937110900878906, -0.017993927001953125, -0.017050743103027344, -0.016107559204101562, -0.015164375305175781, -0.01422119140625, -0.013278007507324219, -0.012334823608398438, -0.011391639709472656, -0.010448455810546875, -0.009505271911621094, -0.008562088012695312, -0.007618904113769531, -0.00667572021484375, -0.005732536315917969, -0.0047893524169921875, -0.0038461685180664062, -0.002902984619140625, -0.0019598007202148438, -0.0010166168212890625, -7.343292236328125e-05, 0.0008697509765625, 0.0018129348754882812, 0.0027561187744140625, 0.0036993026733398438, 0.004642486572265625, 0.005585670471191406, 0.0065288543701171875, 0.007472038269042969, 0.00841522216796875, 0.009358406066894531, 0.010301589965820312, 0.011244773864746094, 0.012187957763671875, 0.013131141662597656, 0.014074325561523438, 0.015017509460449219, 0.015960693359375, 0.01690387725830078, 0.017847061157226562, 0.018790245056152344, 0.019733428955078125, 0.020676612854003906, 0.021619796752929688, 0.02256298065185547, 0.02350616455078125, 0.02444934844970703, 0.025392532348632812, 0.026335716247558594, 0.027278900146484375, 0.028222084045410156, 0.029165267944335938, 0.03010845184326172, 0.0310516357421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 5.0, 9.0, 12.0, 14.0, 17.0, 22.0, 16.0, 20.0, 17.0, 22.0, 24.0, 25.0, 28.0, 30.0, 29.0, 41.0, 35.0, 42.0, 36.0, 32.0, 47.0, 45.0, 34.0, 36.0, 42.0, 36.0, 32.0, 31.0, 29.0, 31.0, 30.0, 15.0, 13.0, 14.0, 10.0, 19.0, 4.0, 8.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0174102783203125, -0.016849994659423828, -0.016289710998535156, -0.015729427337646484, -0.015169143676757812, -0.01460886001586914, -0.014048576354980469, -0.013488292694091797, -0.012928009033203125, -0.012367725372314453, -0.011807441711425781, -0.01124715805053711, -0.010686874389648438, -0.010126590728759766, -0.009566307067871094, -0.009006023406982422, -0.00844573974609375, -0.007885456085205078, -0.007325172424316406, -0.006764888763427734, -0.0062046051025390625, -0.005644321441650391, -0.005084037780761719, -0.004523754119873047, -0.003963470458984375, -0.003403186798095703, -0.0028429031372070312, -0.0022826194763183594, -0.0017223358154296875, -0.0011620521545410156, -0.0006017684936523438, -4.1484832763671875e-05, 0.000518798828125, 0.0010790824890136719, 0.0016393661499023438, 0.0021996498107910156, 0.0027599334716796875, 0.0033202171325683594, 0.0038805007934570312, 0.004440784454345703, 0.005001068115234375, 0.005561351776123047, 0.006121635437011719, 0.006681919097900391, 0.0072422027587890625, 0.007802486419677734, 0.008362770080566406, 0.008923053741455078, 0.00948333740234375, 0.010043621063232422, 0.010603904724121094, 0.011164188385009766, 0.011724472045898438, 0.01228475570678711, 0.012845039367675781, 0.013405323028564453, 0.013965606689453125, 0.014525890350341797, 0.015086174011230469, 0.01564645767211914, 0.016206741333007812, 0.016767024993896484, 0.017327308654785156, 0.017887592315673828, 0.0184478759765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 1.0, 7.0, 5.0, 4.0, 4.0, 7.0, 10.0, 24.0, 35.0, 44.0, 86.0, 196.0, 344.0, 1235.0, 44626.0, 997557.0, 3239.0, 567.0, 241.0, 117.0, 63.0, 38.0, 25.0, 18.0, 11.0, 6.0, 8.0, 3.0, 7.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4007091522216797e-05, -1.3597309589385986e-05, -1.3187527656555176e-05, -1.2777745723724365e-05, -1.2367963790893555e-05, -1.1958181858062744e-05, -1.1548399925231934e-05, -1.1138617992401123e-05, -1.0728836059570312e-05, -1.0319054126739502e-05, -9.909272193908691e-06, -9.499490261077881e-06, -9.08970832824707e-06, -8.67992639541626e-06, -8.27014446258545e-06, -7.860362529754639e-06, -7.450580596923828e-06, -7.040798664093018e-06, -6.631016731262207e-06, -6.2212347984313965e-06, -5.811452865600586e-06, -5.401670932769775e-06, -4.991888999938965e-06, -4.582107067108154e-06, -4.172325134277344e-06, -3.762543201446533e-06, -3.3527612686157227e-06, -2.942979335784912e-06, -2.5331974029541016e-06, -2.123415470123291e-06, -1.7136335372924805e-06, -1.30385160446167e-06, -8.940696716308594e-07, -4.842877388000488e-07, -7.450580596923828e-08, 3.3527612686157227e-07, 7.450580596923828e-07, 1.1548399925231934e-06, 1.564621925354004e-06, 1.9744038581848145e-06, 2.384185791015625e-06, 2.7939677238464355e-06, 3.203749656677246e-06, 3.6135315895080566e-06, 4.023313522338867e-06, 4.433095455169678e-06, 4.842877388000488e-06, 5.252659320831299e-06, 5.662441253662109e-06, 6.07222318649292e-06, 6.4820051193237305e-06, 6.891787052154541e-06, 7.3015689849853516e-06, 7.711350917816162e-06, 8.121132850646973e-06, 8.530914783477783e-06, 8.940696716308594e-06, 9.350478649139404e-06, 9.760260581970215e-06, 1.0170042514801025e-05, 1.0579824447631836e-05, 1.0989606380462646e-05, 1.1399388313293457e-05, 1.1809170246124268e-05, 1.2218952178955078e-05]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 4.0, 3.0, 4.0, 4.0, 7.0, 4.0, 6.0, 5.0, 18.0, 23.0, 29.0, 31.0, 56.0, 64.0, 69.0, 102.0, 146.0, 84.0, 74.0, 75.0, 40.0, 34.0, 30.0, 20.0, 14.0, 10.0, 7.0, 4.0, 5.0, 8.0, 4.0, 4.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.165836334228516e-06, -7.927417755126953e-06, -7.68899917602539e-06, -7.450580596923828e-06, -7.212162017822266e-06, -6.973743438720703e-06, -6.735324859619141e-06, -6.496906280517578e-06, -6.258487701416016e-06, -6.020069122314453e-06, -5.781650543212891e-06, -5.543231964111328e-06, -5.304813385009766e-06, -5.066394805908203e-06, -4.827976226806641e-06, -4.589557647705078e-06, -4.351139068603516e-06, -4.112720489501953e-06, -3.874301910400391e-06, -3.635883331298828e-06, -3.3974647521972656e-06, -3.159046173095703e-06, -2.9206275939941406e-06, -2.682209014892578e-06, -2.4437904357910156e-06, -2.205371856689453e-06, -1.9669532775878906e-06, -1.7285346984863281e-06, -1.4901161193847656e-06, -1.2516975402832031e-06, -1.0132789611816406e-06, -7.748603820800781e-07, -5.364418029785156e-07, -2.980232238769531e-07, -5.960464477539063e-08, 1.7881393432617188e-07, 4.172325134277344e-07, 6.556510925292969e-07, 8.940696716308594e-07, 1.1324882507324219e-06, 1.3709068298339844e-06, 1.6093254089355469e-06, 1.8477439880371094e-06, 2.086162567138672e-06, 2.3245811462402344e-06, 2.562999725341797e-06, 2.8014183044433594e-06, 3.039836883544922e-06, 3.2782554626464844e-06, 3.516674041748047e-06, 3.7550926208496094e-06, 3.993511199951172e-06, 4.231929779052734e-06, 4.470348358154297e-06, 4.708766937255859e-06, 4.947185516357422e-06, 5.185604095458984e-06, 5.424022674560547e-06, 5.662441253662109e-06, 5.900859832763672e-06, 6.139278411865234e-06, 6.377696990966797e-06, 6.616115570068359e-06, 6.854534149169922e-06, 7.092952728271484e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 7.0, 5.0, 16.0, 20.0, 41.0, 92.0, 232.0, 632.0, 1028564.0, 18057.0, 510.0, 178.0, 78.0, 36.0, 17.0, 16.0, 7.0, 9.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6133995056152344e-05, -4.497729241847992e-05, -4.3820589780807495e-05, -4.266388714313507e-05, -4.1507184505462646e-05, -4.035048186779022e-05, -3.91937792301178e-05, -3.8037076592445374e-05, -3.688037395477295e-05, -3.5723671317100525e-05, -3.45669686794281e-05, -3.3410266041755676e-05, -3.225356340408325e-05, -3.109686076641083e-05, -2.9940158128738403e-05, -2.878345549106598e-05, -2.7626752853393555e-05, -2.647005021572113e-05, -2.5313347578048706e-05, -2.4156644940376282e-05, -2.2999942302703857e-05, -2.1843239665031433e-05, -2.068653702735901e-05, -1.9529834389686584e-05, -1.837313175201416e-05, -1.7216429114341736e-05, -1.605972647666931e-05, -1.4903023838996887e-05, -1.3746321201324463e-05, -1.2589618563652039e-05, -1.1432915925979614e-05, -1.027621328830719e-05, -9.119510650634766e-06, -7.962808012962341e-06, -6.806105375289917e-06, -5.649402737617493e-06, -4.492700099945068e-06, -3.335997462272644e-06, -2.1792948246002197e-06, -1.0225921869277954e-06, 1.341104507446289e-07, 1.2908130884170532e-06, 2.4475157260894775e-06, 3.604218363761902e-06, 4.760921001434326e-06, 5.9176236391067505e-06, 7.074326276779175e-06, 8.231028914451599e-06, 9.387731552124023e-06, 1.0544434189796448e-05, 1.1701136827468872e-05, 1.2857839465141296e-05, 1.401454210281372e-05, 1.5171244740486145e-05, 1.632794737815857e-05, 1.7484650015830994e-05, 1.8641352653503418e-05, 1.9798055291175842e-05, 2.0954757928848267e-05, 2.211146056652069e-05, 2.3268163204193115e-05, 2.442486584186554e-05, 2.5581568479537964e-05, 2.6738271117210388e-05, 2.7894973754882812e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 2.0, 8.0, 10.0, 12.0, 21.0, 36.0, 83.0, 463.0, 146.0, 71.0, 46.0, 17.0, 11.0, 7.0, 13.0, 7.0, 9.0, 3.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7358531951904297e-05, -2.6673078536987305e-05, -2.5987625122070312e-05, -2.530217170715332e-05, -2.4616718292236328e-05, -2.3931264877319336e-05, -2.3245811462402344e-05, -2.256035804748535e-05, -2.187490463256836e-05, -2.1189451217651367e-05, -2.0503997802734375e-05, -1.9818544387817383e-05, -1.913309097290039e-05, -1.84476375579834e-05, -1.7762184143066406e-05, -1.7076730728149414e-05, -1.6391277313232422e-05, -1.570582389831543e-05, -1.5020370483398438e-05, -1.4334917068481445e-05, -1.3649463653564453e-05, -1.2964010238647461e-05, -1.2278556823730469e-05, -1.1593103408813477e-05, -1.0907649993896484e-05, -1.0222196578979492e-05, -9.5367431640625e-06, -8.851289749145508e-06, -8.165836334228516e-06, -7.4803829193115234e-06, -6.794929504394531e-06, -6.109476089477539e-06, -5.424022674560547e-06, -4.738569259643555e-06, -4.0531158447265625e-06, -3.3676624298095703e-06, -2.682209014892578e-06, -1.996755599975586e-06, -1.3113021850585938e-06, -6.258487701416016e-07, 5.960464477539063e-08, 7.450580596923828e-07, 1.430511474609375e-06, 2.115964889526367e-06, 2.8014183044433594e-06, 3.4868717193603516e-06, 4.172325134277344e-06, 4.857778549194336e-06, 5.543231964111328e-06, 6.22868537902832e-06, 6.9141387939453125e-06, 7.599592208862305e-06, 8.285045623779297e-06, 8.970499038696289e-06, 9.655952453613281e-06, 1.0341405868530273e-05, 1.1026859283447266e-05, 1.1712312698364258e-05, 1.239776611328125e-05, 1.3083219528198242e-05, 1.3768672943115234e-05, 1.4454126358032227e-05, 1.5139579772949219e-05, 1.582503318786621e-05, 1.6510486602783203e-05]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 15.0, 833.0, 164.0, 3.0, 2.0, 2.0], "bins": [-0.5653712749481201, -0.5559164881706238, -0.5464617013931274, -0.5370069146156311, -0.5275521278381348, -0.5180974006652832, -0.5086426138877869, -0.49918779730796814, -0.4897330403327942, -0.48027825355529785, -0.4708234667778015, -0.46136870980262756, -0.4519139230251312, -0.4424591362476349, -0.43300434947013855, -0.4235495626926422, -0.4140947759151459, -0.40463998913764954, -0.3951852023601532, -0.38573044538497925, -0.3762756586074829, -0.3668208718299866, -0.35736608505249023, -0.3479112982749939, -0.33845651149749756, -0.3290017247200012, -0.3195469379425049, -0.31009218096733093, -0.3006373941898346, -0.29118260741233826, -0.2817278206348419, -0.2722730338573456, -0.26281827688217163, -0.2533634901046753, -0.24390871822834015, -0.2344539314508438, -0.22499915957450867, -0.21554437279701233, -0.206089586019516, -0.19663479924201965, -0.18718001246452332, -0.17772522568702698, -0.16827045381069183, -0.1588156670331955, -0.14936089515686035, -0.139906108379364, -0.13045132160186768, -0.12099654227495193, -0.11154177039861679, -0.10208699107170105, -0.09263220429420471, -0.08317742496728897, -0.07372264564037323, -0.06426786631345749, -0.05481308326125145, -0.04535830020904541, -0.03590352088212967, -0.02644873969256878, -0.01699395850300789, -0.007539177313446999, 0.0019156038761138916, 0.011370383203029633, 0.020825166255235672, 0.03027994930744171, 0.03973472863435745]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 8.0, 9.0, 4.0, 11.0, 12.0, 15.0, 17.0, 21.0, 19.0, 21.0, 29.0, 29.0, 50.0, 43.0, 43.0, 44.0, 47.0, 48.0, 52.0, 58.0, 37.0, 58.0, 39.0, 31.0, 39.0, 28.0, 31.0, 32.0, 20.0, 16.0, 14.0, 9.0, 7.0, 8.0, 13.0, 4.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0904165506362915, -0.08730985969305038, -0.08420316874980927, -0.08109647780656815, -0.07798978686332703, -0.0748831033706665, -0.07177641242742538, -0.06866972148418427, -0.06556303054094315, -0.062456339597702026, -0.05934964865446091, -0.056242961436510086, -0.05313627049326897, -0.05002957955002785, -0.046922892332077026, -0.04381620138883591, -0.04070951044559479, -0.03760281950235367, -0.03449612855911255, -0.03138944134116173, -0.02828275039792061, -0.02517605945467949, -0.02206937037408352, -0.01896268129348755, -0.01585599035024643, -0.012749300338327885, -0.00964261032640934, -0.006535920314490795, -0.0034292303025722504, -0.0003225402906537056, 0.002784149721264839, 0.005890838801860809, 0.008997529745101929, 0.012104219757020473, 0.015210909768939018, 0.01831759884953499, 0.021424289792776108, 0.024530980736017227, 0.027637669816613197, 0.030744358897209167, 0.03385104984045029, 0.036957740783691406, 0.040064431726932526, 0.04317111894488335, 0.046277809888124466, 0.049384500831365585, 0.052491188049316406, 0.055597878992557526, 0.058704569935798645, 0.061811260879039764, 0.06491795182228088, 0.068024642765522, 0.07113133370876312, 0.07423801720142365, 0.07734470814466476, 0.08045139908790588, 0.083558090031147, 0.08666478097438812, 0.08977147191762924, 0.09287816286087036, 0.09598484635353088, 0.099091537296772, 0.10219822824001312, 0.10530491918325424, 0.10841161012649536]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 8.0, 7.0, 7.0, 14.0, 9.0, 13.0, 26.0, 85.0, 2331.0, 4191427.0, 152.0, 74.0, 19.0, 10.0, 9.0, 12.0, 13.0, 3.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0007352828979492188, -0.0007142797112464905, -0.0006932765245437622, -0.0006722733378410339, -0.0006512701511383057, -0.0006302669644355774, -0.0006092637777328491, -0.0005882605910301208, -0.0005672574043273926, -0.0005462542176246643, -0.000525251030921936, -0.0005042478442192078, -0.0004832446575164795, -0.0004622414708137512, -0.00044123828411102295, -0.0004202350974082947, -0.0003992319107055664, -0.00037822872400283813, -0.00035722553730010986, -0.0003362223505973816, -0.0003152191638946533, -0.00029421597719192505, -0.0002732127904891968, -0.0002522096037864685, -0.00023120641708374023, -0.00021020323038101196, -0.0001892000436782837, -0.00016819685697555542, -0.00014719367027282715, -0.00012619048357009888, -0.0001051872968673706, -8.418411016464233e-05, -6.318092346191406e-05, -4.217773675918579e-05, -2.117455005645752e-05, -1.7136335372924805e-07, 2.0831823348999023e-05, 4.1835010051727295e-05, 6.283819675445557e-05, 8.384138345718384e-05, 0.00010484457015991211, 0.00012584775686264038, 0.00014685094356536865, 0.00016785413026809692, 0.0001888573169708252, 0.00020986050367355347, 0.00023086369037628174, 0.00025186687707901, 0.0002728700637817383, 0.00029387325048446655, 0.0003148764371871948, 0.0003358796238899231, 0.00035688281059265137, 0.00037788599729537964, 0.0003988891839981079, 0.0004198923707008362, 0.00044089555740356445, 0.0004618987441062927, 0.000482901930809021, 0.0005039051175117493, 0.0005249083042144775, 0.0005459114909172058, 0.0005669146776199341, 0.0005879178643226624, 0.0006089210510253906]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 12.0, 13.0, 9.0, 9.0, 16.0, 55.0, 129.0, 264.0, 225.0, 113.0, 31.0, 12.0, 9.0, 13.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161617279052734, -0.006907463073730469, -0.006653308868408203, -0.0063991546630859375, -0.006145000457763672, -0.005890846252441406, -0.005636692047119141, -0.005382537841796875, -0.005128383636474609, -0.004874229431152344, -0.004620075225830078, -0.0043659210205078125, -0.004111766815185547, -0.0038576126098632812, -0.0036034584045410156, -0.00334930419921875, -0.0030951499938964844, -0.0028409957885742188, -0.002586841583251953, -0.0023326873779296875, -0.002078533172607422, -0.0018243789672851562, -0.0015702247619628906, -0.001316070556640625, -0.0010619163513183594, -0.0008077621459960938, -0.0005536079406738281, -0.0002994537353515625, -4.5299530029296875e-05, 0.00020885467529296875, 0.0004630088806152344, 0.0007171630859375, 0.0009713172912597656, 0.0012254714965820312, 0.0014796257019042969, 0.0017337799072265625, 0.001987934112548828, 0.0022420883178710938, 0.0024962425231933594, 0.002750396728515625, 0.0030045509338378906, 0.0032587051391601562, 0.003512859344482422, 0.0037670135498046875, 0.004021167755126953, 0.004275321960449219, 0.004529476165771484, 0.00478363037109375, 0.005037784576416016, 0.005291938781738281, 0.005546092987060547, 0.0058002471923828125, 0.006054401397705078, 0.006308555603027344, 0.006562709808349609, 0.006816864013671875, 0.007071018218994141, 0.007325172424316406, 0.007579326629638672, 0.007833480834960938, 0.008087635040283203, 0.008341789245605469, 0.008595943450927734, 0.00885009765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 35.0, 45.0, 97.0, 128.0, 126.0, 4193410.0, 134.0, 105.0, 84.0, 53.0, 31.0, 18.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008306503295898438, -0.0008111335337162018, -0.0007916167378425598, -0.0007720999419689178, -0.0007525831460952759, -0.0007330663502216339, -0.0007135495543479919, -0.00069403275847435, -0.000674515962600708, -0.000654999166727066, -0.0006354823708534241, -0.0006159655749797821, -0.0005964487791061401, -0.0005769319832324982, -0.0005574151873588562, -0.0005378983914852142, -0.0005183815956115723, -0.0004988647997379303, -0.00047934800386428833, -0.00045983120799064636, -0.0004403144121170044, -0.0004207976162433624, -0.00040128082036972046, -0.0003817640244960785, -0.0003622472286224365, -0.00034273043274879456, -0.0003232136368751526, -0.0003036968410015106, -0.00028418004512786865, -0.0002646632492542267, -0.0002451464533805847, -0.00022562965750694275, -0.00020611286163330078, -0.0001865960657596588, -0.00016707926988601685, -0.00014756247401237488, -0.0001280456781387329, -0.00010852888226509094, -8.901208639144897e-05, -6.949529051780701e-05, -4.997849464416504e-05, -3.046169877052307e-05, -1.0944902896881104e-05, 8.571892976760864e-06, 2.8088688850402832e-05, 4.76054847240448e-05, 6.712228059768677e-05, 8.663907647132874e-05, 0.0001061558723449707, 0.00012567266821861267, 0.00014518946409225464, 0.0001647062599658966, 0.00018422305583953857, 0.00020373985171318054, 0.0002232566475868225, 0.00024277344346046448, 0.00026229023933410645, 0.0002818070352077484, 0.0003013238310813904, 0.00032084062695503235, 0.0003403574228286743, 0.0003598742187023163, 0.00037939101457595825, 0.0003989078104496002, 0.0004184246063232422]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4093.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.854534149169922e-06, -3.998167812824249e-06, -1.1418014764785767e-06, 1.714564859867096e-06, 4.5709311962127686e-06, 7.427297532558441e-06, 1.0283663868904114e-05, 1.3140030205249786e-05, 1.599639654159546e-05, 1.885276287794113e-05, 2.1709129214286804e-05, 2.4565495550632477e-05, 2.742186188697815e-05, 3.0278228223323822e-05, 3.3134594559669495e-05, 3.599096089601517e-05, 3.884732723236084e-05, 4.170369356870651e-05, 4.4560059905052185e-05, 4.741642624139786e-05, 5.027279257774353e-05, 5.31291589140892e-05, 5.5985525250434875e-05, 5.884189158678055e-05, 6.169825792312622e-05, 6.45546242594719e-05, 6.741099059581757e-05, 7.026735693216324e-05, 7.312372326850891e-05, 7.598008960485458e-05, 7.883645594120026e-05, 8.169282227754593e-05, 8.45491886138916e-05, 8.740555495023727e-05, 9.026192128658295e-05, 9.311828762292862e-05, 9.597465395927429e-05, 9.883102029561996e-05, 0.00010168738663196564, 0.00010454375296831131, 0.00010740011930465698, 0.00011025648564100266, 0.00011311285197734833, 0.000115969218313694, 0.00011882558465003967, 0.00012168195098638535, 0.00012453831732273102, 0.0001273946836590767, 0.00013025104999542236, 0.00013310741633176804, 0.0001359637826681137, 0.00013882014900445938, 0.00014167651534080505, 0.00014453288167715073, 0.0001473892480134964, 0.00015024561434984207, 0.00015310198068618774, 0.00015595834702253342, 0.0001588147133588791, 0.00016167107969522476, 0.00016452744603157043, 0.0001673838123679161, 0.00017024017870426178, 0.00017309654504060745, 0.00017595291137695312]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 980.0, 26.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007240754785016179, -0.0007026340463198721, -0.0006811925559304655, -0.0006597511237487197, -0.000638309633359313, -0.0006168682011775672, -0.0005954267689958215, -0.0005739852786064148, -0.000552543846424669, -0.0005311024142429233, -0.0005096609238535166, -0.0004882194916717708, -0.0004667780303861946, -0.00044533656910061836, -0.0004238951369188726, -0.00040245367563329637, -0.00038101221434772015, -0.0003595707530621439, -0.0003381292917765677, -0.00031668785959482193, -0.0002952463983092457, -0.0002738049370236695, -0.0002523635048419237, -0.0002309220435563475, -0.00020948058227077127, -0.00018803912098519504, -0.00016659767425153404, -0.00014515622751787305, -0.00012371476623229682, -0.00010227331222267821, -8.08318582130596e-05, -5.939041147939861e-05, -3.7948950193822384e-05, -1.6507496184203774e-05, 4.933957825414836e-06, 2.6375411835033447e-05, 4.781686584465206e-05, 6.925831985427067e-05, 9.069977386388928e-05, 0.00011214122059755027, 0.0001335826818831265, 0.00015502414316870272, 0.00017646558990236372, 0.0001979070366360247, 0.00021934849792160094, 0.00024078995920717716, 0.00026223139138892293, 0.00028367285267449915, 0.0003051143139600754, 0.0003265557752456516, 0.0003479972365312278, 0.0003694386687129736, 0.0003908801299985498, 0.00041232159128412604, 0.0004337630234658718, 0.00045520448475144804, 0.00047664594603702426, 0.00049808737821877, 0.0005195288686081767, 0.0005409703007899225, 0.0005624117329716682, 0.0005838532233610749, 0.0006052946555428207, 0.0006267360877245665, 0.0006481775781139731]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 10.0, 2.0, 14.0, 27.0, 84.0, 106.0, 222.0, 159.0, 192.0, 91.0, 64.0, 13.0, 7.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014632940292358398, -0.00013832375407218933, -0.00013031810522079468, -0.00012231245636940002, -0.00011430680751800537, -0.00010630115866661072, -9.829550981521606e-05, -9.028986096382141e-05, -8.228421211242676e-05, -7.42785632610321e-05, -6.627291440963745e-05, -5.82672655582428e-05, -5.0261616706848145e-05, -4.225596785545349e-05, -3.425031900405884e-05, -2.6244670152664185e-05, -1.823902130126953e-05, -1.0233372449874878e-05, -2.2277235984802246e-06, 5.777925252914429e-06, 1.3783574104309082e-05, 2.1789222955703735e-05, 2.979487180709839e-05, 3.780052065849304e-05, 4.5806169509887695e-05, 5.381181836128235e-05, 6.1817467212677e-05, 6.982311606407166e-05, 7.782876491546631e-05, 8.583441376686096e-05, 9.384006261825562e-05, 0.00010184571146965027, 0.00010985136032104492, 0.00011785700917243958, 0.00012586265802383423, 0.00013386830687522888, 0.00014187395572662354, 0.0001498796045780182, 0.00015788525342941284, 0.0001658909022808075, 0.00017389655113220215, 0.0001819021999835968, 0.00018990784883499146, 0.0001979134976863861, 0.00020591914653778076, 0.00021392479538917542, 0.00022193044424057007, 0.00022993609309196472, 0.00023794174194335938, 0.00024594739079475403, 0.0002539530396461487, 0.00026195868849754333, 0.000269964337348938, 0.00027796998620033264, 0.0002859756350517273, 0.00029398128390312195, 0.0003019869327545166, 0.00030999258160591125, 0.0003179982304573059, 0.00032600387930870056, 0.0003340095281600952, 0.00034201517701148987, 0.0003500208258628845, 0.0003580264747142792, 0.00036603212356567383]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 7.0, 10.0, 4.0, 8.0, 9.0, 14.0, 10.0, 19.0, 35.0, 63.0, 108.0, 239.0, 488.0, 1033.0, 2908.0, 12267.0, 890052.0, 128634.0, 8578.0, 2330.0, 852.0, 402.0, 190.0, 99.0, 58.0, 26.0, 22.0, 14.0, 13.0, 10.0, 7.0, 5.0, 6.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03643798828125, -0.03539395332336426, -0.034349918365478516, -0.03330588340759277, -0.03226184844970703, -0.03121781349182129, -0.030173778533935547, -0.029129743576049805, -0.028085708618164062, -0.02704167366027832, -0.025997638702392578, -0.024953603744506836, -0.023909568786621094, -0.02286553382873535, -0.02182149887084961, -0.020777463912963867, -0.019733428955078125, -0.018689393997192383, -0.01764535903930664, -0.0166013240814209, -0.015557289123535156, -0.014513254165649414, -0.013469219207763672, -0.01242518424987793, -0.011381149291992188, -0.010337114334106445, -0.009293079376220703, -0.008249044418334961, -0.007205009460449219, -0.0061609745025634766, -0.005116939544677734, -0.004072904586791992, -0.00302886962890625, -0.001984834671020508, -0.0009407997131347656, 0.00010323524475097656, 0.0011472702026367188, 0.002191305160522461, 0.003235340118408203, 0.004279375076293945, 0.0053234100341796875, 0.00636744499206543, 0.007411479949951172, 0.008455514907836914, 0.009499549865722656, 0.010543584823608398, 0.01158761978149414, 0.012631654739379883, 0.013675689697265625, 0.014719724655151367, 0.01576375961303711, 0.01680779457092285, 0.017851829528808594, 0.018895864486694336, 0.019939899444580078, 0.02098393440246582, 0.022027969360351562, 0.023072004318237305, 0.024116039276123047, 0.02516007423400879, 0.02620410919189453, 0.027248144149780273, 0.028292179107666016, 0.029336214065551758, 0.0303802490234375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 12.0, 13.0, 9.0, 9.0, 16.0, 55.0, 129.0, 264.0, 225.0, 113.0, 31.0, 12.0, 9.0, 13.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007161617279052734, -0.006907463073730469, -0.006653308868408203, -0.0063991546630859375, -0.006145000457763672, -0.005890846252441406, -0.005636692047119141, -0.005382537841796875, -0.005128383636474609, -0.004874229431152344, -0.004620075225830078, -0.0043659210205078125, -0.004111766815185547, -0.0038576126098632812, -0.0036034584045410156, -0.00334930419921875, -0.0030951499938964844, -0.0028409957885742188, -0.002586841583251953, -0.0023326873779296875, -0.002078533172607422, -0.0018243789672851562, -0.0015702247619628906, -0.001316070556640625, -0.0010619163513183594, -0.0008077621459960938, -0.0005536079406738281, -0.0002994537353515625, -4.5299530029296875e-05, 0.00020885467529296875, 0.0004630088806152344, 0.0007171630859375, 0.0009713172912597656, 0.0012254714965820312, 0.0014796257019042969, 0.0017337799072265625, 0.001987934112548828, 0.0022420883178710938, 0.0024962425231933594, 0.002750396728515625, 0.0030045509338378906, 0.0032587051391601562, 0.003512859344482422, 0.0037670135498046875, 0.004021167755126953, 0.004275321960449219, 0.004529476165771484, 0.00478363037109375, 0.005037784576416016, 0.005291938781738281, 0.005546092987060547, 0.0058002471923828125, 0.006054401397705078, 0.006308555603027344, 0.006562709808349609, 0.006816864013671875, 0.007071018218994141, 0.007325172424316406, 0.007579326629638672, 0.007833480834960938, 0.008087635040283203, 0.008341789245605469, 0.008595943450927734, 0.00885009765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 10.0, 7.0, 8.0, 12.0, 14.0, 26.0, 17.0, 28.0, 23.0, 34.0, 34.0, 56.0, 92.0, 180.0, 391.0, 876.0, 3224.0, 964860.0, 75165.0, 1939.0, 724.0, 286.0, 142.0, 70.0, 52.0, 33.0, 37.0, 24.0, 18.0, 23.0, 15.0, 24.0, 14.0, 14.0, 16.0, 9.0, 5.0, 6.0, 4.0, 6.0, 3.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0262908935546875, -0.025438547134399414, -0.024586200714111328, -0.023733854293823242, -0.022881507873535156, -0.02202916145324707, -0.021176815032958984, -0.0203244686126709, -0.019472122192382812, -0.018619775772094727, -0.01776742935180664, -0.016915082931518555, -0.01606273651123047, -0.015210390090942383, -0.014358043670654297, -0.013505697250366211, -0.012653350830078125, -0.011801004409790039, -0.010948657989501953, -0.010096311569213867, -0.009243965148925781, -0.008391618728637695, -0.007539272308349609, -0.0066869258880615234, -0.0058345794677734375, -0.0049822330474853516, -0.004129886627197266, -0.0032775402069091797, -0.0024251937866210938, -0.0015728473663330078, -0.0007205009460449219, 0.00013184547424316406, 0.00098419189453125, 0.001836538314819336, 0.002688884735107422, 0.003541231155395508, 0.004393577575683594, 0.00524592399597168, 0.006098270416259766, 0.0069506168365478516, 0.0078029632568359375, 0.008655309677124023, 0.00950765609741211, 0.010360002517700195, 0.011212348937988281, 0.012064695358276367, 0.012917041778564453, 0.013769388198852539, 0.014621734619140625, 0.015474081039428711, 0.016326427459716797, 0.017178773880004883, 0.01803112030029297, 0.018883466720581055, 0.01973581314086914, 0.020588159561157227, 0.021440505981445312, 0.0222928524017334, 0.023145198822021484, 0.02399754524230957, 0.024849891662597656, 0.025702238082885742, 0.026554584503173828, 0.027406930923461914, 0.02825927734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 10.0, 7.0, 9.0, 12.0, 15.0, 25.0, 16.0, 28.0, 23.0, 31.0, 29.0, 31.0, 36.0, 40.0, 36.0, 36.0, 46.0, 42.0, 42.0, 31.0, 42.0, 29.0, 38.0, 30.0, 38.0, 30.0, 36.0, 25.0, 17.0, 24.0, 14.0, 25.0, 14.0, 16.0, 13.0, 9.0, 5.0, 6.0, 4.0, 6.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.016326904296875, -0.015796899795532227, -0.015266895294189453, -0.01473689079284668, -0.014206886291503906, -0.013676881790161133, -0.01314687728881836, -0.012616872787475586, -0.012086868286132812, -0.011556863784790039, -0.011026859283447266, -0.010496854782104492, -0.009966850280761719, -0.009436845779418945, -0.008906841278076172, -0.008376836776733398, -0.007846832275390625, -0.0073168277740478516, -0.006786823272705078, -0.006256818771362305, -0.005726814270019531, -0.005196809768676758, -0.004666805267333984, -0.004136800765991211, -0.0036067962646484375, -0.003076791763305664, -0.0025467872619628906, -0.002016782760620117, -0.0014867782592773438, -0.0009567737579345703, -0.0004267692565917969, 0.00010323524475097656, 0.00063323974609375, 0.0011632442474365234, 0.0016932487487792969, 0.0022232532501220703, 0.0027532577514648438, 0.003283262252807617, 0.0038132667541503906, 0.004343271255493164, 0.0048732757568359375, 0.005403280258178711, 0.005933284759521484, 0.006463289260864258, 0.006993293762207031, 0.007523298263549805, 0.008053302764892578, 0.008583307266235352, 0.009113311767578125, 0.009643316268920898, 0.010173320770263672, 0.010703325271606445, 0.011233329772949219, 0.011763334274291992, 0.012293338775634766, 0.012823343276977539, 0.013353347778320312, 0.013883352279663086, 0.01441335678100586, 0.014943361282348633, 0.015473365783691406, 0.01600337028503418, 0.016533374786376953, 0.017063379287719727, 0.0175933837890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 17.0, 9.0, 15.0, 18.0, 23.0, 20.0, 25.0, 32.0, 72.0, 93.0, 250.0, 414.0, 1661.0, 6416.0, 899259.0, 131110.0, 7112.0, 1013.0, 472.0, 150.0, 115.0, 45.0, 37.0, 19.0, 34.0, 16.0, 20.0, 17.0, 14.0, 6.0, 9.0, 3.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.602836608886719e-06, -5.3942203521728516e-06, -5.185604095458984e-06, -4.976987838745117e-06, -4.76837158203125e-06, -4.559755325317383e-06, -4.351139068603516e-06, -4.1425228118896484e-06, -3.933906555175781e-06, -3.725290298461914e-06, -3.516674041748047e-06, -3.3080577850341797e-06, -3.0994415283203125e-06, -2.8908252716064453e-06, -2.682209014892578e-06, -2.473592758178711e-06, -2.2649765014648438e-06, -2.0563602447509766e-06, -1.8477439880371094e-06, -1.6391277313232422e-06, -1.430511474609375e-06, -1.2218952178955078e-06, -1.0132789611816406e-06, -8.046627044677734e-07, -5.960464477539062e-07, -3.8743019104003906e-07, -1.7881393432617188e-07, 2.9802322387695312e-08, 2.384185791015625e-07, 4.470348358154297e-07, 6.556510925292969e-07, 8.642673492431641e-07, 1.0728836059570312e-06, 1.2814998626708984e-06, 1.4901161193847656e-06, 1.6987323760986328e-06, 1.9073486328125e-06, 2.115964889526367e-06, 2.3245811462402344e-06, 2.5331974029541016e-06, 2.7418136596679688e-06, 2.950429916381836e-06, 3.159046173095703e-06, 3.3676624298095703e-06, 3.5762786865234375e-06, 3.7848949432373047e-06, 3.993511199951172e-06, 4.202127456665039e-06, 4.410743713378906e-06, 4.6193599700927734e-06, 4.827976226806641e-06, 5.036592483520508e-06, 5.245208740234375e-06, 5.453824996948242e-06, 5.662441253662109e-06, 5.8710575103759766e-06, 6.079673767089844e-06, 6.288290023803711e-06, 6.496906280517578e-06, 6.705522537231445e-06, 6.9141387939453125e-06, 7.12275505065918e-06, 7.331371307373047e-06, 7.539987564086914e-06, 7.748603820800781e-06]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 5.0, 12.0, 10.0, 10.0, 10.0, 22.0, 9.0, 10.0, 17.0, 20.0, 43.0, 30.0, 50.0, 61.0, 53.0, 50.0, 113.0, 69.0, 59.0, 54.0, 43.0, 41.0, 27.0, 24.0, 15.0, 24.0, 11.0, 16.0, 15.0, 14.0, 9.0, 15.0, 8.0, 5.0, 1.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3974647521972656e-06, -3.275461494922638e-06, -3.1534582376480103e-06, -3.0314549803733826e-06, -2.909451723098755e-06, -2.787448465824127e-06, -2.6654452085494995e-06, -2.543441951274872e-06, -2.421438694000244e-06, -2.2994354367256165e-06, -2.1774321794509888e-06, -2.055428922176361e-06, -1.9334256649017334e-06, -1.8114224076271057e-06, -1.689419150352478e-06, -1.5674158930778503e-06, -1.4454126358032227e-06, -1.323409378528595e-06, -1.2014061212539673e-06, -1.0794028639793396e-06, -9.57399606704712e-07, -8.353963494300842e-07, -7.133930921554565e-07, -5.913898348808289e-07, -4.6938657760620117e-07, -3.473833203315735e-07, -2.253800630569458e-07, -1.0337680578231812e-07, 1.862645149230957e-08, 1.4062970876693726e-07, 2.6263296604156494e-07, 3.8463622331619263e-07, 5.066394805908203e-07, 6.28642737865448e-07, 7.506459951400757e-07, 8.726492524147034e-07, 9.94652509689331e-07, 1.1166557669639587e-06, 1.2386590242385864e-06, 1.3606622815132141e-06, 1.4826655387878418e-06, 1.6046687960624695e-06, 1.7266720533370972e-06, 1.8486753106117249e-06, 1.9706785678863525e-06, 2.0926818251609802e-06, 2.214685082435608e-06, 2.3366883397102356e-06, 2.4586915969848633e-06, 2.580694854259491e-06, 2.7026981115341187e-06, 2.8247013688087463e-06, 2.946704626083374e-06, 3.0687078833580017e-06, 3.1907111406326294e-06, 3.312714397907257e-06, 3.4347176551818848e-06, 3.5567209124565125e-06, 3.67872416973114e-06, 3.800727427005768e-06, 3.9227306842803955e-06, 4.044733941555023e-06, 4.166737198829651e-06, 4.2887404561042786e-06, 4.410743713378906e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 7.0, 10.0, 13.0, 21.0, 28.0, 76.0, 225.0, 1763.0, 1044655.0, 1365.0, 213.0, 77.0, 36.0, 16.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.504753112792969e-05, -3.418140113353729e-05, -3.33152711391449e-05, -3.24491411447525e-05, -3.158301115036011e-05, -3.071688115596771e-05, -2.9850751161575317e-05, -2.8984621167182922e-05, -2.8118491172790527e-05, -2.7252361178398132e-05, -2.6386231184005737e-05, -2.5520101189613342e-05, -2.4653971195220947e-05, -2.3787841200828552e-05, -2.2921711206436157e-05, -2.2055581212043762e-05, -2.1189451217651367e-05, -2.0323321223258972e-05, -1.9457191228866577e-05, -1.8591061234474182e-05, -1.7724931240081787e-05, -1.6858801245689392e-05, -1.5992671251296997e-05, -1.5126541256904602e-05, -1.4260411262512207e-05, -1.3394281268119812e-05, -1.2528151273727417e-05, -1.1662021279335022e-05, -1.0795891284942627e-05, -9.929761290550232e-06, -9.063631296157837e-06, -8.197501301765442e-06, -7.331371307373047e-06, -6.465241312980652e-06, -5.599111318588257e-06, -4.732981324195862e-06, -3.866851329803467e-06, -3.0007213354110718e-06, -2.1345913410186768e-06, -1.2684613466262817e-06, -4.023313522338867e-07, 4.637986421585083e-07, 1.3299286365509033e-06, 2.1960586309432983e-06, 3.0621886253356934e-06, 3.928318619728088e-06, 4.794448614120483e-06, 5.660578608512878e-06, 6.5267086029052734e-06, 7.3928385972976685e-06, 8.258968591690063e-06, 9.125098586082458e-06, 9.991228580474854e-06, 1.0857358574867249e-05, 1.1723488569259644e-05, 1.2589618563652039e-05, 1.3455748558044434e-05, 1.4321878552436829e-05, 1.5188008546829224e-05, 1.605413854122162e-05, 1.6920268535614014e-05, 1.778639853000641e-05, 1.8652528524398804e-05, 1.95186585187912e-05, 2.0384788513183594e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 6.0, 6.0, 7.0, 7.0, 11.0, 20.0, 20.0, 23.0, 58.0, 84.0, 523.0, 93.0, 52.0, 27.0, 19.0, 14.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1696090698242188e-05, -2.1158717572689056e-05, -2.0621344447135925e-05, -2.0083971321582794e-05, -1.9546598196029663e-05, -1.9009225070476532e-05, -1.84718519449234e-05, -1.793447881937027e-05, -1.739710569381714e-05, -1.6859732568264008e-05, -1.6322359442710876e-05, -1.5784986317157745e-05, -1.5247613191604614e-05, -1.4710240066051483e-05, -1.4172866940498352e-05, -1.3635493814945221e-05, -1.309812068939209e-05, -1.2560747563838959e-05, -1.2023374438285828e-05, -1.1486001312732697e-05, -1.0948628187179565e-05, -1.0411255061626434e-05, -9.873881936073303e-06, -9.336508810520172e-06, -8.799135684967041e-06, -8.26176255941391e-06, -7.724389433860779e-06, -7.187016308307648e-06, -6.649643182754517e-06, -6.1122700572013855e-06, -5.574896931648254e-06, -5.037523806095123e-06, -4.500150680541992e-06, -3.962777554988861e-06, -3.42540442943573e-06, -2.888031303882599e-06, -2.3506581783294678e-06, -1.8132850527763367e-06, -1.2759119272232056e-06, -7.385388016700745e-07, -2.0116567611694336e-07, 3.3620744943618774e-07, 8.735805749893188e-07, 1.41095370054245e-06, 1.948326826095581e-06, 2.485699951648712e-06, 3.0230730772018433e-06, 3.5604462027549744e-06, 4.0978193283081055e-06, 4.6351924538612366e-06, 5.172565579414368e-06, 5.709938704967499e-06, 6.24731183052063e-06, 6.784684956073761e-06, 7.322058081626892e-06, 7.859431207180023e-06, 8.396804332733154e-06, 8.934177458286285e-06, 9.471550583839417e-06, 1.0008923709392548e-05, 1.0546296834945679e-05, 1.108366996049881e-05, 1.1621043086051941e-05, 1.2158416211605072e-05, 1.2695789337158203e-05]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 14.0, 83.0, 830.0, 83.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06314918398857117, -0.057644203305244446, -0.052139222621917725, -0.046634241938591, -0.04112926125526428, -0.03562428057193756, -0.03011929616332054, -0.02461431547999382, -0.0191093347966671, -0.013604354113340378, -0.008099372498691082, -0.002594390884041786, 0.002910589799284935, 0.008415570482611656, 0.013920553028583527, 0.019425533711910248, 0.02493051439523697, 0.03043549507856369, 0.03594047576189041, 0.04144545644521713, 0.046950437128543854, 0.052455417811870575, 0.057960402220487595, 0.06346538662910461, 0.06897036731243134, 0.07447534799575806, 0.07998032867908478, 0.0854853093624115, 0.09099029004573822, 0.09649527072906494, 0.10200025141239166, 0.10750523209571838, 0.1130102127790451, 0.11851519346237183, 0.12402017414569855, 0.12952515482902527, 0.135030135512352, 0.1405351161956787, 0.14604009687900543, 0.15154507756233215, 0.15705005824565887, 0.1625550389289856, 0.16806001961231232, 0.17356500029563904, 0.17906998097896576, 0.18457496166229248, 0.1900799423456192, 0.19558492302894592, 0.20108991861343384, 0.20659489929676056, 0.21209987998008728, 0.217604860663414, 0.22310984134674072, 0.22861482203006744, 0.23411980271339417, 0.2396247833967209, 0.2451297640800476, 0.2506347596645355, 0.25613972544670105, 0.26164472103118896, 0.2671496868133545, 0.2726546823978424, 0.27815964818000793, 0.28366464376449585, 0.2891696095466614]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 8.0, 13.0, 12.0, 8.0, 26.0, 27.0, 15.0, 29.0, 29.0, 38.0, 47.0, 56.0, 59.0, 69.0, 65.0, 61.0, 62.0, 51.0, 49.0, 52.0, 33.0, 32.0, 26.0, 23.0, 24.0, 10.0, 15.0, 17.0, 7.0, 11.0, 4.0, 10.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10185462236404419, -0.09835190325975418, -0.09484918415546417, -0.09134646505117416, -0.08784374594688416, -0.08434103429317474, -0.08083831518888474, -0.07733559608459473, -0.07383287698030472, -0.07033015787601471, -0.0668274387717247, -0.06332471966743469, -0.05982200428843498, -0.056319285184144974, -0.052816569805145264, -0.049313850700855255, -0.04581113159656525, -0.04230841249227524, -0.03880569338798523, -0.03530297800898552, -0.03180025890469551, -0.028297539800405502, -0.024794822558760643, -0.021292105317115784, -0.017789386212825775, -0.014286668039858341, -0.010783949866890907, -0.007281231693923473, -0.0037785135209560394, -0.0002757944166660309, 0.0032269228249788284, 0.006729640066623688, 0.010232359170913696, 0.01373507734388113, 0.017237795516848564, 0.020740512758493423, 0.024243231862783432, 0.02774595096707344, 0.0312486682087183, 0.03475138545036316, 0.03825410455465317, 0.041756823658943176, 0.045259542763233185, 0.048762258142232895, 0.0522649772465229, 0.05576769635081291, 0.05927041172981262, 0.06277313083410263, 0.06627584993839264, 0.06977856904268265, 0.07328128814697266, 0.07678400725126266, 0.08028672635555267, 0.08378943800926208, 0.0872921571135521, 0.0907948762178421, 0.09429759532213211, 0.09780031442642212, 0.10130303353071213, 0.10480575263500214, 0.10830846428871155, 0.11181119084358215, 0.11531390249729156, 0.11881662160158157, 0.12231934070587158]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 7.0, 5.0, 1.0, 4.0, 2.0, 9.0, 9.0, 12.0, 10.0, 7.0, 15.0, 24.0, 18.0, 11.0, 15.0, 17.0, 19.0, 20.0, 37.0, 38.0, 51.0, 71.0, 100.0, 118.0, 228.0, 767.0, 4187432.0, 3638.0, 793.0, 286.0, 116.0, 67.0, 52.0, 71.0, 39.0, 20.0, 20.0, 18.0, 22.0, 12.0, 7.0, 5.0, 9.0, 6.0, 11.0, 8.0, 8.0, 11.0, 4.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 5.0], "bins": [-0.0014867782592773438, -0.001444116234779358, -0.001401454210281372, -0.0013587921857833862, -0.0013161301612854004, -0.0012734681367874146, -0.0012308061122894287, -0.0011881440877914429, -0.001145482063293457, -0.0011028200387954712, -0.0010601580142974854, -0.0010174959897994995, -0.0009748339653015137, -0.0009321719408035278, -0.000889509916305542, -0.0008468478918075562, -0.0008041858673095703, -0.0007615238428115845, -0.0007188618183135986, -0.0006761997938156128, -0.000633537769317627, -0.0005908757448196411, -0.0005482137203216553, -0.0005055516958236694, -0.0004628896713256836, -0.00042022764682769775, -0.0003775656223297119, -0.0003349035978317261, -0.00029224157333374023, -0.0002495795488357544, -0.00020691752433776855, -0.00016425549983978271, -0.00012159347534179688, -7.893145084381104e-05, -3.6269426345825195e-05, 6.3925981521606445e-06, 4.9054622650146484e-05, 9.171664714813232e-05, 0.00013437867164611816, 0.000177040696144104, 0.00021970272064208984, 0.0002623647451400757, 0.0003050267696380615, 0.00034768879413604736, 0.0003903508186340332, 0.00043301284313201904, 0.0004756748676300049, 0.0005183368921279907, 0.0005609989166259766, 0.0006036609411239624, 0.0006463229656219482, 0.0006889849901199341, 0.0007316470146179199, 0.0007743090391159058, 0.0008169710636138916, 0.0008596330881118774, 0.0009022951126098633, 0.0009449571371078491, 0.000987619161605835, 0.0010302811861038208, 0.0010729432106018066, 0.0011156052350997925, 0.0011582672595977783, 0.0012009292840957642, 0.00124359130859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 16.0, 8.0, 9.0, 16.0, 45.0, 123.0, 269.0, 220.0, 118.0, 42.0, 12.0, 10.0, 11.0, 11.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 7.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162570953369141, -0.006909370422363281, -0.006656169891357422, -0.0064029693603515625, -0.006149768829345703, -0.005896568298339844, -0.005643367767333984, -0.005390167236328125, -0.005136966705322266, -0.004883766174316406, -0.004630565643310547, -0.0043773651123046875, -0.004124164581298828, -0.0038709640502929688, -0.0036177635192871094, -0.00336456298828125, -0.0031113624572753906, -0.0028581619262695312, -0.002604961395263672, -0.0023517608642578125, -0.002098560333251953, -0.0018453598022460938, -0.0015921592712402344, -0.001338958740234375, -0.0010857582092285156, -0.0008325576782226562, -0.0005793571472167969, -0.0003261566162109375, -7.295608520507812e-05, 0.00018024444580078125, 0.0004334449768066406, 0.0006866455078125, 0.0009398460388183594, 0.0011930465698242188, 0.0014462471008300781, 0.0016994476318359375, 0.0019526481628417969, 0.0022058486938476562, 0.0024590492248535156, 0.002712249755859375, 0.0029654502868652344, 0.0032186508178710938, 0.003471851348876953, 0.0037250518798828125, 0.003978252410888672, 0.004231452941894531, 0.004484653472900391, 0.00473785400390625, 0.004991054534912109, 0.005244255065917969, 0.005497455596923828, 0.0057506561279296875, 0.006003856658935547, 0.006257057189941406, 0.006510257720947266, 0.006763458251953125, 0.007016658782958984, 0.007269859313964844, 0.007523059844970703, 0.0077762603759765625, 0.008029460906982422, 0.008282661437988281, 0.00853586196899414, 0.0087890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 8.0, 19.0, 37.0, 66.0, 91.0, 136.0, 367.0, 1787.0, 4189489.0, 1623.0, 336.0, 129.0, 82.0, 50.0, 35.0, 22.0, 9.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0015964508056640625, -0.0015613436698913574, -0.0015262365341186523, -0.0014911293983459473, -0.0014560222625732422, -0.0014209151268005371, -0.001385807991027832, -0.001350700855255127, -0.0013155937194824219, -0.0012804865837097168, -0.0012453794479370117, -0.0012102723121643066, -0.0011751651763916016, -0.0011400580406188965, -0.0011049509048461914, -0.0010698437690734863, -0.0010347366333007812, -0.0009996294975280762, -0.0009645223617553711, -0.000929415225982666, -0.0008943080902099609, -0.0008592009544372559, -0.0008240938186645508, -0.0007889866828918457, -0.0007538795471191406, -0.0007187724113464355, -0.0006836652755737305, -0.0006485581398010254, -0.0006134510040283203, -0.0005783438682556152, -0.0005432367324829102, -0.0005081295967102051, -0.0004730224609375, -0.0004379153251647949, -0.00040280818939208984, -0.00036770105361938477, -0.0003325939178466797, -0.0002974867820739746, -0.00026237964630126953, -0.00022727251052856445, -0.00019216537475585938, -0.0001570582389831543, -0.00012195110321044922, -8.684396743774414e-05, -5.173683166503906e-05, -1.6629695892333984e-05, 1.8477439880371094e-05, 5.358457565307617e-05, 8.869171142578125e-05, 0.00012379884719848633, 0.0001589059829711914, 0.00019401311874389648, 0.00022912025451660156, 0.00026422739028930664, 0.0002993345260620117, 0.0003344416618347168, 0.0003695487976074219, 0.00040465593338012695, 0.00043976306915283203, 0.0004748702049255371, 0.0005099773406982422, 0.0005450844764709473, 0.0005801916122436523, 0.0006152987480163574, 0.0006504058837890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4048.0, 24.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020301342010498047, -0.00019025243818759918, -0.0001774914562702179, -0.0001647304743528366, -0.00015196949243545532, -0.00013920851051807404, -0.00012644752860069275, -0.00011368654668331146, -0.00010092556476593018, -8.816458284854889e-05, -7.54036009311676e-05, -6.264261901378632e-05, -4.988163709640503e-05, -3.712065517902374e-05, -2.4359673261642456e-05, -1.159869134426117e-05, 1.1622905731201172e-06, 1.3923272490501404e-05, 2.668425440788269e-05, 3.944523632526398e-05, 5.2206218242645264e-05, 6.496720016002655e-05, 7.772818207740784e-05, 9.048916399478912e-05, 0.00010325014591217041, 0.0001160111278295517, 0.00012877210974693298, 0.00014153309166431427, 0.00015429407358169556, 0.00016705505549907684, 0.00017981603741645813, 0.00019257701933383942, 0.0002053380012512207, 0.000218098983168602, 0.00023085996508598328, 0.00024362094700336456, 0.00025638192892074585, 0.00026914291083812714, 0.0002819038927555084, 0.0002946648746728897, 0.000307425856590271, 0.0003201868385076523, 0.00033294782042503357, 0.00034570880234241486, 0.00035846978425979614, 0.00037123076617717743, 0.0003839917480945587, 0.00039675273001194, 0.0004095137119293213, 0.0004222746938467026, 0.00043503567576408386, 0.00044779665768146515, 0.00046055763959884644, 0.0004733186215162277, 0.000486079603433609, 0.0004988405853509903, 0.0005116015672683716, 0.0005243625491857529, 0.0005371235311031342, 0.0005498845130205154, 0.0005626454949378967, 0.000575406476855278, 0.0005881674587726593, 0.0006009284406900406, 0.0006136894226074219]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 9.0, 244.0, 733.0, 22.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001141307526268065, -0.0011142055736854672, -0.0010871035046875477, -0.00106000155210495, -0.0010328995995223522, -0.0010057975305244327, -0.000978695577941835, -0.0009515935671515763, -0.0009244915563613176, -0.000897389545571059, -0.0008702875347808003, -0.0008431855821982026, -0.000816083571407944, -0.0007889815606176853, -0.0007618796080350876, -0.0007347775972448289, -0.0007076755864545703, -0.0006805735756643116, -0.000653471564874053, -0.0006263696122914553, -0.0005992676015011966, -0.000572165590710938, -0.0005450636381283402, -0.0005179616273380816, -0.000490859616547823, -0.0004637576057575643, -0.0004366556240711361, -0.00040955364238470793, -0.0003824516315944493, -0.00035534962080419064, -0.00032824763911776245, -0.00030114565743133426, -0.0002740435884334147, -0.00024694157764315605, -0.00021983959595672786, -0.00019273759971838444, -0.00016563560348004103, -0.0001385336072416976, -0.00011143161100335419, -8.432961476501077e-05, -5.7227618526667356e-05, -3.012562228832394e-05, -3.023626049980521e-06, 2.4078370188362896e-05, 5.1180366426706314e-05, 7.828236266504973e-05, 0.00010538435890339315, 0.00013248635514173657, 0.00015958835138007998, 0.0001866903476184234, 0.00021379234385676682, 0.00024089434009511024, 0.00026799633633345366, 0.0002950983471237123, 0.0003222003288101405, 0.0003493023104965687, 0.0003764043212868273, 0.00040350633207708597, 0.00043060831376351416, 0.00045771029544994235, 0.000484812306240201, 0.0005119143170304596, 0.0005390163278207183, 0.000566118280403316, 0.0005932202911935747]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 5.0, 10.0, 27.0, 46.0, 66.0, 114.0, 153.0, 161.0, 126.0, 117.0, 77.0, 47.0, 26.0, 13.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0013595819473266602, -0.0013292189687490463, -0.0012988559901714325, -0.0012684930115938187, -0.0012381300330162048, -0.001207767054438591, -0.0011774040758609772, -0.0011470410972833633, -0.0011166781187057495, -0.0010863151401281357, -0.0010559521615505219, -0.001025589182972908, -0.0009952262043952942, -0.0009648632258176804, -0.0009345002472400665, -0.0009041372686624527, -0.0008737742900848389, -0.000843411311507225, -0.0008130483329296112, -0.0007826853543519974, -0.0007523223757743835, -0.0007219593971967697, -0.0006915964186191559, -0.000661233440041542, -0.0006308704614639282, -0.0006005074828863144, -0.0005701445043087006, -0.0005397815257310867, -0.0005094185471534729, -0.00047905556857585907, -0.00044869258999824524, -0.0004183296114206314, -0.0003879666328430176, -0.00035760365426540375, -0.0003272406756877899, -0.0002968776971101761, -0.00026651471853256226, -0.00023615173995494843, -0.0002057887613773346, -0.00017542578279972076, -0.00014506280422210693, -0.0001146998256444931, -8.433684706687927e-05, -5.397386848926544e-05, -2.361088991165161e-05, 6.752088665962219e-06, 3.711506724357605e-05, 6.747804582118988e-05, 9.784102439880371e-05, 0.00012820400297641754, 0.00015856698155403137, 0.0001889299601316452, 0.00021929293870925903, 0.00024965591728687286, 0.0002800188958644867, 0.0003103818744421005, 0.00034074485301971436, 0.0003711078315973282, 0.000401470810174942, 0.00043183378875255585, 0.0004621967673301697, 0.0004925597459077835, 0.0005229227244853973, 0.0005532857030630112, 0.000583648681640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 10.0, 13.0, 7.0, 10.0, 21.0, 23.0, 23.0, 47.0, 57.0, 57.0, 109.0, 164.0, 309.0, 458.0, 874.0, 1733.0, 3964.0, 11264.0, 80638.0, 914859.0, 22315.0, 6302.0, 2517.0, 1164.0, 628.0, 319.0, 184.0, 135.0, 80.0, 51.0, 38.0, 34.0, 19.0, 24.0, 27.0, 11.0, 9.0, 9.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.01837158203125, -0.01774311065673828, -0.017114639282226562, -0.016486167907714844, -0.015857696533203125, -0.015229225158691406, -0.014600753784179688, -0.013972282409667969, -0.01334381103515625, -0.012715339660644531, -0.012086868286132812, -0.011458396911621094, -0.010829925537109375, -0.010201454162597656, -0.009572982788085938, -0.008944511413574219, -0.0083160400390625, -0.007687568664550781, -0.0070590972900390625, -0.006430625915527344, -0.005802154541015625, -0.005173683166503906, -0.0045452117919921875, -0.003916740417480469, -0.00328826904296875, -0.0026597976684570312, -0.0020313262939453125, -0.0014028549194335938, -0.000774383544921875, -0.00014591217041015625, 0.0004825592041015625, 0.0011110305786132812, 0.001739501953125, 0.0023679733276367188, 0.0029964447021484375, 0.0036249160766601562, 0.004253387451171875, 0.004881858825683594, 0.0055103302001953125, 0.006138801574707031, 0.00676727294921875, 0.007395744323730469, 0.008024215698242188, 0.008652687072753906, 0.009281158447265625, 0.009909629821777344, 0.010538101196289062, 0.011166572570800781, 0.0117950439453125, 0.012423515319824219, 0.013051986694335938, 0.013680458068847656, 0.014308929443359375, 0.014937400817871094, 0.015565872192382812, 0.01619434356689453, 0.01682281494140625, 0.01745128631591797, 0.018079757690429688, 0.018708229064941406, 0.019336700439453125, 0.019965171813964844, 0.020593643188476562, 0.02122211456298828, 0.0218505859375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 16.0, 8.0, 9.0, 16.0, 45.0, 123.0, 269.0, 220.0, 118.0, 42.0, 11.0, 11.0, 11.0, 11.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 7.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162570953369141, -0.006909370422363281, -0.006656169891357422, -0.0064029693603515625, -0.006149768829345703, -0.005896568298339844, -0.005643367767333984, -0.005390167236328125, -0.005136966705322266, -0.004883766174316406, -0.004630565643310547, -0.0043773651123046875, -0.004124164581298828, -0.0038709640502929688, -0.0036177635192871094, -0.00336456298828125, -0.0031113624572753906, -0.0028581619262695312, -0.002604961395263672, -0.0023517608642578125, -0.002098560333251953, -0.0018453598022460938, -0.0015921592712402344, -0.001338958740234375, -0.0010857582092285156, -0.0008325576782226562, -0.0005793571472167969, -0.0003261566162109375, -7.295608520507812e-05, 0.00018024444580078125, 0.0004334449768066406, 0.0006866455078125, 0.0009398460388183594, 0.0011930465698242188, 0.0014462471008300781, 0.0016994476318359375, 0.0019526481628417969, 0.0022058486938476562, 0.0024590492248535156, 0.002712249755859375, 0.0029654502868652344, 0.0032186508178710938, 0.003471851348876953, 0.0037250518798828125, 0.003978252410888672, 0.004231452941894531, 0.004484653472900391, 0.00473785400390625, 0.004991054534912109, 0.005244255065917969, 0.005497455596923828, 0.0057506561279296875, 0.006003856658935547, 0.006257057189941406, 0.006510257720947266, 0.006763458251953125, 0.007016658782958984, 0.007269859313964844, 0.007523059844970703, 0.0077762603759765625, 0.008029460906982422, 0.008282661437988281, 0.00853586196899414, 0.0087890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 1.0, 4.0, 6.0, 5.0, 10.0, 17.0, 18.0, 9.0, 19.0, 24.0, 27.0, 21.0, 44.0, 38.0, 69.0, 140.0, 282.0, 709.0, 2291.0, 597852.0, 443244.0, 2288.0, 678.0, 281.0, 129.0, 86.0, 53.0, 33.0, 31.0, 27.0, 22.0, 14.0, 14.0, 15.0, 9.0, 5.0, 8.0, 4.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030914306640625, -0.029848098754882812, -0.028781890869140625, -0.027715682983398438, -0.02664947509765625, -0.025583267211914062, -0.024517059326171875, -0.023450851440429688, -0.0223846435546875, -0.021318435668945312, -0.020252227783203125, -0.019186019897460938, -0.01811981201171875, -0.017053604125976562, -0.015987396240234375, -0.014921188354492188, -0.01385498046875, -0.012788772583007812, -0.011722564697265625, -0.010656356811523438, -0.00959014892578125, -0.008523941040039062, -0.007457733154296875, -0.0063915252685546875, -0.0053253173828125, -0.0042591094970703125, -0.003192901611328125, -0.0021266937255859375, -0.00106048583984375, 5.7220458984375e-06, 0.001071929931640625, 0.0021381378173828125, 0.003204345703125, 0.0042705535888671875, 0.005336761474609375, 0.0064029693603515625, 0.00746917724609375, 0.008535385131835938, 0.009601593017578125, 0.010667800903320312, 0.0117340087890625, 0.012800216674804688, 0.013866424560546875, 0.014932632446289062, 0.01599884033203125, 0.017065048217773438, 0.018131256103515625, 0.019197463989257812, 0.020263671875, 0.021329879760742188, 0.022396087646484375, 0.023462295532226562, 0.02452850341796875, 0.025594711303710938, 0.026660919189453125, 0.027727127075195312, 0.0287933349609375, 0.029859542846679688, 0.030925750732421875, 0.03199195861816406, 0.03305816650390625, 0.03412437438964844, 0.035190582275390625, 0.03625679016113281, 0.037322998046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 10.0, 17.0, 18.0, 10.0, 18.0, 24.0, 28.0, 19.0, 39.0, 28.0, 31.0, 35.0, 42.0, 52.0, 51.0, 55.0, 59.0, 43.0, 39.0, 39.0, 40.0, 44.0, 40.0, 31.0, 30.0, 25.0, 23.0, 15.0, 13.0, 14.0, 10.0, 5.0, 8.0, 4.0, 5.0, 9.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0173187255859375, -0.016721248626708984, -0.01612377166748047, -0.015526294708251953, -0.014928817749023438, -0.014331340789794922, -0.013733863830566406, -0.01313638687133789, -0.012538909912109375, -0.01194143295288086, -0.011343955993652344, -0.010746479034423828, -0.010149002075195312, -0.009551525115966797, -0.008954048156738281, -0.008356571197509766, -0.00775909423828125, -0.007161617279052734, -0.006564140319824219, -0.005966663360595703, -0.0053691864013671875, -0.004771709442138672, -0.004174232482910156, -0.0035767555236816406, -0.002979278564453125, -0.0023818016052246094, -0.0017843246459960938, -0.0011868476867675781, -0.0005893707275390625, 8.106231689453125e-06, 0.0006055831909179688, 0.0012030601501464844, 0.001800537109375, 0.0023980140686035156, 0.0029954910278320312, 0.003592967987060547, 0.0041904449462890625, 0.004787921905517578, 0.005385398864746094, 0.005982875823974609, 0.006580352783203125, 0.007177829742431641, 0.007775306701660156, 0.008372783660888672, 0.008970260620117188, 0.009567737579345703, 0.010165214538574219, 0.010762691497802734, 0.01136016845703125, 0.011957645416259766, 0.012555122375488281, 0.013152599334716797, 0.013750076293945312, 0.014347553253173828, 0.014945030212402344, 0.01554250717163086, 0.016139984130859375, 0.01673746109008789, 0.017334938049316406, 0.017932415008544922, 0.018529891967773438, 0.019127368927001953, 0.01972484588623047, 0.020322322845458984, 0.0209197998046875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 11.0, 17.0, 14.0, 20.0, 46.0, 61.0, 111.0, 227.0, 531.0, 2243.0, 34725.0, 998807.0, 9618.0, 1303.0, 401.0, 156.0, 87.0, 54.0, 28.0, 22.0, 12.0, 14.0, 8.0, 5.0, 5.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1801719665527344e-05, -1.1458061635494232e-05, -1.111440360546112e-05, -1.0770745575428009e-05, -1.0427087545394897e-05, -1.0083429515361786e-05, -9.739771485328674e-06, -9.396113455295563e-06, -9.052455425262451e-06, -8.70879739522934e-06, -8.365139365196228e-06, -8.021481335163116e-06, -7.677823305130005e-06, -7.334165275096893e-06, -6.990507245063782e-06, -6.64684921503067e-06, -6.303191184997559e-06, -5.959533154964447e-06, -5.6158751249313354e-06, -5.272217094898224e-06, -4.928559064865112e-06, -4.584901034832001e-06, -4.241243004798889e-06, -3.897584974765778e-06, -3.553926944732666e-06, -3.2102689146995544e-06, -2.866610884666443e-06, -2.5229528546333313e-06, -2.1792948246002197e-06, -1.8356367945671082e-06, -1.4919787645339966e-06, -1.148320734500885e-06, -8.046627044677734e-07, -4.6100467443466187e-07, -1.1734664440155029e-07, 2.2631138563156128e-07, 5.699694156646729e-07, 9.136274456977844e-07, 1.257285475730896e-06, 1.6009435057640076e-06, 1.944601535797119e-06, 2.2882595658302307e-06, 2.6319175958633423e-06, 2.975575625896454e-06, 3.3192336559295654e-06, 3.662891685962677e-06, 4.0065497159957886e-06, 4.3502077460289e-06, 4.693865776062012e-06, 5.037523806095123e-06, 5.381181836128235e-06, 5.7248398661613464e-06, 6.068497896194458e-06, 6.41215592622757e-06, 6.755813956260681e-06, 7.099471986293793e-06, 7.443130016326904e-06, 7.786788046360016e-06, 8.130446076393127e-06, 8.474104106426239e-06, 8.81776213645935e-06, 9.161420166492462e-06, 9.505078196525574e-06, 9.848736226558685e-06, 1.0192394256591797e-05]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 10.0, 10.0, 19.0, 19.0, 29.0, 38.0, 61.0, 53.0, 107.0, 91.0, 141.0, 112.0, 69.0, 56.0, 39.0, 28.0, 31.0, 16.0, 18.0, 7.0, 11.0, 4.0, 4.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.318092346191406e-06, -6.1336904764175415e-06, -5.949288606643677e-06, -5.764886736869812e-06, -5.580484867095947e-06, -5.3960829973220825e-06, -5.211681127548218e-06, -5.027279257774353e-06, -4.842877388000488e-06, -4.6584755182266235e-06, -4.474073648452759e-06, -4.289671778678894e-06, -4.105269908905029e-06, -3.9208680391311646e-06, -3.7364661693573e-06, -3.552064299583435e-06, -3.3676624298095703e-06, -3.1832605600357056e-06, -2.998858690261841e-06, -2.814456820487976e-06, -2.6300549507141113e-06, -2.4456530809402466e-06, -2.261251211166382e-06, -2.076849341392517e-06, -1.8924474716186523e-06, -1.7080456018447876e-06, -1.5236437320709229e-06, -1.339241862297058e-06, -1.1548399925231934e-06, -9.704381227493286e-07, -7.860362529754639e-07, -6.016343832015991e-07, -4.172325134277344e-07, -2.3283064365386963e-07, -4.842877388000488e-08, 1.3597309589385986e-07, 3.203749656677246e-07, 5.047768354415894e-07, 6.891787052154541e-07, 8.735805749893188e-07, 1.0579824447631836e-06, 1.2423843145370483e-06, 1.426786184310913e-06, 1.6111880540847778e-06, 1.7955899238586426e-06, 1.9799917936325073e-06, 2.164393663406372e-06, 2.348795533180237e-06, 2.5331974029541016e-06, 2.7175992727279663e-06, 2.902001142501831e-06, 3.086403012275696e-06, 3.2708048820495605e-06, 3.4552067518234253e-06, 3.63960862159729e-06, 3.824010491371155e-06, 4.0084123611450195e-06, 4.192814230918884e-06, 4.377216100692749e-06, 4.561617970466614e-06, 4.7460198402404785e-06, 4.930421710014343e-06, 5.114823579788208e-06, 5.299225449562073e-06, 5.4836273193359375e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 19.0, 26.0, 35.0, 80.0, 186.0, 880.0, 1032242.0, 14260.0, 490.0, 125.0, 72.0, 31.0, 33.0, 18.0, 12.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.2961368560791016e-05, -3.206636756658554e-05, -3.1171366572380066e-05, -3.027636557817459e-05, -2.9381364583969116e-05, -2.848636358976364e-05, -2.7591362595558167e-05, -2.669636160135269e-05, -2.5801360607147217e-05, -2.4906359612941742e-05, -2.4011358618736267e-05, -2.3116357624530792e-05, -2.2221356630325317e-05, -2.1326355636119843e-05, -2.0431354641914368e-05, -1.9536353647708893e-05, -1.8641352653503418e-05, -1.7746351659297943e-05, -1.6851350665092468e-05, -1.5956349670886993e-05, -1.5061348676681519e-05, -1.4166347682476044e-05, -1.3271346688270569e-05, -1.2376345694065094e-05, -1.1481344699859619e-05, -1.0586343705654144e-05, -9.69134271144867e-06, -8.796341717243195e-06, -7.90134072303772e-06, -7.006339728832245e-06, -6.11133873462677e-06, -5.216337740421295e-06, -4.32133674621582e-06, -3.4263357520103455e-06, -2.5313347578048706e-06, -1.6363337635993958e-06, -7.413327693939209e-07, 1.5366822481155396e-07, 1.0486692190170288e-06, 1.9436702132225037e-06, 2.8386712074279785e-06, 3.7336722016334534e-06, 4.628673195838928e-06, 5.523674190044403e-06, 6.418675184249878e-06, 7.313676178455353e-06, 8.208677172660828e-06, 9.103678166866302e-06, 9.998679161071777e-06, 1.0893680155277252e-05, 1.1788681149482727e-05, 1.2683682143688202e-05, 1.3578683137893677e-05, 1.4473684132099152e-05, 1.5368685126304626e-05, 1.62636861205101e-05, 1.7158687114715576e-05, 1.805368810892105e-05, 1.8948689103126526e-05, 1.9843690097332e-05, 2.0738691091537476e-05, 2.163369208574295e-05, 2.2528693079948425e-05, 2.34236940741539e-05, 2.4318695068359375e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 12.0, 14.0, 17.0, 31.0, 52.0, 67.0, 507.0, 72.0, 66.0, 32.0, 31.0, 19.0, 22.0, 11.0, 10.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.8537044525146484e-05, -1.8034130334854126e-05, -1.7531216144561768e-05, -1.702830195426941e-05, -1.652538776397705e-05, -1.6022473573684692e-05, -1.5519559383392334e-05, -1.5016645193099976e-05, -1.4513731002807617e-05, -1.4010816812515259e-05, -1.35079026222229e-05, -1.3004988431930542e-05, -1.2502074241638184e-05, -1.1999160051345825e-05, -1.1496245861053467e-05, -1.0993331670761108e-05, -1.049041748046875e-05, -9.987503290176392e-06, -9.484589099884033e-06, -8.981674909591675e-06, -8.478760719299316e-06, -7.975846529006958e-06, -7.4729323387146e-06, -6.970018148422241e-06, -6.467103958129883e-06, -5.964189767837524e-06, -5.461275577545166e-06, -4.958361387252808e-06, -4.455447196960449e-06, -3.952533006668091e-06, -3.4496188163757324e-06, -2.946704626083374e-06, -2.4437904357910156e-06, -1.9408762454986572e-06, -1.4379620552062988e-06, -9.350478649139404e-07, -4.3213367462158203e-07, 7.078051567077637e-08, 5.736947059631348e-07, 1.0766088962554932e-06, 1.5795230865478516e-06, 2.08243727684021e-06, 2.5853514671325684e-06, 3.0882656574249268e-06, 3.591179847717285e-06, 4.0940940380096436e-06, 4.597008228302002e-06, 5.09992241859436e-06, 5.602836608886719e-06, 6.105750799179077e-06, 6.6086649894714355e-06, 7.111579179763794e-06, 7.614493370056152e-06, 8.11740756034851e-06, 8.620321750640869e-06, 9.123235940933228e-06, 9.626150131225586e-06, 1.0129064321517944e-05, 1.0631978511810303e-05, 1.1134892702102661e-05, 1.163780689239502e-05, 1.2140721082687378e-05, 1.2643635272979736e-05, 1.3146549463272095e-05, 1.3649463653564453e-05]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 28.0, 133.0, 690.0, 120.0, 24.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10095751285552979, -0.09785737842321396, -0.09475723654031754, -0.09165710210800171, -0.08855696022510529, -0.08545682579278946, -0.08235669136047363, -0.07925654947757721, -0.07615640759468079, -0.07305627316236496, -0.06995613127946854, -0.06685599684715271, -0.06375585496425629, -0.06065572053194046, -0.057555582374334335, -0.05445544421672821, -0.051355309784412384, -0.04825517162680626, -0.045155033469200134, -0.04205489903688431, -0.038954757153987885, -0.03585462272167206, -0.03275448456406593, -0.02965434640645981, -0.026554208248853683, -0.02345407009124756, -0.020353931933641434, -0.017253795638680458, -0.014153657481074333, -0.011053519323468208, -0.007953383028507233, -0.004853244870901108, -0.001753106713294983, 0.0013470309786498547, 0.004447168670594692, 0.0075473058968782425, 0.010647444054484367, 0.013747582212090492, 0.016847718507051468, 0.019947856664657593, 0.023047994822263718, 0.026148132979869843, 0.029248271137475967, 0.03234840929508209, 0.03544854372739792, 0.03854868561029434, 0.04164882004261017, 0.04474895820021629, 0.04784909635782242, 0.05094923451542854, 0.05404937267303467, 0.057149507105350494, 0.06024964898824692, 0.06334978342056274, 0.06644992530345917, 0.069550059735775, 0.07265019416809082, 0.07575032860040665, 0.07885047048330307, 0.0819506049156189, 0.08505074679851532, 0.08815088123083115, 0.09125101566314697, 0.0943511575460434, 0.09745129942893982]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 5.0, 11.0, 10.0, 10.0, 7.0, 21.0, 21.0, 21.0, 23.0, 24.0, 36.0, 34.0, 44.0, 47.0, 50.0, 47.0, 46.0, 41.0, 58.0, 48.0, 45.0, 33.0, 54.0, 37.0, 42.0, 30.0, 21.0, 17.0, 14.0, 17.0, 18.0, 12.0, 13.0, 7.0, 2.0, 7.0, 1.0, 2.0, 6.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08758425712585449, -0.084969162940979, -0.08235406875610352, -0.07973897457122803, -0.07712388038635254, -0.07450878620147705, -0.07189369201660156, -0.06927859783172607, -0.06666350364685059, -0.0640484094619751, -0.06143331527709961, -0.05881822109222412, -0.05620312690734863, -0.053588032722473145, -0.050972938537597656, -0.04835784435272217, -0.04574275016784668, -0.04312765598297119, -0.0405125617980957, -0.037897467613220215, -0.03528237342834473, -0.03266727924346924, -0.03005218505859375, -0.02743709087371826, -0.024821996688842773, -0.022206902503967285, -0.019591808319091797, -0.01697671413421631, -0.01436161994934082, -0.011746525764465332, -0.009131431579589844, -0.0065163373947143555, -0.003901243209838867, -0.001286149024963379, 0.0013289451599121094, 0.003944039344787598, 0.006559133529663086, 0.009174227714538574, 0.011789321899414062, 0.01440441608428955, 0.01701951026916504, 0.019634604454040527, 0.022249698638916016, 0.024864792823791504, 0.027479887008666992, 0.03009498119354248, 0.03271007537841797, 0.03532516956329346, 0.037940263748168945, 0.040555357933044434, 0.04317045211791992, 0.04578554630279541, 0.0484006404876709, 0.05101573467254639, 0.053630828857421875, 0.05624592304229736, 0.05886101722717285, 0.06147611141204834, 0.06409120559692383, 0.06670629978179932, 0.0693213939666748, 0.07193648815155029, 0.07455158233642578, 0.07716667652130127, 0.07978177070617676]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 3.0, 7.0, 6.0, 11.0, 11.0, 8.0, 14.0, 15.0, 18.0, 19.0, 27.0, 44.0, 63.0, 79.0, 137.0, 169.0, 383.0, 1254.0, 15528.0, 4172339.0, 2448.0, 680.0, 306.0, 180.0, 124.0, 77.0, 67.0, 37.0, 33.0, 37.0, 18.0, 29.0, 18.0, 14.0, 15.0, 12.0, 11.0, 3.0, 10.0, 6.0, 7.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0797119140625, -0.07698822021484375, -0.0742645263671875, -0.07154083251953125, -0.068817138671875, -0.06609344482421875, -0.0633697509765625, -0.06064605712890625, -0.05792236328125, -0.05519866943359375, -0.0524749755859375, -0.04975128173828125, -0.047027587890625, -0.04430389404296875, -0.0415802001953125, -0.03885650634765625, -0.0361328125, -0.03340911865234375, -0.0306854248046875, -0.02796173095703125, -0.025238037109375, -0.02251434326171875, -0.0197906494140625, -0.01706695556640625, -0.01434326171875, -0.01161956787109375, -0.0088958740234375, -0.00617218017578125, -0.003448486328125, -0.00072479248046875, 0.0019989013671875, 0.00472259521484375, 0.0074462890625, 0.01016998291015625, 0.0128936767578125, 0.01561737060546875, 0.018341064453125, 0.02106475830078125, 0.0237884521484375, 0.02651214599609375, 0.02923583984375, 0.03195953369140625, 0.0346832275390625, 0.03740692138671875, 0.040130615234375, 0.04285430908203125, 0.0455780029296875, 0.04830169677734375, 0.051025390625, 0.05374908447265625, 0.0564727783203125, 0.05919647216796875, 0.061920166015625, 0.06464385986328125, 0.0673675537109375, 0.07009124755859375, 0.07281494140625, 0.07553863525390625, 0.0782623291015625, 0.08098602294921875, 0.083709716796875, 0.08643341064453125, 0.0891571044921875, 0.09188079833984375, 0.0946044921875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 9.0, 15.0, 9.0, 9.0, 13.0, 45.0, 120.0, 257.0, 233.0, 122.0, 43.0, 11.0, 11.0, 11.0, 10.0, 9.0, 6.0, 4.0, 5.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162809371948242, -0.006909847259521484, -0.0066568851470947266, -0.006403923034667969, -0.006150960922241211, -0.005897998809814453, -0.005645036697387695, -0.0053920745849609375, -0.00513911247253418, -0.004886150360107422, -0.004633188247680664, -0.004380226135253906, -0.0041272640228271484, -0.0038743019104003906, -0.003621339797973633, -0.003368377685546875, -0.003115415573120117, -0.0028624534606933594, -0.0026094913482666016, -0.0023565292358398438, -0.002103567123413086, -0.0018506050109863281, -0.0015976428985595703, -0.0013446807861328125, -0.0010917186737060547, -0.0008387565612792969, -0.0005857944488525391, -0.00033283233642578125, -7.987022399902344e-05, 0.00017309188842773438, 0.0004260540008544922, 0.00067901611328125, 0.0009319782257080078, 0.0011849403381347656, 0.0014379024505615234, 0.0016908645629882812, 0.001943826675415039, 0.002196788787841797, 0.0024497509002685547, 0.0027027130126953125, 0.0029556751251220703, 0.003208637237548828, 0.003461599349975586, 0.0037145614624023438, 0.0039675235748291016, 0.004220485687255859, 0.004473447799682617, 0.004726409912109375, 0.004979372024536133, 0.005232334136962891, 0.0054852962493896484, 0.005738258361816406, 0.005991220474243164, 0.006244182586669922, 0.00649714469909668, 0.0067501068115234375, 0.007003068923950195, 0.007256031036376953, 0.007508993148803711, 0.007761955261230469, 0.008014917373657227, 0.008267879486083984, 0.008520841598510742, 0.0087738037109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 8.0, 4.0, 4.0, 11.0, 13.0, 17.0, 25.0, 22.0, 29.0, 51.0, 51.0, 58.0, 116.0, 362.0, 2306.0, 30882.0, 4146628.0, 11877.0, 1163.0, 215.0, 121.0, 62.0, 62.0, 38.0, 24.0, 13.0, 23.0, 17.0, 12.0, 6.0, 5.0, 11.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0251617431640625, -0.024384021759033203, -0.023606300354003906, -0.02282857894897461, -0.022050857543945312, -0.021273136138916016, -0.02049541473388672, -0.019717693328857422, -0.018939971923828125, -0.018162250518798828, -0.01738452911376953, -0.016606807708740234, -0.015829086303710938, -0.01505136489868164, -0.014273643493652344, -0.013495922088623047, -0.01271820068359375, -0.011940479278564453, -0.011162757873535156, -0.01038503646850586, -0.009607315063476562, -0.008829593658447266, -0.008051872253417969, -0.007274150848388672, -0.006496429443359375, -0.005718708038330078, -0.004940986633300781, -0.004163265228271484, -0.0033855438232421875, -0.0026078224182128906, -0.0018301010131835938, -0.0010523796081542969, -0.000274658203125, 0.0005030632019042969, 0.0012807846069335938, 0.0020585060119628906, 0.0028362274169921875, 0.0036139488220214844, 0.004391670227050781, 0.005169391632080078, 0.005947113037109375, 0.006724834442138672, 0.007502555847167969, 0.008280277252197266, 0.009057998657226562, 0.00983572006225586, 0.010613441467285156, 0.011391162872314453, 0.01216888427734375, 0.012946605682373047, 0.013724327087402344, 0.01450204849243164, 0.015279769897460938, 0.016057491302490234, 0.01683521270751953, 0.017612934112548828, 0.018390655517578125, 0.019168376922607422, 0.01994609832763672, 0.020723819732666016, 0.021501541137695312, 0.02227926254272461, 0.023056983947753906, 0.023834705352783203, 0.0246124267578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 12.0, 12.0, 13.0, 14.0, 26.0, 55.0, 145.0, 600.0, 2208.0, 639.0, 189.0, 56.0, 12.0, 15.0, 7.0, 9.0, 7.0, 2.0, 2.0, 8.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01253509521484375, -0.012137889862060547, -0.011740684509277344, -0.01134347915649414, -0.010946273803710938, -0.010549068450927734, -0.010151863098144531, -0.009754657745361328, -0.009357452392578125, -0.008960247039794922, -0.008563041687011719, -0.008165836334228516, -0.0077686309814453125, -0.007371425628662109, -0.006974220275878906, -0.006577014923095703, -0.0061798095703125, -0.005782604217529297, -0.005385398864746094, -0.004988193511962891, -0.0045909881591796875, -0.004193782806396484, -0.0037965774536132812, -0.003399372100830078, -0.003002166748046875, -0.002604961395263672, -0.0022077560424804688, -0.0018105506896972656, -0.0014133453369140625, -0.0010161399841308594, -0.0006189346313476562, -0.00022172927856445312, 0.00017547607421875, 0.0005726814270019531, 0.0009698867797851562, 0.0013670921325683594, 0.0017642974853515625, 0.0021615028381347656, 0.0025587081909179688, 0.002955913543701172, 0.003353118896484375, 0.003750324249267578, 0.004147529602050781, 0.004544734954833984, 0.0049419403076171875, 0.005339145660400391, 0.005736351013183594, 0.006133556365966797, 0.00653076171875, 0.006927967071533203, 0.007325172424316406, 0.007722377777099609, 0.008119583129882812, 0.008516788482666016, 0.008913993835449219, 0.009311199188232422, 0.009708404541015625, 0.010105609893798828, 0.010502815246582031, 0.010900020599365234, 0.011297225952148438, 0.01169443130493164, 0.012091636657714844, 0.012488842010498047, 0.01288604736328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 10.0, 22.0, 104.0, 586.0, 211.0, 41.0, 17.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014731462113559246, -0.013573849573731422, -0.012416237965226173, -0.01125862542539835, -0.010101012885570526, -0.008943401277065277, -0.0077857887372374535, -0.0066281771287322044, -0.005470564588904381, -0.0043129525147378445, -0.0031553402077406645, -0.0019977279007434845, -0.0008401158265769482, 0.00031749624758958817, 0.0014751087874174118, 0.002632720395922661, 0.0037903329357504845, 0.004947945009917021, 0.006105557084083557, 0.007263169623911381, 0.008420782163739204, 0.009578393772244453, 0.010736006312072277, 0.011893617920577526, 0.01305123046040535, 0.014208843000233173, 0.015366454608738422, 0.016524067148566246, 0.017681678757071495, 0.018839292228221893, 0.019996903836727142, 0.02115451544523239, 0.02231213077902794, 0.023469742387533188, 0.024627355858683586, 0.025784967467188835, 0.026942579075694084, 0.028100192546844482, 0.02925780415534973, 0.03041541576385498, 0.03157302737236023, 0.03273063898086548, 0.03388825058937073, 0.03504586219787598, 0.036203477531671524, 0.03736108914017677, 0.03851870074868202, 0.03967631235718727, 0.04083392769098282, 0.04199153929948807, 0.04314915090799332, 0.044306762516498566, 0.04546437785029411, 0.04662198945879936, 0.04777960106730461, 0.04893721267580986, 0.05009482428431511, 0.05125243589282036, 0.05241004750132561, 0.053567662835121155, 0.054725274443626404, 0.05588288605213165, 0.0570404976606369, 0.05819810926914215, 0.0593557208776474]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 3.0, 3.0, 5.0, 7.0, 9.0, 12.0, 20.0, 17.0, 28.0, 24.0, 16.0, 28.0, 28.0, 58.0, 43.0, 50.0, 42.0, 28.0, 45.0, 47.0, 55.0, 53.0, 45.0, 40.0, 53.0, 34.0, 26.0, 26.0, 24.0, 30.0, 18.0, 19.0, 15.0, 14.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.03885149955749512, -0.0377403162419796, -0.03662913292646408, -0.03551795333623886, -0.03440677002072334, -0.033295586705207825, -0.032184407114982605, -0.031073223799467087, -0.02996204048395157, -0.02885085716843605, -0.02773967571556568, -0.026628494262695312, -0.025517310947179794, -0.024406127631664276, -0.023294946178793907, -0.022183764725923538, -0.02107258141040802, -0.019961398094892502, -0.018850216642022133, -0.017739035189151764, -0.016627851873636246, -0.015516669489443302, -0.014405487105250359, -0.013294304721057415, -0.012183122336864471, -0.011071939952671528, -0.009960757568478584, -0.00884957518428564, -0.007738392800092697, -0.006627210415899754, -0.00551602803170681, -0.004404845647513866, -0.003293663263320923, -0.0021824808791279793, -0.0010712984949350357, 3.988388925790787e-05, 0.0011510662734508514, 0.002262248657643795, 0.0033734310418367386, 0.004484613426029682, 0.005595795810222626, 0.006706978194415569, 0.007818160578608513, 0.008929342962801456, 0.0100405253469944, 0.011151707731187344, 0.012262890115380287, 0.01337407249957323, 0.014485254883766174, 0.015596437267959118, 0.01670761965215206, 0.01781880110502243, 0.01892998442053795, 0.020041167736053467, 0.021152349188923836, 0.022263530641794205, 0.023374713957309723, 0.02448589727282524, 0.02559707872569561, 0.02670826017856598, 0.027819443494081497, 0.028930626809597015, 0.030041808262467384, 0.031152989715337753, 0.03226417303085327]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 1.0, 8.0, 9.0, 10.0, 3.0, 20.0, 24.0, 26.0, 43.0, 51.0, 64.0, 99.0, 121.0, 203.0, 241.0, 333.0, 447.0, 691.0, 985.0, 1526.0, 2742.0, 5228.0, 14781.0, 174752.0, 813876.0, 18174.0, 5891.0, 2858.0, 1596.0, 1046.0, 756.0, 517.0, 401.0, 238.0, 214.0, 160.0, 103.0, 81.0, 66.0, 46.0, 28.0, 22.0, 27.0, 15.0, 13.0, 6.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.041656494140625, -0.04043436050415039, -0.03921222686767578, -0.03799009323120117, -0.03676795959472656, -0.03554582595825195, -0.034323692321777344, -0.033101558685302734, -0.031879425048828125, -0.030657291412353516, -0.029435157775878906, -0.028213024139404297, -0.026990890502929688, -0.025768756866455078, -0.02454662322998047, -0.02332448959350586, -0.02210235595703125, -0.02088022232055664, -0.01965808868408203, -0.018435955047607422, -0.017213821411132812, -0.015991687774658203, -0.014769554138183594, -0.013547420501708984, -0.012325286865234375, -0.011103153228759766, -0.009881019592285156, -0.008658885955810547, -0.0074367523193359375, -0.006214618682861328, -0.004992485046386719, -0.0037703514099121094, -0.0025482177734375, -0.0013260841369628906, -0.00010395050048828125, 0.0011181831359863281, 0.0023403167724609375, 0.003562450408935547, 0.004784584045410156, 0.006006717681884766, 0.007228851318359375, 0.008450984954833984, 0.009673118591308594, 0.010895252227783203, 0.012117385864257812, 0.013339519500732422, 0.014561653137207031, 0.01578378677368164, 0.01700592041015625, 0.01822805404663086, 0.01945018768310547, 0.020672321319580078, 0.021894454956054688, 0.023116588592529297, 0.024338722229003906, 0.025560855865478516, 0.026782989501953125, 0.028005123138427734, 0.029227256774902344, 0.030449390411376953, 0.03167152404785156, 0.03289365768432617, 0.03411579132080078, 0.03533792495727539, 0.03656005859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 16.0, 10.0, 8.0, 15.0, 43.0, 121.0, 252.0, 239.0, 122.0, 42.0, 11.0, 11.0, 12.0, 9.0, 9.0, 7.0, 3.0, 5.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007162928581237793, -0.006910085678100586, -0.006657242774963379, -0.006404399871826172, -0.006151556968688965, -0.005898714065551758, -0.005645871162414551, -0.005393028259277344, -0.005140185356140137, -0.00488734245300293, -0.004634499549865723, -0.004381656646728516, -0.004128813743591309, -0.0038759708404541016, -0.0036231279373168945, -0.0033702850341796875, -0.0031174421310424805, -0.0028645992279052734, -0.0026117563247680664, -0.0023589134216308594, -0.0021060705184936523, -0.0018532276153564453, -0.0016003847122192383, -0.0013475418090820312, -0.0010946989059448242, -0.0008418560028076172, -0.0005890130996704102, -0.0003361701965332031, -8.33272933959961e-05, 0.00016951560974121094, 0.00042235851287841797, 0.000675201416015625, 0.000928044319152832, 0.001180887222290039, 0.001433730125427246, 0.0016865730285644531, 0.0019394159317016602, 0.002192258834838867, 0.0024451017379760742, 0.0026979446411132812, 0.0029507875442504883, 0.0032036304473876953, 0.0034564733505249023, 0.0037093162536621094, 0.003962159156799316, 0.0042150020599365234, 0.0044678449630737305, 0.0047206878662109375, 0.0049735307693481445, 0.0052263736724853516, 0.005479216575622559, 0.005732059478759766, 0.005984902381896973, 0.00623774528503418, 0.006490588188171387, 0.006743431091308594, 0.006996273994445801, 0.007249116897583008, 0.007501959800720215, 0.007754802703857422, 0.008007645606994629, 0.008260488510131836, 0.008513331413269043, 0.00876617431640625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 6.0, 5.0, 13.0, 13.0, 16.0, 16.0, 24.0, 31.0, 46.0, 66.0, 85.0, 109.0, 143.0, 221.0, 352.0, 649.0, 1672.0, 41944.0, 997069.0, 3825.0, 886.0, 467.0, 255.0, 163.0, 130.0, 76.0, 60.0, 43.0, 52.0, 34.0, 29.0, 14.0, 11.0, 6.0, 9.0, 6.0, 1.0, 3.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039031982421875, -0.03769636154174805, -0.036360740661621094, -0.03502511978149414, -0.03368949890136719, -0.032353878021240234, -0.03101825714111328, -0.029682636260986328, -0.028347015380859375, -0.027011394500732422, -0.02567577362060547, -0.024340152740478516, -0.023004531860351562, -0.02166891098022461, -0.020333290100097656, -0.018997669219970703, -0.01766204833984375, -0.016326427459716797, -0.014990806579589844, -0.01365518569946289, -0.012319564819335938, -0.010983943939208984, -0.009648323059082031, -0.008312702178955078, -0.006977081298828125, -0.005641460418701172, -0.004305839538574219, -0.0029702186584472656, -0.0016345977783203125, -0.0002989768981933594, 0.0010366439819335938, 0.002372264862060547, 0.0037078857421875, 0.005043506622314453, 0.006379127502441406, 0.007714748382568359, 0.009050369262695312, 0.010385990142822266, 0.011721611022949219, 0.013057231903076172, 0.014392852783203125, 0.015728473663330078, 0.01706409454345703, 0.018399715423583984, 0.019735336303710938, 0.02107095718383789, 0.022406578063964844, 0.023742198944091797, 0.02507781982421875, 0.026413440704345703, 0.027749061584472656, 0.02908468246459961, 0.030420303344726562, 0.031755924224853516, 0.03309154510498047, 0.03442716598510742, 0.035762786865234375, 0.03709840774536133, 0.03843402862548828, 0.039769649505615234, 0.04110527038574219, 0.04244089126586914, 0.043776512145996094, 0.04511213302612305, 0.04644775390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 5.0, 11.0, 10.0, 9.0, 14.0, 16.0, 20.0, 25.0, 32.0, 35.0, 43.0, 45.0, 52.0, 45.0, 39.0, 35.0, 53.0, 64.0, 46.0, 46.0, 47.0, 42.0, 37.0, 38.0, 30.0, 23.0, 25.0, 31.0, 21.0, 20.0, 8.0, 6.0, 5.0, 9.0, 4.0, 1.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0171051025390625, -0.016519784927368164, -0.015934467315673828, -0.015349149703979492, -0.014763832092285156, -0.01417851448059082, -0.013593196868896484, -0.013007879257202148, -0.012422561645507812, -0.011837244033813477, -0.01125192642211914, -0.010666608810424805, -0.010081291198730469, -0.009495973587036133, -0.008910655975341797, -0.008325338363647461, -0.007740020751953125, -0.007154703140258789, -0.006569385528564453, -0.005984067916870117, -0.005398750305175781, -0.004813432693481445, -0.004228115081787109, -0.0036427974700927734, -0.0030574798583984375, -0.0024721622467041016, -0.0018868446350097656, -0.0013015270233154297, -0.0007162094116210938, -0.0001308917999267578, 0.0004544258117675781, 0.001039743423461914, 0.00162506103515625, 0.002210378646850586, 0.002795696258544922, 0.003381013870239258, 0.003966331481933594, 0.00455164909362793, 0.005136966705322266, 0.0057222843170166016, 0.0063076019287109375, 0.0068929195404052734, 0.007478237152099609, 0.008063554763793945, 0.008648872375488281, 0.009234189987182617, 0.009819507598876953, 0.010404825210571289, 0.010990142822265625, 0.011575460433959961, 0.012160778045654297, 0.012746095657348633, 0.013331413269042969, 0.013916730880737305, 0.01450204849243164, 0.015087366104125977, 0.015672683715820312, 0.01625800132751465, 0.016843318939208984, 0.01742863655090332, 0.018013954162597656, 0.018599271774291992, 0.019184589385986328, 0.019769906997680664, 0.020355224609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 4.0, 6.0, 9.0, 9.0, 9.0, 11.0, 7.0, 16.0, 22.0, 29.0, 31.0, 37.0, 55.0, 58.0, 103.0, 141.0, 314.0, 455.0, 1007.0, 3273.0, 16442.0, 970193.0, 48851.0, 4466.0, 1402.0, 596.0, 362.0, 162.0, 120.0, 78.0, 66.0, 44.0, 36.0, 25.0, 21.0, 24.0, 12.0, 3.0, 12.0, 10.0, 7.0, 1.0, 7.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8656253814697266e-05, -1.798197627067566e-05, -1.7307698726654053e-05, -1.6633421182632446e-05, -1.595914363861084e-05, -1.5284866094589233e-05, -1.4610588550567627e-05, -1.393631100654602e-05, -1.3262033462524414e-05, -1.2587755918502808e-05, -1.1913478374481201e-05, -1.1239200830459595e-05, -1.0564923286437988e-05, -9.890645742416382e-06, -9.216368198394775e-06, -8.542090654373169e-06, -7.867813110351562e-06, -7.193535566329956e-06, -6.51925802230835e-06, -5.844980478286743e-06, -5.170702934265137e-06, -4.49642539024353e-06, -3.822147846221924e-06, -3.1478703022003174e-06, -2.473592758178711e-06, -1.7993152141571045e-06, -1.125037670135498e-06, -4.507601261138916e-07, 2.2351741790771484e-07, 8.977949619293213e-07, 1.5720725059509277e-06, 2.246350049972534e-06, 2.9206275939941406e-06, 3.594905138015747e-06, 4.2691826820373535e-06, 4.94346022605896e-06, 5.617737770080566e-06, 6.292015314102173e-06, 6.966292858123779e-06, 7.640570402145386e-06, 8.314847946166992e-06, 8.989125490188599e-06, 9.663403034210205e-06, 1.0337680578231812e-05, 1.1011958122253418e-05, 1.1686235666275024e-05, 1.2360513210296631e-05, 1.3034790754318237e-05, 1.3709068298339844e-05, 1.438334584236145e-05, 1.5057623386383057e-05, 1.5731900930404663e-05, 1.640617847442627e-05, 1.7080456018447876e-05, 1.7754733562469482e-05, 1.842901110649109e-05, 1.9103288650512695e-05, 1.9777566194534302e-05, 2.0451843738555908e-05, 2.1126121282577515e-05, 2.180039882659912e-05, 2.2474676370620728e-05, 2.3148953914642334e-05, 2.382323145866394e-05, 2.4497509002685547e-05]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 10.0, 5.0, 16.0, 14.0, 18.0, 21.0, 20.0, 38.0, 25.0, 53.0, 96.0, 96.0, 140.0, 91.0, 79.0, 45.0, 33.0, 32.0, 18.0, 25.0, 20.0, 18.0, 11.0, 5.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.927417755126953e-06, -7.636845111846924e-06, -7.3462724685668945e-06, -7.055699825286865e-06, -6.765127182006836e-06, -6.474554538726807e-06, -6.183981895446777e-06, -5.893409252166748e-06, -5.602836608886719e-06, -5.3122639656066895e-06, -5.02169132232666e-06, -4.731118679046631e-06, -4.4405460357666016e-06, -4.149973392486572e-06, -3.859400749206543e-06, -3.5688281059265137e-06, -3.2782554626464844e-06, -2.987682819366455e-06, -2.6971101760864258e-06, -2.4065375328063965e-06, -2.115964889526367e-06, -1.8253922462463379e-06, -1.5348196029663086e-06, -1.2442469596862793e-06, -9.5367431640625e-07, -6.631016731262207e-07, -3.725290298461914e-07, -8.195638656616211e-08, 2.086162567138672e-07, 4.991888999938965e-07, 7.897615432739258e-07, 1.080334186553955e-06, 1.3709068298339844e-06, 1.6614794731140137e-06, 1.952052116394043e-06, 2.2426247596740723e-06, 2.5331974029541016e-06, 2.823770046234131e-06, 3.11434268951416e-06, 3.4049153327941895e-06, 3.6954879760742188e-06, 3.986060619354248e-06, 4.276633262634277e-06, 4.567205905914307e-06, 4.857778549194336e-06, 5.148351192474365e-06, 5.4389238357543945e-06, 5.729496479034424e-06, 6.020069122314453e-06, 6.310641765594482e-06, 6.601214408874512e-06, 6.891787052154541e-06, 7.18235969543457e-06, 7.4729323387146e-06, 7.763504981994629e-06, 8.054077625274658e-06, 8.344650268554688e-06, 8.635222911834717e-06, 8.925795555114746e-06, 9.216368198394775e-06, 9.506940841674805e-06, 9.797513484954834e-06, 1.0088086128234863e-05, 1.0378658771514893e-05, 1.0669231414794922e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 2.0, 3.0, 7.0, 8.0, 13.0, 17.0, 21.0, 22.0, 43.0, 58.0, 97.0, 160.0, 406.0, 2040.0, 1034552.0, 9792.0, 715.0, 223.0, 128.0, 65.0, 56.0, 30.0, 23.0, 16.0, 6.0, 10.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-8.761882781982422e-05, -8.52951779961586e-05, -8.297152817249298e-05, -8.064787834882736e-05, -7.832422852516174e-05, -7.600057870149612e-05, -7.36769288778305e-05, -7.135327905416489e-05, -6.902962923049927e-05, -6.670597940683365e-05, -6.438232958316803e-05, -6.205867975950241e-05, -5.973502993583679e-05, -5.741138011217117e-05, -5.5087730288505554e-05, -5.2764080464839935e-05, -5.0440430641174316e-05, -4.81167808175087e-05, -4.579313099384308e-05, -4.346948117017746e-05, -4.114583134651184e-05, -3.882218152284622e-05, -3.64985316991806e-05, -3.4174881875514984e-05, -3.1851232051849365e-05, -2.9527582228183746e-05, -2.7203932404518127e-05, -2.488028258085251e-05, -2.255663275718689e-05, -2.023298293352127e-05, -1.7909333109855652e-05, -1.5585683286190033e-05, -1.3262033462524414e-05, -1.0938383638858795e-05, -8.614733815193176e-06, -6.291083991527557e-06, -3.9674341678619385e-06, -1.6437843441963196e-06, 6.798654794692993e-07, 3.0035153031349182e-06, 5.327165126800537e-06, 7.650814950466156e-06, 9.974464774131775e-06, 1.2298114597797394e-05, 1.4621764421463013e-05, 1.694541424512863e-05, 1.926906406879425e-05, 2.159271389245987e-05, 2.3916363716125488e-05, 2.6240013539791107e-05, 2.8563663363456726e-05, 3.0887313187122345e-05, 3.3210963010787964e-05, 3.553461283445358e-05, 3.78582626581192e-05, 4.018191248178482e-05, 4.250556230545044e-05, 4.482921212911606e-05, 4.715286195278168e-05, 4.9476511776447296e-05, 5.1800161600112915e-05, 5.4123811423778534e-05, 5.644746124744415e-05, 5.877111107110977e-05, 6.109476089477539e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 7.0, 2.0, 5.0, 8.0, 8.0, 8.0, 21.0, 16.0, 23.0, 22.0, 44.0, 120.0, 346.0, 120.0, 81.0, 40.0, 35.0, 22.0, 14.0, 17.0, 8.0, 7.0, 4.0, 4.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.844499588012695e-05, -3.745127469301224e-05, -3.645755350589752e-05, -3.5463832318782806e-05, -3.447011113166809e-05, -3.3476389944553375e-05, -3.248266875743866e-05, -3.1488947570323944e-05, -3.049522638320923e-05, -2.9501505196094513e-05, -2.8507784008979797e-05, -2.7514062821865082e-05, -2.6520341634750366e-05, -2.552662044763565e-05, -2.4532899260520935e-05, -2.353917807340622e-05, -2.2545456886291504e-05, -2.155173569917679e-05, -2.0558014512062073e-05, -1.9564293324947357e-05, -1.857057213783264e-05, -1.7576850950717926e-05, -1.658312976360321e-05, -1.5589408576488495e-05, -1.459568738937378e-05, -1.3601966202259064e-05, -1.2608245015144348e-05, -1.1614523828029633e-05, -1.0620802640914917e-05, -9.627081453800201e-06, -8.633360266685486e-06, -7.63963907957077e-06, -6.645917892456055e-06, -5.652196705341339e-06, -4.6584755182266235e-06, -3.664754331111908e-06, -2.6710331439971924e-06, -1.6773119568824768e-06, -6.835907697677612e-07, 3.1013041734695435e-07, 1.30385160446167e-06, 2.2975727915763855e-06, 3.291293978691101e-06, 4.285015165805817e-06, 5.278736352920532e-06, 6.272457540035248e-06, 7.266178727149963e-06, 8.259899914264679e-06, 9.253621101379395e-06, 1.024734228849411e-05, 1.1241063475608826e-05, 1.2234784662723541e-05, 1.3228505849838257e-05, 1.4222227036952972e-05, 1.5215948224067688e-05, 1.6209669411182404e-05, 1.720339059829712e-05, 1.8197111785411835e-05, 1.919083297252655e-05, 2.0184554159641266e-05, 2.117827534675598e-05, 2.2171996533870697e-05, 2.3165717720985413e-05, 2.4159438908100128e-05, 2.5153160095214844e-05]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 30.0, 921.0, 62.0], "bins": [-0.558448314666748, -0.5495374798774719, -0.5406267046928406, -0.5317158699035645, -0.5228050947189331, -0.513894259929657, -0.5049834847450256, -0.4960726499557495, -0.4871618449687958, -0.47825103998184204, -0.4693402349948883, -0.46042943000793457, -0.45151859521865845, -0.4426077902317047, -0.433696985244751, -0.42478618025779724, -0.4158753752708435, -0.40696457028388977, -0.39805376529693604, -0.3891429603099823, -0.38023215532302856, -0.37132132053375244, -0.3624105155467987, -0.35349971055984497, -0.34458890557289124, -0.3356781005859375, -0.32676729559898376, -0.31785649061203003, -0.3089456558227539, -0.30003485083580017, -0.29112404584884644, -0.2822132408618927, -0.2733024060726166, -0.26439160108566284, -0.2554807960987091, -0.24656997621059418, -0.23765917122364044, -0.2287483662366867, -0.21983754634857178, -0.21092674136161804, -0.2020159512758255, -0.19310514628887177, -0.18419432640075684, -0.1752835214138031, -0.16637271642684937, -0.15746191143989563, -0.1485511064529419, -0.13964028656482697, -0.13072948157787323, -0.1218186765909195, -0.11290786415338516, -0.10399705171585083, -0.0950862467288971, -0.08617544174194336, -0.07726462930440903, -0.0683538168668747, -0.05944300442934036, -0.05053219571709633, -0.041621387004852295, -0.03271057829260826, -0.023799769580364227, -0.014888960868120193, -0.00597815215587616, 0.002932656556367874, 0.011843464337289333]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 7.0, 5.0, 12.0, 10.0, 11.0, 17.0, 17.0, 22.0, 23.0, 22.0, 44.0, 32.0, 36.0, 38.0, 39.0, 66.0, 53.0, 65.0, 54.0, 59.0, 51.0, 41.0, 51.0, 32.0, 33.0, 31.0, 21.0, 17.0, 16.0, 13.0, 17.0, 11.0, 3.0, 10.0, 3.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08399641513824463, -0.08156851679086685, -0.07914061099290848, -0.0767127126455307, -0.07428480684757233, -0.07185690850019455, -0.06942901015281677, -0.0670011043548584, -0.06457320600748062, -0.062145303934812546, -0.05971740186214447, -0.05728950351476669, -0.05486160144209862, -0.05243369936943054, -0.050005801022052765, -0.04757789894938469, -0.045149996876716614, -0.04272209480404854, -0.04029419273138046, -0.037866294384002686, -0.03543839231133461, -0.033010490238666534, -0.030582590028643608, -0.028154689818620682, -0.025726787745952606, -0.02329888567328453, -0.020870985463261604, -0.018443085253238678, -0.016015183180570602, -0.013587282039225101, -0.0111593808978796, -0.008731480687856674, -0.006303578615188599, -0.0038756774738430977, -0.0014477763324975967, 0.0009801248088479042, 0.003408025950193405, 0.005835927091538906, 0.008263828232884407, 0.010691728442907333, 0.013119630515575409, 0.01554753165692091, 0.01797543279826641, 0.020403333008289337, 0.022831235080957413, 0.02525913715362549, 0.027687037363648415, 0.03011493757367134, 0.032542839646339417, 0.03497074171900749, 0.03739864379167557, 0.039826542139053345, 0.04225444421172142, 0.044682346284389496, 0.04711024463176727, 0.04953814670443535, 0.051966048777103424, 0.0543939508497715, 0.056821852922439575, 0.05924975126981735, 0.06167765334248543, 0.0641055554151535, 0.06653345376253128, 0.06896135210990906, 0.07138925790786743]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 5.0, 8.0, 7.0, 8.0, 5.0, 9.0, 15.0, 27.0, 24.0, 28.0, 44.0, 78.0, 274.0, 1536.0, 4191353.0, 497.0, 104.0, 44.0, 35.0, 34.0, 20.0, 19.0, 17.0, 14.0, 11.0, 5.0, 8.0, 8.0, 6.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.095703125, -2.024200439453125, -1.95269775390625, -1.881195068359375, -1.8096923828125, -1.738189697265625, -1.66668701171875, -1.595184326171875, -1.523681640625, -1.452178955078125, -1.38067626953125, -1.309173583984375, -1.2376708984375, -1.166168212890625, -1.09466552734375, -1.023162841796875, -0.95166015625, -0.880157470703125, -0.80865478515625, -0.737152099609375, -0.6656494140625, -0.594146728515625, -0.52264404296875, -0.451141357421875, -0.379638671875, -0.308135986328125, -0.23663330078125, -0.165130615234375, -0.0936279296875, -0.022125244140625, 0.04937744140625, 0.120880126953125, 0.1923828125, 0.263885498046875, 0.33538818359375, 0.406890869140625, 0.4783935546875, 0.549896240234375, 0.62139892578125, 0.692901611328125, 0.764404296875, 0.835906982421875, 0.90740966796875, 0.978912353515625, 1.0504150390625, 1.121917724609375, 1.19342041015625, 1.264923095703125, 1.33642578125, 1.407928466796875, 1.47943115234375, 1.550933837890625, 1.6224365234375, 1.693939208984375, 1.76544189453125, 1.836944580078125, 1.908447265625, 1.979949951171875, 2.05145263671875, 2.122955322265625, 2.1944580078125, 2.265960693359375, 2.33746337890625, 2.408966064453125, 2.48046875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 7.0, 12.0, 15.0, 5.0, 16.0, 39.0, 112.0, 216.0, 259.0, 145.0, 47.0, 14.0, 11.0, 13.0, 7.0, 10.0, 6.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 3.0, 0.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007415771484375, -0.007163882255554199, -0.0069119930267333984, -0.006660103797912598, -0.006408214569091797, -0.006156325340270996, -0.005904436111450195, -0.0056525468826293945, -0.005400657653808594, -0.005148768424987793, -0.004896879196166992, -0.004644989967346191, -0.004393100738525391, -0.00414121150970459, -0.003889322280883789, -0.0036374330520629883, -0.0033855438232421875, -0.0031336545944213867, -0.002881765365600586, -0.002629876136779785, -0.0023779869079589844, -0.0021260976791381836, -0.0018742084503173828, -0.001622319221496582, -0.0013704299926757812, -0.0011185407638549805, -0.0008666515350341797, -0.0006147623062133789, -0.0003628730773925781, -0.00011098384857177734, 0.00014090538024902344, 0.0003927946090698242, 0.000644683837890625, 0.0008965730667114258, 0.0011484622955322266, 0.0014003515243530273, 0.0016522407531738281, 0.001904129981994629, 0.0021560192108154297, 0.0024079084396362305, 0.0026597976684570312, 0.002911686897277832, 0.003163576126098633, 0.0034154653549194336, 0.0036673545837402344, 0.003919243812561035, 0.004171133041381836, 0.004423022270202637, 0.0046749114990234375, 0.004926800727844238, 0.005178689956665039, 0.00543057918548584, 0.005682468414306641, 0.005934357643127441, 0.006186246871948242, 0.006438136100769043, 0.006690025329589844, 0.0069419145584106445, 0.007193803787231445, 0.007445693016052246, 0.007697582244873047, 0.007949471473693848, 0.008201360702514648, 0.00845324993133545, 0.00870513916015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 10.0, 11.0, 19.0, 18.0, 35.0, 49.0, 101.0, 145.0, 267.0, 603.0, 1485.0, 4477.0, 26272.0, 4135100.0, 19698.0, 3598.0, 1217.0, 497.0, 269.0, 132.0, 84.0, 51.0, 33.0, 29.0, 19.0, 13.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.04852294921875, -0.046929359436035156, -0.04533576965332031, -0.04374217987060547, -0.042148590087890625, -0.04055500030517578, -0.03896141052246094, -0.037367820739746094, -0.03577423095703125, -0.034180641174316406, -0.03258705139160156, -0.03099346160888672, -0.029399871826171875, -0.02780628204345703, -0.026212692260742188, -0.024619102478027344, -0.0230255126953125, -0.021431922912597656, -0.019838333129882812, -0.01824474334716797, -0.016651153564453125, -0.015057563781738281, -0.013463973999023438, -0.011870384216308594, -0.01027679443359375, -0.008683204650878906, -0.0070896148681640625, -0.005496025085449219, -0.003902435302734375, -0.0023088455200195312, -0.0007152557373046875, 0.0008783340454101562, 0.002471923828125, 0.004065513610839844, 0.0056591033935546875, 0.007252693176269531, 0.008846282958984375, 0.010439872741699219, 0.012033462524414062, 0.013627052307128906, 0.01522064208984375, 0.016814231872558594, 0.018407821655273438, 0.02000141143798828, 0.021595001220703125, 0.02318859100341797, 0.024782180786132812, 0.026375770568847656, 0.0279693603515625, 0.029562950134277344, 0.031156539916992188, 0.03275012969970703, 0.034343719482421875, 0.03593730926513672, 0.03753089904785156, 0.039124488830566406, 0.04071807861328125, 0.042311668395996094, 0.04390525817871094, 0.04549884796142578, 0.047092437744140625, 0.04868602752685547, 0.05027961730957031, 0.051873207092285156, 0.053466796875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 6.0, 6.0, 10.0, 5.0, 9.0, 10.0, 26.0, 60.0, 252.0, 3067.0, 407.0, 96.0, 35.0, 14.0, 9.0, 7.0, 7.0, 3.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.01409149169921875, -0.013717055320739746, -0.013342618942260742, -0.012968182563781738, -0.012593746185302734, -0.01221930980682373, -0.011844873428344727, -0.011470437049865723, -0.011096000671386719, -0.010721564292907715, -0.010347127914428711, -0.009972691535949707, -0.009598255157470703, -0.0092238187789917, -0.008849382400512695, -0.008474946022033691, -0.008100509643554688, -0.007726073265075684, -0.00735163688659668, -0.006977200508117676, -0.006602764129638672, -0.006228327751159668, -0.005853891372680664, -0.00547945499420166, -0.005105018615722656, -0.004730582237243652, -0.0043561458587646484, -0.0039817094802856445, -0.0036072731018066406, -0.0032328367233276367, -0.002858400344848633, -0.002483963966369629, -0.002109527587890625, -0.001735091209411621, -0.0013606548309326172, -0.0009862184524536133, -0.0006117820739746094, -0.00023734569549560547, 0.00013709068298339844, 0.0005115270614624023, 0.0008859634399414062, 0.0012603998184204102, 0.001634836196899414, 0.002009272575378418, 0.002383708953857422, 0.0027581453323364258, 0.0031325817108154297, 0.0035070180892944336, 0.0038814544677734375, 0.004255890846252441, 0.004630327224731445, 0.005004763603210449, 0.005379199981689453, 0.005753636360168457, 0.006128072738647461, 0.006502509117126465, 0.006876945495605469, 0.007251381874084473, 0.0076258182525634766, 0.00800025463104248, 0.008374691009521484, 0.008749127388000488, 0.009123563766479492, 0.009498000144958496, 0.0098724365234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 18.0, 111.0, 628.0, 153.0, 47.0, 22.0, 14.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055271510034799576, -0.048703815788030624, -0.04213612154126167, -0.03556842729449272, -0.02900073304772377, -0.02243303880095482, -0.015865344554185867, -0.009297650307416916, -0.0027299560606479645, 0.003837738186120987, 0.010405432432889938, 0.01697312667965889, 0.02354082092642784, 0.030108515173196793, 0.036676209419965744, 0.043243903666734695, 0.04981159791350365, 0.0563792921602726, 0.06294699013233185, 0.0695146769285202, 0.07608237862586975, 0.0826500654220581, 0.08921776711940765, 0.09578545391559601, 0.10235315561294556, 0.10892084985971451, 0.11548854410648346, 0.12205623835325241, 0.12862393260002136, 0.13519161939620972, 0.14175932109355927, 0.1483270227909088, 0.15489470958709717, 0.16146239638328552, 0.16803009808063507, 0.17459779977798462, 0.18116548657417297, 0.18773317337036133, 0.19430087506771088, 0.20086857676506042, 0.20743626356124878, 0.21400395035743713, 0.22057165205478668, 0.22713935375213623, 0.23370704054832458, 0.24027472734451294, 0.2468424290418625, 0.25341013073921204, 0.2599778175354004, 0.26654550433158875, 0.2731131911277771, 0.27968090772628784, 0.2862485945224762, 0.29281628131866455, 0.2993839979171753, 0.30595168471336365, 0.312519371509552, 0.31908705830574036, 0.3256547451019287, 0.33222246170043945, 0.3387901484966278, 0.34535783529281616, 0.3519255518913269, 0.35849323868751526, 0.3650609254837036]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 7.0, 8.0, 12.0, 11.0, 20.0, 16.0, 35.0, 35.0, 36.0, 40.0, 56.0, 52.0, 44.0, 49.0, 53.0, 51.0, 71.0, 60.0, 48.0, 46.0, 40.0, 47.0, 37.0, 22.0, 22.0, 15.0, 15.0, 11.0, 11.0, 6.0, 9.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035768866539001465, -0.0345376580953598, -0.03330644965171814, -0.03207524120807648, -0.030844032764434814, -0.029612824320793152, -0.02838161587715149, -0.027150407433509827, -0.025919198989868164, -0.0246879905462265, -0.02345678210258484, -0.022225573658943176, -0.020994365215301514, -0.01976315677165985, -0.01853194832801819, -0.017300739884376526, -0.016069531440734863, -0.0148383229970932, -0.013607114553451538, -0.012375906109809875, -0.011144697666168213, -0.00991348922252655, -0.008682280778884888, -0.007451072335243225, -0.0062198638916015625, -0.0049886554479599, -0.0037574470043182373, -0.0025262385606765747, -0.0012950301170349121, -6.382167339324951e-05, 0.001167386770248413, 0.0023985952138900757, 0.0036298036575317383, 0.004861012101173401, 0.0060922205448150635, 0.007323428988456726, 0.008554637432098389, 0.009785845875740051, 0.011017054319381714, 0.012248262763023376, 0.013479471206665039, 0.014710679650306702, 0.015941888093948364, 0.017173096537590027, 0.01840430498123169, 0.019635513424873352, 0.020866721868515015, 0.022097930312156677, 0.02332913875579834, 0.024560347199440002, 0.025791555643081665, 0.027022764086723328, 0.02825397253036499, 0.029485180974006653, 0.030716389417648315, 0.03194759786128998, 0.03317880630493164, 0.0344100147485733, 0.035641223192214966, 0.03687243163585663, 0.03810364007949829, 0.039334848523139954, 0.040566056966781616, 0.04179726541042328, 0.04302847385406494]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 7.0, 6.0, 11.0, 11.0, 20.0, 33.0, 38.0, 74.0, 128.0, 196.0, 376.0, 896.0, 2119.0, 6072.0, 26431.0, 954107.0, 44849.0, 8121.0, 2785.0, 1128.0, 536.0, 241.0, 138.0, 87.0, 43.0, 31.0, 12.0, 16.0, 11.0, 4.0, 3.0, 6.0, 1.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0655517578125, -0.0633382797241211, -0.06112480163574219, -0.05891132354736328, -0.056697845458984375, -0.05448436737060547, -0.05227088928222656, -0.050057411193847656, -0.04784393310546875, -0.045630455017089844, -0.04341697692871094, -0.04120349884033203, -0.038990020751953125, -0.03677654266357422, -0.03456306457519531, -0.032349586486816406, -0.0301361083984375, -0.027922630310058594, -0.025709152221679688, -0.02349567413330078, -0.021282196044921875, -0.01906871795654297, -0.016855239868164062, -0.014641761779785156, -0.01242828369140625, -0.010214805603027344, -0.008001327514648438, -0.005787849426269531, -0.003574371337890625, -0.0013608932495117188, 0.0008525848388671875, 0.0030660629272460938, 0.005279541015625, 0.007493019104003906, 0.009706497192382812, 0.011919975280761719, 0.014133453369140625, 0.01634693145751953, 0.018560409545898438, 0.020773887634277344, 0.02298736572265625, 0.025200843811035156, 0.027414321899414062, 0.02962779998779297, 0.031841278076171875, 0.03405475616455078, 0.03626823425292969, 0.038481712341308594, 0.0406951904296875, 0.042908668518066406, 0.04512214660644531, 0.04733562469482422, 0.049549102783203125, 0.05176258087158203, 0.05397605895996094, 0.056189537048339844, 0.05840301513671875, 0.060616493225097656, 0.06282997131347656, 0.06504344940185547, 0.06725692749023438, 0.06947040557861328, 0.07168388366699219, 0.0738973617553711, 0.07611083984375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 2.0, 3.0, 10.0, 12.0, 12.0, 15.0, 14.0, 67.0, 136.0, 233.0, 216.0, 116.0, 46.0, 16.0, 11.0, 10.0, 11.0, 8.0, 5.0, 4.0, 3.0, 1.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007381439208984375, -0.007128655910491943, -0.006875872611999512, -0.00662308931350708, -0.0063703060150146484, -0.006117522716522217, -0.005864739418029785, -0.0056119561195373535, -0.005359172821044922, -0.00510638952255249, -0.004853606224060059, -0.004600822925567627, -0.004348039627075195, -0.004095256328582764, -0.003842473030090332, -0.0035896897315979004, -0.0033369064331054688, -0.003084123134613037, -0.0028313398361206055, -0.002578556537628174, -0.002325773239135742, -0.0020729899406433105, -0.001820206642150879, -0.0015674233436584473, -0.0013146400451660156, -0.001061856746673584, -0.0008090734481811523, -0.0005562901496887207, -0.00030350685119628906, -5.072355270385742e-05, 0.00020205974578857422, 0.00045484304428100586, 0.0007076263427734375, 0.0009604096412658691, 0.0012131929397583008, 0.0014659762382507324, 0.001718759536743164, 0.0019715428352355957, 0.0022243261337280273, 0.002477109432220459, 0.0027298927307128906, 0.0029826760292053223, 0.003235459327697754, 0.0034882426261901855, 0.003741025924682617, 0.003993809223175049, 0.0042465925216674805, 0.004499375820159912, 0.004752159118652344, 0.005004942417144775, 0.005257725715637207, 0.005510509014129639, 0.00576329231262207, 0.006016075611114502, 0.006268858909606934, 0.006521642208099365, 0.006774425506591797, 0.0070272088050842285, 0.00727999210357666, 0.007532775402069092, 0.0077855587005615234, 0.008038341999053955, 0.008291125297546387, 0.008543908596038818, 0.00879669189453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 5.0, 5.0, 8.0, 6.0, 13.0, 20.0, 23.0, 30.0, 34.0, 47.0, 51.0, 81.0, 130.0, 189.0, 275.0, 440.0, 776.0, 1612.0, 3682.0, 10355.0, 38986.0, 416877.0, 515853.0, 40892.0, 10645.0, 3739.0, 1571.0, 817.0, 473.0, 274.0, 199.0, 116.0, 86.0, 68.0, 43.0, 30.0, 21.0, 24.0, 17.0, 12.0, 9.0, 7.0, 9.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0298309326171875, -0.028927326202392578, -0.028023719787597656, -0.027120113372802734, -0.026216506958007812, -0.02531290054321289, -0.02440929412841797, -0.023505687713623047, -0.022602081298828125, -0.021698474884033203, -0.02079486846923828, -0.01989126205444336, -0.018987655639648438, -0.018084049224853516, -0.017180442810058594, -0.016276836395263672, -0.01537322998046875, -0.014469623565673828, -0.013566017150878906, -0.012662410736083984, -0.011758804321289062, -0.01085519790649414, -0.009951591491699219, -0.009047985076904297, -0.008144378662109375, -0.007240772247314453, -0.006337165832519531, -0.005433559417724609, -0.0045299530029296875, -0.0036263465881347656, -0.0027227401733398438, -0.0018191337585449219, -0.00091552734375, -1.1920928955078125e-05, 0.0008916854858398438, 0.0017952919006347656, 0.0026988983154296875, 0.0036025047302246094, 0.004506111145019531, 0.005409717559814453, 0.006313323974609375, 0.007216930389404297, 0.008120536804199219, 0.00902414321899414, 0.009927749633789062, 0.010831356048583984, 0.011734962463378906, 0.012638568878173828, 0.01354217529296875, 0.014445781707763672, 0.015349388122558594, 0.016252994537353516, 0.017156600952148438, 0.01806020736694336, 0.01896381378173828, 0.019867420196533203, 0.020771026611328125, 0.021674633026123047, 0.02257823944091797, 0.02348184585571289, 0.024385452270507812, 0.025289058685302734, 0.026192665100097656, 0.027096271514892578, 0.0279998779296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 9.0, 8.0, 9.0, 8.0, 7.0, 16.0, 20.0, 18.0, 29.0, 40.0, 34.0, 34.0, 35.0, 46.0, 53.0, 52.0, 45.0, 55.0, 46.0, 44.0, 53.0, 26.0, 44.0, 35.0, 46.0, 23.0, 21.0, 25.0, 14.0, 26.0, 15.0, 8.0, 8.0, 8.0, 7.0, 1.0, 3.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01538848876953125, -0.01487743854522705, -0.014366388320922852, -0.013855338096618652, -0.013344287872314453, -0.012833237648010254, -0.012322187423706055, -0.011811137199401855, -0.011300086975097656, -0.010789036750793457, -0.010277986526489258, -0.009766936302185059, -0.00925588607788086, -0.00874483585357666, -0.008233785629272461, -0.007722735404968262, -0.0072116851806640625, -0.006700634956359863, -0.006189584732055664, -0.005678534507751465, -0.005167484283447266, -0.004656434059143066, -0.004145383834838867, -0.003634333610534668, -0.0031232833862304688, -0.0026122331619262695, -0.0021011829376220703, -0.001590132713317871, -0.0010790824890136719, -0.0005680322647094727, -5.698204040527344e-05, 0.0004540681838989258, 0.000965118408203125, 0.0014761686325073242, 0.0019872188568115234, 0.0024982690811157227, 0.003009319305419922, 0.003520369529724121, 0.00403141975402832, 0.0045424699783325195, 0.005053520202636719, 0.005564570426940918, 0.006075620651245117, 0.006586670875549316, 0.007097721099853516, 0.007608771324157715, 0.008119821548461914, 0.008630871772766113, 0.009141921997070312, 0.009652972221374512, 0.010164022445678711, 0.01067507266998291, 0.01118612289428711, 0.011697173118591309, 0.012208223342895508, 0.012719273567199707, 0.013230323791503906, 0.013741374015808105, 0.014252424240112305, 0.014763474464416504, 0.015274524688720703, 0.015785574913024902, 0.0162966251373291, 0.0168076753616333, 0.0173187255859375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 8.0, 15.0, 23.0, 35.0, 57.0, 72.0, 106.0, 153.0, 278.0, 465.0, 831.0, 1750.0, 3743.0, 9810.0, 36135.0, 616434.0, 331763.0, 31021.0, 8824.0, 3425.0, 1628.0, 826.0, 391.0, 269.0, 151.0, 111.0, 61.0, 45.0, 28.0, 21.0, 16.0, 8.0, 7.0, 6.0, 7.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012264251708984375, -0.001188039779663086, -0.0011496543884277344, -0.0011112689971923828, -0.0010728836059570312, -0.0010344982147216797, -0.0009961128234863281, -0.0009577274322509766, -0.000919342041015625, -0.0008809566497802734, -0.0008425712585449219, -0.0008041858673095703, -0.0007658004760742188, -0.0007274150848388672, -0.0006890296936035156, -0.0006506443023681641, -0.0006122589111328125, -0.0005738735198974609, -0.0005354881286621094, -0.0004971027374267578, -0.00045871734619140625, -0.0004203319549560547, -0.0003819465637207031, -0.00034356117248535156, -0.00030517578125, -0.00026679039001464844, -0.00022840499877929688, -0.0001900196075439453, -0.00015163421630859375, -0.00011324882507324219, -7.486343383789062e-05, -3.647804260253906e-05, 1.9073486328125e-06, 4.029273986816406e-05, 7.867813110351562e-05, 0.00011706352233886719, 0.00015544891357421875, 0.0001938343048095703, 0.00023221969604492188, 0.00027060508728027344, 0.000308990478515625, 0.00034737586975097656, 0.0003857612609863281, 0.0004241466522216797, 0.00046253204345703125, 0.0005009174346923828, 0.0005393028259277344, 0.0005776882171630859, 0.0006160736083984375, 0.0006544589996337891, 0.0006928443908691406, 0.0007312297821044922, 0.0007696151733398438, 0.0008080005645751953, 0.0008463859558105469, 0.0008847713470458984, 0.00092315673828125, 0.0009615421295166016, 0.0009999275207519531, 0.0010383129119873047, 0.0010766983032226562, 0.0011150836944580078, 0.0011534690856933594, 0.001191854476928711, 0.0012302398681640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 1.0, 8.0, 5.0, 8.0, 6.0, 22.0, 123.0, 502.0, 232.0, 33.0, 12.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.073713302612305e-05, -5.881674587726593e-05, -5.6896358728408813e-05, -5.49759715795517e-05, -5.305558443069458e-05, -5.113519728183746e-05, -4.921481013298035e-05, -4.729442298412323e-05, -4.537403583526611e-05, -4.3453648686408997e-05, -4.153326153755188e-05, -3.961287438869476e-05, -3.7692487239837646e-05, -3.577210009098053e-05, -3.385171294212341e-05, -3.1931325793266296e-05, -3.001093864440918e-05, -2.8090551495552063e-05, -2.6170164346694946e-05, -2.424977719783783e-05, -2.2329390048980713e-05, -2.0409002900123596e-05, -1.848861575126648e-05, -1.6568228602409363e-05, -1.4647841453552246e-05, -1.272745430469513e-05, -1.0807067155838013e-05, -8.886680006980896e-06, -6.966292858123779e-06, -5.045905709266663e-06, -3.125518560409546e-06, -1.2051314115524292e-06, 7.152557373046875e-07, 2.635642886161804e-06, 4.556030035018921e-06, 6.476417183876038e-06, 8.396804332733154e-06, 1.0317191481590271e-05, 1.2237578630447388e-05, 1.4157965779304504e-05, 1.607835292816162e-05, 1.7998740077018738e-05, 1.9919127225875854e-05, 2.183951437473297e-05, 2.3759901523590088e-05, 2.5680288672447205e-05, 2.760067582130432e-05, 2.9521062970161438e-05, 3.1441450119018555e-05, 3.336183726787567e-05, 3.528222441673279e-05, 3.7202611565589905e-05, 3.912299871444702e-05, 4.104338586330414e-05, 4.2963773012161255e-05, 4.488416016101837e-05, 4.680454730987549e-05, 4.8724934458732605e-05, 5.064532160758972e-05, 5.256570875644684e-05, 5.4486095905303955e-05, 5.640648305416107e-05, 5.832687020301819e-05, 6.0247257351875305e-05, 6.216764450073242e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 9.0, 11.0, 17.0, 11.0, 19.0, 17.0, 29.0, 39.0, 58.0, 94.0, 135.0, 180.0, 322.0, 584.0, 1201.0, 2511.0, 7219.0, 28643.0, 629008.0, 341937.0, 24906.0, 6571.0, 2396.0, 1133.0, 560.0, 307.0, 187.0, 135.0, 92.0, 52.0, 40.0, 30.0, 24.0, 14.0, 12.0, 14.0, 6.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012083053588867188, -0.0011692792177200317, -0.0011302530765533447, -0.0010912269353866577, -0.0010522007942199707, -0.0010131746530532837, -0.0009741485118865967, -0.0009351223707199097, -0.0008960962295532227, -0.0008570700883865356, -0.0008180439472198486, -0.0007790178060531616, -0.0007399916648864746, -0.0007009655237197876, -0.0006619393825531006, -0.0006229132413864136, -0.0005838871002197266, -0.0005448609590530396, -0.0005058348178863525, -0.00046680867671966553, -0.0004277825355529785, -0.0003887563943862915, -0.0003497302532196045, -0.0003107041120529175, -0.00027167797088623047, -0.00023265182971954346, -0.00019362568855285645, -0.00015459954738616943, -0.00011557340621948242, -7.654726505279541e-05, -3.75211238861084e-05, 1.5050172805786133e-06, 4.0531158447265625e-05, 7.955729961395264e-05, 0.00011858344078063965, 0.00015760958194732666, 0.00019663572311401367, 0.00023566186428070068, 0.0002746880054473877, 0.0003137141466140747, 0.0003527402877807617, 0.00039176642894744873, 0.00043079257011413574, 0.00046981871128082275, 0.0005088448524475098, 0.0005478709936141968, 0.0005868971347808838, 0.0006259232759475708, 0.0006649494171142578, 0.0007039755582809448, 0.0007430016994476318, 0.0007820278406143188, 0.0008210539817810059, 0.0008600801229476929, 0.0008991062641143799, 0.0009381324052810669, 0.000977158546447754, 0.001016184687614441, 0.001055210828781128, 0.001094236969947815, 0.001133263111114502, 0.001172289252281189, 0.001211315393447876, 0.001250341534614563, 0.00128936767578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 10.0, 7.0, 15.0, 23.0, 18.0, 18.0, 27.0, 41.0, 42.0, 64.0, 86.0, 75.0, 95.0, 92.0, 69.0, 49.0, 44.0, 52.0, 27.0, 22.0, 18.0, 20.0, 8.0, 11.0, 10.0, 4.0, 6.0, 4.0, 2.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007576942443847656, -0.000734962522983551, -0.0007122308015823364, -0.0006894990801811218, -0.0006667673587799072, -0.0006440356373786926, -0.000621303915977478, -0.0005985721945762634, -0.0005758404731750488, -0.0005531087517738342, -0.0005303770303726196, -0.000507645308971405, -0.00048491358757019043, -0.00046218186616897583, -0.00043945014476776123, -0.00041671842336654663, -0.00039398670196533203, -0.00037125498056411743, -0.00034852325916290283, -0.00032579153776168823, -0.00030305981636047363, -0.00028032809495925903, -0.00025759637355804443, -0.00023486465215682983, -0.00021213293075561523, -0.00018940120935440063, -0.00016666948795318604, -0.00014393776655197144, -0.00012120604515075684, -9.847432374954224e-05, -7.574260234832764e-05, -5.301088094711304e-05, -3.0279159545898438e-05, -7.547438144683838e-06, 1.5184283256530762e-05, 3.791600465774536e-05, 6.064772605895996e-05, 8.337944746017456e-05, 0.00010611116886138916, 0.00012884289026260376, 0.00015157461166381836, 0.00017430633306503296, 0.00019703805446624756, 0.00021976977586746216, 0.00024250149726867676, 0.00026523321866989136, 0.00028796494007110596, 0.00031069666147232056, 0.00033342838287353516, 0.00035616010427474976, 0.00037889182567596436, 0.00040162354707717896, 0.00042435526847839355, 0.00044708698987960815, 0.00046981871128082275, 0.0004925504326820374, 0.000515282154083252, 0.0005380138754844666, 0.0005607455968856812, 0.0005834773182868958, 0.0006062090396881104, 0.000628940761089325, 0.0006516724824905396, 0.0006744042038917542, 0.0006971359252929688]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 10.0, 16.0, 22.0, 30.0, 76.0, 159.0, 247.0, 197.0, 99.0, 43.0, 36.0, 24.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1494062840938568, -0.14543524384498596, -0.1414642184972763, -0.13749317824840546, -0.1335221529006958, -0.12955111265182495, -0.1255800873041153, -0.12160904705524445, -0.11763802170753479, -0.11366698890924454, -0.10969595611095428, -0.10572492331266403, -0.10175389051437378, -0.09778285771608353, -0.09381182491779327, -0.08984078466892242, -0.08586975187063217, -0.08189871907234192, -0.07792768627405167, -0.07395665347576141, -0.06998562067747116, -0.06601458787918091, -0.06204355135560036, -0.058072518557310104, -0.05410148575901985, -0.0501304529607296, -0.046159420162439346, -0.042188383638858795, -0.03821735084056854, -0.03424631804227829, -0.030275285243988037, -0.026304252445697784, -0.02233322709798813, -0.018362194299697876, -0.014391160570085049, -0.010420126840472221, -0.006449094042181969, -0.002478061243891716, 0.001492973417043686, 0.005464006215333939, 0.009435039013624191, 0.013406071811914444, 0.017377104610204697, 0.0213481392711401, 0.02531917206943035, 0.029290204867720604, 0.033261239528656006, 0.03723227232694626, 0.04120330512523651, 0.045174337923526764, 0.04914537072181702, 0.05311640352010727, 0.05708743631839752, 0.061058469116687775, 0.06502950191497803, 0.06900054216384888, 0.07297156751155853, 0.07694260030984879, 0.08091363310813904, 0.08488466590642929, 0.08885569870471954, 0.0928267315030098, 0.09679776430130005, 0.1007688045501709, 0.10473983734846115]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 4.0, 9.0, 17.0, 18.0, 15.0, 21.0, 19.0, 24.0, 33.0, 46.0, 39.0, 52.0, 64.0, 57.0, 65.0, 67.0, 59.0, 46.0, 45.0, 39.0, 27.0, 29.0, 29.0, 33.0, 19.0, 26.0, 22.0, 15.0, 5.0, 9.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.07515132427215576, -0.07287157326936722, -0.07059182226657867, -0.06831207126379013, -0.06603232026100159, -0.06375257670879364, -0.061472825706005096, -0.05919307470321655, -0.05691332370042801, -0.054633572697639465, -0.05235382169485092, -0.050074074417352676, -0.04779432341456413, -0.04551457241177559, -0.043234825134277344, -0.0409550741314888, -0.038675323128700256, -0.03639557212591171, -0.03411582112312317, -0.031836073845624924, -0.02955632284283638, -0.027276571840047836, -0.024996822699904442, -0.022717073559761047, -0.020437322556972504, -0.01815757155418396, -0.015877822414040565, -0.013598072342574596, -0.011318322271108627, -0.009038572199642658, -0.006758822128176689, -0.004479072988033295, -0.002199321985244751, 8.042808622121811e-05, 0.002360178157687187, 0.004639928229153156, 0.006919678300619125, 0.009199428372085094, 0.011479178443551064, 0.013758927583694458, 0.016038678586483, 0.018318429589271545, 0.02059817872941494, 0.022877927869558334, 0.025157678872346878, 0.027437429875135422, 0.029717179015278816, 0.03199692815542221, 0.034276679158210754, 0.0365564301609993, 0.03883618116378784, 0.04111592844128609, 0.04339567944407463, 0.045675430446863174, 0.04795517772436142, 0.05023492872714996, 0.05251467972993851, 0.05479443073272705, 0.057074181735515594, 0.05935392901301384, 0.06163368001580238, 0.06391342729330063, 0.06619317829608917, 0.06847292929887772, 0.07075268030166626]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 4.0, 3.0, 17.0, 16.0, 27.0, 47.0, 64.0, 178.0, 365.0, 24806.0, 4167989.0, 334.0, 158.0, 78.0, 51.0, 31.0, 26.0, 10.0, 9.0, 10.0, 5.0, 7.0, 8.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.197021484375, -0.19024276733398438, -0.18346405029296875, -0.17668533325195312, -0.1699066162109375, -0.16312789916992188, -0.15634918212890625, -0.14957046508789062, -0.142791748046875, -0.13601303100585938, -0.12923431396484375, -0.12245559692382812, -0.1156768798828125, -0.10889816284179688, -0.10211944580078125, -0.09534072875976562, -0.08856201171875, -0.08178329467773438, -0.07500457763671875, -0.06822586059570312, -0.0614471435546875, -0.054668426513671875, -0.04788970947265625, -0.041110992431640625, -0.034332275390625, -0.027553558349609375, -0.02077484130859375, -0.013996124267578125, -0.0072174072265625, -0.000438690185546875, 0.00634002685546875, 0.013118743896484375, 0.0198974609375, 0.026676177978515625, 0.03345489501953125, 0.040233612060546875, 0.0470123291015625, 0.053791046142578125, 0.06056976318359375, 0.06734848022460938, 0.074127197265625, 0.08090591430664062, 0.08768463134765625, 0.09446334838867188, 0.1012420654296875, 0.10802078247070312, 0.11479949951171875, 0.12157821655273438, 0.12835693359375, 0.13513565063476562, 0.14191436767578125, 0.14869308471679688, 0.1554718017578125, 0.16225051879882812, 0.16902923583984375, 0.17580795288085938, 0.182586669921875, 0.18936538696289062, 0.19614410400390625, 0.20292282104492188, 0.2097015380859375, 0.21648025512695312, 0.22325897216796875, 0.23003768920898438, 0.23681640625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 10.0, 11.0, 10.0, 27.0, 34.0, 91.0, 127.0, 187.0, 190.0, 108.0, 65.0, 34.0, 17.0, 13.0, 6.0, 9.0, 7.0, 6.0, 4.0, 3.0, 7.0, 2.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007343292236328125, -0.007091224193572998, -0.006839156150817871, -0.006587088108062744, -0.006335020065307617, -0.00608295202255249, -0.005830883979797363, -0.005578815937042236, -0.005326747894287109, -0.005074679851531982, -0.0048226118087768555, -0.0045705437660217285, -0.0043184757232666016, -0.004066407680511475, -0.0038143396377563477, -0.0035622715950012207, -0.0033102035522460938, -0.003058135509490967, -0.00280606746673584, -0.002553999423980713, -0.002301931381225586, -0.002049863338470459, -0.001797795295715332, -0.001545727252960205, -0.0012936592102050781, -0.0010415911674499512, -0.0007895231246948242, -0.0005374550819396973, -0.0002853870391845703, -3.331899642944336e-05, 0.0002187490463256836, 0.00047081708908081055, 0.0007228851318359375, 0.0009749531745910645, 0.0012270212173461914, 0.0014790892601013184, 0.0017311573028564453, 0.0019832253456115723, 0.0022352933883666992, 0.002487361431121826, 0.002739429473876953, 0.00299149751663208, 0.003243565559387207, 0.003495633602142334, 0.003747701644897461, 0.003999769687652588, 0.004251837730407715, 0.004503905773162842, 0.004755973815917969, 0.005008041858673096, 0.005260109901428223, 0.00551217794418335, 0.0057642459869384766, 0.0060163140296936035, 0.0062683820724487305, 0.006520450115203857, 0.006772518157958984, 0.007024586200714111, 0.007276654243469238, 0.007528722286224365, 0.007780790328979492, 0.00803285837173462, 0.008284926414489746, 0.008536994457244873, 0.0087890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 10.0, 13.0, 23.0, 30.0, 44.0, 78.0, 121.0, 227.0, 361.0, 668.0, 1237.0, 2546.0, 5282.0, 13430.0, 44260.0, 813420.0, 3219677.0, 62861.0, 16543.0, 6500.0, 3004.0, 1545.0, 896.0, 551.0, 319.0, 210.0, 143.0, 91.0, 58.0, 40.0, 27.0, 20.0, 17.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.008575439453125, -0.008331239223480225, -0.00808703899383545, -0.007842838764190674, -0.0075986385345458984, -0.007354438304901123, -0.007110238075256348, -0.006866037845611572, -0.006621837615966797, -0.0063776373863220215, -0.006133437156677246, -0.005889236927032471, -0.005645036697387695, -0.00540083646774292, -0.0051566362380981445, -0.004912436008453369, -0.004668235778808594, -0.004424035549163818, -0.004179835319519043, -0.003935635089874268, -0.003691434860229492, -0.003447234630584717, -0.0032030344009399414, -0.002958834171295166, -0.0027146339416503906, -0.0024704337120056152, -0.00222623348236084, -0.0019820332527160645, -0.001737833023071289, -0.0014936327934265137, -0.0012494325637817383, -0.0010052323341369629, -0.0007610321044921875, -0.0005168318748474121, -0.0002726316452026367, -2.8431415557861328e-05, 0.00021576881408691406, 0.00045996904373168945, 0.0007041692733764648, 0.0009483695030212402, 0.0011925697326660156, 0.001436769962310791, 0.0016809701919555664, 0.0019251704216003418, 0.002169370651245117, 0.0024135708808898926, 0.002657771110534668, 0.0029019713401794434, 0.0031461715698242188, 0.003390371799468994, 0.0036345720291137695, 0.003878772258758545, 0.00412297248840332, 0.004367172718048096, 0.004611372947692871, 0.0048555731773376465, 0.005099773406982422, 0.005343973636627197, 0.005588173866271973, 0.005832374095916748, 0.0060765743255615234, 0.006320774555206299, 0.006564974784851074, 0.00680917501449585, 0.007053375244140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 1.0, 2.0, 7.0, 5.0, 6.0, 7.0, 7.0, 14.0, 16.0, 19.0, 22.0, 37.0, 52.0, 131.0, 368.0, 1107.0, 1390.0, 501.0, 172.0, 58.0, 27.0, 22.0, 18.0, 21.0, 5.0, 11.0, 8.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007122039794921875, -0.0068686604499816895, -0.006615281105041504, -0.006361901760101318, -0.006108522415161133, -0.005855143070220947, -0.005601763725280762, -0.005348384380340576, -0.005095005035400391, -0.004841625690460205, -0.0045882463455200195, -0.004334867000579834, -0.0040814876556396484, -0.003828108310699463, -0.0035747289657592773, -0.003321349620819092, -0.0030679702758789062, -0.0028145909309387207, -0.002561211585998535, -0.0023078322410583496, -0.002054452896118164, -0.0018010735511779785, -0.001547694206237793, -0.0012943148612976074, -0.0010409355163574219, -0.0007875561714172363, -0.0005341768264770508, -0.00028079748153686523, -2.7418136596679688e-05, 0.00022596120834350586, 0.0004793405532836914, 0.000732719898223877, 0.0009860992431640625, 0.001239478588104248, 0.0014928579330444336, 0.0017462372779846191, 0.0019996166229248047, 0.0022529959678649902, 0.0025063753128051758, 0.0027597546577453613, 0.003013134002685547, 0.0032665133476257324, 0.003519892692565918, 0.0037732720375061035, 0.004026651382446289, 0.004280030727386475, 0.00453341007232666, 0.004786789417266846, 0.005040168762207031, 0.005293548107147217, 0.005546927452087402, 0.005800306797027588, 0.0060536861419677734, 0.006307065486907959, 0.0065604448318481445, 0.00681382417678833, 0.007067203521728516, 0.007320582866668701, 0.007573962211608887, 0.007827341556549072, 0.008080720901489258, 0.008334100246429443, 0.008587479591369629, 0.008840858936309814, 0.00909423828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 9.0, 7.0, 15.0, 47.0, 85.0, 205.0, 257.0, 157.0, 78.0, 53.0, 32.0, 10.0, 19.0, 16.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0763329565525055, -0.07402196526527405, -0.0717109739780426, -0.06939999014139175, -0.06708899885416031, -0.06477800756692886, -0.06246701627969742, -0.06015602499246597, -0.057845037430524826, -0.05553404614329338, -0.053223058581352234, -0.05091206729412079, -0.04860107600688934, -0.046290088444948196, -0.04397909715771675, -0.041668109595775604, -0.03935711830854416, -0.037046127021312714, -0.03473513945937157, -0.03242414817214012, -0.030113158747553825, -0.02780216932296753, -0.025491178035736084, -0.023180188611149788, -0.020869199186563492, -0.018558209761977196, -0.0162472203373909, -0.013936229050159454, -0.011625239625573158, -0.009314250200986862, -0.0070032598450779915, -0.004692269489169121, -0.002381272614002228, -7.02827237546444e-05, 0.002240707166492939, 0.004551697056740522, 0.006862686946988106, 0.009173676371574402, 0.011484666727483273, 0.013795657083392143, 0.01610664650797844, 0.018417635932564735, 0.02072862535715103, 0.023039616644382477, 0.025350606068968773, 0.02766159549355507, 0.029972586780786514, 0.03228357434272766, 0.034594565629959106, 0.03690555691719055, 0.0392165444791317, 0.041527535766363144, 0.04383852332830429, 0.046149514615535736, 0.04846050590276718, 0.05077149718999863, 0.053082484751939774, 0.05539347603917122, 0.057704463601112366, 0.06001545488834381, 0.062326446175575256, 0.0646374374628067, 0.06694842129945755, 0.069259412586689, 0.07157040387392044]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 6.0, 11.0, 7.0, 17.0, 18.0, 20.0, 11.0, 23.0, 33.0, 30.0, 41.0, 35.0, 49.0, 60.0, 49.0, 55.0, 48.0, 64.0, 57.0, 48.0, 38.0, 35.0, 46.0, 33.0, 24.0, 26.0, 29.0, 16.0, 11.0, 13.0, 10.0, 8.0, 6.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031122207641601562, -0.0300825834274292, -0.029042961075901985, -0.02800333872437477, -0.026963714510202408, -0.025924090296030045, -0.02488446794450283, -0.023844845592975616, -0.022805221378803253, -0.02176559716463089, -0.020725974813103676, -0.019686352461576462, -0.0186467282474041, -0.017607104033231735, -0.01656748168170452, -0.015527858398854733, -0.014488235116004944, -0.013448611833155155, -0.012408988550305367, -0.011369365267455578, -0.01032974198460579, -0.009290118701756, -0.008250495418906212, -0.007210872136056423, -0.0061712488532066345, -0.005131625570356846, -0.004092002287507057, -0.0030523790046572685, -0.00201275572180748, -0.0009731324389576912, 6.649084389209747e-05, 0.0011061141267418861, 0.002145737409591675, 0.0031853606924414635, 0.004224983975291252, 0.005264607258141041, 0.0063042305409908295, 0.007343853823840618, 0.008383477106690407, 0.009423100389540195, 0.010462723672389984, 0.011502346955239773, 0.012541970238089561, 0.01358159352093935, 0.014621216803789139, 0.015660841017961502, 0.016700463369488716, 0.01774008572101593, 0.018779709935188293, 0.019819334149360657, 0.02085895650088787, 0.021898578852415085, 0.022938203066587448, 0.02397782728075981, 0.025017449632287025, 0.02605707198381424, 0.027096696197986603, 0.028136320412158966, 0.02917594276368618, 0.030215565115213394, 0.03125518932938576, 0.03229481354355812, 0.033334434032440186, 0.03437405824661255, 0.03541368246078491]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 9.0, 20.0, 29.0, 34.0, 49.0, 80.0, 85.0, 134.0, 188.0, 260.0, 408.0, 616.0, 950.0, 1478.0, 2593.0, 4866.0, 10977.0, 32896.0, 297758.0, 619453.0, 48792.0, 13367.0, 5621.0, 2880.0, 1720.0, 1054.0, 643.0, 462.0, 307.0, 220.0, 149.0, 120.0, 75.0, 65.0, 45.0, 34.0, 22.0, 25.0, 9.0, 5.0, 13.0, 4.0, 8.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01190948486328125, -0.01150059700012207, -0.01109170913696289, -0.010682821273803711, -0.010273933410644531, -0.009865045547485352, -0.009456157684326172, -0.009047269821166992, -0.008638381958007812, -0.008229494094848633, -0.007820606231689453, -0.0074117183685302734, -0.007002830505371094, -0.006593942642211914, -0.006185054779052734, -0.005776166915893555, -0.005367279052734375, -0.004958391189575195, -0.004549503326416016, -0.004140615463256836, -0.0037317276000976562, -0.0033228397369384766, -0.002913951873779297, -0.002505064010620117, -0.0020961761474609375, -0.0016872882843017578, -0.0012784004211425781, -0.0008695125579833984, -0.00046062469482421875, -5.173683166503906e-05, 0.0003571510314941406, 0.0007660388946533203, 0.0011749267578125, 0.0015838146209716797, 0.0019927024841308594, 0.002401590347290039, 0.0028104782104492188, 0.0032193660736083984, 0.003628253936767578, 0.004037141799926758, 0.0044460296630859375, 0.004854917526245117, 0.005263805389404297, 0.0056726932525634766, 0.006081581115722656, 0.006490468978881836, 0.006899356842041016, 0.007308244705200195, 0.007717132568359375, 0.008126020431518555, 0.008534908294677734, 0.008943796157836914, 0.009352684020996094, 0.009761571884155273, 0.010170459747314453, 0.010579347610473633, 0.010988235473632812, 0.011397123336791992, 0.011806011199951172, 0.012214899063110352, 0.012623786926269531, 0.013032674789428711, 0.01344156265258789, 0.01385045051574707, 0.01425933837890625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 8.0, 16.0, 22.0, 52.0, 85.0, 136.0, 173.0, 153.0, 139.0, 77.0, 37.0, 12.0, 12.0, 8.0, 6.0, 7.0, 6.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007404327392578125, -0.007149875164031982, -0.00689542293548584, -0.006640970706939697, -0.006386518478393555, -0.006132066249847412, -0.0058776140213012695, -0.005623161792755127, -0.005368709564208984, -0.005114257335662842, -0.004859805107116699, -0.004605352878570557, -0.004350900650024414, -0.0040964484214782715, -0.003841996192932129, -0.0035875439643859863, -0.0033330917358398438, -0.003078639507293701, -0.0028241872787475586, -0.002569735050201416, -0.0023152828216552734, -0.002060830593109131, -0.0018063783645629883, -0.0015519261360168457, -0.0012974739074707031, -0.0010430216789245605, -0.000788569450378418, -0.0005341172218322754, -0.0002796649932861328, -2.5212764739990234e-05, 0.00022923946380615234, 0.0004836916923522949, 0.0007381439208984375, 0.00099259614944458, 0.0012470483779907227, 0.0015015006065368652, 0.0017559528350830078, 0.0020104050636291504, 0.002264857292175293, 0.0025193095207214355, 0.002773761749267578, 0.0030282139778137207, 0.0032826662063598633, 0.003537118434906006, 0.0037915706634521484, 0.004046022891998291, 0.004300475120544434, 0.004554927349090576, 0.004809379577636719, 0.005063831806182861, 0.005318284034729004, 0.0055727362632751465, 0.005827188491821289, 0.006081640720367432, 0.006336092948913574, 0.006590545177459717, 0.006844997406005859, 0.007099449634552002, 0.0073539018630981445, 0.007608354091644287, 0.00786280632019043, 0.008117258548736572, 0.008371710777282715, 0.008626163005828857, 0.008880615234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 10.0, 3.0, 9.0, 8.0, 6.0, 9.0, 13.0, 29.0, 34.0, 55.0, 73.0, 93.0, 123.0, 174.0, 261.0, 362.0, 532.0, 958.0, 1805.0, 3726.0, 9992.0, 38042.0, 259903.0, 629901.0, 75074.0, 16282.0, 5278.0, 2407.0, 1221.0, 700.0, 439.0, 306.0, 186.0, 140.0, 106.0, 72.0, 61.0, 46.0, 18.0, 17.0, 20.0, 14.0, 11.0, 9.0, 6.0, 12.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.01168060302734375, -0.011339068412780762, -0.010997533798217773, -0.010655999183654785, -0.010314464569091797, -0.009972929954528809, -0.00963139533996582, -0.009289860725402832, -0.008948326110839844, -0.008606791496276855, -0.008265256881713867, -0.007923722267150879, -0.007582187652587891, -0.007240653038024902, -0.006899118423461914, -0.006557583808898926, -0.0062160491943359375, -0.005874514579772949, -0.005532979965209961, -0.005191445350646973, -0.004849910736083984, -0.004508376121520996, -0.004166841506958008, -0.0038253068923950195, -0.0034837722778320312, -0.003142237663269043, -0.0028007030487060547, -0.0024591684341430664, -0.002117633819580078, -0.0017760992050170898, -0.0014345645904541016, -0.0010930299758911133, -0.000751495361328125, -0.0004099607467651367, -6.842613220214844e-05, 0.00027310848236083984, 0.0006146430969238281, 0.0009561777114868164, 0.0012977123260498047, 0.001639246940612793, 0.0019807815551757812, 0.0023223161697387695, 0.002663850784301758, 0.003005385398864746, 0.0033469200134277344, 0.0036884546279907227, 0.004029989242553711, 0.004371523857116699, 0.0047130584716796875, 0.005054593086242676, 0.005396127700805664, 0.005737662315368652, 0.006079196929931641, 0.006420731544494629, 0.006762266159057617, 0.0071038007736206055, 0.007445335388183594, 0.007786870002746582, 0.00812840461730957, 0.008469939231872559, 0.008811473846435547, 0.009153008460998535, 0.009494543075561523, 0.009836077690124512, 0.0101776123046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 2.0, 12.0, 13.0, 15.0, 22.0, 28.0, 23.0, 27.0, 23.0, 25.0, 51.0, 37.0, 46.0, 45.0, 55.0, 42.0, 53.0, 40.0, 44.0, 41.0, 36.0, 33.0, 39.0, 47.0, 31.0, 29.0, 19.0, 21.0, 18.0, 14.0, 13.0, 14.0, 4.0, 4.0, 3.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.016937255859375, -0.016460657119750977, -0.015984058380126953, -0.01550745964050293, -0.015030860900878906, -0.014554262161254883, -0.01407766342163086, -0.013601064682006836, -0.013124465942382812, -0.012647867202758789, -0.012171268463134766, -0.011694669723510742, -0.011218070983886719, -0.010741472244262695, -0.010264873504638672, -0.009788274765014648, -0.009311676025390625, -0.008835077285766602, -0.008358478546142578, -0.007881879806518555, -0.007405281066894531, -0.006928682327270508, -0.006452083587646484, -0.005975484848022461, -0.0054988861083984375, -0.005022287368774414, -0.004545688629150391, -0.004069089889526367, -0.0035924911499023438, -0.0031158924102783203, -0.002639293670654297, -0.0021626949310302734, -0.00168609619140625, -0.0012094974517822266, -0.0007328987121582031, -0.0002562999725341797, 0.00022029876708984375, 0.0006968975067138672, 0.0011734962463378906, 0.001650094985961914, 0.0021266937255859375, 0.002603292465209961, 0.0030798912048339844, 0.003556489944458008, 0.004033088684082031, 0.004509687423706055, 0.004986286163330078, 0.0054628849029541016, 0.005939483642578125, 0.0064160823822021484, 0.006892681121826172, 0.007369279861450195, 0.007845878601074219, 0.008322477340698242, 0.008799076080322266, 0.009275674819946289, 0.009752273559570312, 0.010228872299194336, 0.01070547103881836, 0.011182069778442383, 0.011658668518066406, 0.01213526725769043, 0.012611865997314453, 0.013088464736938477, 0.0135650634765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 11.0, 7.0, 13.0, 17.0, 18.0, 46.0, 63.0, 123.0, 216.0, 490.0, 1072.0, 2793.0, 8046.0, 40662.0, 840008.0, 133517.0, 14357.0, 4132.0, 1614.0, 650.0, 312.0, 132.0, 85.0, 49.0, 38.0, 14.0, 18.0, 11.0, 12.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0029125213623046875, -0.002826124429702759, -0.00273972749710083, -0.0026533305644989014, -0.0025669336318969727, -0.002480536699295044, -0.0023941397666931152, -0.0023077428340911865, -0.002221345901489258, -0.002134948968887329, -0.0020485520362854004, -0.0019621551036834717, -0.001875758171081543, -0.0017893612384796143, -0.0017029643058776855, -0.0016165673732757568, -0.0015301704406738281, -0.0014437735080718994, -0.0013573765754699707, -0.001270979642868042, -0.0011845827102661133, -0.0010981857776641846, -0.0010117888450622559, -0.0009253919124603271, -0.0008389949798583984, -0.0007525980472564697, -0.000666201114654541, -0.0005798041820526123, -0.0004934072494506836, -0.0004070103168487549, -0.00032061338424682617, -0.00023421645164489746, -0.00014781951904296875, -6.142258644104004e-05, 2.4974346160888672e-05, 0.00011137127876281738, 0.0001977682113647461, 0.0002841651439666748, 0.0003705620765686035, 0.0004569590091705322, 0.0005433559417724609, 0.0006297528743743896, 0.0007161498069763184, 0.0008025467395782471, 0.0008889436721801758, 0.0009753406047821045, 0.0010617375373840332, 0.001148134469985962, 0.0012345314025878906, 0.0013209283351898193, 0.001407325267791748, 0.0014937222003936768, 0.0015801191329956055, 0.0016665160655975342, 0.0017529129981994629, 0.0018393099308013916, 0.0019257068634033203, 0.002012103796005249, 0.0020985007286071777, 0.0021848976612091064, 0.002271294593811035, 0.002357691526412964, 0.0024440884590148926, 0.0025304853916168213, 0.00261688232421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 2.0, 6.0, 4.0, 9.0, 4.0, 7.0, 13.0, 17.0, 12.0, 8.0, 23.0, 22.0, 13.0, 45.0, 19.0, 24.0, 32.0, 42.0, 49.0, 26.0, 42.0, 50.0, 19.0, 46.0, 44.0, 51.0, 21.0, 54.0, 42.0, 13.0, 37.0, 37.0, 20.0, 28.0, 18.0, 25.0, 12.0, 11.0, 10.0, 6.0, 14.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.4570693969726562e-06, -3.355555236339569e-06, -3.254041075706482e-06, -3.1525269150733948e-06, -3.0510127544403076e-06, -2.9494985938072205e-06, -2.8479844331741333e-06, -2.746470272541046e-06, -2.644956111907959e-06, -2.543441951274872e-06, -2.4419277906417847e-06, -2.3404136300086975e-06, -2.2388994693756104e-06, -2.137385308742523e-06, -2.035871148109436e-06, -1.934356987476349e-06, -1.8328428268432617e-06, -1.7313286662101746e-06, -1.6298145055770874e-06, -1.5283003449440002e-06, -1.426786184310913e-06, -1.325272023677826e-06, -1.2237578630447388e-06, -1.1222437024116516e-06, -1.0207295417785645e-06, -9.192153811454773e-07, -8.177012205123901e-07, -7.16187059879303e-07, -6.146728992462158e-07, -5.131587386131287e-07, -4.116445779800415e-07, -3.1013041734695435e-07, -2.086162567138672e-07, -1.0710209608078003e-07, -5.587935447692871e-09, 9.592622518539429e-08, 1.9744038581848145e-07, 2.989545464515686e-07, 4.0046870708465576e-07, 5.019828677177429e-07, 6.034970283508301e-07, 7.050111889839172e-07, 8.065253496170044e-07, 9.080395102500916e-07, 1.0095536708831787e-06, 1.1110678315162659e-06, 1.212581992149353e-06, 1.3140961527824402e-06, 1.4156103134155273e-06, 1.5171244740486145e-06, 1.6186386346817017e-06, 1.7201527953147888e-06, 1.821666955947876e-06, 1.923181116580963e-06, 2.0246952772140503e-06, 2.1262094378471375e-06, 2.2277235984802246e-06, 2.3292377591133118e-06, 2.430751919746399e-06, 2.532266080379486e-06, 2.6337802410125732e-06, 2.7352944016456604e-06, 2.8368085622787476e-06, 2.9383227229118347e-06, 3.039836883544922e-06]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 8.0, 5.0, 6.0, 16.0, 14.0, 30.0, 47.0, 52.0, 78.0, 128.0, 190.0, 294.0, 614.0, 1287.0, 3043.0, 9196.0, 47904.0, 810208.0, 150891.0, 16280.0, 4482.0, 1810.0, 822.0, 397.0, 301.0, 130.0, 92.0, 58.0, 45.0, 29.0, 34.0, 16.0, 13.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00278472900390625, -0.0027067363262176514, -0.0026287436485290527, -0.002550750970840454, -0.0024727582931518555, -0.002394765615463257, -0.002316772937774658, -0.0022387802600860596, -0.002160787582397461, -0.0020827949047088623, -0.0020048022270202637, -0.001926809549331665, -0.0018488168716430664, -0.0017708241939544678, -0.0016928315162658691, -0.0016148388385772705, -0.0015368461608886719, -0.0014588534832000732, -0.0013808608055114746, -0.001302868127822876, -0.0012248754501342773, -0.0011468827724456787, -0.00106889009475708, -0.0009908974170684814, -0.0009129047393798828, -0.0008349120616912842, -0.0007569193840026855, -0.0006789267063140869, -0.0006009340286254883, -0.0005229413509368896, -0.000444948673248291, -0.0003669559955596924, -0.00028896331787109375, -0.00021097064018249512, -0.00013297796249389648, -5.498528480529785e-05, 2.300739288330078e-05, 0.00010100007057189941, 0.00017899274826049805, 0.0002569854259490967, 0.0003349781036376953, 0.00041297078132629395, 0.0004909634590148926, 0.0005689561367034912, 0.0006469488143920898, 0.0007249414920806885, 0.0008029341697692871, 0.0008809268474578857, 0.0009589195251464844, 0.001036912202835083, 0.0011149048805236816, 0.0011928975582122803, 0.001270890235900879, 0.0013488829135894775, 0.0014268755912780762, 0.0015048682689666748, 0.0015828609466552734, 0.001660853624343872, 0.0017388463020324707, 0.0018168389797210693, 0.001894831657409668, 0.0019728243350982666, 0.0020508170127868652, 0.002128809690475464, 0.0022068023681640625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 0.0, 4.0, 11.0, 8.0, 4.0, 13.0, 22.0, 30.0, 40.0, 49.0, 107.0, 105.0, 104.0, 116.0, 97.0, 79.0, 57.0, 41.0, 28.0, 16.0, 17.0, 14.0, 8.0, 6.0, 3.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032978057861328125, -0.0032031238079071045, -0.0031084418296813965, -0.0030137598514556885, -0.0029190778732299805, -0.0028243958950042725, -0.0027297139167785645, -0.0026350319385528564, -0.0025403499603271484, -0.0024456679821014404, -0.0023509860038757324, -0.0022563040256500244, -0.0021616220474243164, -0.0020669400691986084, -0.0019722580909729004, -0.0018775761127471924, -0.0017828941345214844, -0.0016882121562957764, -0.0015935301780700684, -0.0014988481998443604, -0.0014041662216186523, -0.0013094842433929443, -0.0012148022651672363, -0.0011201202869415283, -0.0010254383087158203, -0.0009307563304901123, -0.0008360743522644043, -0.0007413923740386963, -0.0006467103958129883, -0.0005520284175872803, -0.00045734643936157227, -0.00036266446113586426, -0.00026798248291015625, -0.00017330050468444824, -7.861852645874023e-05, 1.6063451766967773e-05, 0.00011074542999267578, 0.0002054274082183838, 0.0003001093864440918, 0.0003947913646697998, 0.0004894733428955078, 0.0005841553211212158, 0.0006788372993469238, 0.0007735192775726318, 0.0008682012557983398, 0.0009628832340240479, 0.0010575652122497559, 0.0011522471904754639, 0.0012469291687011719, 0.0013416111469268799, 0.0014362931251525879, 0.001530975103378296, 0.001625657081604004, 0.001720339059829712, 0.00181502103805542, 0.001909703016281128, 0.002004384994506836, 0.002099066972732544, 0.002193748950958252, 0.00228843092918396, 0.002383112907409668, 0.002477794885635376, 0.002572476863861084, 0.002667158842086792, 0.0027618408203125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 4.0, 4.0, 23.0, 38.0, 152.0, 391.0, 231.0, 77.0, 42.0, 16.0, 11.0, 7.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10761038213968277, -0.10356015712022781, -0.09950992465019226, -0.0954596996307373, -0.09140946716070175, -0.0873592421412468, -0.08330900967121124, -0.07925878465175629, -0.07520855963230133, -0.07115833461284637, -0.06710810214281082, -0.06305787712335587, -0.05900764465332031, -0.054957419633865356, -0.0509071908891201, -0.04685696214437485, -0.042806729674339294, -0.03875650092959404, -0.034706272184848785, -0.03065604530274868, -0.026605816558003426, -0.02255558781325817, -0.018505360931158066, -0.014455132186412811, -0.010404903441667557, -0.0063546751625835896, -0.0023044468834996223, 0.0017457809299230576, 0.005796009674668312, 0.009846238419413567, 0.013896465301513672, 0.017946694046258926, 0.021996930241584778, 0.026047158986330032, 0.030097387731075287, 0.03414761275053024, 0.038197845220565796, 0.04224807024002075, 0.046298298984766006, 0.05034852772951126, 0.054398756474256516, 0.05844898521900177, 0.062499213963747025, 0.06654944270849228, 0.07059966772794724, 0.07464990019798279, 0.07870012521743774, 0.0827503502368927, 0.08680058270692825, 0.09085080772638321, 0.09490104019641876, 0.09895126521587372, 0.10300149768590927, 0.10705172270536423, 0.11110195517539978, 0.11515218019485474, 0.11920240521430969, 0.12325263023376465, 0.1273028552532196, 0.13135309517383575, 0.1354033201932907, 0.13945354521274567, 0.14350377023220062, 0.14755401015281677, 0.15160423517227173]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 7.0, 3.0, 4.0, 7.0, 13.0, 10.0, 13.0, 11.0, 15.0, 12.0, 20.0, 18.0, 22.0, 28.0, 31.0, 35.0, 37.0, 40.0, 39.0, 50.0, 60.0, 66.0, 61.0, 53.0, 38.0, 36.0, 41.0, 31.0, 20.0, 24.0, 24.0, 21.0, 16.0, 19.0, 10.0, 14.0, 14.0, 5.0, 7.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056395113468170166, -0.05458729341626167, -0.05277947336435318, -0.050971657037734985, -0.04916383698582649, -0.047356016933918, -0.045548200607299805, -0.04374038055539131, -0.04193256050348282, -0.040124740451574326, -0.03831692039966583, -0.03650910407304764, -0.034701284021139145, -0.03289346396923065, -0.031085645779967308, -0.029277827590703964, -0.02747000753879547, -0.025662187486886978, -0.023854369297623634, -0.02204655110836029, -0.020238731056451797, -0.018430911004543304, -0.01662309281527996, -0.014815273694694042, -0.013007454574108124, -0.011199635453522205, -0.009391816332936287, -0.0075839972123503685, -0.00577617809176445, -0.003968358971178532, -0.0021605398505926132, -0.0003527207300066948, 0.0014550983905792236, 0.003262917511165142, 0.0050707366317510605, 0.006878555752336979, 0.008686374872922897, 0.010494193993508816, 0.012302013114094734, 0.014109832234680653, 0.01591765135526657, 0.017725471407175064, 0.019533289596438408, 0.02134110778570175, 0.023148927837610245, 0.024956747889518738, 0.02676456607878208, 0.028572384268045425, 0.03038020431995392, 0.03218802437186241, 0.033995844423770905, 0.0358036607503891, 0.03761148080229759, 0.039419300854206085, 0.04122711718082428, 0.04303493723273277, 0.044842757284641266, 0.04665057733654976, 0.04845839738845825, 0.05026621371507645, 0.05207403376698494, 0.05388185381889343, 0.05568967014551163, 0.05749749019742012, 0.05930531024932861]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 16.0, 25.0, 36.0, 49.0, 94.0, 212.0, 568.0, 1558.0, 4551.0, 16145.0, 87498.0, 1683851.0, 2298952.0, 80493.0, 14010.0, 3870.0, 1354.0, 492.0, 196.0, 106.0, 64.0, 42.0, 28.0, 21.0, 10.0, 4.0, 8.0, 6.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004486083984375, -0.004331529140472412, -0.004176974296569824, -0.004022419452667236, -0.0038678646087646484, -0.0037133097648620605, -0.0035587549209594727, -0.0034042000770568848, -0.003249645233154297, -0.003095090389251709, -0.002940535545349121, -0.002785980701446533, -0.0026314258575439453, -0.0024768710136413574, -0.0023223161697387695, -0.0021677613258361816, -0.0020132064819335938, -0.0018586516380310059, -0.001704096794128418, -0.00154954195022583, -0.0013949871063232422, -0.0012404322624206543, -0.0010858774185180664, -0.0009313225746154785, -0.0007767677307128906, -0.0006222128868103027, -0.00046765804290771484, -0.00031310319900512695, -0.00015854835510253906, -3.993511199951172e-06, 0.00015056133270263672, 0.0003051161766052246, 0.0004596710205078125, 0.0006142258644104004, 0.0007687807083129883, 0.0009233355522155762, 0.001077890396118164, 0.001232445240020752, 0.0013870000839233398, 0.0015415549278259277, 0.0016961097717285156, 0.0018506646156311035, 0.0020052194595336914, 0.0021597743034362793, 0.002314329147338867, 0.002468883991241455, 0.002623438835144043, 0.002777993679046631, 0.0029325485229492188, 0.0030871033668518066, 0.0032416582107543945, 0.0033962130546569824, 0.0035507678985595703, 0.003705322742462158, 0.003859877586364746, 0.004014432430267334, 0.004168987274169922, 0.00432354211807251, 0.004478096961975098, 0.0046326518058776855, 0.0047872066497802734, 0.004941761493682861, 0.005096316337585449, 0.005250871181488037, 0.005405426025390625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 9.0, 11.0, 28.0, 46.0, 58.0, 79.0, 106.0, 140.0, 129.0, 108.0, 86.0, 46.0, 40.0, 34.0, 20.0, 8.0, 10.0, 10.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007427215576171875, -0.007173478603363037, -0.006919741630554199, -0.006666004657745361, -0.0064122676849365234, -0.0061585307121276855, -0.005904793739318848, -0.00565105676651001, -0.005397319793701172, -0.005143582820892334, -0.004889845848083496, -0.004636108875274658, -0.00438237190246582, -0.004128634929656982, -0.0038748979568481445, -0.0036211609840393066, -0.0033674240112304688, -0.003113687038421631, -0.002859950065612793, -0.002606213092803955, -0.002352476119995117, -0.0020987391471862793, -0.0018450021743774414, -0.0015912652015686035, -0.0013375282287597656, -0.0010837912559509277, -0.0008300542831420898, -0.000576317310333252, -0.00032258033752441406, -6.884336471557617e-05, 0.00018489360809326172, 0.0004386305809020996, 0.0006923675537109375, 0.0009461045265197754, 0.0011998414993286133, 0.0014535784721374512, 0.001707315444946289, 0.001961052417755127, 0.002214789390563965, 0.0024685263633728027, 0.0027222633361816406, 0.0029760003089904785, 0.0032297372817993164, 0.0034834742546081543, 0.003737211227416992, 0.00399094820022583, 0.004244685173034668, 0.004498422145843506, 0.004752159118652344, 0.005005896091461182, 0.0052596330642700195, 0.005513370037078857, 0.005767107009887695, 0.006020843982696533, 0.006274580955505371, 0.006528317928314209, 0.006782054901123047, 0.007035791873931885, 0.007289528846740723, 0.0075432658195495605, 0.0077970027923583984, 0.008050739765167236, 0.008304476737976074, 0.008558213710784912, 0.00881195068359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 14.0, 15.0, 23.0, 45.0, 70.0, 128.0, 224.0, 398.0, 840.0, 1920.0, 5238.0, 17486.0, 90010.0, 3655546.0, 374765.0, 31616.0, 9429.0, 3482.0, 1412.0, 686.0, 339.0, 183.0, 135.0, 92.0, 65.0, 37.0, 23.0, 14.0, 10.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0050811767578125, -0.004915714263916016, -0.004750251770019531, -0.004584789276123047, -0.0044193267822265625, -0.004253864288330078, -0.004088401794433594, -0.003922939300537109, -0.003757476806640625, -0.0035920143127441406, -0.0034265518188476562, -0.003261089324951172, -0.0030956268310546875, -0.002930164337158203, -0.0027647018432617188, -0.0025992393493652344, -0.00243377685546875, -0.0022683143615722656, -0.0021028518676757812, -0.0019373893737792969, -0.0017719268798828125, -0.0016064643859863281, -0.0014410018920898438, -0.0012755393981933594, -0.001110076904296875, -0.0009446144104003906, -0.0007791519165039062, -0.0006136894226074219, -0.0004482269287109375, -0.0002827644348144531, -0.00011730194091796875, 4.8160552978515625e-05, 0.000213623046875, 0.0003790855407714844, 0.0005445480346679688, 0.0007100105285644531, 0.0008754730224609375, 0.0010409355163574219, 0.0012063980102539062, 0.0013718605041503906, 0.001537322998046875, 0.0017027854919433594, 0.0018682479858398438, 0.002033710479736328, 0.0021991729736328125, 0.002364635467529297, 0.0025300979614257812, 0.0026955604553222656, 0.00286102294921875, 0.0030264854431152344, 0.0031919479370117188, 0.003357410430908203, 0.0035228729248046875, 0.003688335418701172, 0.0038537979125976562, 0.004019260406494141, 0.004184722900390625, 0.004350185394287109, 0.004515647888183594, 0.004681110382080078, 0.0048465728759765625, 0.005012035369873047, 0.005177497863769531, 0.005342960357666016, 0.0055084228515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 5.0, 6.0, 8.0, 13.0, 19.0, 12.0, 26.0, 58.0, 136.0, 353.0, 960.0, 1305.0, 717.0, 235.0, 82.0, 35.0, 17.0, 11.0, 13.0, 10.0, 10.0, 7.0, 13.0, 3.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006290435791015625, -0.006067931652069092, -0.005845427513122559, -0.005622923374176025, -0.005400419235229492, -0.005177915096282959, -0.004955410957336426, -0.004732906818389893, -0.004510402679443359, -0.004287898540496826, -0.004065394401550293, -0.0038428902626037598, -0.0036203861236572266, -0.0033978819847106934, -0.00317537784576416, -0.002952873706817627, -0.0027303695678710938, -0.0025078654289245605, -0.0022853612899780273, -0.002062857151031494, -0.001840353012084961, -0.0016178488731384277, -0.0013953447341918945, -0.0011728405952453613, -0.0009503364562988281, -0.0007278323173522949, -0.0005053281784057617, -0.0002828240394592285, -6.031990051269531e-05, 0.0001621842384338379, 0.0003846883773803711, 0.0006071925163269043, 0.0008296966552734375, 0.0010522007942199707, 0.001274704933166504, 0.0014972090721130371, 0.0017197132110595703, 0.0019422173500061035, 0.0021647214889526367, 0.00238722562789917, 0.002609729766845703, 0.0028322339057922363, 0.0030547380447387695, 0.0032772421836853027, 0.003499746322631836, 0.003722250461578369, 0.003944754600524902, 0.0041672587394714355, 0.004389762878417969, 0.004612267017364502, 0.004834771156311035, 0.005057275295257568, 0.0052797794342041016, 0.005502283573150635, 0.005724787712097168, 0.005947291851043701, 0.006169795989990234, 0.006392300128936768, 0.006614804267883301, 0.006837308406829834, 0.007059812545776367, 0.0072823166847229, 0.007504820823669434, 0.007727324962615967, 0.0079498291015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 7.0, 34.0, 58.0, 140.0, 223.0, 236.0, 154.0, 57.0, 41.0, 9.0, 9.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046362124383449554, -0.04495404660701752, -0.04354596510529518, -0.042137887328863144, -0.04072980582714081, -0.03932172805070877, -0.03791365027427673, -0.036505572497844696, -0.03509749099612236, -0.03368941321969032, -0.03228133171796799, -0.03087325394153595, -0.029465174302458763, -0.028057094663381577, -0.02664901688694954, -0.025240937247872353, -0.023832857608795166, -0.02242477796971798, -0.021016698330640793, -0.019608620554208755, -0.01820054091513157, -0.016792461276054382, -0.01538438256829977, -0.013976303860545158, -0.012568224221467972, -0.011160144582390785, -0.009752065874636173, -0.008343987166881561, -0.006935907527804375, -0.005527828354388475, -0.004119749180972576, -0.002711670473217964, -0.0013035908341407776, 0.00010448833927512169, 0.001512567512691021, 0.0029206466861069202, 0.0043287258595228195, 0.005736805032938719, 0.007144884206354618, 0.00855296291410923, 0.009961042553186417, 0.011369122192263603, 0.012777200900018215, 0.014185279607772827, 0.015593359246850014, 0.0170014388859272, 0.018409516662359238, 0.019817596301436424, 0.02122567594051361, 0.022633755579590797, 0.024041835218667984, 0.02544991299510002, 0.026857992634177208, 0.028266072273254395, 0.029674150049686432, 0.03108222968876362, 0.032490309327840805, 0.03389838710427284, 0.03530646860599518, 0.036714546382427216, 0.03812262415885925, 0.03953070566058159, 0.040938783437013626, 0.04234686493873596, 0.043754942715168]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 4.0, 7.0, 9.0, 11.0, 8.0, 8.0, 18.0, 17.0, 29.0, 31.0, 32.0, 31.0, 39.0, 39.0, 36.0, 46.0, 37.0, 51.0, 56.0, 47.0, 50.0, 47.0, 33.0, 40.0, 34.0, 44.0, 27.0, 24.0, 37.0, 17.0, 10.0, 9.0, 20.0, 7.0, 8.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.023339927196502686, -0.022639479488134384, -0.021939033642411232, -0.02123858779668808, -0.02053814008831978, -0.019837692379951477, -0.019137246534228325, -0.018436800688505173, -0.01773635298013687, -0.01703590527176857, -0.016335459426045418, -0.015635013580322266, -0.014934565871953964, -0.014234119094908237, -0.01353367231786251, -0.012833225540816784, -0.012132778763771057, -0.01143233198672533, -0.010731885209679604, -0.010031438432633877, -0.00933099165558815, -0.008630544878542423, -0.007930098101496696, -0.00722965132445097, -0.006529204547405243, -0.005828757770359516, -0.005128310993313789, -0.004427864216268063, -0.003727417439222336, -0.003026970662176609, -0.0023265238851308823, -0.0016260771080851555, -0.0009256303310394287, -0.00022518355399370193, 0.00047526322305202484, 0.0011757100000977516, 0.0018761567771434784, 0.002576603554189205, 0.003277050331234932, 0.003977497108280659, 0.0046779438853263855, 0.005378390662372112, 0.006078837439417839, 0.006779284216463566, 0.007479730993509293, 0.00818017777055502, 0.008880624547600746, 0.009581071324646473, 0.0102815181016922, 0.010981964878737926, 0.011682411655783653, 0.01238285843282938, 0.013083305209875107, 0.013783751986920834, 0.01448419876396656, 0.015184645541012287, 0.015885092318058014, 0.016585540026426315, 0.017285985872149467, 0.01798643171787262, 0.01868687942624092, 0.019387327134609222, 0.020087772980332375, 0.020788218826055527, 0.021488666534423828]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 8.0, 9.0, 20.0, 26.0, 24.0, 40.0, 57.0, 84.0, 126.0, 201.0, 356.0, 593.0, 1006.0, 1925.0, 3839.0, 8772.0, 24460.0, 92561.0, 441373.0, 363249.0, 74155.0, 20746.0, 7617.0, 3453.0, 1582.0, 877.0, 525.0, 294.0, 196.0, 139.0, 79.0, 53.0, 20.0, 26.0, 20.0, 14.0, 7.0, 7.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0053863525390625, -0.00520634651184082, -0.005026340484619141, -0.004846334457397461, -0.004666328430175781, -0.0044863224029541016, -0.004306316375732422, -0.004126310348510742, -0.0039463043212890625, -0.003766298294067383, -0.003586292266845703, -0.0034062862396240234, -0.0032262802124023438, -0.003046274185180664, -0.0028662681579589844, -0.0026862621307373047, -0.002506256103515625, -0.0023262500762939453, -0.0021462440490722656, -0.001966238021850586, -0.0017862319946289062, -0.0016062259674072266, -0.0014262199401855469, -0.0012462139129638672, -0.0010662078857421875, -0.0008862018585205078, -0.0007061958312988281, -0.0005261898040771484, -0.00034618377685546875, -0.00016617774963378906, 1.3828277587890625e-05, 0.0001938343048095703, 0.00037384033203125, 0.0005538463592529297, 0.0007338523864746094, 0.0009138584136962891, 0.0010938644409179688, 0.0012738704681396484, 0.0014538764953613281, 0.0016338825225830078, 0.0018138885498046875, 0.001993894577026367, 0.002173900604248047, 0.0023539066314697266, 0.0025339126586914062, 0.002713918685913086, 0.0028939247131347656, 0.0030739307403564453, 0.003253936767578125, 0.0034339427947998047, 0.0036139488220214844, 0.003793954849243164, 0.003973960876464844, 0.0041539669036865234, 0.004333972930908203, 0.004513978958129883, 0.0046939849853515625, 0.004873991012573242, 0.005053997039794922, 0.0052340030670166016, 0.005414009094238281, 0.005594015121459961, 0.005774021148681641, 0.00595402717590332, 0.006134033203125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 23.0, 34.0, 45.0, 76.0, 77.0, 122.0, 146.0, 121.0, 102.0, 70.0, 45.0, 33.0, 28.0, 15.0, 9.0, 7.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00734710693359375, -0.007092714309692383, -0.006838321685791016, -0.0065839290618896484, -0.006329536437988281, -0.006075143814086914, -0.005820751190185547, -0.00556635856628418, -0.0053119659423828125, -0.005057573318481445, -0.004803180694580078, -0.004548788070678711, -0.004294395446777344, -0.0040400028228759766, -0.0037856101989746094, -0.003531217575073242, -0.003276824951171875, -0.003022432327270508, -0.0027680397033691406, -0.0025136470794677734, -0.0022592544555664062, -0.002004861831665039, -0.0017504692077636719, -0.0014960765838623047, -0.0012416839599609375, -0.0009872913360595703, -0.0007328987121582031, -0.00047850608825683594, -0.00022411346435546875, 3.0279159545898438e-05, 0.0002846717834472656, 0.0005390644073486328, 0.00079345703125, 0.0010478496551513672, 0.0013022422790527344, 0.0015566349029541016, 0.0018110275268554688, 0.002065420150756836, 0.002319812774658203, 0.0025742053985595703, 0.0028285980224609375, 0.0030829906463623047, 0.003337383270263672, 0.003591775894165039, 0.0038461685180664062, 0.0041005611419677734, 0.004354953765869141, 0.004609346389770508, 0.004863739013671875, 0.005118131637573242, 0.005372524261474609, 0.0056269168853759766, 0.005881309509277344, 0.006135702133178711, 0.006390094757080078, 0.006644487380981445, 0.0068988800048828125, 0.00715327262878418, 0.007407665252685547, 0.007662057876586914, 0.007916450500488281, 0.008170843124389648, 0.008425235748291016, 0.008679628372192383, 0.00893402099609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 11.0, 5.0, 8.0, 9.0, 13.0, 20.0, 17.0, 24.0, 33.0, 55.0, 61.0, 89.0, 103.0, 154.0, 231.0, 298.0, 514.0, 821.0, 1668.0, 4014.0, 14785.0, 92369.0, 679633.0, 213660.0, 28349.0, 6279.0, 2154.0, 1079.0, 687.0, 395.0, 272.0, 202.0, 144.0, 86.0, 80.0, 67.0, 48.0, 31.0, 28.0, 18.0, 9.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.01020050048828125, -0.009914755821228027, -0.009629011154174805, -0.009343266487121582, -0.00905752182006836, -0.008771777153015137, -0.008486032485961914, -0.008200287818908691, -0.007914543151855469, -0.007628798484802246, -0.0073430538177490234, -0.007057309150695801, -0.006771564483642578, -0.0064858198165893555, -0.006200075149536133, -0.00591433048248291, -0.0056285858154296875, -0.005342841148376465, -0.005057096481323242, -0.0047713518142700195, -0.004485607147216797, -0.004199862480163574, -0.0039141178131103516, -0.003628373146057129, -0.0033426284790039062, -0.0030568838119506836, -0.002771139144897461, -0.0024853944778442383, -0.0021996498107910156, -0.001913905143737793, -0.0016281604766845703, -0.0013424158096313477, -0.001056671142578125, -0.0007709264755249023, -0.0004851818084716797, -0.00019943714141845703, 8.630752563476562e-05, 0.0003720521926879883, 0.0006577968597412109, 0.0009435415267944336, 0.0012292861938476562, 0.001515030860900879, 0.0018007755279541016, 0.0020865201950073242, 0.002372264862060547, 0.0026580095291137695, 0.002943754196166992, 0.003229498863220215, 0.0035152435302734375, 0.00380098819732666, 0.004086732864379883, 0.0043724775314331055, 0.004658222198486328, 0.004943966865539551, 0.0052297115325927734, 0.005515456199645996, 0.005801200866699219, 0.006086945533752441, 0.006372690200805664, 0.006658434867858887, 0.006944179534912109, 0.007229924201965332, 0.007515668869018555, 0.007801413536071777, 0.008087158203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 2.0, 4.0, 8.0, 7.0, 11.0, 9.0, 7.0, 9.0, 12.0, 17.0, 16.0, 24.0, 34.0, 33.0, 28.0, 34.0, 36.0, 36.0, 50.0, 48.0, 32.0, 45.0, 35.0, 47.0, 42.0, 41.0, 38.0, 40.0, 42.0, 28.0, 26.0, 26.0, 17.0, 21.0, 16.0, 11.0, 16.0, 13.0, 7.0, 5.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.013458251953125, -0.013055801391601562, -0.012653350830078125, -0.012250900268554688, -0.01184844970703125, -0.011445999145507812, -0.011043548583984375, -0.010641098022460938, -0.0102386474609375, -0.009836196899414062, -0.009433746337890625, -0.009031295776367188, -0.00862884521484375, -0.008226394653320312, -0.007823944091796875, -0.0074214935302734375, -0.00701904296875, -0.0066165924072265625, -0.006214141845703125, -0.0058116912841796875, -0.00540924072265625, -0.0050067901611328125, -0.004604339599609375, -0.0042018890380859375, -0.0037994384765625, -0.0033969879150390625, -0.002994537353515625, -0.0025920867919921875, -0.00218963623046875, -0.0017871856689453125, -0.001384735107421875, -0.0009822845458984375, -0.000579833984375, -0.0001773834228515625, 0.000225067138671875, 0.0006275177001953125, 0.00102996826171875, 0.0014324188232421875, 0.001834869384765625, 0.0022373199462890625, 0.0026397705078125, 0.0030422210693359375, 0.003444671630859375, 0.0038471221923828125, 0.00424957275390625, 0.0046520233154296875, 0.005054473876953125, 0.0054569244384765625, 0.005859375, 0.0062618255615234375, 0.006664276123046875, 0.0070667266845703125, 0.00746917724609375, 0.007871627807617188, 0.008274078369140625, 0.008676528930664062, 0.0090789794921875, 0.009481430053710938, 0.009883880615234375, 0.010286331176757812, 0.01068878173828125, 0.011091232299804688, 0.011493682861328125, 0.011896133422851562, 0.012298583984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 5.0, 11.0, 15.0, 18.0, 31.0, 32.0, 57.0, 77.0, 158.0, 304.0, 491.0, 1044.0, 2156.0, 5361.0, 16416.0, 68258.0, 506544.0, 358539.0, 63820.0, 15737.0, 5242.0, 2087.0, 967.0, 483.0, 254.0, 157.0, 104.0, 59.0, 40.0, 30.0, 15.0, 13.0, 11.0, 11.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001148223876953125, -0.0011071860790252686, -0.0010661482810974121, -0.0010251104831695557, -0.0009840726852416992, -0.0009430348873138428, -0.0009019970893859863, -0.0008609592914581299, -0.0008199214935302734, -0.000778883695602417, -0.0007378458976745605, -0.0006968080997467041, -0.0006557703018188477, -0.0006147325038909912, -0.0005736947059631348, -0.0005326569080352783, -0.0004916191101074219, -0.00045058131217956543, -0.000409543514251709, -0.00036850571632385254, -0.0003274679183959961, -0.00028643012046813965, -0.0002453923225402832, -0.00020435452461242676, -0.0001633167266845703, -0.00012227892875671387, -8.124113082885742e-05, -4.0203332901000977e-05, 8.344650268554688e-07, 4.1872262954711914e-05, 8.291006088256836e-05, 0.0001239478588104248, 0.00016498565673828125, 0.0002060234546661377, 0.00024706125259399414, 0.0002880990505218506, 0.00032913684844970703, 0.0003701746463775635, 0.0004112124443054199, 0.00045225024223327637, 0.0004932880401611328, 0.0005343258380889893, 0.0005753636360168457, 0.0006164014339447021, 0.0006574392318725586, 0.000698477029800415, 0.0007395148277282715, 0.0007805526256561279, 0.0008215904235839844, 0.0008626282215118408, 0.0009036660194396973, 0.0009447038173675537, 0.0009857416152954102, 0.0010267794132232666, 0.001067817211151123, 0.0011088550090789795, 0.001149892807006836, 0.0011909306049346924, 0.0012319684028625488, 0.0012730062007904053, 0.0013140439987182617, 0.0013550817966461182, 0.0013961195945739746, 0.001437157392501831, 0.0014781951904296875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 12.0, 9.0, 9.0, 16.0, 11.0, 12.0, 29.0, 20.0, 30.0, 27.0, 30.0, 47.0, 35.0, 60.0, 56.0, 41.0, 74.0, 45.0, 67.0, 75.0, 35.0, 56.0, 26.0, 39.0, 35.0, 20.0, 8.0, 14.0, 19.0, 7.0, 8.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-06, -4.374422132968903e-06, -4.218891263008118e-06, -4.063360393047333e-06, -3.907829523086548e-06, -3.752298653125763e-06, -3.596767783164978e-06, -3.441236913204193e-06, -3.285706043243408e-06, -3.1301751732826233e-06, -2.9746443033218384e-06, -2.8191134333610535e-06, -2.6635825634002686e-06, -2.5080516934394836e-06, -2.3525208234786987e-06, -2.196989953517914e-06, -2.041459083557129e-06, -1.885928213596344e-06, -1.730397343635559e-06, -1.5748664736747742e-06, -1.4193356037139893e-06, -1.2638047337532043e-06, -1.1082738637924194e-06, -9.527429938316345e-07, -7.972121238708496e-07, -6.416812539100647e-07, -4.861503839492798e-07, -3.3061951398849487e-07, -1.7508864402770996e-07, -1.955777406692505e-08, 1.3597309589385986e-07, 2.915039658546448e-07, 4.470348358154297e-07, 6.025657057762146e-07, 7.580965757369995e-07, 9.136274456977844e-07, 1.0691583156585693e-06, 1.2246891856193542e-06, 1.3802200555801392e-06, 1.535750925540924e-06, 1.691281795501709e-06, 1.846812665462494e-06, 2.002343535423279e-06, 2.1578744053840637e-06, 2.3134052753448486e-06, 2.4689361453056335e-06, 2.6244670152664185e-06, 2.7799978852272034e-06, 2.9355287551879883e-06, 3.091059625148773e-06, 3.246590495109558e-06, 3.402121365070343e-06, 3.557652235031128e-06, 3.713183104991913e-06, 3.868713974952698e-06, 4.024244844913483e-06, 4.179775714874268e-06, 4.3353065848350525e-06, 4.490837454795837e-06, 4.646368324756622e-06, 4.801899194717407e-06, 4.957430064678192e-06, 5.112960934638977e-06, 5.268491804599762e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 5.0, 9.0, 9.0, 19.0, 35.0, 36.0, 49.0, 73.0, 111.0, 200.0, 303.0, 526.0, 1106.0, 2675.0, 8850.0, 43072.0, 317762.0, 591945.0, 63822.0, 11787.0, 3329.0, 1261.0, 619.0, 350.0, 194.0, 126.0, 68.0, 55.0, 45.0, 39.0, 14.0, 12.0, 7.0, 12.0, 4.0, 7.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001293182373046875, -0.0012454688549041748, -0.0011977553367614746, -0.0011500418186187744, -0.0011023283004760742, -0.001054614782333374, -0.0010069012641906738, -0.0009591877460479736, -0.0009114742279052734, -0.0008637607097625732, -0.000816047191619873, -0.0007683336734771729, -0.0007206201553344727, -0.0006729066371917725, -0.0006251931190490723, -0.0005774796009063721, -0.0005297660827636719, -0.0004820525646209717, -0.0004343390464782715, -0.0003866255283355713, -0.0003389120101928711, -0.0002911984920501709, -0.0002434849739074707, -0.0001957714557647705, -0.0001480579376220703, -0.00010034441947937012, -5.263090133666992e-05, -4.9173831939697266e-06, 4.279613494873047e-05, 9.050965309143066e-05, 0.00013822317123413086, 0.00018593668937683105, 0.00023365020751953125, 0.00028136372566223145, 0.00032907724380493164, 0.00037679076194763184, 0.00042450428009033203, 0.0004722177982330322, 0.0005199313163757324, 0.0005676448345184326, 0.0006153583526611328, 0.000663071870803833, 0.0007107853889465332, 0.0007584989070892334, 0.0008062124252319336, 0.0008539259433746338, 0.000901639461517334, 0.0009493529796600342, 0.0009970664978027344, 0.0010447800159454346, 0.0010924935340881348, 0.001140207052230835, 0.0011879205703735352, 0.0012356340885162354, 0.0012833476066589355, 0.0013310611248016357, 0.001378774642944336, 0.0014264881610870361, 0.0014742016792297363, 0.0015219151973724365, 0.0015696287155151367, 0.001617342233657837, 0.0016650557518005371, 0.0017127692699432373, 0.0017604827880859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 11.0, 19.0, 19.0, 21.0, 34.0, 42.0, 64.0, 67.0, 72.0, 82.0, 93.0, 78.0, 84.0, 57.0, 57.0, 39.0, 34.0, 20.0, 21.0, 14.0, 13.0, 18.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002040863037109375, -0.00197407603263855, -0.0019072890281677246, -0.0018405020236968994, -0.0017737150192260742, -0.001706928014755249, -0.0016401410102844238, -0.0015733540058135986, -0.0015065670013427734, -0.0014397799968719482, -0.001372992992401123, -0.0013062059879302979, -0.0012394189834594727, -0.0011726319789886475, -0.0011058449745178223, -0.001039057970046997, -0.0009722709655761719, -0.0009054839611053467, -0.0008386969566345215, -0.0007719099521636963, -0.0007051229476928711, -0.0006383359432220459, -0.0005715489387512207, -0.0005047619342803955, -0.0004379749298095703, -0.0003711879253387451, -0.0003044009208679199, -0.00023761391639709473, -0.00017082691192626953, -0.00010403990745544434, -3.725290298461914e-05, 2.9534101486206055e-05, 9.632110595703125e-05, 0.00016310811042785645, 0.00022989511489868164, 0.00029668211936950684, 0.00036346912384033203, 0.0004302561283111572, 0.0004970431327819824, 0.0005638301372528076, 0.0006306171417236328, 0.000697404146194458, 0.0007641911506652832, 0.0008309781551361084, 0.0008977651596069336, 0.0009645521640777588, 0.001031339168548584, 0.0010981261730194092, 0.0011649131774902344, 0.0012317001819610596, 0.0012984871864318848, 0.00136527419090271, 0.0014320611953735352, 0.0014988481998443604, 0.0015656352043151855, 0.0016324222087860107, 0.001699209213256836, 0.0017659962177276611, 0.0018327832221984863, 0.0018995702266693115, 0.0019663572311401367, 0.002033144235610962, 0.002099931240081787, 0.0021667182445526123, 0.0022335052490234375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 14.0, 24.0, 59.0, 131.0, 237.0, 297.0, 130.0, 46.0, 29.0, 12.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062259502708911896, -0.059788286685943604, -0.05731707066297531, -0.05484585091471672, -0.05237463489174843, -0.049903418868780136, -0.047432199120521545, -0.04496098309755325, -0.04248976707458496, -0.04001855105161667, -0.037547335028648376, -0.035076115280389786, -0.032604899257421494, -0.0301336832344532, -0.02766246534883976, -0.02519124746322632, -0.022720031440258026, -0.020248815417289734, -0.017777597531676292, -0.015306380577385426, -0.012835163623094559, -0.010363946668803692, -0.007892729714512825, -0.0054215118288993835, -0.0029502958059310913, -0.00047907885164022446, 0.0019921381026506424, 0.004463355056941509, 0.006934572011232376, 0.009405788965523243, 0.01187700591981411, 0.014348223805427551, 0.016819432377815247, 0.01929064840078354, 0.02176186628639698, 0.024233084172010422, 0.026704300194978714, 0.029175516217947006, 0.0316467359662056, 0.03411795198917389, 0.03658916801214218, 0.039060384035110474, 0.041531600058078766, 0.04400281980633736, 0.04647403582930565, 0.04894525185227394, 0.05141647160053253, 0.053887687623500824, 0.056358903646469116, 0.05883011966943741, 0.0613013356924057, 0.06377255171537399, 0.06624376773834229, 0.06871499121189117, 0.07118620723485947, 0.07365742325782776, 0.07612863928079605, 0.07859985530376434, 0.08107107132673264, 0.08354228734970093, 0.08601351082324982, 0.08848472684621811, 0.0909559428691864, 0.0934271588921547, 0.09589837491512299]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 8.0, 3.0, 5.0, 10.0, 16.0, 8.0, 15.0, 18.0, 19.0, 17.0, 30.0, 26.0, 21.0, 29.0, 37.0, 47.0, 58.0, 64.0, 72.0, 93.0, 61.0, 51.0, 38.0, 36.0, 34.0, 34.0, 20.0, 20.0, 16.0, 12.0, 16.0, 11.0, 8.0, 7.0, 8.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06331872940063477, -0.0614977590739727, -0.05967678874731064, -0.057855818420648575, -0.05603484809398651, -0.05421387776732445, -0.052392907440662384, -0.05057193711400032, -0.04875096678733826, -0.04692999646067619, -0.04510902613401413, -0.043288055807352066, -0.04146708548069, -0.03964611515402794, -0.037825144827365875, -0.03600417450070381, -0.03418320417404175, -0.032362233847379684, -0.03054126352071762, -0.028720293194055557, -0.026899322867393494, -0.02507835254073143, -0.023257382214069366, -0.021436411887407303, -0.01961544156074524, -0.017794471234083176, -0.015973500907421112, -0.014152530580759048, -0.012331560254096985, -0.010510589927434921, -0.008689619600772858, -0.006868649274110794, -0.0050476789474487305, -0.003226708620786667, -0.0014057382941246033, 0.00041523203253746033, 0.002236202359199524, 0.0040571726858615875, 0.005878143012523651, 0.007699113339185715, 0.009520083665847778, 0.011341053992509842, 0.013162024319171906, 0.014982994645833969, 0.016803964972496033, 0.018624935299158096, 0.02044590562582016, 0.022266875952482224, 0.024087846279144287, 0.02590881660580635, 0.027729786932468414, 0.029550757259130478, 0.03137172758579254, 0.033192697912454605, 0.03501366823911667, 0.03683463856577873, 0.038655608892440796, 0.04047657921910286, 0.04229754954576492, 0.04411851987242699, 0.04593949019908905, 0.047760460525751114, 0.04958143085241318, 0.05140240117907524, 0.053223371505737305]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 2.0, 13.0, 5.0, 19.0, 45.0, 41.0, 85.0, 160.0, 299.0, 698.0, 1813.0, 4740.0, 15642.0, 97897.0, 2179245.0, 1789983.0, 84968.0, 12716.0, 3573.0, 1348.0, 436.0, 228.0, 113.0, 57.0, 48.0, 33.0, 18.0, 15.0, 12.0, 7.0, 7.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004108428955078125, -0.0039560794830322266, -0.003803730010986328, -0.0036513805389404297, -0.0034990310668945312, -0.003346681594848633, -0.0031943321228027344, -0.003041982650756836, -0.0028896331787109375, -0.002737283706665039, -0.0025849342346191406, -0.002432584762573242, -0.0022802352905273438, -0.0021278858184814453, -0.001975536346435547, -0.0018231868743896484, -0.00167083740234375, -0.0015184879302978516, -0.0013661384582519531, -0.0012137889862060547, -0.0010614395141601562, -0.0009090900421142578, -0.0007567405700683594, -0.0006043910980224609, -0.0004520416259765625, -0.00029969215393066406, -0.00014734268188476562, 5.0067901611328125e-06, 0.00015735626220703125, 0.0003097057342529297, 0.0004620552062988281, 0.0006144046783447266, 0.000766754150390625, 0.0009191036224365234, 0.0010714530944824219, 0.0012238025665283203, 0.0013761520385742188, 0.0015285015106201172, 0.0016808509826660156, 0.001833200454711914, 0.0019855499267578125, 0.002137899398803711, 0.0022902488708496094, 0.002442598342895508, 0.0025949478149414062, 0.0027472972869873047, 0.002899646759033203, 0.0030519962310791016, 0.003204345703125, 0.0033566951751708984, 0.003509044647216797, 0.0036613941192626953, 0.0038137435913085938, 0.003966093063354492, 0.004118442535400391, 0.004270792007446289, 0.0044231414794921875, 0.004575490951538086, 0.004727840423583984, 0.004880189895629883, 0.005032539367675781, 0.00518488883972168, 0.005337238311767578, 0.0054895877838134766, 0.005641937255859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 13.0, 20.0, 30.0, 52.0, 67.0, 92.0, 104.0, 138.0, 132.0, 103.0, 84.0, 49.0, 35.0, 26.0, 11.0, 7.0, 10.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007305145263671875, -0.007050931453704834, -0.006796717643737793, -0.006542503833770752, -0.006288290023803711, -0.00603407621383667, -0.005779862403869629, -0.005525648593902588, -0.005271434783935547, -0.005017220973968506, -0.004763007164001465, -0.004508793354034424, -0.004254579544067383, -0.004000365734100342, -0.0037461519241333008, -0.0034919381141662598, -0.0032377243041992188, -0.0029835104942321777, -0.0027292966842651367, -0.0024750828742980957, -0.0022208690643310547, -0.0019666552543640137, -0.0017124414443969727, -0.0014582276344299316, -0.0012040138244628906, -0.0009498000144958496, -0.0006955862045288086, -0.0004413723945617676, -0.00018715858459472656, 6.705522537231445e-05, 0.00032126903533935547, 0.0005754828453063965, 0.0008296966552734375, 0.0010839104652404785, 0.0013381242752075195, 0.0015923380851745605, 0.0018465518951416016, 0.0021007657051086426, 0.0023549795150756836, 0.0026091933250427246, 0.0028634071350097656, 0.0031176209449768066, 0.0033718347549438477, 0.0036260485649108887, 0.0038802623748779297, 0.004134476184844971, 0.004388689994812012, 0.004642903804779053, 0.004897117614746094, 0.005151331424713135, 0.005405545234680176, 0.005659759044647217, 0.005913972854614258, 0.006168186664581299, 0.00642240047454834, 0.006676614284515381, 0.006930828094482422, 0.007185041904449463, 0.007439255714416504, 0.007693469524383545, 0.007947683334350586, 0.008201897144317627, 0.008456110954284668, 0.008710324764251709, 0.00896453857421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 15.0, 22.0, 42.0, 67.0, 162.0, 309.0, 571.0, 1288.0, 4493.0, 39978.0, 3992024.0, 143401.0, 8374.0, 1905.0, 743.0, 378.0, 196.0, 122.0, 56.0, 51.0, 22.0, 12.0, 10.0, 6.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00928497314453125, -0.009009122848510742, -0.008733272552490234, -0.008457422256469727, -0.008181571960449219, -0.007905721664428711, -0.007629871368408203, -0.007354021072387695, -0.0070781707763671875, -0.00680232048034668, -0.006526470184326172, -0.006250619888305664, -0.005974769592285156, -0.0056989192962646484, -0.005423069000244141, -0.005147218704223633, -0.004871368408203125, -0.004595518112182617, -0.004319667816162109, -0.0040438175201416016, -0.0037679672241210938, -0.003492116928100586, -0.003216266632080078, -0.0029404163360595703, -0.0026645660400390625, -0.0023887157440185547, -0.002112865447998047, -0.001837015151977539, -0.0015611648559570312, -0.0012853145599365234, -0.0010094642639160156, -0.0007336139678955078, -0.000457763671875, -0.0001819133758544922, 9.393692016601562e-05, 0.00036978721618652344, 0.0006456375122070312, 0.0009214878082275391, 0.0011973381042480469, 0.0014731884002685547, 0.0017490386962890625, 0.0020248889923095703, 0.002300739288330078, 0.002576589584350586, 0.0028524398803710938, 0.0031282901763916016, 0.0034041404724121094, 0.003679990768432617, 0.003955841064453125, 0.004231691360473633, 0.004507541656494141, 0.0047833919525146484, 0.005059242248535156, 0.005335092544555664, 0.005610942840576172, 0.00588679313659668, 0.0061626434326171875, 0.006438493728637695, 0.006714344024658203, 0.006990194320678711, 0.007266044616699219, 0.0075418949127197266, 0.007817745208740234, 0.008093595504760742, 0.00836944580078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 9.0, 15.0, 31.0, 141.0, 665.0, 1562.0, 1166.0, 308.0, 75.0, 34.0, 18.0, 21.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00934600830078125, -0.009009361267089844, -0.008672714233398438, -0.008336067199707031, -0.007999420166015625, -0.007662773132324219, -0.0073261260986328125, -0.006989479064941406, -0.00665283203125, -0.006316184997558594, -0.0059795379638671875, -0.005642890930175781, -0.005306243896484375, -0.004969596862792969, -0.0046329498291015625, -0.004296302795410156, -0.00395965576171875, -0.0036230087280273438, -0.0032863616943359375, -0.0029497146606445312, -0.002613067626953125, -0.0022764205932617188, -0.0019397735595703125, -0.0016031265258789062, -0.0012664794921875, -0.0009298324584960938, -0.0005931854248046875, -0.00025653839111328125, 8.0108642578125e-05, 0.00041675567626953125, 0.0007534027099609375, 0.0010900497436523438, 0.00142669677734375, 0.0017633438110351562, 0.0020999908447265625, 0.0024366378784179688, 0.002773284912109375, 0.0031099319458007812, 0.0034465789794921875, 0.0037832260131835938, 0.004119873046875, 0.004456520080566406, 0.0047931671142578125, 0.005129814147949219, 0.005466461181640625, 0.005803108215332031, 0.0061397552490234375, 0.006476402282714844, 0.00681304931640625, 0.007149696350097656, 0.0074863433837890625, 0.007822990417480469, 0.008159637451171875, 0.008496284484863281, 0.008832931518554688, 0.009169578552246094, 0.0095062255859375, 0.009842872619628906, 0.010179519653320312, 0.010516166687011719, 0.010852813720703125, 0.011189460754394531, 0.011526107788085938, 0.011862754821777344, 0.01219940185546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 12.0, 72.0, 310.0, 428.0, 124.0, 25.0, 16.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05934443697333336, -0.056237686425447464, -0.05313093960285187, -0.05002418905496597, -0.04691743850708008, -0.04381069168448448, -0.04070394113659859, -0.03759719431400299, -0.034490443766117096, -0.0313836932182312, -0.028276946395635605, -0.02517019584774971, -0.022063447162508965, -0.01895669847726822, -0.015849947929382324, -0.012743199244141579, -0.009636450558900833, -0.0065297014079988, -0.0034229522570967674, -0.00031620264053344727, 0.0027905460447072983, 0.005897294729948044, 0.009004045277833939, 0.012110793963074684, 0.01521754264831543, 0.018324291333556175, 0.02143104001879692, 0.024537790566682816, 0.02764453925192356, 0.030751287937164307, 0.0338580384850502, 0.036964789032936096, 0.040071532130241394, 0.04317828267812729, 0.046285029500722885, 0.04939178004860878, 0.052498526871204376, 0.05560527741909027, 0.058712027966976166, 0.06181877851486206, 0.06492552161216736, 0.06803227216005325, 0.07113902270793915, 0.07424576580524445, 0.07735251635313034, 0.08045926690101624, 0.08356601744890213, 0.08667276799678802, 0.08977951854467392, 0.09288626909255981, 0.09599301964044571, 0.0990997701883316, 0.1022065132856369, 0.1053132638335228, 0.10842001438140869, 0.11152676492929459, 0.11463351547718048, 0.11774026602506638, 0.12084701657295227, 0.12395375967025757, 0.12706051766872406, 0.13016726076602936, 0.13327401876449585, 0.13638076186180115, 0.13948750495910645]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 4.0, 4.0, 9.0, 7.0, 8.0, 9.0, 9.0, 12.0, 13.0, 31.0, 28.0, 23.0, 25.0, 26.0, 25.0, 30.0, 35.0, 43.0, 40.0, 48.0, 53.0, 44.0, 47.0, 50.0, 42.0, 47.0, 36.0, 38.0, 33.0, 28.0, 15.0, 21.0, 25.0, 15.0, 10.0, 17.0, 12.0, 7.0, 8.0, 8.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020757019519805908, -0.020089566707611084, -0.01942211575806141, -0.018754664808511734, -0.01808721199631691, -0.017419759184122086, -0.01675230823457241, -0.016084857285022736, -0.015417404472827911, -0.014749952591955662, -0.014082500711083412, -0.013415048830211163, -0.012747596949338913, -0.012080145068466663, -0.011412693187594414, -0.010745241306722164, -0.010077789425849915, -0.009410337544977665, -0.008742885664105415, -0.008075433783233166, -0.007407981902360916, -0.0067405300214886665, -0.006073078140616417, -0.005405626259744167, -0.004738174378871918, -0.004070722497999668, -0.0034032706171274185, -0.002735818736255169, -0.0020683668553829193, -0.0014009149745106697, -0.0007334630936384201, -6.60112127661705e-05, 0.0006014406681060791, 0.0012688925489783287, 0.0019363444298505783, 0.002603796310722828, 0.0032712481915950775, 0.003938700072467327, 0.004606151953339577, 0.005273603834211826, 0.005941055715084076, 0.0066085075959563255, 0.007275959476828575, 0.007943411357700825, 0.008610863238573074, 0.009278315119445324, 0.009945767000317574, 0.010613218881189823, 0.011280670762062073, 0.011948122642934322, 0.012615574523806572, 0.013283026404678822, 0.013950478285551071, 0.01461793016642332, 0.01528538204729557, 0.015952832996845245, 0.01662028580904007, 0.017287738621234894, 0.01795518957078457, 0.018622640520334244, 0.019290093332529068, 0.019957546144723892, 0.020624997094273567, 0.021292448043823242, 0.021959900856018066]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 2.0, 7.0, 5.0, 13.0, 9.0, 17.0, 19.0, 37.0, 36.0, 66.0, 77.0, 113.0, 165.0, 258.0, 339.0, 556.0, 915.0, 1493.0, 2569.0, 4973.0, 10781.0, 26944.0, 78453.0, 238079.0, 392982.0, 187874.0, 60600.0, 21765.0, 9061.0, 4294.0, 2247.0, 1330.0, 808.0, 529.0, 334.0, 228.0, 150.0, 105.0, 91.0, 63.0, 48.0, 28.0, 23.0, 16.0, 15.0, 10.0, 13.0, 6.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0037708282470703125, -0.0036506950855255127, -0.003530561923980713, -0.003410428762435913, -0.0032902956008911133, -0.0031701624393463135, -0.0030500292778015137, -0.002929896116256714, -0.002809762954711914, -0.0026896297931671143, -0.0025694966316223145, -0.0024493634700775146, -0.002329230308532715, -0.002209097146987915, -0.0020889639854431152, -0.0019688308238983154, -0.0018486976623535156, -0.0017285645008087158, -0.001608431339263916, -0.0014882981777191162, -0.0013681650161743164, -0.0012480318546295166, -0.0011278986930847168, -0.001007765531539917, -0.0008876323699951172, -0.0007674992084503174, -0.0006473660469055176, -0.0005272328853607178, -0.00040709972381591797, -0.00028696656227111816, -0.00016683340072631836, -4.6700239181518555e-05, 7.343292236328125e-05, 0.00019356608390808105, 0.00031369924545288086, 0.00043383240699768066, 0.0005539655685424805, 0.0006740987300872803, 0.0007942318916320801, 0.0009143650531768799, 0.0010344982147216797, 0.0011546313762664795, 0.0012747645378112793, 0.001394897699356079, 0.001515030860900879, 0.0016351640224456787, 0.0017552971839904785, 0.0018754303455352783, 0.001995563507080078, 0.002115696668624878, 0.0022358298301696777, 0.0023559629917144775, 0.0024760961532592773, 0.002596229314804077, 0.002716362476348877, 0.0028364956378936768, 0.0029566287994384766, 0.0030767619609832764, 0.003196895122528076, 0.003317028284072876, 0.0034371614456176758, 0.0035572946071624756, 0.0036774277687072754, 0.003797560930252075, 0.003917694091796875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 18.0, 21.0, 34.0, 52.0, 65.0, 106.0, 131.0, 129.0, 141.0, 104.0, 68.0, 33.0, 32.0, 21.0, 11.0, 6.0, 11.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00725555419921875, -0.007000565528869629, -0.006745576858520508, -0.006490588188171387, -0.006235599517822266, -0.0059806108474731445, -0.0057256221771240234, -0.005470633506774902, -0.005215644836425781, -0.00496065616607666, -0.004705667495727539, -0.004450678825378418, -0.004195690155029297, -0.003940701484680176, -0.0036857128143310547, -0.0034307241439819336, -0.0031757354736328125, -0.0029207468032836914, -0.0026657581329345703, -0.0024107694625854492, -0.002155780792236328, -0.001900792121887207, -0.001645803451538086, -0.0013908147811889648, -0.0011358261108398438, -0.0008808374404907227, -0.0006258487701416016, -0.00037086009979248047, -0.00011587142944335938, 0.00013911724090576172, 0.0003941059112548828, 0.0006490945816040039, 0.000904083251953125, 0.001159071922302246, 0.0014140605926513672, 0.0016690492630004883, 0.0019240379333496094, 0.0021790266036987305, 0.0024340152740478516, 0.0026890039443969727, 0.0029439926147460938, 0.003198981285095215, 0.003453969955444336, 0.003708958625793457, 0.003963947296142578, 0.004218935966491699, 0.00447392463684082, 0.004728913307189941, 0.0049839019775390625, 0.005238890647888184, 0.005493879318237305, 0.005748867988586426, 0.006003856658935547, 0.006258845329284668, 0.006513833999633789, 0.00676882266998291, 0.007023811340332031, 0.007278800010681152, 0.0075337886810302734, 0.0077887773513793945, 0.008043766021728516, 0.008298754692077637, 0.008553743362426758, 0.008808732032775879, 0.009063720703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 3.0, 7.0, 6.0, 13.0, 14.0, 19.0, 25.0, 30.0, 48.0, 71.0, 69.0, 122.0, 165.0, 236.0, 390.0, 690.0, 1205.0, 2461.0, 5405.0, 13299.0, 34592.0, 96284.0, 232401.0, 442292.0, 136232.0, 49525.0, 18374.0, 7333.0, 3313.0, 1633.0, 825.0, 464.0, 325.0, 198.0, 136.0, 95.0, 72.0, 40.0, 35.0, 27.0, 15.0, 17.0, 11.0, 10.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0043487548828125, -0.004221528768539429, -0.004094302654266357, -0.003967076539993286, -0.003839850425720215, -0.0037126243114471436, -0.0035853981971740723, -0.003458172082901001, -0.0033309459686279297, -0.0032037198543548584, -0.003076493740081787, -0.002949267625808716, -0.0028220415115356445, -0.0026948153972625732, -0.002567589282989502, -0.0024403631687164307, -0.0023131370544433594, -0.002185910940170288, -0.002058684825897217, -0.0019314587116241455, -0.0018042325973510742, -0.001677006483078003, -0.0015497803688049316, -0.0014225542545318604, -0.001295328140258789, -0.0011681020259857178, -0.0010408759117126465, -0.0009136497974395752, -0.0007864236831665039, -0.0006591975688934326, -0.0005319714546203613, -0.00040474534034729004, -0.00027751922607421875, -0.00015029311180114746, -2.3066997528076172e-05, 0.00010415911674499512, 0.0002313852310180664, 0.0003586113452911377, 0.000485837459564209, 0.0006130635738372803, 0.0007402896881103516, 0.0008675158023834229, 0.0009947419166564941, 0.0011219680309295654, 0.0012491941452026367, 0.001376420259475708, 0.0015036463737487793, 0.0016308724880218506, 0.0017580986022949219, 0.0018853247165679932, 0.0020125508308410645, 0.0021397769451141357, 0.002267003059387207, 0.0023942291736602783, 0.0025214552879333496, 0.002648681402206421, 0.002775907516479492, 0.0029031336307525635, 0.0030303597450256348, 0.003157585859298706, 0.0032848119735717773, 0.0034120380878448486, 0.00353926420211792, 0.003666490316390991, 0.0037937164306640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 11.0, 3.0, 11.0, 9.0, 8.0, 12.0, 11.0, 11.0, 19.0, 20.0, 24.0, 24.0, 21.0, 35.0, 40.0, 36.0, 42.0, 44.0, 47.0, 49.0, 51.0, 42.0, 43.0, 38.0, 29.0, 31.0, 35.0, 40.0, 33.0, 27.0, 20.0, 16.0, 20.0, 17.0, 20.0, 10.0, 6.0, 8.0, 16.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.01067352294921875, -0.010328173637390137, -0.009982824325561523, -0.00963747501373291, -0.009292125701904297, -0.008946776390075684, -0.00860142707824707, -0.008256077766418457, -0.007910728454589844, -0.0075653791427612305, -0.007220029830932617, -0.006874680519104004, -0.006529331207275391, -0.006183981895446777, -0.005838632583618164, -0.005493283271789551, -0.0051479339599609375, -0.004802584648132324, -0.004457235336303711, -0.004111886024475098, -0.0037665367126464844, -0.003421187400817871, -0.003075838088989258, -0.0027304887771606445, -0.0023851394653320312, -0.002039790153503418, -0.0016944408416748047, -0.0013490915298461914, -0.0010037422180175781, -0.0006583929061889648, -0.00031304359436035156, 3.230571746826172e-05, 0.000377655029296875, 0.0007230043411254883, 0.0010683536529541016, 0.0014137029647827148, 0.0017590522766113281, 0.0021044015884399414, 0.0024497509002685547, 0.002795100212097168, 0.0031404495239257812, 0.0034857988357543945, 0.003831148147583008, 0.004176497459411621, 0.004521846771240234, 0.004867196083068848, 0.005212545394897461, 0.005557894706726074, 0.0059032440185546875, 0.006248593330383301, 0.006593942642211914, 0.006939291954040527, 0.007284641265869141, 0.007629990577697754, 0.007975339889526367, 0.00832068920135498, 0.008666038513183594, 0.009011387825012207, 0.00935673713684082, 0.009702086448669434, 0.010047435760498047, 0.01039278507232666, 0.010738134384155273, 0.011083483695983887, 0.0114288330078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 13.0, 10.0, 14.0, 22.0, 46.0, 63.0, 89.0, 148.0, 243.0, 383.0, 663.0, 1264.0, 2450.0, 5363.0, 12850.0, 36830.0, 135403.0, 596869.0, 180712.0, 47304.0, 15473.0, 6353.0, 2747.0, 1373.0, 757.0, 405.0, 270.0, 149.0, 80.0, 81.0, 45.0, 30.0, 18.0, 12.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0013113021850585938, -0.0012684464454650879, -0.001225590705871582, -0.0011827349662780762, -0.0011398792266845703, -0.0010970234870910645, -0.0010541677474975586, -0.0010113120079040527, -0.0009684562683105469, -0.000925600528717041, -0.0008827447891235352, -0.0008398890495300293, -0.0007970333099365234, -0.0007541775703430176, -0.0007113218307495117, -0.0006684660911560059, -0.0006256103515625, -0.0005827546119689941, -0.0005398988723754883, -0.0004970431327819824, -0.00045418739318847656, -0.0004113316535949707, -0.00036847591400146484, -0.000325620174407959, -0.0002827644348144531, -0.00023990869522094727, -0.0001970529556274414, -0.00015419721603393555, -0.00011134147644042969, -6.848573684692383e-05, -2.562999725341797e-05, 1.722574234008789e-05, 6.008148193359375e-05, 0.00010293722152709961, 0.00014579296112060547, 0.00018864870071411133, 0.0002315044403076172, 0.00027436017990112305, 0.0003172159194946289, 0.00036007165908813477, 0.0004029273986816406, 0.0004457831382751465, 0.0004886388778686523, 0.0005314946174621582, 0.0005743503570556641, 0.0006172060966491699, 0.0006600618362426758, 0.0007029175758361816, 0.0007457733154296875, 0.0007886290550231934, 0.0008314847946166992, 0.0008743405342102051, 0.0009171962738037109, 0.0009600520133972168, 0.0010029077529907227, 0.0010457634925842285, 0.0010886192321777344, 0.0011314749717712402, 0.001174330711364746, 0.001217186450958252, 0.0012600421905517578, 0.0013028979301452637, 0.0013457536697387695, 0.0013886094093322754, 0.0014314651489257812]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 5.0, 13.0, 15.0, 17.0, 11.0, 22.0, 11.0, 27.0, 34.0, 37.0, 33.0, 42.0, 44.0, 23.0, 51.0, 50.0, 51.0, 63.0, 48.0, 50.0, 22.0, 55.0, 32.0, 32.0, 41.0, 23.0, 25.0, 12.0, 29.0, 19.0, 8.0, 11.0, 8.0, 4.0, 2.0, 7.0, 2.0, 6.0, 6.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.516674041748047e-06, -3.405846655368805e-06, -3.295019268989563e-06, -3.184191882610321e-06, -3.073364496231079e-06, -2.962537109851837e-06, -2.8517097234725952e-06, -2.7408823370933533e-06, -2.6300549507141113e-06, -2.5192275643348694e-06, -2.4084001779556274e-06, -2.2975727915763855e-06, -2.1867454051971436e-06, -2.0759180188179016e-06, -1.9650906324386597e-06, -1.8542632460594177e-06, -1.7434358596801758e-06, -1.6326084733009338e-06, -1.521781086921692e-06, -1.41095370054245e-06, -1.300126314163208e-06, -1.189298927783966e-06, -1.0784715414047241e-06, -9.676441550254822e-07, -8.568167686462402e-07, -7.459893822669983e-07, -6.351619958877563e-07, -5.243346095085144e-07, -4.1350722312927246e-07, -3.026798367500305e-07, -1.9185245037078857e-07, -8.102506399154663e-08, 2.9802322387695312e-08, 1.4062970876693726e-07, 2.514570951461792e-07, 3.6228448152542114e-07, 4.731118679046631e-07, 5.83939254283905e-07, 6.94766640663147e-07, 8.055940270423889e-07, 9.164214134216309e-07, 1.0272487998008728e-06, 1.1380761861801147e-06, 1.2489035725593567e-06, 1.3597309589385986e-06, 1.4705583453178406e-06, 1.5813857316970825e-06, 1.6922131180763245e-06, 1.8030405044555664e-06, 1.9138678908348083e-06, 2.0246952772140503e-06, 2.1355226635932922e-06, 2.246350049972534e-06, 2.357177436351776e-06, 2.468004822731018e-06, 2.57883220911026e-06, 2.689659595489502e-06, 2.800486981868744e-06, 2.911314368247986e-06, 3.0221417546272278e-06, 3.1329691410064697e-06, 3.2437965273857117e-06, 3.3546239137649536e-06, 3.4654513001441956e-06, 3.5762786865234375e-06]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 9.0, 18.0, 16.0, 29.0, 32.0, 93.0, 148.0, 338.0, 736.0, 1945.0, 6300.0, 26188.0, 161684.0, 688880.0, 131252.0, 22221.0, 5483.0, 1798.0, 716.0, 308.0, 129.0, 82.0, 39.0, 32.0, 17.0, 16.0, 9.0, 7.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00225830078125, -0.002202466130256653, -0.0021466314792633057, -0.0020907968282699585, -0.0020349621772766113, -0.001979127526283264, -0.001923292875289917, -0.0018674582242965698, -0.0018116235733032227, -0.0017557889223098755, -0.0016999542713165283, -0.0016441196203231812, -0.001588284969329834, -0.0015324503183364868, -0.0014766156673431396, -0.0014207810163497925, -0.0013649463653564453, -0.0013091117143630981, -0.001253277063369751, -0.0011974424123764038, -0.0011416077613830566, -0.0010857731103897095, -0.0010299384593963623, -0.0009741038084030151, -0.000918269157409668, -0.0008624345064163208, -0.0008065998554229736, -0.0007507652044296265, -0.0006949305534362793, -0.0006390959024429321, -0.000583261251449585, -0.0005274266004562378, -0.0004715919494628906, -0.00041575729846954346, -0.0003599226474761963, -0.0003040879964828491, -0.00024825334548950195, -0.00019241869449615479, -0.00013658404350280762, -8.074939250946045e-05, -2.491474151611328e-05, 3.091990947723389e-05, 8.675456047058105e-05, 0.00014258921146392822, 0.0001984238624572754, 0.00025425851345062256, 0.0003100931644439697, 0.0003659278154373169, 0.00042176246643066406, 0.00047759711742401123, 0.0005334317684173584, 0.0005892664194107056, 0.0006451010704040527, 0.0007009357213973999, 0.0007567703723907471, 0.0008126050233840942, 0.0008684396743774414, 0.0009242743253707886, 0.0009801089763641357, 0.001035943627357483, 0.00109177827835083, 0.0011476129293441772, 0.0012034475803375244, 0.0012592822313308716, 0.0013151168823242188]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 9.0, 17.0, 21.0, 21.0, 17.0, 26.0, 48.0, 56.0, 75.0, 84.0, 82.0, 89.0, 98.0, 78.0, 72.0, 50.0, 38.0, 33.0, 17.0, 15.0, 10.0, 14.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002483367919921875, -0.0024108588695526123, -0.0023383498191833496, -0.002265840768814087, -0.0021933317184448242, -0.0021208226680755615, -0.002048313617706299, -0.001975804567337036, -0.0019032955169677734, -0.0018307864665985107, -0.001758277416229248, -0.0016857683658599854, -0.0016132593154907227, -0.00154075026512146, -0.0014682412147521973, -0.0013957321643829346, -0.0013232231140136719, -0.0012507140636444092, -0.0011782050132751465, -0.0011056959629058838, -0.001033186912536621, -0.0009606778621673584, -0.0008881688117980957, -0.000815659761428833, -0.0007431507110595703, -0.0006706416606903076, -0.0005981326103210449, -0.0005256235599517822, -0.00045311450958251953, -0.00038060545921325684, -0.00030809640884399414, -0.00023558735847473145, -0.00016307830810546875, -9.056925773620605e-05, -1.806020736694336e-05, 5.4448843002319336e-05, 0.00012695789337158203, 0.00019946694374084473, 0.0002719759941101074, 0.0003444850444793701, 0.0004169940948486328, 0.0004895031452178955, 0.0005620121955871582, 0.0006345212459564209, 0.0007070302963256836, 0.0007795393466949463, 0.000852048397064209, 0.0009245574474334717, 0.0009970664978027344, 0.001069575548171997, 0.0011420845985412598, 0.0012145936489105225, 0.0012871026992797852, 0.0013596117496490479, 0.0014321208000183105, 0.0015046298503875732, 0.001577138900756836, 0.0016496479511260986, 0.0017221570014953613, 0.001794666051864624, 0.0018671751022338867, 0.0019396841526031494, 0.002012193202972412, 0.002084702253341675, 0.0021572113037109375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 9.0, 18.0, 31.0, 71.0, 220.0, 359.0, 181.0, 72.0, 24.0, 10.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04073881357908249, -0.03827570006251335, -0.035812586545944214, -0.033349473029375076, -0.03088635765016079, -0.028423244133591652, -0.025960128754377365, -0.023497015237808228, -0.02103390172123909, -0.018570788204669952, -0.016107674688100815, -0.013644559308886528, -0.01118144579231739, -0.008718332275748253, -0.006255217827856541, -0.0037921033799648285, -0.001328989863395691, 0.001134124118834734, 0.003597238101065159, 0.006060352083295584, 0.008523466065526009, 0.010986579582095146, 0.013449694029986858, 0.01591280847787857, 0.018375921994447708, 0.020839035511016846, 0.023302149027585983, 0.02576526440680027, 0.028228377923369408, 0.030691491439938545, 0.03315460681915283, 0.03561772033572197, 0.03808082640171051, 0.04054393991827965, 0.043007053434848785, 0.04547016695141792, 0.04793328046798706, 0.0503963977098465, 0.052859511226415634, 0.05532262474298477, 0.05778573825955391, 0.06024885177612305, 0.06271196901798248, 0.06517507880926132, 0.06763819605112076, 0.0701013058423996, 0.07256442308425903, 0.07502754032611847, 0.07749065011739731, 0.07995376735925674, 0.08241687715053558, 0.08487999439239502, 0.08734310418367386, 0.0898062214255333, 0.09226933121681213, 0.09473244845867157, 0.097195565700531, 0.09965868294239044, 0.10212179273366928, 0.10458490997552872, 0.10704801976680756, 0.10951113700866699, 0.11197424679994583, 0.11443736404180527, 0.1169004738330841]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 1.0, 4.0, 7.0, 3.0, 6.0, 5.0, 10.0, 15.0, 10.0, 16.0, 13.0, 15.0, 22.0, 27.0, 29.0, 25.0, 20.0, 31.0, 41.0, 41.0, 58.0, 60.0, 69.0, 56.0, 61.0, 35.0, 38.0, 30.0, 33.0, 14.0, 23.0, 21.0, 17.0, 18.0, 24.0, 11.0, 13.0, 14.0, 8.0, 7.0, 7.0, 5.0, 7.0, 10.0, 3.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.03861534595489502, -0.03742838278412819, -0.03624141961336136, -0.03505445271730423, -0.0338674895465374, -0.03268052637577057, -0.03149355947971344, -0.03030659630894661, -0.02911963313817978, -0.02793266996741295, -0.02674570493400097, -0.02555873990058899, -0.02437177672982216, -0.02318481355905533, -0.02199784852564335, -0.02081088349223137, -0.01962392032146454, -0.018436957150697708, -0.01724999211728573, -0.01606302708387375, -0.014876063913106918, -0.013689099811017513, -0.012502135708928108, -0.011315171606838703, -0.010128207504749298, -0.008941243402659893, -0.007754279300570488, -0.006567315198481083, -0.005380351096391678, -0.004193386994302273, -0.0030064228922128677, -0.0018194587901234627, -0.0006324946880340576, 0.0005544694140553474, 0.0017414335161447525, 0.0029283976182341576, 0.004115361720323563, 0.005302325822412968, 0.006489289924502373, 0.007676254026591778, 0.008863218128681183, 0.010050182230770588, 0.011237146332859993, 0.012424110434949398, 0.013611074537038803, 0.014798038639128208, 0.015985002741217613, 0.017171967774629593, 0.018358930945396423, 0.019545894116163254, 0.020732859149575233, 0.021919824182987213, 0.023106787353754044, 0.024293750524520874, 0.025480715557932854, 0.026667680591344833, 0.027854643762111664, 0.029041606932878494, 0.030228571966290474, 0.031415536999702454, 0.032602500170469284, 0.033789463341236115, 0.03497643023729324, 0.036163393408060074, 0.037350356578826904]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 11.0, 9.0, 17.0, 41.0, 97.0, 197.0, 310.0, 518.0, 972.0, 1897.0, 3573.0, 7771.0, 21326.0, 95203.0, 709223.0, 2688535.0, 556991.0, 79129.0, 17740.0, 5568.0, 2523.0, 1288.0, 658.0, 350.0, 143.0, 66.0, 42.0, 20.0, 16.0, 8.0, 11.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0032825469970703125, -0.0031899213790893555, -0.0030972957611083984, -0.0030046701431274414, -0.0029120445251464844, -0.0028194189071655273, -0.0027267932891845703, -0.0026341676712036133, -0.0025415420532226562, -0.0024489164352416992, -0.002356290817260742, -0.002263665199279785, -0.002171039581298828, -0.002078413963317871, -0.001985788345336914, -0.001893162727355957, -0.001800537109375, -0.001707911491394043, -0.001615285873413086, -0.001522660255432129, -0.0014300346374511719, -0.0013374090194702148, -0.0012447834014892578, -0.0011521577835083008, -0.0010595321655273438, -0.0009669065475463867, -0.0008742809295654297, -0.0007816553115844727, -0.0006890296936035156, -0.0005964040756225586, -0.0005037784576416016, -0.00041115283966064453, -0.0003185272216796875, -0.00022590160369873047, -0.00013327598571777344, -4.0650367736816406e-05, 5.1975250244140625e-05, 0.00014460086822509766, 0.0002372264862060547, 0.0003298521041870117, 0.00042247772216796875, 0.0005151033401489258, 0.0006077289581298828, 0.0007003545761108398, 0.0007929801940917969, 0.0008856058120727539, 0.000978231430053711, 0.001070857048034668, 0.001163482666015625, 0.001256108283996582, 0.001348733901977539, 0.001441359519958496, 0.0015339851379394531, 0.0016266107559204102, 0.0017192363739013672, 0.0018118619918823242, 0.0019044876098632812, 0.0019971132278442383, 0.0020897388458251953, 0.0021823644638061523, 0.0022749900817871094, 0.0023676156997680664, 0.0024602413177490234, 0.0025528669357299805, 0.0026454925537109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 5.0, 6.0, 13.0, 19.0, 28.0, 46.0, 78.0, 109.0, 109.0, 139.0, 137.0, 106.0, 82.0, 33.0, 35.0, 25.0, 11.0, 7.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007293701171875, -0.007038474082946777, -0.006783246994018555, -0.006528019905090332, -0.006272792816162109, -0.006017565727233887, -0.005762338638305664, -0.005507111549377441, -0.005251884460449219, -0.004996657371520996, -0.0047414302825927734, -0.004486203193664551, -0.004230976104736328, -0.0039757490158081055, -0.003720521926879883, -0.00346529483795166, -0.0032100677490234375, -0.002954840660095215, -0.002699613571166992, -0.0024443864822387695, -0.002189159393310547, -0.0019339323043823242, -0.0016787052154541016, -0.001423478126525879, -0.0011682510375976562, -0.0009130239486694336, -0.0006577968597412109, -0.0004025697708129883, -0.00014734268188476562, 0.00010788440704345703, 0.0003631114959716797, 0.0006183385848999023, 0.000873565673828125, 0.0011287927627563477, 0.0013840198516845703, 0.001639246940612793, 0.0018944740295410156, 0.0021497011184692383, 0.002404928207397461, 0.0026601552963256836, 0.0029153823852539062, 0.003170609474182129, 0.0034258365631103516, 0.0036810636520385742, 0.003936290740966797, 0.0041915178298950195, 0.004446744918823242, 0.004701972007751465, 0.0049571990966796875, 0.00521242618560791, 0.005467653274536133, 0.0057228803634643555, 0.005978107452392578, 0.006233334541320801, 0.0064885616302490234, 0.006743788719177246, 0.006999015808105469, 0.007254242897033691, 0.007509469985961914, 0.007764697074890137, 0.00801992416381836, 0.008275151252746582, 0.008530378341674805, 0.008785605430603027, 0.00904083251953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 15.0, 25.0, 37.0, 87.0, 159.0, 312.0, 12087.0, 4179898.0, 1242.0, 205.0, 120.0, 57.0, 29.0, 12.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0291595458984375, -0.028197050094604492, -0.027234554290771484, -0.026272058486938477, -0.02530956268310547, -0.02434706687927246, -0.023384571075439453, -0.022422075271606445, -0.021459579467773438, -0.02049708366394043, -0.019534587860107422, -0.018572092056274414, -0.017609596252441406, -0.0166471004486084, -0.01568460464477539, -0.014722108840942383, -0.013759613037109375, -0.012797117233276367, -0.01183462142944336, -0.010872125625610352, -0.009909629821777344, -0.008947134017944336, -0.007984638214111328, -0.00702214241027832, -0.0060596466064453125, -0.005097150802612305, -0.004134654998779297, -0.003172159194946289, -0.0022096633911132812, -0.0012471675872802734, -0.0002846717834472656, 0.0006778240203857422, 0.00164031982421875, 0.002602815628051758, 0.0035653114318847656, 0.0045278072357177734, 0.005490303039550781, 0.006452798843383789, 0.007415294647216797, 0.008377790451049805, 0.009340286254882812, 0.01030278205871582, 0.011265277862548828, 0.012227773666381836, 0.013190269470214844, 0.014152765274047852, 0.01511526107788086, 0.016077756881713867, 0.017040252685546875, 0.018002748489379883, 0.01896524429321289, 0.0199277400970459, 0.020890235900878906, 0.021852731704711914, 0.022815227508544922, 0.02377772331237793, 0.024740219116210938, 0.025702714920043945, 0.026665210723876953, 0.02762770652770996, 0.02859020233154297, 0.029552698135375977, 0.030515193939208984, 0.03147768974304199, 0.032440185546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 10.0, 19.0, 55.0, 239.0, 1018.0, 1830.0, 701.0, 142.0, 33.0, 11.0, 8.0, 7.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.018707275390625, -0.01834315061569214, -0.017979025840759277, -0.017614901065826416, -0.017250776290893555, -0.016886651515960693, -0.016522526741027832, -0.01615840196609497, -0.01579427719116211, -0.015430152416229248, -0.015066027641296387, -0.014701902866363525, -0.014337778091430664, -0.013973653316497803, -0.013609528541564941, -0.01324540376663208, -0.012881278991699219, -0.012517154216766357, -0.012153029441833496, -0.011788904666900635, -0.011424779891967773, -0.011060655117034912, -0.01069653034210205, -0.01033240556716919, -0.009968280792236328, -0.009604156017303467, -0.009240031242370605, -0.008875906467437744, -0.008511781692504883, -0.008147656917572021, -0.00778353214263916, -0.007419407367706299, -0.0070552825927734375, -0.006691157817840576, -0.006327033042907715, -0.0059629082679748535, -0.005598783493041992, -0.005234658718109131, -0.0048705339431762695, -0.004506409168243408, -0.004142284393310547, -0.0037781596183776855, -0.0034140348434448242, -0.003049910068511963, -0.0026857852935791016, -0.0023216605186462402, -0.001957535743713379, -0.0015934109687805176, -0.0012292861938476562, -0.0008651614189147949, -0.0005010366439819336, -0.00013691186904907227, 0.00022721290588378906, 0.0005913376808166504, 0.0009554624557495117, 0.001319587230682373, 0.0016837120056152344, 0.0020478367805480957, 0.002411961555480957, 0.0027760863304138184, 0.0031402111053466797, 0.003504335880279541, 0.0038684606552124023, 0.004232585430145264, 0.004596710205078125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 11.0, 8.0, 11.0, 19.0, 36.0, 68.0, 128.0, 164.0, 197.0, 157.0, 95.0, 61.0, 22.0, 10.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05580972880125046, -0.054664552211761475, -0.05351937562227249, -0.05237419903278351, -0.051229022443294525, -0.05008384585380554, -0.04893866926431656, -0.047793492674827576, -0.04664831608533859, -0.04550313949584961, -0.044357962906360626, -0.04321278631687164, -0.04206760972738266, -0.04092243313789368, -0.039777256548404694, -0.03863207995891571, -0.03748689964413643, -0.036341723054647446, -0.03519654646515846, -0.03405136987566948, -0.032906193286180496, -0.03176101669669151, -0.03061583824455738, -0.029470661655068398, -0.028325485065579414, -0.02718030847609043, -0.026035131886601448, -0.024889955297112465, -0.023744776844978333, -0.02259960025548935, -0.021454423666000366, -0.020309247076511383, -0.0191640704870224, -0.018018893897533417, -0.016873717308044434, -0.01572854071855545, -0.014583363197743893, -0.01343818660825491, -0.012293009087443352, -0.011147832497954369, -0.010002655908465385, -0.008857479318976402, -0.007712302263826132, -0.006567125208675861, -0.005421948619186878, -0.004276772029697895, -0.0031315949745476246, -0.001986417919397354, -0.000841241329908371, 0.00030393549241125584, 0.0014491123147308826, 0.0025942891370505095, 0.0037394659593701363, 0.004884642548859119, 0.00602981960400939, 0.00717499665915966, 0.008320173248648643, 0.009465349838137627, 0.01061052642762661, 0.011755703948438168, 0.01290088053792715, 0.014046057127416134, 0.015191234648227692, 0.016336411237716675, 0.017481587827205658]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 8.0, 8.0, 8.0, 7.0, 10.0, 8.0, 11.0, 17.0, 22.0, 25.0, 30.0, 26.0, 42.0, 27.0, 44.0, 31.0, 37.0, 51.0, 38.0, 36.0, 45.0, 43.0, 45.0, 50.0, 43.0, 45.0, 34.0, 28.0, 40.0, 21.0, 17.0, 19.0, 19.0, 14.0, 10.0, 13.0, 10.0, 12.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.02270883321762085, -0.022083088755607605, -0.02145734243094921, -0.020831596106290817, -0.020205851644277573, -0.019580107182264328, -0.018954360857605934, -0.01832861453294754, -0.017702870070934296, -0.01707712560892105, -0.016451379284262657, -0.015825632959604263, -0.015199888497591019, -0.0145741431042552, -0.01394839771091938, -0.013322652317583561, -0.012696906924247742, -0.012071161530911922, -0.011445416137576103, -0.010819670744240284, -0.010193925350904465, -0.009568179957568645, -0.008942434564232826, -0.008316689170897007, -0.007690943777561188, -0.0070651983842253685, -0.006439452990889549, -0.00581370759755373, -0.005187962204217911, -0.0045622168108820915, -0.003936471417546272, -0.003310726024210453, -0.002684980630874634, -0.0020592352375388145, -0.0014334898442029953, -0.0008077444508671761, -0.0001819990575313568, 0.00044374633580446243, 0.0010694917291402817, 0.001695237122476101, 0.00232098251581192, 0.0029467279091477394, 0.0035724733024835587, 0.004198218695819378, 0.004823964089155197, 0.005449709482491016, 0.006075454875826836, 0.006701200269162655, 0.007326945662498474, 0.007952691055834293, 0.008578436449170113, 0.009204181842505932, 0.009829927235841751, 0.01045567262917757, 0.01108141802251339, 0.011707163415849209, 0.012332908809185028, 0.012958654202520847, 0.013584399595856667, 0.014210144989192486, 0.014835890382528305, 0.015461635775864124, 0.016087381169199944, 0.016713127493858337, 0.017338871955871582]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 13.0, 7.0, 18.0, 18.0, 34.0, 36.0, 57.0, 65.0, 91.0, 173.0, 249.0, 342.0, 497.0, 899.0, 1542.0, 3028.0, 6425.0, 15433.0, 44192.0, 142244.0, 395205.0, 295419.0, 91313.0, 29675.0, 10919.0, 4808.0, 2374.0, 1247.0, 782.0, 458.0, 339.0, 186.0, 117.0, 108.0, 64.0, 49.0, 29.0, 32.0, 23.0, 12.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004314422607421875, -0.004178822040557861, -0.004043221473693848, -0.003907620906829834, -0.0037720203399658203, -0.0036364197731018066, -0.003500819206237793, -0.0033652186393737793, -0.0032296180725097656, -0.003094017505645752, -0.0029584169387817383, -0.0028228163719177246, -0.002687215805053711, -0.0025516152381896973, -0.0024160146713256836, -0.00228041410446167, -0.0021448135375976562, -0.0020092129707336426, -0.001873612403869629, -0.0017380118370056152, -0.0016024112701416016, -0.0014668107032775879, -0.0013312101364135742, -0.0011956095695495605, -0.0010600090026855469, -0.0009244084358215332, -0.0007888078689575195, -0.0006532073020935059, -0.0005176067352294922, -0.0003820061683654785, -0.00024640560150146484, -0.00011080503463745117, 2.47955322265625e-05, 0.00016039609909057617, 0.00029599666595458984, 0.0004315972328186035, 0.0005671977996826172, 0.0007027983665466309, 0.0008383989334106445, 0.0009739995002746582, 0.0011096000671386719, 0.0012452006340026855, 0.0013808012008666992, 0.0015164017677307129, 0.0016520023345947266, 0.0017876029014587402, 0.001923203468322754, 0.0020588040351867676, 0.0021944046020507812, 0.002330005168914795, 0.0024656057357788086, 0.0026012063026428223, 0.002736806869506836, 0.0028724074363708496, 0.0030080080032348633, 0.003143608570098877, 0.0032792091369628906, 0.0034148097038269043, 0.003550410270690918, 0.0036860108375549316, 0.0038216114044189453, 0.003957211971282959, 0.004092812538146973, 0.004228413105010986, 0.004364013671875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 20.0, 27.0, 58.0, 80.0, 99.0, 120.0, 138.0, 139.0, 105.0, 59.0, 42.0, 35.0, 23.0, 12.0, 13.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007266998291015625, -0.007012307643890381, -0.006757616996765137, -0.006502926349639893, -0.0062482357025146484, -0.005993545055389404, -0.00573885440826416, -0.005484163761138916, -0.005229473114013672, -0.004974782466888428, -0.004720091819763184, -0.0044654011726379395, -0.004210710525512695, -0.003956019878387451, -0.003701329231262207, -0.003446638584136963, -0.0031919479370117188, -0.0029372572898864746, -0.0026825666427612305, -0.0024278759956359863, -0.002173185348510742, -0.001918494701385498, -0.001663804054260254, -0.0014091134071350098, -0.0011544227600097656, -0.0008997321128845215, -0.0006450414657592773, -0.0003903508186340332, -0.00013566017150878906, 0.00011903047561645508, 0.0003737211227416992, 0.0006284117698669434, 0.0008831024169921875, 0.0011377930641174316, 0.0013924837112426758, 0.00164717435836792, 0.001901865005493164, 0.002156555652618408, 0.0024112462997436523, 0.0026659369468688965, 0.0029206275939941406, 0.0031753182411193848, 0.003430008888244629, 0.003684699535369873, 0.003939390182495117, 0.004194080829620361, 0.0044487714767456055, 0.00470346212387085, 0.004958152770996094, 0.005212843418121338, 0.005467534065246582, 0.005722224712371826, 0.00597691535949707, 0.0062316060066223145, 0.006486296653747559, 0.006740987300872803, 0.006995677947998047, 0.007250368595123291, 0.007505059242248535, 0.007759749889373779, 0.008014440536499023, 0.008269131183624268, 0.008523821830749512, 0.008778512477874756, 0.009033203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 9.0, 12.0, 14.0, 26.0, 35.0, 66.0, 76.0, 91.0, 144.0, 215.0, 297.0, 525.0, 1034.0, 2885.0, 14107.0, 100670.0, 700285.0, 195442.0, 25053.0, 4567.0, 1388.0, 597.0, 387.0, 210.0, 112.0, 83.0, 66.0, 53.0, 27.0, 24.0, 10.0, 11.0, 9.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007518768310546875, -0.007265269756317139, -0.007011771202087402, -0.006758272647857666, -0.00650477409362793, -0.006251275539398193, -0.005997776985168457, -0.005744278430938721, -0.005490779876708984, -0.005237281322479248, -0.004983782768249512, -0.004730284214019775, -0.004476785659790039, -0.004223287105560303, -0.003969788551330566, -0.00371628999710083, -0.0034627914428710938, -0.0032092928886413574, -0.002955794334411621, -0.0027022957801818848, -0.0024487972259521484, -0.002195298671722412, -0.0019418001174926758, -0.0016883015632629395, -0.0014348030090332031, -0.0011813044548034668, -0.0009278059005737305, -0.0006743073463439941, -0.0004208087921142578, -0.00016731023788452148, 8.618831634521484e-05, 0.00033968687057495117, 0.0005931854248046875, 0.0008466839790344238, 0.0011001825332641602, 0.0013536810874938965, 0.0016071796417236328, 0.0018606781959533691, 0.0021141767501831055, 0.002367675304412842, 0.002621173858642578, 0.0028746724128723145, 0.0031281709671020508, 0.003381669521331787, 0.0036351680755615234, 0.0038886666297912598, 0.004142165184020996, 0.004395663738250732, 0.004649162292480469, 0.004902660846710205, 0.005156159400939941, 0.005409657955169678, 0.005663156509399414, 0.00591665506362915, 0.006170153617858887, 0.006423652172088623, 0.006677150726318359, 0.006930649280548096, 0.007184147834777832, 0.007437646389007568, 0.007691144943237305, 0.007944643497467041, 0.008198142051696777, 0.008451640605926514, 0.00870513916015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 6.0, 4.0, 9.0, 8.0, 13.0, 15.0, 21.0, 16.0, 18.0, 33.0, 27.0, 34.0, 47.0, 61.0, 56.0, 40.0, 59.0, 55.0, 71.0, 53.0, 52.0, 53.0, 33.0, 40.0, 38.0, 37.0, 26.0, 23.0, 11.0, 12.0, 9.0, 9.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01279449462890625, -0.01235342025756836, -0.011912345886230469, -0.011471271514892578, -0.011030197143554688, -0.010589122772216797, -0.010148048400878906, -0.009706974029541016, -0.009265899658203125, -0.008824825286865234, -0.008383750915527344, -0.007942676544189453, -0.0075016021728515625, -0.007060527801513672, -0.006619453430175781, -0.006178379058837891, -0.0057373046875, -0.005296230316162109, -0.004855155944824219, -0.004414081573486328, -0.0039730072021484375, -0.003531932830810547, -0.0030908584594726562, -0.0026497840881347656, -0.002208709716796875, -0.0017676353454589844, -0.0013265609741210938, -0.0008854866027832031, -0.0004444122314453125, -3.337860107421875e-06, 0.00043773651123046875, 0.0008788108825683594, 0.00131988525390625, 0.0017609596252441406, 0.0022020339965820312, 0.002643108367919922, 0.0030841827392578125, 0.003525257110595703, 0.003966331481933594, 0.004407405853271484, 0.004848480224609375, 0.005289554595947266, 0.005730628967285156, 0.006171703338623047, 0.0066127777099609375, 0.007053852081298828, 0.007494926452636719, 0.00793600082397461, 0.0083770751953125, 0.00881814956665039, 0.009259223937988281, 0.009700298309326172, 0.010141372680664062, 0.010582447052001953, 0.011023521423339844, 0.011464595794677734, 0.011905670166015625, 0.012346744537353516, 0.012787818908691406, 0.013228893280029297, 0.013669967651367188, 0.014111042022705078, 0.014552116394042969, 0.01499319076538086, 0.01543426513671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 6.0, 10.0, 16.0, 12.0, 12.0, 27.0, 40.0, 65.0, 85.0, 119.0, 225.0, 319.0, 563.0, 975.0, 1988.0, 4015.0, 9436.0, 23828.0, 69410.0, 240658.0, 544790.0, 97648.0, 31869.0, 11990.0, 5115.0, 2319.0, 1245.0, 690.0, 382.0, 219.0, 141.0, 93.0, 62.0, 43.0, 38.0, 27.0, 14.0, 12.0, 14.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010242462158203125, -0.0009913593530654907, -0.0009584724903106689, -0.0009255856275558472, -0.0008926987648010254, -0.0008598119020462036, -0.0008269250392913818, -0.0007940381765365601, -0.0007611513137817383, -0.0007282644510269165, -0.0006953775882720947, -0.000662490725517273, -0.0006296038627624512, -0.0005967170000076294, -0.0005638301372528076, -0.0005309432744979858, -0.0004980564117431641, -0.0004651695489883423, -0.0004322826862335205, -0.00039939582347869873, -0.00036650896072387695, -0.0003336220979690552, -0.0003007352352142334, -0.0002678483724594116, -0.00023496150970458984, -0.00020207464694976807, -0.0001691877841949463, -0.0001363009214401245, -0.00010341405868530273, -7.052719593048096e-05, -3.764033317565918e-05, -4.753470420837402e-06, 2.8133392333984375e-05, 6.102025508880615e-05, 9.390711784362793e-05, 0.0001267939805984497, 0.00015968084335327148, 0.00019256770610809326, 0.00022545456886291504, 0.0002583414316177368, 0.0002912282943725586, 0.00032411515712738037, 0.00035700201988220215, 0.0003898888826370239, 0.0004227757453918457, 0.0004556626081466675, 0.0004885494709014893, 0.000521436333656311, 0.0005543231964111328, 0.0005872100591659546, 0.0006200969219207764, 0.0006529837846755981, 0.0006858706474304199, 0.0007187575101852417, 0.0007516443729400635, 0.0007845312356948853, 0.000817418098449707, 0.0008503049612045288, 0.0008831918239593506, 0.0009160786867141724, 0.0009489655494689941, 0.000981852412223816, 0.0010147392749786377, 0.0010476261377334595, 0.0010805130004882812]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 7.0, 2.0, 11.0, 12.0, 6.0, 13.0, 18.0, 18.0, 28.0, 27.0, 19.0, 17.0, 37.0, 40.0, 29.0, 51.0, 37.0, 53.0, 21.0, 51.0, 49.0, 34.0, 48.0, 53.0, 33.0, 30.0, 39.0, 46.0, 9.0, 33.0, 24.0, 10.0, 19.0, 19.0, 14.0, 11.0, 9.0, 8.0, 2.0, 6.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.2782554626464844e-06, -3.1767413020133972e-06, -3.07522714138031e-06, -2.973712980747223e-06, -2.8721988201141357e-06, -2.7706846594810486e-06, -2.6691704988479614e-06, -2.5676563382148743e-06, -2.466142177581787e-06, -2.3646280169487e-06, -2.263113856315613e-06, -2.1615996956825256e-06, -2.0600855350494385e-06, -1.9585713744163513e-06, -1.8570572137832642e-06, -1.755543053150177e-06, -1.6540288925170898e-06, -1.5525147318840027e-06, -1.4510005712509155e-06, -1.3494864106178284e-06, -1.2479722499847412e-06, -1.146458089351654e-06, -1.044943928718567e-06, -9.434297680854797e-07, -8.419156074523926e-07, -7.404014468193054e-07, -6.388872861862183e-07, -5.373731255531311e-07, -4.3585896492004395e-07, -3.343448042869568e-07, -2.3283064365386963e-07, -1.3131648302078247e-07, -2.9802322387695312e-08, 7.171183824539185e-08, 1.73225998878479e-07, 2.7474015951156616e-07, 3.762543201446533e-07, 4.777684807777405e-07, 5.792826414108276e-07, 6.807968020439148e-07, 7.82310962677002e-07, 8.838251233100891e-07, 9.853392839431763e-07, 1.0868534445762634e-06, 1.1883676052093506e-06, 1.2898817658424377e-06, 1.391395926475525e-06, 1.492910087108612e-06, 1.5944242477416992e-06, 1.6959384083747864e-06, 1.7974525690078735e-06, 1.8989667296409607e-06, 2.000480890274048e-06, 2.101995050907135e-06, 2.203509211540222e-06, 2.3050233721733093e-06, 2.4065375328063965e-06, 2.5080516934394836e-06, 2.609565854072571e-06, 2.711080014705658e-06, 2.812594175338745e-06, 2.9141083359718323e-06, 3.0156224966049194e-06, 3.1171366572380066e-06, 3.2186508178710938e-06]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 11.0, 10.0, 11.0, 14.0, 15.0, 23.0, 24.0, 41.0, 48.0, 74.0, 134.0, 160.0, 263.0, 422.0, 743.0, 1444.0, 3156.0, 7919.0, 21241.0, 65472.0, 242010.0, 556248.0, 99473.0, 30298.0, 10812.0, 4184.0, 1892.0, 950.0, 512.0, 307.0, 197.0, 121.0, 86.0, 60.0, 46.0, 33.0, 20.0, 16.0, 18.0, 8.0, 9.0, 9.0, 8.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0011358261108398438, -0.0011025816202163696, -0.0010693371295928955, -0.0010360926389694214, -0.0010028481483459473, -0.0009696036577224731, -0.000936359167098999, -0.0009031146764755249, -0.0008698701858520508, -0.0008366256952285767, -0.0008033812046051025, -0.0007701367139816284, -0.0007368922233581543, -0.0007036477327346802, -0.0006704032421112061, -0.0006371587514877319, -0.0006039142608642578, -0.0005706697702407837, -0.0005374252796173096, -0.0005041807889938354, -0.00047093629837036133, -0.0004376918077468872, -0.0004044473171234131, -0.00037120282649993896, -0.00033795833587646484, -0.0003047138452529907, -0.0002714693546295166, -0.00023822486400604248, -0.00020498037338256836, -0.00017173588275909424, -0.00013849139213562012, -0.000105246901512146, -7.200241088867188e-05, -3.8757920265197754e-05, -5.513429641723633e-06, 2.7731060981750488e-05, 6.097555160522461e-05, 9.422004222869873e-05, 0.00012746453285217285, 0.00016070902347564697, 0.0001939535140991211, 0.00022719800472259521, 0.00026044249534606934, 0.00029368698596954346, 0.0003269314765930176, 0.0003601759672164917, 0.0003934204578399658, 0.00042666494846343994, 0.00045990943908691406, 0.0004931539297103882, 0.0005263984203338623, 0.0005596429109573364, 0.0005928874015808105, 0.0006261318922042847, 0.0006593763828277588, 0.0006926208734512329, 0.000725865364074707, 0.0007591098546981812, 0.0007923543453216553, 0.0008255988359451294, 0.0008588433265686035, 0.0008920878171920776, 0.0009253323078155518, 0.0009585767984390259, 0.0009918212890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 6.0, 10.0, 11.0, 20.0, 23.0, 31.0, 25.0, 43.0, 47.0, 50.0, 53.0, 76.0, 71.0, 64.0, 64.0, 52.0, 62.0, 49.0, 39.0, 41.0, 25.0, 18.0, 16.0, 8.0, 10.0, 9.0, 9.0, 5.0, 2.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013856887817382812, -0.0013398975133895874, -0.0012941062450408936, -0.0012483149766921997, -0.0012025237083435059, -0.001156732439994812, -0.0011109411716461182, -0.0010651499032974243, -0.0010193586349487305, -0.0009735673666000366, -0.0009277760982513428, -0.0008819848299026489, -0.0008361935615539551, -0.0007904022932052612, -0.0007446110248565674, -0.0006988197565078735, -0.0006530284881591797, -0.0006072372198104858, -0.000561445951461792, -0.0005156546831130981, -0.0004698634147644043, -0.00042407214641571045, -0.0003782808780670166, -0.00033248960971832275, -0.0002866983413696289, -0.00024090707302093506, -0.0001951158046722412, -0.00014932453632354736, -0.00010353326797485352, -5.774199962615967e-05, -1.195073127746582e-05, 3.384053707122803e-05, 7.963180541992188e-05, 0.00012542307376861572, 0.00017121434211730957, 0.00021700561046600342, 0.00026279687881469727, 0.0003085881471633911, 0.00035437941551208496, 0.0004001706838607788, 0.00044596195220947266, 0.0004917532205581665, 0.0005375444889068604, 0.0005833357572555542, 0.000629127025604248, 0.0006749182939529419, 0.0007207095623016357, 0.0007665008306503296, 0.0008122920989990234, 0.0008580833673477173, 0.0009038746356964111, 0.000949665904045105, 0.0009954571723937988, 0.0010412484407424927, 0.0010870397090911865, 0.0011328309774398804, 0.0011786222457885742, 0.001224413514137268, 0.001270204782485962, 0.0013159960508346558, 0.0013617873191833496, 0.0014075785875320435, 0.0014533698558807373, 0.0014991611242294312, 0.001544952392578125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 14.0, 16.0, 31.0, 56.0, 79.0, 132.0, 238.0, 179.0, 91.0, 56.0, 39.0, 18.0, 13.0, 9.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05052497237920761, -0.04925081506371498, -0.04797666147351265, -0.04670250415802002, -0.04542835056781769, -0.04415419325232506, -0.04288003593683243, -0.041605882346630096, -0.040331725031137466, -0.039057567715644836, -0.037783414125442505, -0.036509256809949875, -0.03523510321974754, -0.03396094590425491, -0.03268679231405258, -0.03141263499855995, -0.03013847954571247, -0.02886432409286499, -0.02759016864001751, -0.02631601318717003, -0.0250418558716774, -0.023767700418829918, -0.022493544965982437, -0.021219387650489807, -0.019945234060287476, -0.018671078607439995, -0.017396923154592514, -0.016122765839099884, -0.014848610386252403, -0.013574454933404922, -0.012300299480557442, -0.011026143096387386, -0.00975198857486248, -0.008477833122015, -0.007203676737844944, -0.005929521284997463, -0.004655365366488695, -0.003381209447979927, -0.0021070539951324463, -0.0008328976109623909, 0.0004412578418850899, 0.0017154136439785361, 0.0029895694460719824, 0.004263725131750107, 0.005537881050258875, 0.006812036968767643, 0.008086192421615124, 0.00936034880578518, 0.01063450425863266, 0.01190865971148014, 0.013182816095650196, 0.014456971548497677, 0.015731127932667732, 0.017005283385515213, 0.018279438838362694, 0.019553594291210175, 0.020827751606702805, 0.022101907059550285, 0.023376062512397766, 0.024650219827890396, 0.025924375280737877, 0.027198530733585358, 0.02847268618643284, 0.02974684163928032, 0.0310209970921278]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 5.0, 5.0, 9.0, 11.0, 13.0, 15.0, 15.0, 11.0, 22.0, 16.0, 29.0, 30.0, 34.0, 21.0, 32.0, 30.0, 34.0, 66.0, 93.0, 81.0, 57.0, 31.0, 39.0, 22.0, 32.0, 31.0, 21.0, 19.0, 19.0, 19.0, 16.0, 20.0, 12.0, 12.0, 4.0, 13.0, 7.0, 7.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03422337770462036, -0.03304683044552803, -0.0318702831864357, -0.03069373220205307, -0.02951718494296074, -0.028340637683868408, -0.027164088562130928, -0.025987539440393448, -0.024810992181301117, -0.023634444922208786, -0.022457895800471306, -0.021281346678733826, -0.020104799419641495, -0.018928252160549164, -0.017751703038811684, -0.016575153917074203, -0.015398606657981873, -0.014222058467566967, -0.013045510277152061, -0.011868962086737156, -0.01069241389632225, -0.009515865705907345, -0.00833931751549244, -0.007162769325077534, -0.005986221134662628, -0.004809672944247723, -0.003633124753832817, -0.0024565765634179115, -0.001280028373003006, -0.00010348018258810043, 0.0010730680078268051, 0.0022496161982417107, 0.003426164388656616, 0.004602712579071522, 0.005779260769486427, 0.006955808959901333, 0.008132357150316238, 0.009308905340731144, 0.01048545353114605, 0.011662001721560955, 0.01283854991197586, 0.014015098102390766, 0.015191646292805672, 0.016368195414543152, 0.017544742673635483, 0.018721289932727814, 0.019897839054465294, 0.021074388176202774, 0.022250935435295105, 0.023427482694387436, 0.024604031816124916, 0.025780580937862396, 0.026957128196954727, 0.028133675456047058, 0.02931022457778454, 0.03048677369952202, 0.03166332095861435, 0.03283986821770668, 0.03401641547679901, 0.03519296646118164, 0.03636951372027397, 0.0375460609793663, 0.03872261196374893, 0.03989915922284126, 0.041075706481933594]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 12.0, 9.0, 15.0, 26.0, 44.0, 61.0, 79.0, 132.0, 212.0, 393.0, 1208.0, 3823.0, 18501.0, 398648.0, 3593385.0, 164107.0, 9893.0, 2313.0, 603.0, 288.0, 157.0, 123.0, 77.0, 58.0, 33.0, 20.0, 21.0, 12.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00762176513671875, -0.007393479347229004, -0.007165193557739258, -0.006936907768249512, -0.006708621978759766, -0.0064803361892700195, -0.0062520503997802734, -0.006023764610290527, -0.005795478820800781, -0.005567193031311035, -0.005338907241821289, -0.005110621452331543, -0.004882335662841797, -0.004654049873352051, -0.004425764083862305, -0.004197478294372559, -0.0039691925048828125, -0.0037409067153930664, -0.0035126209259033203, -0.0032843351364135742, -0.003056049346923828, -0.002827763557434082, -0.002599477767944336, -0.00237119197845459, -0.0021429061889648438, -0.0019146203994750977, -0.0016863346099853516, -0.0014580488204956055, -0.0012297630310058594, -0.0010014772415161133, -0.0007731914520263672, -0.0005449056625366211, -0.000316619873046875, -8.83340835571289e-05, 0.0001399517059326172, 0.0003682374954223633, 0.0005965232849121094, 0.0008248090744018555, 0.0010530948638916016, 0.0012813806533813477, 0.0015096664428710938, 0.0017379522323608398, 0.001966238021850586, 0.002194523811340332, 0.002422809600830078, 0.0026510953903198242, 0.0028793811798095703, 0.0031076669692993164, 0.0033359527587890625, 0.0035642385482788086, 0.0037925243377685547, 0.004020810127258301, 0.004249095916748047, 0.004477381706237793, 0.004705667495727539, 0.004933953285217285, 0.005162239074707031, 0.005390524864196777, 0.0056188106536865234, 0.0058470964431762695, 0.006075382232666016, 0.006303668022155762, 0.006531953811645508, 0.006760239601135254, 0.006988525390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 10.0, 9.0, 9.0, 23.0, 27.0, 60.0, 67.0, 85.0, 126.0, 152.0, 116.0, 97.0, 90.0, 49.0, 26.0, 22.0, 16.0, 9.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007266998291015625, -0.007013142108917236, -0.006759285926818848, -0.006505429744720459, -0.00625157356262207, -0.005997717380523682, -0.005743861198425293, -0.005490005016326904, -0.005236148834228516, -0.004982292652130127, -0.004728436470031738, -0.00447458028793335, -0.004220724105834961, -0.003966867923736572, -0.0037130117416381836, -0.003459155559539795, -0.0032052993774414062, -0.0029514431953430176, -0.002697587013244629, -0.0024437308311462402, -0.0021898746490478516, -0.0019360184669494629, -0.0016821622848510742, -0.0014283061027526855, -0.0011744499206542969, -0.0009205937385559082, -0.0006667375564575195, -0.00041288137435913086, -0.0001590251922607422, 9.483098983764648e-05, 0.00034868717193603516, 0.0006025433540344238, 0.0008563995361328125, 0.0011102557182312012, 0.0013641119003295898, 0.0016179680824279785, 0.0018718242645263672, 0.002125680446624756, 0.0023795366287231445, 0.002633392810821533, 0.002887248992919922, 0.0031411051750183105, 0.0033949613571166992, 0.003648817539215088, 0.0039026737213134766, 0.004156529903411865, 0.004410386085510254, 0.004664242267608643, 0.004918098449707031, 0.00517195463180542, 0.005425810813903809, 0.005679666996002197, 0.005933523178100586, 0.006187379360198975, 0.006441235542297363, 0.006695091724395752, 0.006948947906494141, 0.007202804088592529, 0.007456660270690918, 0.007710516452789307, 0.007964372634887695, 0.008218228816986084, 0.008472084999084473, 0.008725941181182861, 0.00897979736328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 3.0, 5.0, 16.0, 23.0, 44.0, 70.0, 164.0, 297.0, 724.0, 2481.0, 22229.0, 3891278.0, 268545.0, 6138.0, 1291.0, 457.0, 227.0, 134.0, 58.0, 33.0, 26.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01273345947265625, -0.01239621639251709, -0.01205897331237793, -0.01172173023223877, -0.01138448715209961, -0.01104724407196045, -0.010710000991821289, -0.010372757911682129, -0.010035514831542969, -0.009698271751403809, -0.009361028671264648, -0.009023785591125488, -0.008686542510986328, -0.008349299430847168, -0.008012056350708008, -0.007674813270568848, -0.0073375701904296875, -0.007000327110290527, -0.006663084030151367, -0.006325840950012207, -0.005988597869873047, -0.005651354789733887, -0.0053141117095947266, -0.004976868629455566, -0.004639625549316406, -0.004302382469177246, -0.003965139389038086, -0.0036278963088989258, -0.0032906532287597656, -0.0029534101486206055, -0.0026161670684814453, -0.002278923988342285, -0.001941680908203125, -0.0016044378280639648, -0.0012671947479248047, -0.0009299516677856445, -0.0005927085876464844, -0.0002554655075073242, 8.177757263183594e-05, 0.0004190206527709961, 0.0007562637329101562, 0.0010935068130493164, 0.0014307498931884766, 0.0017679929733276367, 0.002105236053466797, 0.002442479133605957, 0.002779722213745117, 0.0031169652938842773, 0.0034542083740234375, 0.0037914514541625977, 0.004128694534301758, 0.004465937614440918, 0.004803180694580078, 0.005140423774719238, 0.0054776668548583984, 0.005814909934997559, 0.006152153015136719, 0.006489396095275879, 0.006826639175415039, 0.007163882255554199, 0.007501125335693359, 0.00783836841583252, 0.00817561149597168, 0.00851285457611084, 0.00885009765625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 10.0, 18.0, 26.0, 57.0, 144.0, 342.0, 728.0, 1090.0, 849.0, 464.0, 176.0, 73.0, 30.0, 29.0, 14.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005584716796875, -0.005314230918884277, -0.005043745040893555, -0.004773259162902832, -0.004502773284912109, -0.004232287406921387, -0.003961801528930664, -0.0036913156509399414, -0.0034208297729492188, -0.003150343894958496, -0.0028798580169677734, -0.0026093721389770508, -0.002338886260986328, -0.0020684003829956055, -0.0017979145050048828, -0.0015274286270141602, -0.0012569427490234375, -0.0009864568710327148, -0.0007159709930419922, -0.00044548511505126953, -0.00017499923706054688, 9.548664093017578e-05, 0.00036597251892089844, 0.0006364583969116211, 0.0009069442749023438, 0.0011774301528930664, 0.001447916030883789, 0.0017184019088745117, 0.0019888877868652344, 0.002259373664855957, 0.0025298595428466797, 0.0028003454208374023, 0.003070831298828125, 0.0033413171768188477, 0.0036118030548095703, 0.003882288932800293, 0.004152774810791016, 0.004423260688781738, 0.004693746566772461, 0.004964232444763184, 0.005234718322753906, 0.005505204200744629, 0.0057756900787353516, 0.006046175956726074, 0.006316661834716797, 0.0065871477127075195, 0.006857633590698242, 0.007128119468688965, 0.0073986053466796875, 0.00766909122467041, 0.007939577102661133, 0.008210062980651855, 0.008480548858642578, 0.0087510347366333, 0.009021520614624023, 0.009292006492614746, 0.009562492370605469, 0.009832978248596191, 0.010103464126586914, 0.010373950004577637, 0.01064443588256836, 0.010914921760559082, 0.011185407638549805, 0.011455893516540527, 0.01172637939453125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 21.0, 22.0, 41.0, 64.0, 93.0, 107.0, 163.0, 130.0, 92.0, 92.0, 42.0, 42.0, 18.0, 17.0, 4.0, 14.0, 5.0, 1.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.02202855423092842, -0.020994314923882484, -0.0199600737541914, -0.018925834447145462, -0.017891593277454376, -0.01685735397040844, -0.015823114663362503, -0.014788874424993992, -0.01375463418662548, -0.01272039394825697, -0.011686153709888458, -0.010651914402842522, -0.00961767416447401, -0.0085834339261055, -0.007549194153398275, -0.0065149543806910515, -0.00548071414232254, -0.004446473903954029, -0.003412234131246805, -0.0023779941257089376, -0.00134375412017107, -0.0003095138818025589, 0.000724725890904665, 0.0017589656636118889, 0.0027932059019804, 0.0038274459075182676, 0.004861685913056135, 0.005895925685763359, 0.00693016592413187, 0.007964406162500381, 0.008998645469546318, 0.01003288570791483, 0.011067129671573639, 0.01210136990994215, 0.013135610148310661, 0.014169849455356598, 0.015204089693725109, 0.01623832993209362, 0.017272569239139557, 0.018306810408830643, 0.01934104971587658, 0.020375289022922516, 0.0214095301926136, 0.02244376949965954, 0.023478008806705475, 0.02451224997639656, 0.025546489283442497, 0.026580728590488434, 0.02761496976017952, 0.028649209067225456, 0.029683450236916542, 0.03071768954396248, 0.031751930713653564, 0.03278616815805435, 0.03382040932774544, 0.03485465049743652, 0.03588888794183731, 0.0369231291115284, 0.037957366555929184, 0.03899160772562027, 0.040025848895311356, 0.04106009006500244, 0.04209432750940323, 0.043128568679094315, 0.0441628098487854]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 10.0, 7.0, 12.0, 8.0, 12.0, 17.0, 17.0, 17.0, 20.0, 25.0, 34.0, 24.0, 41.0, 51.0, 57.0, 36.0, 45.0, 57.0, 60.0, 48.0, 45.0, 50.0, 40.0, 43.0, 34.0, 24.0, 26.0, 10.0, 16.0, 13.0, 14.0, 17.0, 10.0, 9.0, 10.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.019015789031982422, -0.01829322800040245, -0.01757066510617733, -0.01684810221195221, -0.016125541180372238, -0.015402979217469692, -0.014680417254567146, -0.0139578552916646, -0.013235293328762054, -0.012512731365859509, -0.011790169402956963, -0.011067607440054417, -0.01034504547715187, -0.009622483514249325, -0.008899921551346779, -0.008177359588444233, -0.007454797625541687, -0.006732235662639141, -0.006009673699736595, -0.005287111736834049, -0.004564549773931503, -0.0038419878110289574, -0.0031194258481264114, -0.0023968638852238655, -0.0016743019223213196, -0.0009517399594187737, -0.00022917799651622772, 0.0004933839663863182, 0.0012159459292888641, 0.00193850789219141, 0.002661069855093956, 0.003383631817996502, 0.004106193780899048, 0.004828755743801594, 0.00555131770670414, 0.006273879669606686, 0.006996441632509232, 0.0077190035954117775, 0.008441565558314323, 0.00916412752121687, 0.009886689484119415, 0.010609251447021961, 0.011331813409924507, 0.012054375372827053, 0.012776937335729599, 0.013499499298632145, 0.01422206126153469, 0.014944623224437237, 0.015667185187339783, 0.016389746218919754, 0.017112309113144875, 0.017834872007369995, 0.018557433038949966, 0.019279994070529938, 0.02000255696475506, 0.02072511985898018, 0.02144768089056015, 0.02217024192214012, 0.022892804816365242, 0.023615367710590363, 0.024337928742170334, 0.025060489773750305, 0.025783052667975426, 0.026505615562200546, 0.027228176593780518]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 7.0, 5.0, 8.0, 14.0, 18.0, 24.0, 18.0, 52.0, 57.0, 93.0, 137.0, 195.0, 366.0, 717.0, 1382.0, 3015.0, 7844.0, 24992.0, 107828.0, 497145.0, 316374.0, 61892.0, 16169.0, 5405.0, 2276.0, 1053.0, 585.0, 302.0, 194.0, 124.0, 74.0, 55.0, 36.0, 27.0, 13.0, 16.0, 14.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.007717132568359375, -0.00748896598815918, -0.007260799407958984, -0.007032632827758789, -0.006804466247558594, -0.0065762996673583984, -0.006348133087158203, -0.006119966506958008, -0.0058917999267578125, -0.005663633346557617, -0.005435466766357422, -0.0052073001861572266, -0.004979133605957031, -0.004750967025756836, -0.004522800445556641, -0.004294633865356445, -0.00406646728515625, -0.0038383007049560547, -0.0036101341247558594, -0.003381967544555664, -0.0031538009643554688, -0.0029256343841552734, -0.002697467803955078, -0.002469301223754883, -0.0022411346435546875, -0.002012968063354492, -0.0017848014831542969, -0.0015566349029541016, -0.0013284683227539062, -0.001100301742553711, -0.0008721351623535156, -0.0006439685821533203, -0.000415802001953125, -0.0001876354217529297, 4.0531158447265625e-05, 0.00026869773864746094, 0.0004968643188476562, 0.0007250308990478516, 0.0009531974792480469, 0.0011813640594482422, 0.0014095306396484375, 0.0016376972198486328, 0.0018658638000488281, 0.0020940303802490234, 0.0023221969604492188, 0.002550363540649414, 0.0027785301208496094, 0.0030066967010498047, 0.00323486328125, 0.0034630298614501953, 0.0036911964416503906, 0.003919363021850586, 0.004147529602050781, 0.0043756961822509766, 0.004603862762451172, 0.004832029342651367, 0.0050601959228515625, 0.005288362503051758, 0.005516529083251953, 0.0057446956634521484, 0.005972862243652344, 0.006201028823852539, 0.006429195404052734, 0.00665736198425293, 0.006885528564453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 15.0, 20.0, 33.0, 64.0, 81.0, 116.0, 96.0, 143.0, 119.0, 101.0, 69.0, 63.0, 20.0, 17.0, 19.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007251739501953125, -0.006996810436248779, -0.006741881370544434, -0.006486952304840088, -0.006232023239135742, -0.0059770941734313965, -0.005722165107727051, -0.005467236042022705, -0.005212306976318359, -0.004957377910614014, -0.004702448844909668, -0.004447519779205322, -0.0041925907135009766, -0.003937661647796631, -0.003682732582092285, -0.0034278035163879395, -0.0031728744506835938, -0.002917945384979248, -0.0026630163192749023, -0.0024080872535705566, -0.002153158187866211, -0.0018982291221618652, -0.0016433000564575195, -0.0013883709907531738, -0.0011334419250488281, -0.0008785128593444824, -0.0006235837936401367, -0.000368654727935791, -0.00011372566223144531, 0.0001412034034729004, 0.0003961324691772461, 0.0006510615348815918, 0.0009059906005859375, 0.0011609196662902832, 0.001415848731994629, 0.0016707777976989746, 0.0019257068634033203, 0.002180635929107666, 0.0024355649948120117, 0.0026904940605163574, 0.002945423126220703, 0.003200352191925049, 0.0034552812576293945, 0.0037102103233337402, 0.003965139389038086, 0.004220068454742432, 0.004474997520446777, 0.004729926586151123, 0.004984855651855469, 0.0052397847175598145, 0.00549471378326416, 0.005749642848968506, 0.0060045719146728516, 0.006259500980377197, 0.006514430046081543, 0.006769359111785889, 0.007024288177490234, 0.00727921724319458, 0.007534146308898926, 0.0077890753746032715, 0.008044004440307617, 0.008298933506011963, 0.008553862571716309, 0.008808791637420654, 0.009063720703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 9.0, 12.0, 9.0, 10.0, 16.0, 23.0, 27.0, 50.0, 50.0, 101.0, 120.0, 173.0, 314.0, 499.0, 798.0, 1657.0, 4854.0, 23852.0, 219051.0, 724908.0, 57892.0, 8941.0, 2410.0, 1124.0, 619.0, 342.0, 210.0, 139.0, 94.0, 64.0, 41.0, 38.0, 25.0, 21.0, 21.0, 12.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00908660888671875, -0.008795499801635742, -0.008504390716552734, -0.008213281631469727, -0.007922172546386719, -0.007631063461303711, -0.007339954376220703, -0.007048845291137695, -0.0067577362060546875, -0.00646662712097168, -0.006175518035888672, -0.005884408950805664, -0.005593299865722656, -0.0053021907806396484, -0.005011081695556641, -0.004719972610473633, -0.004428863525390625, -0.004137754440307617, -0.0038466453552246094, -0.0035555362701416016, -0.0032644271850585938, -0.002973318099975586, -0.002682209014892578, -0.0023910999298095703, -0.0020999908447265625, -0.0018088817596435547, -0.0015177726745605469, -0.001226663589477539, -0.0009355545043945312, -0.0006444454193115234, -0.0003533363342285156, -6.222724914550781e-05, 0.0002288818359375, 0.0005199909210205078, 0.0008111000061035156, 0.0011022090911865234, 0.0013933181762695312, 0.001684427261352539, 0.001975536346435547, 0.0022666454315185547, 0.0025577545166015625, 0.0028488636016845703, 0.003139972686767578, 0.003431081771850586, 0.0037221908569335938, 0.0040132999420166016, 0.004304409027099609, 0.004595518112182617, 0.004886627197265625, 0.005177736282348633, 0.005468845367431641, 0.0057599544525146484, 0.006051063537597656, 0.006342172622680664, 0.006633281707763672, 0.00692439079284668, 0.0072154998779296875, 0.007506608963012695, 0.007797718048095703, 0.008088827133178711, 0.008379936218261719, 0.008671045303344727, 0.008962154388427734, 0.009253263473510742, 0.00954437255859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 4.0, 7.0, 13.0, 9.0, 18.0, 30.0, 30.0, 44.0, 32.0, 44.0, 69.0, 70.0, 61.0, 61.0, 65.0, 62.0, 58.0, 50.0, 55.0, 45.0, 31.0, 29.0, 22.0, 21.0, 16.0, 10.0, 9.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01593017578125, -0.0154496431350708, -0.014969110488891602, -0.014488577842712402, -0.014008045196533203, -0.013527512550354004, -0.013046979904174805, -0.012566447257995605, -0.012085914611816406, -0.011605381965637207, -0.011124849319458008, -0.010644316673278809, -0.01016378402709961, -0.00968325138092041, -0.009202718734741211, -0.008722186088562012, -0.008241653442382812, -0.007761120796203613, -0.007280588150024414, -0.006800055503845215, -0.006319522857666016, -0.005838990211486816, -0.005358457565307617, -0.004877924919128418, -0.004397392272949219, -0.0039168596267700195, -0.0034363269805908203, -0.002955794334411621, -0.002475261688232422, -0.0019947290420532227, -0.0015141963958740234, -0.0010336637496948242, -0.000553131103515625, -7.259845733642578e-05, 0.00040793418884277344, 0.0008884668350219727, 0.0013689994812011719, 0.001849532127380371, 0.0023300647735595703, 0.0028105974197387695, 0.0032911300659179688, 0.003771662712097168, 0.004252195358276367, 0.004732728004455566, 0.005213260650634766, 0.005693793296813965, 0.006174325942993164, 0.006654858589172363, 0.0071353912353515625, 0.007615923881530762, 0.008096456527709961, 0.00857698917388916, 0.00905752182006836, 0.009538054466247559, 0.010018587112426758, 0.010499119758605957, 0.010979652404785156, 0.011460185050964355, 0.011940717697143555, 0.012421250343322754, 0.012901782989501953, 0.013382315635681152, 0.013862848281860352, 0.01434338092803955, 0.01482391357421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 5.0, 8.0, 5.0, 9.0, 16.0, 23.0, 42.0, 52.0, 70.0, 140.0, 235.0, 419.0, 814.0, 2102.0, 6603.0, 29399.0, 224223.0, 710576.0, 57515.0, 10814.0, 3096.0, 1150.0, 513.0, 258.0, 185.0, 86.0, 59.0, 35.0, 28.0, 12.0, 12.0, 16.0, 6.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.001682281494140625, -0.0016330629587173462, -0.0015838444232940674, -0.0015346258878707886, -0.0014854073524475098, -0.001436188817024231, -0.0013869702816009521, -0.0013377517461776733, -0.0012885332107543945, -0.0012393146753311157, -0.001190096139907837, -0.001140877604484558, -0.0010916590690612793, -0.0010424405336380005, -0.0009932219982147217, -0.0009440034627914429, -0.0008947849273681641, -0.0008455663919448853, -0.0007963478565216064, -0.0007471293210983276, -0.0006979107856750488, -0.00064869225025177, -0.0005994737148284912, -0.0005502551794052124, -0.0005010366439819336, -0.0004518181085586548, -0.000402599573135376, -0.00035338103771209717, -0.00030416250228881836, -0.00025494396686553955, -0.00020572543144226074, -0.00015650689601898193, -0.00010728836059570312, -5.8069825172424316e-05, -8.851289749145508e-06, 4.03672456741333e-05, 8.958578109741211e-05, 0.00013880431652069092, 0.00018802285194396973, 0.00023724138736724854, 0.00028645992279052734, 0.00033567845821380615, 0.00038489699363708496, 0.00043411552906036377, 0.0004833340644836426, 0.0005325525999069214, 0.0005817711353302002, 0.000630989670753479, 0.0006802082061767578, 0.0007294267416000366, 0.0007786452770233154, 0.0008278638124465942, 0.000877082347869873, 0.0009263008832931519, 0.0009755194187164307, 0.0010247379541397095, 0.0010739564895629883, 0.001123175024986267, 0.001172393560409546, 0.0012216120958328247, 0.0012708306312561035, 0.0013200491666793823, 0.0013692677021026611, 0.00141848623752594, 0.0014677047729492188]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 5.0, 2.0, 5.0, 8.0, 8.0, 8.0, 20.0, 11.0, 18.0, 15.0, 21.0, 16.0, 37.0, 33.0, 50.0, 30.0, 76.0, 43.0, 80.0, 55.0, 56.0, 69.0, 43.0, 53.0, 27.0, 32.0, 27.0, 42.0, 20.0, 13.0, 19.0, 9.0, 9.0, 9.0, 6.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.708766937255859e-06, -4.560686647891998e-06, -4.412606358528137e-06, -4.264526069164276e-06, -4.116445779800415e-06, -3.968365490436554e-06, -3.820285201072693e-06, -3.6722049117088318e-06, -3.5241246223449707e-06, -3.3760443329811096e-06, -3.2279640436172485e-06, -3.0798837542533875e-06, -2.9318034648895264e-06, -2.7837231755256653e-06, -2.635642886161804e-06, -2.487562596797943e-06, -2.339482307434082e-06, -2.191402018070221e-06, -2.04332172870636e-06, -1.8952414393424988e-06, -1.7471611499786377e-06, -1.5990808606147766e-06, -1.4510005712509155e-06, -1.3029202818870544e-06, -1.1548399925231934e-06, -1.0067597031593323e-06, -8.586794137954712e-07, -7.105991244316101e-07, -5.62518835067749e-07, -4.1443854570388794e-07, -2.6635825634002686e-07, -1.1827796697616577e-07, 2.9802322387695312e-08, 1.778826117515564e-07, 3.259629011154175e-07, 4.7404319047927856e-07, 6.221234798431396e-07, 7.702037692070007e-07, 9.182840585708618e-07, 1.066364347934723e-06, 1.214444637298584e-06, 1.362524926662445e-06, 1.5106052160263062e-06, 1.6586855053901672e-06, 1.8067657947540283e-06, 1.9548460841178894e-06, 2.1029263734817505e-06, 2.2510066628456116e-06, 2.3990869522094727e-06, 2.5471672415733337e-06, 2.695247530937195e-06, 2.843327820301056e-06, 2.991408109664917e-06, 3.139488399028778e-06, 3.287568688392639e-06, 3.4356489777565002e-06, 3.5837292671203613e-06, 3.7318095564842224e-06, 3.8798898458480835e-06, 4.027970135211945e-06, 4.176050424575806e-06, 4.324130713939667e-06, 4.472211003303528e-06, 4.620291292667389e-06, 4.76837158203125e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 4.0, 0.0, 7.0, 5.0, 24.0, 11.0, 27.0, 31.0, 44.0, 77.0, 85.0, 140.0, 253.0, 427.0, 916.0, 2108.0, 5885.0, 22629.0, 155876.0, 756513.0, 81469.0, 14421.0, 4229.0, 1631.0, 722.0, 398.0, 210.0, 131.0, 72.0, 61.0, 49.0, 27.0, 24.0, 14.0, 11.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001369476318359375, -0.0013243556022644043, -0.0012792348861694336, -0.0012341141700744629, -0.0011889934539794922, -0.0011438727378845215, -0.0010987520217895508, -0.00105363130569458, -0.0010085105895996094, -0.0009633898735046387, -0.000918269157409668, -0.0008731484413146973, -0.0008280277252197266, -0.0007829070091247559, -0.0007377862930297852, -0.0006926655769348145, -0.0006475448608398438, -0.000602424144744873, -0.0005573034286499023, -0.0005121827125549316, -0.00046706199645996094, -0.00042194128036499023, -0.00037682056427001953, -0.00033169984817504883, -0.0002865791320800781, -0.00024145841598510742, -0.00019633769989013672, -0.00015121698379516602, -0.00010609626770019531, -6.097555160522461e-05, -1.5854835510253906e-05, 2.9265880584716797e-05, 7.43865966796875e-05, 0.0001195073127746582, 0.0001646280288696289, 0.0002097487449645996, 0.0002548694610595703, 0.000299990177154541, 0.0003451108932495117, 0.0003902316093444824, 0.0004353523254394531, 0.00048047304153442383, 0.0005255937576293945, 0.0005707144737243652, 0.0006158351898193359, 0.0006609559059143066, 0.0007060766220092773, 0.000751197338104248, 0.0007963180541992188, 0.0008414387702941895, 0.0008865594863891602, 0.0009316802024841309, 0.0009768009185791016, 0.0010219216346740723, 0.001067042350769043, 0.0011121630668640137, 0.0011572837829589844, 0.001202404499053955, 0.0012475252151489258, 0.0012926459312438965, 0.0013377666473388672, 0.0013828873634338379, 0.0014280080795288086, 0.0014731287956237793, 0.00151824951171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 8.0, 10.0, 16.0, 25.0, 23.0, 36.0, 57.0, 69.0, 75.0, 95.0, 108.0, 93.0, 76.0, 74.0, 56.0, 44.0, 36.0, 19.0, 11.0, 20.0, 11.0, 10.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0020904541015625, -0.0020330101251602173, -0.0019755661487579346, -0.0019181221723556519, -0.0018606781959533691, -0.0018032342195510864, -0.0017457902431488037, -0.001688346266746521, -0.0016309022903442383, -0.0015734583139419556, -0.0015160143375396729, -0.0014585703611373901, -0.0014011263847351074, -0.0013436824083328247, -0.001286238431930542, -0.0012287944555282593, -0.0011713504791259766, -0.0011139065027236938, -0.0010564625263214111, -0.0009990185499191284, -0.0009415745735168457, -0.000884130597114563, -0.0008266866207122803, -0.0007692426443099976, -0.0007117986679077148, -0.0006543546915054321, -0.0005969107151031494, -0.0005394667387008667, -0.000482022762298584, -0.00042457878589630127, -0.00036713480949401855, -0.00030969083309173584, -0.0002522468566894531, -0.0001948028802871704, -0.0001373589038848877, -7.991492748260498e-05, -2.2470951080322266e-05, 3.497302532196045e-05, 9.241700172424316e-05, 0.00014986097812652588, 0.0002073049545288086, 0.0002647489309310913, 0.000322192907333374, 0.00037963688373565674, 0.00043708086013793945, 0.0004945248365402222, 0.0005519688129425049, 0.0006094127893447876, 0.0006668567657470703, 0.000724300742149353, 0.0007817447185516357, 0.0008391886949539185, 0.0008966326713562012, 0.0009540766477584839, 0.0010115206241607666, 0.0010689646005630493, 0.001126408576965332, 0.0011838525533676147, 0.0012412965297698975, 0.0012987405061721802, 0.0013561844825744629, 0.0014136284589767456, 0.0014710724353790283, 0.001528516411781311, 0.0015859603881835938]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 26.0, 86.0, 198.0, 421.0, 166.0, 56.0, 19.0, 15.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0683184489607811, -0.06560777872800827, -0.06289711594581604, -0.06018644571304321, -0.057475775480270386, -0.05476510524749756, -0.05205443874001503, -0.0493437722325325, -0.046633101999759674, -0.04392243176698685, -0.04121176525950432, -0.03850109875202179, -0.03579042851924896, -0.033079758286476135, -0.030369091778993607, -0.02765842340886593, -0.02494775503873825, -0.022237086668610573, -0.019526418298482895, -0.016815749928355217, -0.014105081558227539, -0.011394413188099861, -0.008683744817972183, -0.005973076447844505, -0.0032624080777168274, -0.0005517397075891495, 0.0021589286625385284, 0.004869597032666206, 0.007580265402793884, 0.010290933772921562, 0.01300160214304924, 0.015712270513176918, 0.018422946333885193, 0.02113361470401287, 0.02384428307414055, 0.026554951444268227, 0.029265619814395905, 0.03197629004716873, 0.03468695655465126, 0.03739762306213379, 0.040108293294906616, 0.04281896352767944, 0.04552963003516197, 0.0482402965426445, 0.05095096677541733, 0.053661637008190155, 0.056372303515672684, 0.05908297002315521, 0.06179364025592804, 0.06450431048870087, 0.0672149807214737, 0.06992564350366592, 0.07263631373643875, 0.07534698396921158, 0.07805764675140381, 0.08076831698417664, 0.08347898721694946, 0.08618965744972229, 0.08890032768249512, 0.09161099046468735, 0.09432166069746017, 0.097032330930233, 0.09974299371242523, 0.10245366394519806, 0.10516433417797089]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 3.0, 5.0, 6.0, 12.0, 13.0, 14.0, 18.0, 26.0, 26.0, 26.0, 31.0, 29.0, 42.0, 77.0, 135.0, 154.0, 87.0, 38.0, 41.0, 33.0, 28.0, 24.0, 18.0, 21.0, 19.0, 17.0, 6.0, 14.0, 8.0, 7.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05504107475280762, -0.053425658494234085, -0.05181024223566055, -0.05019482597708702, -0.04857940971851349, -0.04696399345993996, -0.045348577201366425, -0.04373316094279289, -0.04211774468421936, -0.04050232842564583, -0.038886912167072296, -0.037271495908498764, -0.03565607964992523, -0.0340406633913517, -0.03242524713277817, -0.030809830874204636, -0.029194414615631104, -0.02757899835705757, -0.02596358209848404, -0.024348165839910507, -0.022732749581336975, -0.021117333322763443, -0.01950191706418991, -0.01788650080561638, -0.016271084547042847, -0.014655668288469315, -0.013040252029895782, -0.01142483577132225, -0.009809419512748718, -0.008194003254175186, -0.006578586995601654, -0.004963170737028122, -0.00334775447845459, -0.0017323382198810577, -0.00011692196130752563, 0.0014984942972660065, 0.0031139105558395386, 0.004729326814413071, 0.006344743072986603, 0.007960159331560135, 0.009575575590133667, 0.011190991848707199, 0.012806408107280731, 0.014421824365854263, 0.016037240624427795, 0.017652656883001328, 0.01926807314157486, 0.02088348940014839, 0.022498905658721924, 0.024114321917295456, 0.025729738175868988, 0.02734515443444252, 0.028960570693016052, 0.030575986951589584, 0.032191403210163116, 0.03380681946873665, 0.03542223572731018, 0.03703765198588371, 0.038653068244457245, 0.04026848450303078, 0.04188390076160431, 0.04349931702017784, 0.04511473327875137, 0.046730149537324905, 0.04834556579589844]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 7.0, 7.0, 10.0, 24.0, 28.0, 42.0, 55.0, 118.0, 270.0, 865.0, 1957.0, 4809.0, 15930.0, 95622.0, 1290094.0, 2515807.0, 236186.0, 22266.0, 6579.0, 2199.0, 700.0, 307.0, 129.0, 93.0, 61.0, 31.0, 24.0, 18.0, 20.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005218505859375, -0.005026519298553467, -0.004834532737731934, -0.0046425461769104, -0.004450559616088867, -0.004258573055267334, -0.004066586494445801, -0.0038745999336242676, -0.0036826133728027344, -0.003490626811981201, -0.003298640251159668, -0.0031066536903381348, -0.0029146671295166016, -0.0027226805686950684, -0.002530694007873535, -0.002338707447052002, -0.0021467208862304688, -0.0019547343254089355, -0.0017627477645874023, -0.0015707612037658691, -0.001378774642944336, -0.0011867880821228027, -0.0009948015213012695, -0.0008028149604797363, -0.0006108283996582031, -0.0004188418388366699, -0.00022685527801513672, -3.4868717193603516e-05, 0.0001571178436279297, 0.0003491044044494629, 0.0005410909652709961, 0.0007330775260925293, 0.0009250640869140625, 0.0011170506477355957, 0.001309037208557129, 0.0015010237693786621, 0.0016930103302001953, 0.0018849968910217285, 0.0020769834518432617, 0.002268970012664795, 0.002460956573486328, 0.0026529431343078613, 0.0028449296951293945, 0.0030369162559509277, 0.003228902816772461, 0.003420889377593994, 0.0036128759384155273, 0.0038048624992370605, 0.003996849060058594, 0.004188835620880127, 0.00438082218170166, 0.004572808742523193, 0.0047647953033447266, 0.00495678186416626, 0.005148768424987793, 0.005340754985809326, 0.005532741546630859, 0.005724728107452393, 0.005916714668273926, 0.006108701229095459, 0.006300687789916992, 0.006492674350738525, 0.006684660911560059, 0.006876647472381592, 0.007068634033203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 13.0, 4.0, 13.0, 17.0, 45.0, 63.0, 90.0, 116.0, 125.0, 125.0, 110.0, 95.0, 62.0, 42.0, 31.0, 23.0, 17.0, 7.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007251739501953125, -0.00699537992477417, -0.006739020347595215, -0.00648266077041626, -0.006226301193237305, -0.00596994161605835, -0.0057135820388793945, -0.0054572224617004395, -0.005200862884521484, -0.004944503307342529, -0.004688143730163574, -0.004431784152984619, -0.004175424575805664, -0.003919064998626709, -0.003662705421447754, -0.003406345844268799, -0.0031499862670898438, -0.0028936266899108887, -0.0026372671127319336, -0.0023809075355529785, -0.0021245479583740234, -0.0018681883811950684, -0.0016118288040161133, -0.0013554692268371582, -0.0010991096496582031, -0.000842750072479248, -0.000586390495300293, -0.0003300309181213379, -7.367134094238281e-05, 0.00018268823623657227, 0.00043904781341552734, 0.0006954073905944824, 0.0009517669677734375, 0.0012081265449523926, 0.0014644861221313477, 0.0017208456993103027, 0.001977205276489258, 0.002233564853668213, 0.002489924430847168, 0.002746284008026123, 0.003002643585205078, 0.003259003162384033, 0.0035153627395629883, 0.0037717223167419434, 0.0040280818939208984, 0.0042844414710998535, 0.004540801048278809, 0.004797160625457764, 0.005053520202636719, 0.005309879779815674, 0.005566239356994629, 0.005822598934173584, 0.006078958511352539, 0.006335318088531494, 0.006591677665710449, 0.006848037242889404, 0.007104396820068359, 0.0073607563972473145, 0.0076171159744262695, 0.007873475551605225, 0.00812983512878418, 0.008386194705963135, 0.00864255428314209, 0.008898913860321045, 0.0091552734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 8.0, 17.0, 32.0, 72.0, 196.0, 613.0, 3480.0, 4065049.0, 122162.0, 1904.0, 456.0, 157.0, 62.0, 37.0, 12.0, 13.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038604736328125, -0.03726673126220703, -0.03592872619628906, -0.034590721130371094, -0.033252716064453125, -0.031914710998535156, -0.030576705932617188, -0.02923870086669922, -0.02790069580078125, -0.02656269073486328, -0.025224685668945312, -0.023886680603027344, -0.022548675537109375, -0.021210670471191406, -0.019872665405273438, -0.01853466033935547, -0.0171966552734375, -0.01585865020751953, -0.014520645141601562, -0.013182640075683594, -0.011844635009765625, -0.010506629943847656, -0.009168624877929688, -0.007830619812011719, -0.00649261474609375, -0.005154609680175781, -0.0038166046142578125, -0.0024785995483398438, -0.001140594482421875, 0.00019741058349609375, 0.0015354156494140625, 0.0028734207153320312, 0.00421142578125, 0.005549430847167969, 0.0068874359130859375, 0.008225440979003906, 0.009563446044921875, 0.010901451110839844, 0.012239456176757812, 0.013577461242675781, 0.01491546630859375, 0.01625347137451172, 0.017591476440429688, 0.018929481506347656, 0.020267486572265625, 0.021605491638183594, 0.022943496704101562, 0.02428150177001953, 0.0256195068359375, 0.02695751190185547, 0.028295516967773438, 0.029633522033691406, 0.030971527099609375, 0.032309532165527344, 0.03364753723144531, 0.03498554229736328, 0.03632354736328125, 0.03766155242919922, 0.03899955749511719, 0.040337562561035156, 0.041675567626953125, 0.043013572692871094, 0.04435157775878906, 0.04568958282470703, 0.047027587890625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 9.0, 10.0, 12.0, 24.0, 36.0, 61.0, 114.0, 225.0, 490.0, 1115.0, 1069.0, 459.0, 216.0, 102.0, 62.0, 24.0, 17.0, 11.0, 5.0, 11.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0099945068359375, -0.009407281875610352, -0.008820056915283203, -0.008232831954956055, -0.007645606994628906, -0.007058382034301758, -0.006471157073974609, -0.005883932113647461, -0.0052967071533203125, -0.004709482192993164, -0.004122257232666016, -0.003535032272338867, -0.0029478073120117188, -0.0023605823516845703, -0.0017733573913574219, -0.0011861324310302734, -0.000598907470703125, -1.1682510375976562e-05, 0.0005755424499511719, 0.0011627674102783203, 0.0017499923706054688, 0.002337217330932617, 0.0029244422912597656, 0.003511667251586914, 0.0040988922119140625, 0.004686117172241211, 0.005273342132568359, 0.005860567092895508, 0.006447792053222656, 0.007035017013549805, 0.007622241973876953, 0.008209466934204102, 0.00879669189453125, 0.009383916854858398, 0.009971141815185547, 0.010558366775512695, 0.011145591735839844, 0.011732816696166992, 0.01232004165649414, 0.012907266616821289, 0.013494491577148438, 0.014081716537475586, 0.014668941497802734, 0.015256166458129883, 0.01584339141845703, 0.01643061637878418, 0.017017841339111328, 0.017605066299438477, 0.018192291259765625, 0.018779516220092773, 0.019366741180419922, 0.01995396614074707, 0.02054119110107422, 0.021128416061401367, 0.021715641021728516, 0.022302865982055664, 0.022890090942382812, 0.02347731590270996, 0.02406454086303711, 0.024651765823364258, 0.025238990783691406, 0.025826215744018555, 0.026413440704345703, 0.02700066566467285, 0.027587890625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 15.0, 46.0, 83.0, 135.0, 236.0, 208.0, 111.0, 63.0, 29.0, 14.0, 5.0, 10.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0895826444029808, -0.08583042770624161, -0.08207820355892181, -0.07832598686218262, -0.07457377016544342, -0.07082155346870422, -0.06706933677196503, -0.06331711262464523, -0.059564895927906036, -0.05581267923116684, -0.052060458809137344, -0.04830823838710785, -0.04455602169036865, -0.040803804993629456, -0.03705158457159996, -0.033299364149570465, -0.02954714745283127, -0.025794928893446922, -0.022042710334062576, -0.01829049177467823, -0.014538273215293884, -0.010786054655909538, -0.007033836096525192, -0.0032816175371408463, 0.00047060102224349976, 0.004222819581627846, 0.007975038141012192, 0.011727256700396538, 0.015479475259780884, 0.01923169381916523, 0.022983912378549576, 0.026736130937933922, 0.03048834204673767, 0.03424055874347687, 0.03799277916550636, 0.04174499958753586, 0.045497216284275055, 0.04924943298101425, 0.05300165340304375, 0.05675387382507324, 0.06050609052181244, 0.06425830721855164, 0.06801052391529083, 0.07176274806261063, 0.07551496475934982, 0.07926718145608902, 0.08301940560340881, 0.08677162230014801, 0.09052383899688721, 0.0942760556936264, 0.0980282723903656, 0.1017804965376854, 0.10553271323442459, 0.10928492993116379, 0.11303715407848358, 0.11678937077522278, 0.12054158747196198, 0.12429380416870117, 0.12804602086544037, 0.13179823756217957, 0.13555046916007996, 0.13930268585681915, 0.14305490255355835, 0.14680711925029755, 0.15055933594703674]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 9.0, 10.0, 21.0, 25.0, 21.0, 44.0, 46.0, 82.0, 83.0, 118.0, 125.0, 106.0, 79.0, 79.0, 50.0, 45.0, 17.0, 14.0, 12.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09496647119522095, -0.09070610255002975, -0.08644573390483856, -0.08218536525964737, -0.07792499661445618, -0.07366463541984558, -0.06940426677465439, -0.0651438981294632, -0.060883529484272, -0.05662316083908081, -0.05236279219388962, -0.048102427273988724, -0.04384205862879753, -0.03958168998360634, -0.035321325063705444, -0.03106095641851425, -0.02680058777332306, -0.022540219128131866, -0.018279852345585823, -0.014019484631717205, -0.009759116917848587, -0.005498748272657394, -0.001238381490111351, 0.0030219852924346924, 0.007282353937625885, 0.011542721651494503, 0.01580308936536312, 0.020063456147909164, 0.024323824793100357, 0.02858419343829155, 0.032844558358192444, 0.037104927003383636, 0.04136529564857483, 0.04562566429376602, 0.049886032938957214, 0.05414639785885811, 0.0584067665040493, 0.0626671314239502, 0.06692750006914139, 0.07118786871433258, 0.07544823735952377, 0.07970860600471497, 0.08396897464990616, 0.08822934329509735, 0.09248970448970795, 0.09675008058547974, 0.10101044178009033, 0.10527081042528152, 0.10953117907047272, 0.11379154771566391, 0.1180519163608551, 0.1223122850060463, 0.1265726536512375, 0.13083301484584808, 0.13509339094161987, 0.13935375213623047, 0.14361411333084106, 0.14787447452545166, 0.15213485062122345, 0.15639521181583405, 0.16065558791160583, 0.16491594910621643, 0.16917632520198822, 0.17343668639659882, 0.1776970624923706]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 3.0, 4.0, 3.0, 7.0, 7.0, 11.0, 12.0, 15.0, 20.0, 32.0, 36.0, 68.0, 103.0, 131.0, 219.0, 364.0, 719.0, 1394.0, 3265.0, 8669.0, 28501.0, 147383.0, 687477.0, 129846.0, 26105.0, 7989.0, 3097.0, 1374.0, 690.0, 358.0, 212.0, 141.0, 80.0, 47.0, 38.0, 33.0, 20.0, 13.0, 19.0, 13.0, 10.0, 2.0, 5.0, 2.0, 8.0, 1.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00792694091796875, -0.00761568546295166, -0.00730443000793457, -0.0069931745529174805, -0.006681919097900391, -0.006370663642883301, -0.006059408187866211, -0.005748152732849121, -0.005436897277832031, -0.005125641822814941, -0.0048143863677978516, -0.004503130912780762, -0.004191875457763672, -0.003880620002746582, -0.003569364547729492, -0.0032581090927124023, -0.0029468536376953125, -0.0026355981826782227, -0.002324342727661133, -0.002013087272644043, -0.0017018318176269531, -0.0013905763626098633, -0.0010793209075927734, -0.0007680654525756836, -0.00045680999755859375, -0.0001455545425415039, 0.00016570091247558594, 0.0004769563674926758, 0.0007882118225097656, 0.0010994672775268555, 0.0014107227325439453, 0.0017219781875610352, 0.002033233642578125, 0.002344489097595215, 0.0026557445526123047, 0.0029670000076293945, 0.0032782554626464844, 0.0035895109176635742, 0.003900766372680664, 0.004212021827697754, 0.004523277282714844, 0.004834532737731934, 0.0051457881927490234, 0.005457043647766113, 0.005768299102783203, 0.006079554557800293, 0.006390810012817383, 0.006702065467834473, 0.0070133209228515625, 0.007324576377868652, 0.007635831832885742, 0.007947087287902832, 0.008258342742919922, 0.008569598197937012, 0.008880853652954102, 0.009192109107971191, 0.009503364562988281, 0.009814620018005371, 0.010125875473022461, 0.01043713092803955, 0.01074838638305664, 0.01105964183807373, 0.01137089729309082, 0.01168215274810791, 0.011993408203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 12.0, 21.0, 29.0, 42.0, 86.0, 135.0, 137.0, 142.0, 125.0, 87.0, 63.0, 38.0, 37.0, 27.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006771087646484375, -0.006403505802154541, -0.006035923957824707, -0.005668342113494873, -0.005300760269165039, -0.004933178424835205, -0.004565596580505371, -0.004198014736175537, -0.003830432891845703, -0.003462851047515869, -0.003095269203186035, -0.002727687358856201, -0.002360105514526367, -0.001992523670196533, -0.0016249418258666992, -0.0012573599815368652, -0.0008897781372070312, -0.0005221962928771973, -0.00015461444854736328, 0.0002129673957824707, 0.0005805492401123047, 0.0009481310844421387, 0.0013157129287719727, 0.0016832947731018066, 0.0020508766174316406, 0.0024184584617614746, 0.0027860403060913086, 0.0031536221504211426, 0.0035212039947509766, 0.0038887858390808105, 0.0042563676834106445, 0.0046239495277404785, 0.0049915313720703125, 0.0053591132164001465, 0.0057266950607299805, 0.0060942769050598145, 0.0064618587493896484, 0.006829440593719482, 0.007197022438049316, 0.00756460428237915, 0.007932186126708984, 0.008299767971038818, 0.008667349815368652, 0.009034931659698486, 0.00940251350402832, 0.009770095348358154, 0.010137677192687988, 0.010505259037017822, 0.010872840881347656, 0.01124042272567749, 0.011608004570007324, 0.011975586414337158, 0.012343168258666992, 0.012710750102996826, 0.01307833194732666, 0.013445913791656494, 0.013813495635986328, 0.014181077480316162, 0.014548659324645996, 0.01491624116897583, 0.015283823013305664, 0.015651404857635498, 0.016018986701965332, 0.016386568546295166, 0.016754150390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 6.0, 4.0, 5.0, 7.0, 12.0, 10.0, 16.0, 10.0, 18.0, 28.0, 36.0, 55.0, 72.0, 114.0, 174.0, 303.0, 557.0, 1200.0, 2994.0, 11970.0, 90059.0, 872751.0, 54890.0, 8494.0, 2533.0, 955.0, 509.0, 269.0, 153.0, 108.0, 66.0, 39.0, 25.0, 27.0, 21.0, 13.0, 11.0, 10.0, 8.0, 9.0, 0.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01068878173828125, -0.010348320007324219, -0.010007858276367188, -0.009667396545410156, -0.009326934814453125, -0.008986473083496094, -0.008646011352539062, -0.008305549621582031, -0.007965087890625, -0.007624626159667969, -0.0072841644287109375, -0.006943702697753906, -0.006603240966796875, -0.006262779235839844, -0.0059223175048828125, -0.005581855773925781, -0.00524139404296875, -0.004900932312011719, -0.0045604705810546875, -0.004220008850097656, -0.003879547119140625, -0.0035390853881835938, -0.0031986236572265625, -0.0028581619262695312, -0.0025177001953125, -0.0021772384643554688, -0.0018367767333984375, -0.0014963150024414062, -0.001155853271484375, -0.0008153915405273438, -0.0004749298095703125, -0.00013446807861328125, 0.00020599365234375, 0.0005464553833007812, 0.0008869171142578125, 0.0012273788452148438, 0.001567840576171875, 0.0019083023071289062, 0.0022487640380859375, 0.0025892257690429688, 0.0029296875, 0.0032701492309570312, 0.0036106109619140625, 0.003951072692871094, 0.004291534423828125, 0.004631996154785156, 0.0049724578857421875, 0.005312919616699219, 0.00565338134765625, 0.005993843078613281, 0.0063343048095703125, 0.006674766540527344, 0.007015228271484375, 0.007355690002441406, 0.0076961517333984375, 0.008036613464355469, 0.0083770751953125, 0.008717536926269531, 0.009057998657226562, 0.009398460388183594, 0.009738922119140625, 0.010079383850097656, 0.010419845581054688, 0.010760307312011719, 0.01110076904296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 2.0, 7.0, 7.0, 6.0, 5.0, 6.0, 16.0, 11.0, 21.0, 19.0, 24.0, 28.0, 35.0, 55.0, 56.0, 69.0, 76.0, 86.0, 79.0, 62.0, 58.0, 40.0, 39.0, 40.0, 27.0, 24.0, 22.0, 13.0, 10.0, 13.0, 8.0, 5.0, 4.0, 6.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0196380615234375, -0.018996000289916992, -0.018353939056396484, -0.017711877822875977, -0.01706981658935547, -0.01642775535583496, -0.015785694122314453, -0.015143632888793945, -0.014501571655273438, -0.01385951042175293, -0.013217449188232422, -0.012575387954711914, -0.011933326721191406, -0.011291265487670898, -0.01064920425415039, -0.010007143020629883, -0.009365081787109375, -0.008723020553588867, -0.00808095932006836, -0.0074388980865478516, -0.006796836853027344, -0.006154775619506836, -0.005512714385986328, -0.00487065315246582, -0.0042285919189453125, -0.0035865306854248047, -0.002944469451904297, -0.002302408218383789, -0.0016603469848632812, -0.0010182857513427734, -0.0003762245178222656, 0.0002658367156982422, 0.00090789794921875, 0.0015499591827392578, 0.0021920204162597656, 0.0028340816497802734, 0.0034761428833007812, 0.004118204116821289, 0.004760265350341797, 0.005402326583862305, 0.0060443878173828125, 0.00668644905090332, 0.007328510284423828, 0.007970571517944336, 0.008612632751464844, 0.009254693984985352, 0.00989675521850586, 0.010538816452026367, 0.011180877685546875, 0.011822938919067383, 0.01246500015258789, 0.013107061386108398, 0.013749122619628906, 0.014391183853149414, 0.015033245086669922, 0.01567530632019043, 0.016317367553710938, 0.016959428787231445, 0.017601490020751953, 0.01824355125427246, 0.01888561248779297, 0.019527673721313477, 0.020169734954833984, 0.020811796188354492, 0.021453857421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 10.0, 7.0, 17.0, 25.0, 30.0, 62.0, 91.0, 191.0, 418.0, 1355.0, 6181.0, 137906.0, 889755.0, 9698.0, 1797.0, 500.0, 200.0, 96.0, 72.0, 40.0, 28.0, 24.0, 9.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0046844482421875, -0.004538536071777344, -0.0043926239013671875, -0.004246711730957031, -0.004100799560546875, -0.003954887390136719, -0.0038089752197265625, -0.0036630630493164062, -0.00351715087890625, -0.0033712387084960938, -0.0032253265380859375, -0.0030794143676757812, -0.002933502197265625, -0.0027875900268554688, -0.0026416778564453125, -0.0024957656860351562, -0.002349853515625, -0.0022039413452148438, -0.0020580291748046875, -0.0019121170043945312, -0.001766204833984375, -0.0016202926635742188, -0.0014743804931640625, -0.0013284683227539062, -0.00118255615234375, -0.0010366439819335938, -0.0008907318115234375, -0.0007448196411132812, -0.000598907470703125, -0.00045299530029296875, -0.0003070831298828125, -0.00016117095947265625, -1.52587890625e-05, 0.00013065338134765625, 0.0002765655517578125, 0.00042247772216796875, 0.000568389892578125, 0.0007143020629882812, 0.0008602142333984375, 0.0010061264038085938, 0.00115203857421875, 0.0012979507446289062, 0.0014438629150390625, 0.0015897750854492188, 0.001735687255859375, 0.0018815994262695312, 0.0020275115966796875, 0.0021734237670898438, 0.0023193359375, 0.0024652481079101562, 0.0026111602783203125, 0.0027570724487304688, 0.002902984619140625, 0.0030488967895507812, 0.0031948089599609375, 0.0033407211303710938, 0.00348663330078125, 0.0036325454711914062, 0.0037784576416015625, 0.003924369812011719, 0.004070281982421875, 0.004216194152832031, 0.0043621063232421875, 0.004508018493652344, 0.0046539306640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 0.0, 4.0, 0.0, 7.0, 6.0, 7.0, 5.0, 7.0, 10.0, 13.0, 13.0, 11.0, 8.0, 24.0, 34.0, 37.0, 23.0, 47.0, 63.0, 41.0, 48.0, 33.0, 54.0, 94.0, 49.0, 33.0, 43.0, 31.0, 57.0, 34.0, 26.0, 17.0, 22.0, 22.0, 13.0, 13.0, 8.0, 9.0, 4.0, 6.0, 8.0, 5.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.410743713378906e-06, -4.279427230358124e-06, -4.148110747337341e-06, -4.016794264316559e-06, -3.885477781295776e-06, -3.754161298274994e-06, -3.6228448152542114e-06, -3.491528332233429e-06, -3.3602118492126465e-06, -3.228895366191864e-06, -3.0975788831710815e-06, -2.966262400150299e-06, -2.8349459171295166e-06, -2.703629434108734e-06, -2.5723129510879517e-06, -2.440996468067169e-06, -2.3096799850463867e-06, -2.1783635020256042e-06, -2.0470470190048218e-06, -1.9157305359840393e-06, -1.7844140529632568e-06, -1.6530975699424744e-06, -1.521781086921692e-06, -1.3904646039009094e-06, -1.259148120880127e-06, -1.1278316378593445e-06, -9.96515154838562e-07, -8.651986718177795e-07, -7.338821887969971e-07, -6.025657057762146e-07, -4.7124922275543213e-07, -3.3993273973464966e-07, -2.086162567138672e-07, -7.729977369308472e-08, 5.4016709327697754e-08, 1.8533319234848022e-07, 3.166496753692627e-07, 4.4796615839004517e-07, 5.792826414108276e-07, 7.105991244316101e-07, 8.419156074523926e-07, 9.73232090473175e-07, 1.1045485734939575e-06, 1.23586505651474e-06, 1.3671815395355225e-06, 1.498498022556305e-06, 1.6298145055770874e-06, 1.7611309885978699e-06, 1.8924474716186523e-06, 2.023763954639435e-06, 2.1550804376602173e-06, 2.2863969206809998e-06, 2.4177134037017822e-06, 2.5490298867225647e-06, 2.680346369743347e-06, 2.8116628527641296e-06, 2.942979335784912e-06, 3.0742958188056946e-06, 3.205612301826477e-06, 3.3369287848472595e-06, 3.468245267868042e-06, 3.5995617508888245e-06, 3.730878233909607e-06, 3.862194716930389e-06, 3.993511199951172e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 7.0, 5.0, 13.0, 28.0, 47.0, 77.0, 89.0, 229.0, 357.0, 766.0, 1780.0, 5255.0, 22479.0, 733054.0, 256106.0, 20073.0, 4969.0, 1694.0, 728.0, 338.0, 173.0, 93.0, 58.0, 43.0, 21.0, 17.0, 16.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014171600341796875, -0.0013682395219802856, -0.0013193190097808838, -0.001270398497581482, -0.00122147798538208, -0.0011725574731826782, -0.0011236369609832764, -0.0010747164487838745, -0.0010257959365844727, -0.0009768754243850708, -0.0009279549121856689, -0.0008790343999862671, -0.0008301138877868652, -0.0007811933755874634, -0.0007322728633880615, -0.0006833523511886597, -0.0006344318389892578, -0.000585511326789856, -0.0005365908145904541, -0.00048767030239105225, -0.0004387497901916504, -0.00038982927799224854, -0.0003409087657928467, -0.0002919882535934448, -0.00024306774139404297, -0.0001941472291946411, -0.00014522671699523926, -9.63062047958374e-05, -4.738569259643555e-05, 1.5348196029663086e-06, 5.0455331802368164e-05, 9.937584400177002e-05, 0.00014829635620117188, 0.00019721686840057373, 0.0002461373805999756, 0.00029505789279937744, 0.0003439784049987793, 0.00039289891719818115, 0.000441819429397583, 0.0004907399415969849, 0.0005396604537963867, 0.0005885809659957886, 0.0006375014781951904, 0.0006864219903945923, 0.0007353425025939941, 0.000784263014793396, 0.0008331835269927979, 0.0008821040391921997, 0.0009310245513916016, 0.0009799450635910034, 0.0010288655757904053, 0.0010777860879898071, 0.001126706600189209, 0.0011756271123886108, 0.0012245476245880127, 0.0012734681367874146, 0.0013223886489868164, 0.0013713091611862183, 0.0014202296733856201, 0.001469150185585022, 0.0015180706977844238, 0.0015669912099838257, 0.0016159117221832275, 0.0016648322343826294, 0.0017137527465820312]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 9.0, 21.0, 14.0, 19.0, 45.0, 50.0, 118.0, 151.0, 175.0, 130.0, 101.0, 54.0, 36.0, 21.0, 10.0, 10.0, 17.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002475738525390625, -0.002370178699493408, -0.0022646188735961914, -0.0021590590476989746, -0.002053499221801758, -0.001947939395904541, -0.0018423795700073242, -0.0017368197441101074, -0.0016312599182128906, -0.0015257000923156738, -0.001420140266418457, -0.0013145804405212402, -0.0012090206146240234, -0.0011034607887268066, -0.0009979009628295898, -0.000892341136932373, -0.0007867813110351562, -0.0006812214851379395, -0.0005756616592407227, -0.00047010183334350586, -0.00036454200744628906, -0.00025898218154907227, -0.00015342235565185547, -4.786252975463867e-05, 5.7697296142578125e-05, 0.00016325712203979492, 0.0002688169479370117, 0.0003743767738342285, 0.0004799365997314453, 0.0005854964256286621, 0.0006910562515258789, 0.0007966160774230957, 0.0009021759033203125, 0.0010077357292175293, 0.001113295555114746, 0.0012188553810119629, 0.0013244152069091797, 0.0014299750328063965, 0.0015355348587036133, 0.00164109468460083, 0.0017466545104980469, 0.0018522143363952637, 0.0019577741622924805, 0.0020633339881896973, 0.002168893814086914, 0.002274453639984131, 0.0023800134658813477, 0.0024855732917785645, 0.0025911331176757812, 0.002696692943572998, 0.002802252769470215, 0.0029078125953674316, 0.0030133724212646484, 0.0031189322471618652, 0.003224492073059082, 0.003330051898956299, 0.0034356117248535156, 0.0035411715507507324, 0.0036467313766479492, 0.003752291202545166, 0.003857851028442383, 0.0039634108543396, 0.004068970680236816, 0.004174530506134033, 0.00428009033203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 11.0, 10.0, 20.0, 50.0, 130.0, 588.0, 127.0, 47.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.17189592123031616, -0.16756770014762878, -0.1632394641637802, -0.15891124308109283, -0.15458300709724426, -0.15025478601455688, -0.1459265649318695, -0.14159832894802094, -0.13727010786533356, -0.13294188678264618, -0.1286136507987976, -0.12428542971611023, -0.11995720118284225, -0.11562897264957428, -0.1113007515668869, -0.10697252303361893, -0.10264429450035095, -0.09831606596708298, -0.093987837433815, -0.08965961635112762, -0.08533138781785965, -0.08100315928459167, -0.0766749382019043, -0.07234670966863632, -0.06801848113536835, -0.06369025260210037, -0.059362027794122696, -0.05503380298614502, -0.050705574452877045, -0.04637734591960907, -0.04204912111163139, -0.03772089630365372, -0.033392660319805145, -0.02906443364918232, -0.024736206978559494, -0.02040798030793667, -0.016079753637313843, -0.011751526966691017, -0.0074233002960681915, -0.003095073625445366, 0.0012331530451774597, 0.005561379715800285, 0.009889606386423111, 0.014217833057045937, 0.018546059727668762, 0.022874286398291588, 0.027202513068914413, 0.03153073787689209, 0.035858966410160065, 0.04018719494342804, 0.044515419751405716, 0.04884364455938339, 0.05317187309265137, 0.05750010162591934, 0.06182832643389702, 0.0661565512418747, 0.07048477977514267, 0.07481300830841064, 0.07914122939109802, 0.083469457924366, 0.08779768645763397, 0.09212591499090195, 0.09645414352416992, 0.1007823646068573, 0.10511059314012527]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 4.0, 6.0, 12.0, 17.0, 24.0, 26.0, 27.0, 26.0, 29.0, 44.0, 123.0, 300.0, 112.0, 38.0, 32.0, 25.0, 23.0, 22.0, 23.0, 14.0, 12.0, 9.0, 10.0, 4.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07029181718826294, -0.06805931776762009, -0.06582681089639664, -0.06359431147575378, -0.06136180832982063, -0.05912930518388748, -0.05689680576324463, -0.05466430261731148, -0.052431799471378326, -0.050199296325445175, -0.047966793179512024, -0.04573429375886917, -0.04350179061293602, -0.04126928746700287, -0.039036788046360016, -0.036804284900426865, -0.03457178175449371, -0.03233927860856056, -0.03010677732527256, -0.027874276041984558, -0.025641772896051407, -0.023409269750118256, -0.021176768466830254, -0.01894426718354225, -0.0167117640376091, -0.014479261822998524, -0.012246759608387947, -0.01001425739377737, -0.007781755179166794, -0.005549252964556217, -0.0033167507499456406, -0.0010842494666576385, 0.0011482536792755127, 0.0033807558938860893, 0.005613258108496666, 0.007845760323107243, 0.01007826253771782, 0.012310764752328396, 0.014543266966938972, 0.016775768250226974, 0.019008271396160126, 0.021240774542093277, 0.02347327582538128, 0.02570577710866928, 0.027938280254602432, 0.030170783400535583, 0.032403282821178436, 0.03463578596711159, 0.03686828911304474, 0.03910079225897789, 0.04133329540491104, 0.043565794825553894, 0.045798297971487045, 0.0480308011174202, 0.05026330053806305, 0.0524958036839962, 0.05472830682992935, 0.0569608099758625, 0.059193313121795654, 0.06142581254243851, 0.06365831196308136, 0.06589081883430481, 0.06812331825494766, 0.07035581767559052, 0.07258832454681396]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 2.0, 6.0, 11.0, 20.0, 11.0, 16.0, 16.0, 23.0, 24.0, 44.0, 56.0, 117.0, 280.0, 92.0, 41.0, 47.0, 31.0, 29.0, 29.0, 16.0, 14.0, 7.0, 7.0, 9.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00418853759765625, -0.004035472869873047, -0.0038824081420898438, -0.0037293434143066406, -0.0035762786865234375, -0.0034232139587402344, -0.0032701492309570312, -0.003117084503173828, -0.002964019775390625, -0.002810955047607422, -0.0026578903198242188, -0.0025048255920410156, -0.0023517608642578125, -0.0021986961364746094, -0.0020456314086914062, -0.0018925666809082031, -0.001739501953125, -0.0015864372253417969, -0.0014333724975585938, -0.0012803077697753906, -0.0011272430419921875, -0.0009741783142089844, -0.0008211135864257812, -0.0006680488586425781, -0.000514984130859375, -0.0003619194030761719, -0.00020885467529296875, -5.5789947509765625e-05, 9.72747802734375e-05, 0.0002503395080566406, 0.00040340423583984375, 0.0005564689636230469, 0.00070953369140625, 0.0008625984191894531, 0.0010156631469726562, 0.0011687278747558594, 0.0013217926025390625, 0.0014748573303222656, 0.0016279220581054688, 0.0017809867858886719, 0.001934051513671875, 0.002087116241455078, 0.0022401809692382812, 0.0023932456970214844, 0.0025463104248046875, 0.0026993751525878906, 0.0028524398803710938, 0.003005504608154297, 0.0031585693359375, 0.003311634063720703, 0.0034646987915039062, 0.0036177635192871094, 0.0037708282470703125, 0.003923892974853516, 0.004076957702636719, 0.004230022430419922, 0.004383087158203125, 0.004536151885986328, 0.004689216613769531, 0.004842281341552734, 0.0049953460693359375, 0.005148410797119141, 0.005301475524902344, 0.005454540252685547, 0.00560760498046875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 20.0, 11.0, 5.0, 15.0, 36.0, 31.0, 44.0, 100.0, 252.0, 844.0, 7848.0, 8369648.0, 8293.0, 921.0, 238.0, 92.0, 76.0, 31.0, 13.0, 13.0, 14.0, 2.0, 6.0, 2.0, 3.0, 2.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.05763475224375725, -0.05601182579994202, -0.05438889563083649, -0.052765969187021255, -0.051143042743206024, -0.049520112574100494, -0.04789718613028526, -0.04627425968647003, -0.0446513332426548, -0.04302840679883957, -0.04140547662973404, -0.03978255018591881, -0.03815962374210358, -0.03653669357299805, -0.034913767129182816, -0.033290840685367584, -0.031667910516262054, -0.030044982209801674, -0.028422055765986443, -0.026799127459526062, -0.02517620101571083, -0.02355327270925045, -0.02193034440279007, -0.020307417958974838, -0.018684491515159607, -0.017061563208699226, -0.015438636764883995, -0.013815708458423615, -0.012192782014608383, -0.010569853708148003, -0.008946926333010197, -0.007323998957872391, -0.005701072514057159, -0.0040781451389193535, -0.002455217530950904, -0.0008322899229824543, 0.0007906374521553516, 0.002413565292954445, 0.004036492668092251, 0.005659420043230057, 0.007282347418367863, 0.008905274793505669, 0.010528202168643475, 0.01215112954378128, 0.013774057850241661, 0.015396985225379467, 0.017019912600517273, 0.018642839044332504, 0.020265767350792885, 0.021888695657253265, 0.023511622101068497, 0.025134550407528877, 0.02675747685134411, 0.02838040515780449, 0.03000333160161972, 0.03162626177072525, 0.03324918821454048, 0.03487211465835571, 0.03649504482746124, 0.038117971271276474, 0.039740897715091705, 0.041363827884197235, 0.042986754328012466, 0.0446096807718277, 0.04623260721564293]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 2.0, 2.0, 4.0, 2.0, 9.0, 4.0, 7.0, 5.0, 8.0, 1.0, 5.0, 2.0, 4.0, 8.0, 2.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023277707397937775, -0.022740105167031288, -0.0222025029361248, -0.021664900705218315, -0.02112729847431183, -0.020589694380760193, -0.020052092149853706, -0.01951448991894722, -0.018976887688040733, -0.018439285457134247, -0.01790168322622776, -0.017364080995321274, -0.016826476901769638, -0.01628887467086315, -0.015751272439956665, -0.015213670209050179, -0.014676067978143692, -0.014138465747237206, -0.013600863516330719, -0.013063260354101658, -0.012525658123195171, -0.011988055892288685, -0.011450452730059624, -0.010912850499153137, -0.01037524826824665, -0.009837646037340164, -0.009300043806433678, -0.008762440644204617, -0.00822483841329813, -0.0076872361823916435, -0.00714963348582387, -0.006612030789256096, -0.00607442669570446, -0.005536824464797974, -0.0049992217682302, -0.004461619071662426, -0.0039240168407559395, -0.0033864143770188093, -0.002848811913281679, -0.002311209449544549, -0.0017736069858074188, -0.0012360045220702887, -0.0006984020583331585, -0.00016079959459602833, 0.00037680286914110184, 0.000914405332878232, 0.0014520077966153622, 0.0019896102603524923, 0.0025272127240896225, 0.0030648151878267527, 0.003602417651563883, 0.004140020348131657, 0.004677622579038143, 0.00521522480994463, 0.0057528275065124035, 0.006290430203080177, 0.006828032433986664, 0.00736563466489315, 0.007903236895799637, 0.008440840058028698, 0.008978442288935184, 0.009516044519841671, 0.010053647682070732, 0.010591249912977219, 0.011128852143883705]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 2.0, 5.0, 9.0, 6.0, 21.0, 14.0, 36.0, 52.0, 96.0, 170.0, 224.0, 389.0, 819.0, 1722.0, 4031.0, 10191.0, 30030.0, 100196.0, 221675.0, 105560.0, 31341.0, 10403.0, 3885.0, 1545.0, 754.0, 375.0, 204.0, 162.0, 90.0, 60.0, 46.0, 38.0, 22.0, 17.0, 17.0, 14.0, 6.0, 9.0, 6.0, 4.0, 2.0, 7.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.0206298828125, -0.01995372772216797, -0.019277572631835938, -0.018601417541503906, -0.017925262451171875, -0.017249107360839844, -0.016572952270507812, -0.01589679718017578, -0.01522064208984375, -0.014544486999511719, -0.013868331909179688, -0.013192176818847656, -0.012516021728515625, -0.011839866638183594, -0.011163711547851562, -0.010487556457519531, -0.0098114013671875, -0.009135246276855469, -0.008459091186523438, -0.007782936096191406, -0.007106781005859375, -0.006430625915527344, -0.0057544708251953125, -0.005078315734863281, -0.00440216064453125, -0.0037260055541992188, -0.0030498504638671875, -0.0023736953735351562, -0.001697540283203125, -0.0010213851928710938, -0.0003452301025390625, 0.00033092498779296875, 0.001007080078125, 0.0016832351684570312, 0.0023593902587890625, 0.0030355453491210938, 0.003711700439453125, 0.004387855529785156, 0.0050640106201171875, 0.005740165710449219, 0.00641632080078125, 0.007092475891113281, 0.0077686309814453125, 0.008444786071777344, 0.009120941162109375, 0.009797096252441406, 0.010473251342773438, 0.011149406433105469, 0.0118255615234375, 0.012501716613769531, 0.013177871704101562, 0.013854026794433594, 0.014530181884765625, 0.015206336975097656, 0.015882492065429688, 0.01655864715576172, 0.01723480224609375, 0.01791095733642578, 0.018587112426757812, 0.019263267517089844, 0.019939422607421875, 0.020615577697753906, 0.021291732788085938, 0.02196788787841797, 0.02264404296875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 7.0, 7.0, 10.0, 38.0, 50.0, 87.0, 101.0, 161.0, 162.0, 159.0, 83.0, 61.0, 33.0, 23.0, 13.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006114959716796875, -0.005738317966461182, -0.005361676216125488, -0.004985034465789795, -0.0046083927154541016, -0.004231750965118408, -0.003855109214782715, -0.0034784674644470215, -0.003101825714111328, -0.0027251839637756348, -0.0023485422134399414, -0.001971900463104248, -0.0015952587127685547, -0.0012186169624328613, -0.000841975212097168, -0.0004653334617614746, -8.869171142578125e-05, 0.0002879500389099121, 0.0006645917892456055, 0.0010412335395812988, 0.0014178752899169922, 0.0017945170402526855, 0.002171158790588379, 0.0025478005409240723, 0.0029244422912597656, 0.003301084041595459, 0.0036777257919311523, 0.004054367542266846, 0.004431009292602539, 0.004807651042938232, 0.005184292793273926, 0.005560934543609619, 0.0059375762939453125, 0.006314218044281006, 0.006690859794616699, 0.007067501544952393, 0.007444143295288086, 0.00782078504562378, 0.008197426795959473, 0.008574068546295166, 0.00895071029663086, 0.009327352046966553, 0.009703993797302246, 0.01008063554763794, 0.010457277297973633, 0.010833919048309326, 0.01121056079864502, 0.011587202548980713, 0.011963844299316406, 0.0123404860496521, 0.012717127799987793, 0.013093769550323486, 0.01347041130065918, 0.013847053050994873, 0.014223694801330566, 0.01460033655166626, 0.014976978302001953, 0.015353620052337646, 0.01573026180267334, 0.016106903553009033, 0.016483545303344727, 0.01686018705368042, 0.017236828804016113, 0.017613470554351807, 0.0179901123046875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 5.0, 9.0, 6.0, 3.0, 15.0, 29.0, 126.0, 151.0, 75.0, 28.0, 9.0, 8.0, 8.0, 3.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03378673642873764, -0.03251172974705696, -0.031236721202731133, -0.029961712658405304, -0.028686705976724625, -0.027411699295043945, -0.026136690750718117, -0.024861682206392288, -0.02358667552471161, -0.02231166884303093, -0.0210366602987051, -0.019761651754379272, -0.018486645072698593, -0.017211638391017914, -0.015936629846692085, -0.014661622233688831, -0.013386614620685577, -0.012111607007682323, -0.01083659939467907, -0.009561591781675816, -0.008286584168672562, -0.007011576555669308, -0.005736568942666054, -0.0044615613296628, -0.003186553716659546, -0.001911546103656292, -0.000636538490653038, 0.0006384691223502159, 0.0019134767353534698, 0.003188484348356724, 0.004463491961359978, 0.005738499574363232, 0.007013507187366486, 0.00828851480036974, 0.009563522413372993, 0.010838530026376247, 0.012113537639379501, 0.013388545252382755, 0.01466355286538601, 0.015938561409711838, 0.017213568091392517, 0.018488574773073196, 0.019763583317399025, 0.021038591861724854, 0.022313598543405533, 0.023588605225086212, 0.02486361376941204, 0.02613862231373787, 0.02741362899541855, 0.028688635677099228, 0.029963644221425056, 0.031238652765750885, 0.032513659447431564, 0.033788666129112244, 0.03506367653608322, 0.0363386832177639, 0.03761368989944458, 0.03888869658112526, 0.04016370326280594, 0.041438713669776917, 0.042713720351457596, 0.043988727033138275, 0.04526373744010925, 0.04653874412178993, 0.04781375080347061]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 6.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 8.0, 12.0, 45.0, 106.0, 98.0, 80.0, 35.0, 14.0, 10.0, 4.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.031161367893218994, -0.030129114165902138, -0.02909686043858528, -0.028064606711268425, -0.02703235298395157, -0.026000099256634712, -0.024967845529317856, -0.023935591802001, -0.022903338074684143, -0.021871084347367287, -0.02083883062005043, -0.019806576892733574, -0.018774323165416718, -0.01774206943809986, -0.016709815710783005, -0.01567756198346615, -0.014645308256149292, -0.013613054528832436, -0.01258080080151558, -0.011548547074198723, -0.010516293346881866, -0.00948403961956501, -0.008451785892248154, -0.007419532164931297, -0.006387278437614441, -0.0053550247102975845, -0.004322770982980728, -0.0032905172556638718, -0.0022582635283470154, -0.001226009801030159, -0.0001937560737133026, 0.0008384976536035538, 0.0018707513809204102, 0.0029030051082372665, 0.003935258835554123, 0.004967512562870979, 0.005999766290187836, 0.007032020017504692, 0.008064273744821548, 0.009096527472138405, 0.010128781199455261, 0.011161034926772118, 0.012193288654088974, 0.01322554238140583, 0.014257796108722687, 0.015290049836039543, 0.0163223035633564, 0.017354557290673256, 0.018386811017990112, 0.01941906474530697, 0.020451318472623825, 0.02148357219994068, 0.022515825927257538, 0.023548079654574394, 0.02458033338189125, 0.025612587109208107, 0.026644840836524963, 0.02767709456384182, 0.028709348291158676, 0.029741602018475533, 0.03077385574579239, 0.031806111335754395, 0.0328383632004261, 0.03387061506509781, 0.034902870655059814]}, "eval/loss": 4.670431137084961, "eval/wer": 1.9589646965489884, "eval/runtime": 781.1725, "eval/samples_per_second": 3.382, "eval/steps_per_second": 0.283, "train/train_runtime": 6725.1387, "train/train_samples_per_second": 4.243, "train/train_steps_per_second": 0.177, "train/total_flos": 0.0, "train/train_loss": 4.647471772210753} \ No newline at end of file