diff --git "a/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" "b/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.1576, "train/learning_rate": 9.920000000000002e-06, "train/epoch": 0.28, "train/global_step": 500, "_runtime": 2485, "_timestamp": 1646043510, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 18.0, 102.0, 313.0, 369.0, 178.0, 29.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.22979736328125, -217.4264678955078, -212.62313842773438, -207.81982421875, -203.01649475097656, -198.21316528320312, -193.40985107421875, -188.6065216064453, -183.80319213867188, -178.99986267089844, -174.196533203125, -169.39321899414062, -164.5898895263672, -159.78656005859375, -154.98324584960938, -150.17991638183594, -145.3765869140625, -140.57325744628906, -135.76992797851562, -130.96661376953125, -126.16328430175781, -121.35995483398438, -116.55663299560547, -111.75331115722656, -106.94998168945312, -102.14665222167969, -97.34333038330078, -92.54000854492188, -87.73667907714844, -82.933349609375, -78.1300277709961, -73.32670593261719, -68.52339172363281, -63.72006607055664, -58.91674041748047, -54.1134147644043, -49.310089111328125, -44.50676345825195, -39.70343780517578, -34.90011215209961, -30.096786499023438, -25.293460845947266, -20.490135192871094, -15.686809539794922, -10.88348388671875, -6.080158233642578, -1.2768325805664062, 3.5264930725097656, 8.329818725585938, 13.13314437866211, 17.93647003173828, 22.739795684814453, 27.543121337890625, 32.3464469909668, 37.14977264404297, 41.95309829711914, 46.75642395019531, 51.559749603271484, 56.363075256347656, 61.16640090942383, 65.9697265625, 70.77305603027344, 75.57637786865234, 80.37969970703125, 85.18302917480469]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 3.0, 4.0, 8.0, 8.0, 12.0, 23.0, 19.0, 19.0, 18.0, 24.0, 23.0, 27.0, 36.0, 35.0, 54.0, 60.0, 60.0, 46.0, 55.0, 43.0, 44.0, 46.0, 56.0, 38.0, 31.0, 40.0, 30.0, 27.0, 18.0, 17.0, 16.0, 12.0, 10.0, 5.0, 7.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-80.72836303710938, -78.43955993652344, -76.1507568359375, -73.86195373535156, -71.57315063476562, -69.28434753417969, -66.99554443359375, -64.70674896240234, -62.417945861816406, -60.12914276123047, -57.84033966064453, -55.551536560058594, -53.26273727416992, -50.973934173583984, -48.68513107299805, -46.396331787109375, -44.10752487182617, -41.818721771240234, -39.5299186706543, -37.241119384765625, -34.95231628417969, -32.66351318359375, -30.374710083007812, -28.085908889770508, -25.79710578918457, -23.508302688598633, -21.219501495361328, -18.93069839477539, -16.641895294189453, -14.353094100952148, -12.064291000366211, -9.775489807128906, -7.486686706542969, -5.197884559631348, -2.9090819358825684, -0.6202793121337891, 1.668522834777832, 3.957324981689453, 6.246128082275391, 8.534929275512695, 10.823732376098633, 13.112534523010254, 15.401336669921875, 17.690139770507812, 19.97894287109375, 22.267744064331055, 24.556547164916992, 26.845348358154297, 29.134151458740234, 31.422954559326172, 33.71175765991211, 36.00055694580078, 38.28936004638672, 40.578163146972656, 42.866966247558594, 45.15576934814453, 47.44457244873047, 49.733375549316406, 52.022178649902344, 54.31098175048828, 56.59978103637695, 58.88858413696289, 61.17738723754883, 63.4661865234375, 65.75498962402344]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 9.0, 9.0, 14.0, 8.0, 11.0, 23.0, 20.0, 22.0, 32.0, 35.0, 44.0, 50.0, 54.0, 43.0, 55.0, 55.0, 53.0, 58.0, 48.0, 50.0, 60.0, 31.0, 39.0, 32.0, 33.0, 26.0, 21.0, 8.0, 13.0, 13.0, 8.0, 11.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.52734375, -7.34014892578125, -7.1529541015625, -6.96575927734375, -6.778564453125, -6.59136962890625, -6.4041748046875, -6.21697998046875, -6.02978515625, -5.84259033203125, -5.6553955078125, -5.46820068359375, -5.281005859375, -5.09381103515625, -4.9066162109375, -4.71942138671875, -4.5322265625, -4.34503173828125, -4.1578369140625, -3.97064208984375, -3.783447265625, -3.59625244140625, -3.4090576171875, -3.22186279296875, -3.03466796875, -2.84747314453125, -2.6602783203125, -2.47308349609375, -2.285888671875, -2.09869384765625, -1.9114990234375, -1.72430419921875, -1.537109375, -1.34991455078125, -1.1627197265625, -0.97552490234375, -0.788330078125, -0.60113525390625, -0.4139404296875, -0.22674560546875, -0.03955078125, 0.14764404296875, 0.3348388671875, 0.52203369140625, 0.709228515625, 0.89642333984375, 1.0836181640625, 1.27081298828125, 1.4580078125, 1.64520263671875, 1.8323974609375, 2.01959228515625, 2.206787109375, 2.39398193359375, 2.5811767578125, 2.76837158203125, 2.95556640625, 3.14276123046875, 3.3299560546875, 3.51715087890625, 3.704345703125, 3.89154052734375, 4.0787353515625, 4.26593017578125, 4.453125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 13.0, 11.0, 23.0, 27.0, 45.0, 59.0, 80.0, 95.0, 176.0, 236.0, 327.0, 531.0, 895.0, 1533.0, 3080.0, 6968.0, 22679.0, 120736.0, 1334738.0, 2360999.0, 281759.0, 39591.0, 10454.0, 4146.0, 2008.0, 1135.0, 633.0, 402.0, 276.0, 202.0, 137.0, 87.0, 70.0, 47.0, 27.0, 25.0, 12.0, 7.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.515625, -17.056884765625, -16.59814453125, -16.139404296875, -15.6806640625, -15.221923828125, -14.76318359375, -14.304443359375, -13.845703125, -13.386962890625, -12.92822265625, -12.469482421875, -12.0107421875, -11.552001953125, -11.09326171875, -10.634521484375, -10.17578125, -9.717041015625, -9.25830078125, -8.799560546875, -8.3408203125, -7.882080078125, -7.42333984375, -6.964599609375, -6.505859375, -6.047119140625, -5.58837890625, -5.129638671875, -4.6708984375, -4.212158203125, -3.75341796875, -3.294677734375, -2.8359375, -2.377197265625, -1.91845703125, -1.459716796875, -1.0009765625, -0.542236328125, -0.08349609375, 0.375244140625, 0.833984375, 1.292724609375, 1.75146484375, 2.210205078125, 2.6689453125, 3.127685546875, 3.58642578125, 4.045166015625, 4.50390625, 4.962646484375, 5.42138671875, 5.880126953125, 6.3388671875, 6.797607421875, 7.25634765625, 7.715087890625, 8.173828125, 8.632568359375, 9.09130859375, 9.550048828125, 10.0087890625, 10.467529296875, 10.92626953125, 11.385009765625, 11.84375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 6.0, 8.0, 7.0, 11.0, 26.0, 38.0, 48.0, 61.0, 90.0, 134.0, 212.0, 296.0, 451.0, 587.0, 583.0, 466.0, 320.0, 218.0, 152.0, 117.0, 67.0, 36.0, 42.0, 27.0, 24.0, 17.0, 6.0, 5.0, 6.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.40380859375, -16.7607421875, -16.11767578125, -15.474609375, -14.83154296875, -14.1884765625, -13.54541015625, -12.90234375, -12.25927734375, -11.6162109375, -10.97314453125, -10.330078125, -9.68701171875, -9.0439453125, -8.40087890625, -7.7578125, -7.11474609375, -6.4716796875, -5.82861328125, -5.185546875, -4.54248046875, -3.8994140625, -3.25634765625, -2.61328125, -1.97021484375, -1.3271484375, -0.68408203125, -0.041015625, 0.60205078125, 1.2451171875, 1.88818359375, 2.53125, 3.17431640625, 3.8173828125, 4.46044921875, 5.103515625, 5.74658203125, 6.3896484375, 7.03271484375, 7.67578125, 8.31884765625, 8.9619140625, 9.60498046875, 10.248046875, 10.89111328125, 11.5341796875, 12.17724609375, 12.8203125, 13.46337890625, 14.1064453125, 14.74951171875, 15.392578125, 16.03564453125, 16.6787109375, 17.32177734375, 17.96484375, 18.60791015625, 19.2509765625, 19.89404296875, 20.537109375, 21.18017578125, 21.8232421875, 22.46630859375, 23.109375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 7.0, 6.0, 14.0, 11.0, 18.0, 26.0, 32.0, 58.0, 98.0, 150.0, 183.0, 309.0, 507.0, 944.0, 2312.0, 19425.0, 3502329.0, 657279.0, 6949.0, 1599.0, 777.0, 440.0, 255.0, 178.0, 121.0, 78.0, 56.0, 32.0, 20.0, 15.0, 14.0, 11.0, 8.0, 3.0, 2.0, 1.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.21875, -58.13037109375, -56.0419921875, -53.95361328125, -51.865234375, -49.77685546875, -47.6884765625, -45.60009765625, -43.51171875, -41.42333984375, -39.3349609375, -37.24658203125, -35.158203125, -33.06982421875, -30.9814453125, -28.89306640625, -26.8046875, -24.71630859375, -22.6279296875, -20.53955078125, -18.451171875, -16.36279296875, -14.2744140625, -12.18603515625, -10.09765625, -8.00927734375, -5.9208984375, -3.83251953125, -1.744140625, 0.34423828125, 2.4326171875, 4.52099609375, 6.609375, 8.69775390625, 10.7861328125, 12.87451171875, 14.962890625, 17.05126953125, 19.1396484375, 21.22802734375, 23.31640625, 25.40478515625, 27.4931640625, 29.58154296875, 31.669921875, 33.75830078125, 35.8466796875, 37.93505859375, 40.0234375, 42.11181640625, 44.2001953125, 46.28857421875, 48.376953125, 50.46533203125, 52.5537109375, 54.64208984375, 56.73046875, 58.81884765625, 60.9072265625, 62.99560546875, 65.083984375, 67.17236328125, 69.2607421875, 71.34912109375, 73.4375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 167.0, 535.0, 268.0, 29.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-366.3058166503906, -359.3312683105469, -352.35675048828125, -345.3822021484375, -338.4076843261719, -331.4331359863281, -324.4586181640625, -317.48406982421875, -310.509521484375, -303.53497314453125, -296.5604553222656, -289.5859069824219, -282.61138916015625, -275.6368408203125, -268.6623229980469, -261.6877746582031, -254.7132568359375, -247.7387237548828, -240.76419067382812, -233.78965759277344, -226.81512451171875, -219.840576171875, -212.8660430908203, -205.89151000976562, -198.91697692871094, -191.94244384765625, -184.96791076660156, -177.99337768554688, -171.01882934570312, -164.0443115234375, -157.06976318359375, -150.09523010253906, -143.12071228027344, -136.14617919921875, -129.17164611816406, -122.19710540771484, -115.22257232666016, -108.24803924560547, -101.27349853515625, -94.29896545410156, -87.32443237304688, -80.34989929199219, -73.3753662109375, -66.40082550048828, -59.426292419433594, -52.451759338378906, -45.47722244262695, -38.502685546875, -31.528152465820312, -24.553617477416992, -17.579082489013672, -10.604547500610352, -3.6300125122070312, 3.3445205688476562, 10.31905746459961, 17.293594360351562, 24.26812744140625, 31.24266242980957, 38.21719741821289, 45.191734313964844, 52.16626739501953, 59.14080047607422, 66.11534118652344, 73.08987426757812, 80.06440734863281]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 3.0, 2.0, 8.0, 8.0, 14.0, 9.0, 11.0, 19.0, 14.0, 24.0, 20.0, 26.0, 17.0, 34.0, 30.0, 26.0, 30.0, 44.0, 46.0, 29.0, 32.0, 36.0, 34.0, 43.0, 45.0, 41.0, 43.0, 31.0, 25.0, 34.0, 23.0, 22.0, 18.0, 26.0, 14.0, 11.0, 17.0, 9.0, 15.0, 10.0, 15.0, 11.0, 10.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-55.38246154785156, -53.66963195800781, -51.95680236816406, -50.24397277832031, -48.53114318847656, -46.81831359863281, -45.10548400878906, -43.39265441894531, -41.67982482910156, -39.96699523925781, -38.25416564941406, -36.54133605957031, -34.82850646972656, -33.11567687988281, -31.402847290039062, -29.690017700195312, -27.977190017700195, -26.264360427856445, -24.551530838012695, -22.838701248168945, -21.125871658325195, -19.413043975830078, -17.700214385986328, -15.987383842468262, -14.274554252624512, -12.561724662780762, -10.848895072937012, -9.136066436767578, -7.42323637008667, -5.710407257080078, -3.997577667236328, -2.284748077392578, -0.5719184875488281, 1.1409109830856323, 2.8537404537200928, 4.566569805145264, 6.279399394989014, 7.9922285079956055, 9.705058097839355, 11.417887687683105, 13.130717277526855, 14.843546867370605, 16.55637550354004, 18.26920509338379, 19.98203468322754, 21.69486427307129, 23.40769386291504, 25.12052345275879, 26.83335304260254, 28.54618263244629, 30.25901222229004, 31.97184181213379, 33.684669494628906, 35.397499084472656, 37.110328674316406, 38.823158264160156, 40.535987854003906, 42.248817443847656, 43.961647033691406, 45.674476623535156, 47.387306213378906, 49.100135803222656, 50.812965393066406, 52.525794982910156, 54.238624572753906]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 7.0, 8.0, 12.0, 15.0, 16.0, 12.0, 27.0, 24.0, 18.0, 23.0, 30.0, 31.0, 35.0, 33.0, 35.0, 46.0, 45.0, 36.0, 52.0, 48.0, 47.0, 36.0, 38.0, 35.0, 34.0, 36.0, 32.0, 25.0, 14.0, 23.0, 18.0, 14.0, 16.0, 8.0, 10.0, 13.0, 8.0, 6.0, 4.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.279296875, -5.12109375, -4.962890625, -4.8046875, -4.646484375, -4.48828125, -4.330078125, -4.171875, -4.013671875, -3.85546875, -3.697265625, -3.5390625, -3.380859375, -3.22265625, -3.064453125, -2.90625, -2.748046875, -2.58984375, -2.431640625, -2.2734375, -2.115234375, -1.95703125, -1.798828125, -1.640625, -1.482421875, -1.32421875, -1.166015625, -1.0078125, -0.849609375, -0.69140625, -0.533203125, -0.375, -0.216796875, -0.05859375, 0.099609375, 0.2578125, 0.416015625, 0.57421875, 0.732421875, 0.890625, 1.048828125, 1.20703125, 1.365234375, 1.5234375, 1.681640625, 1.83984375, 1.998046875, 2.15625, 2.314453125, 2.47265625, 2.630859375, 2.7890625, 2.947265625, 3.10546875, 3.263671875, 3.421875, 3.580078125, 3.73828125, 3.896484375, 4.0546875, 4.212890625, 4.37109375, 4.529296875, 4.6875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 3.0, 7.0, 30.0, 23.0, 38.0, 66.0, 79.0, 104.0, 169.0, 231.0, 338.0, 410.0, 632.0, 926.0, 1388.0, 1897.0, 2799.0, 4195.0, 6050.0, 8770.0, 12920.0, 19285.0, 29282.0, 45705.0, 74063.0, 136286.0, 311310.0, 161126.0, 82595.0, 50422.0, 31849.0, 21081.0, 14111.0, 9432.0, 6518.0, 4464.0, 2951.0, 2163.0, 1474.0, 1040.0, 735.0, 527.0, 319.0, 238.0, 156.0, 93.0, 81.0, 39.0, 37.0, 26.0, 18.0, 18.0, 16.0, 2.0, 5.0, 9.0, 6.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.90771484375, -0.8770523071289062, -0.8463897705078125, -0.8157272338867188, -0.785064697265625, -0.7544021606445312, -0.7237396240234375, -0.6930770874023438, -0.66241455078125, -0.6317520141601562, -0.6010894775390625, -0.5704269409179688, -0.539764404296875, -0.5091018676757812, -0.4784393310546875, -0.44777679443359375, -0.4171142578125, -0.38645172119140625, -0.3557891845703125, -0.32512664794921875, -0.294464111328125, -0.26380157470703125, -0.2331390380859375, -0.20247650146484375, -0.17181396484375, -0.14115142822265625, -0.1104888916015625, -0.07982635498046875, -0.049163818359375, -0.01850128173828125, 0.0121612548828125, 0.04282379150390625, 0.073486328125, 0.10414886474609375, 0.1348114013671875, 0.16547393798828125, 0.196136474609375, 0.22679901123046875, 0.2574615478515625, 0.28812408447265625, 0.31878662109375, 0.34944915771484375, 0.3801116943359375, 0.41077423095703125, 0.441436767578125, 0.47209930419921875, 0.5027618408203125, 0.5334243774414062, 0.5640869140625, 0.5947494506835938, 0.6254119873046875, 0.6560745239257812, 0.686737060546875, 0.7173995971679688, 0.7480621337890625, 0.7787246704101562, 0.80938720703125, 0.8400497436523438, 0.8707122802734375, 0.9013748168945312, 0.932037353515625, 0.9626998901367188, 0.9933624267578125, 1.0240249633789062, 1.0546875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 10.0, 6.0, 12.0, 13.0, 17.0, 13.0, 13.0, 18.0, 20.0, 23.0, 32.0, 18.0, 33.0, 28.0, 34.0, 37.0, 47.0, 38.0, 29.0, 39.0, 1063.0, 54.0, 35.0, 36.0, 40.0, 35.0, 32.0, 28.0, 26.0, 30.0, 25.0, 21.0, 17.0, 12.0, 18.0, 15.0, 13.0, 8.0, 14.0, 3.0, 6.0, 8.0, 3.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.125, -3.02783203125, -2.9306640625, -2.83349609375, -2.736328125, -2.63916015625, -2.5419921875, -2.44482421875, -2.34765625, -2.25048828125, -2.1533203125, -2.05615234375, -1.958984375, -1.86181640625, -1.7646484375, -1.66748046875, -1.5703125, -1.47314453125, -1.3759765625, -1.27880859375, -1.181640625, -1.08447265625, -0.9873046875, -0.89013671875, -0.79296875, -0.69580078125, -0.5986328125, -0.50146484375, -0.404296875, -0.30712890625, -0.2099609375, -0.11279296875, -0.015625, 0.08154296875, 0.1787109375, 0.27587890625, 0.373046875, 0.47021484375, 0.5673828125, 0.66455078125, 0.76171875, 0.85888671875, 0.9560546875, 1.05322265625, 1.150390625, 1.24755859375, 1.3447265625, 1.44189453125, 1.5390625, 1.63623046875, 1.7333984375, 1.83056640625, 1.927734375, 2.02490234375, 2.1220703125, 2.21923828125, 2.31640625, 2.41357421875, 2.5107421875, 2.60791015625, 2.705078125, 2.80224609375, 2.8994140625, 2.99658203125, 3.09375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 6.0, 8.0, 7.0, 27.0, 31.0, 49.0, 99.0, 149.0, 208.0, 322.0, 545.0, 799.0, 1351.0, 2139.0, 3359.0, 5165.0, 8142.0, 12682.0, 20179.0, 32477.0, 54380.0, 97986.0, 232592.0, 1354517.0, 112790.0, 60717.0, 36023.0, 22241.0, 13940.0, 8790.0, 5570.0, 3596.0, 2323.0, 1449.0, 911.0, 580.0, 348.0, 244.0, 140.0, 86.0, 60.0, 44.0, 26.0, 12.0, 13.0, 7.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0577850341796875, -1.023773193359375, -0.9897613525390625, -0.95574951171875, -0.9217376708984375, -0.887725830078125, -0.8537139892578125, -0.8197021484375, -0.7856903076171875, -0.751678466796875, -0.7176666259765625, -0.68365478515625, -0.6496429443359375, -0.615631103515625, -0.5816192626953125, -0.547607421875, -0.5135955810546875, -0.479583740234375, -0.4455718994140625, -0.41156005859375, -0.3775482177734375, -0.343536376953125, -0.3095245361328125, -0.2755126953125, -0.2415008544921875, -0.207489013671875, -0.1734771728515625, -0.13946533203125, -0.1054534912109375, -0.071441650390625, -0.0374298095703125, -0.00341796875, 0.0305938720703125, 0.064605712890625, 0.0986175537109375, 0.13262939453125, 0.1666412353515625, 0.200653076171875, 0.2346649169921875, 0.2686767578125, 0.3026885986328125, 0.336700439453125, 0.3707122802734375, 0.40472412109375, 0.4387359619140625, 0.472747802734375, 0.5067596435546875, 0.540771484375, 0.5747833251953125, 0.608795166015625, 0.6428070068359375, 0.67681884765625, 0.7108306884765625, 0.744842529296875, 0.7788543701171875, 0.8128662109375, 0.8468780517578125, 0.880889892578125, 0.9149017333984375, 0.94891357421875, 0.9829254150390625, 1.016937255859375, 1.0509490966796875, 1.0849609375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 7.0, 10.0, 7.0, 3.0, 7.0, 9.0, 7.0, 11.0, 16.0, 15.0, 27.0, 27.0, 39.0, 36.0, 47.0, 50.0, 56.0, 64.0, 66.0, 96.0, 57.0, 46.0, 44.0, 39.0, 43.0, 38.0, 22.0, 20.0, 15.0, 5.0, 23.0, 9.0, 12.0, 7.0, 4.0, 4.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005035400390625, -0.0004878491163253784, -0.00047215819358825684, -0.00045646727085113525, -0.00044077634811401367, -0.0004250854253768921, -0.0004093945026397705, -0.0003937035799026489, -0.00037801265716552734, -0.00036232173442840576, -0.0003466308116912842, -0.0003309398889541626, -0.000315248966217041, -0.00029955804347991943, -0.00028386712074279785, -0.00026817619800567627, -0.0002524852752685547, -0.0002367943525314331, -0.00022110342979431152, -0.00020541250705718994, -0.00018972158432006836, -0.00017403066158294678, -0.0001583397388458252, -0.0001426488161087036, -0.00012695789337158203, -0.00011126697063446045, -9.557604789733887e-05, -7.988512516021729e-05, -6.41942024230957e-05, -4.850327968597412e-05, -3.281235694885254e-05, -1.7121434211730957e-05, -1.430511474609375e-06, 1.4260411262512207e-05, 2.995133399963379e-05, 4.564225673675537e-05, 6.133317947387695e-05, 7.702410221099854e-05, 9.271502494812012e-05, 0.0001084059476852417, 0.00012409687042236328, 0.00013978779315948486, 0.00015547871589660645, 0.00017116963863372803, 0.0001868605613708496, 0.0002025514841079712, 0.00021824240684509277, 0.00023393332958221436, 0.00024962425231933594, 0.0002653151750564575, 0.0002810060977935791, 0.0002966970205307007, 0.00031238794326782227, 0.00032807886600494385, 0.00034376978874206543, 0.000359460711479187, 0.0003751516342163086, 0.0003908425569534302, 0.00040653347969055176, 0.00042222440242767334, 0.0004379153251647949, 0.0004536062479019165, 0.0004692971706390381, 0.00048498809337615967, 0.0005006790161132812]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 4.0, 9.0, 4.0, 12.0, 20.0, 20.0, 23.0, 27.0, 37.0, 40.0, 47.0, 85.0, 86.0, 133.0, 169.0, 224.0, 299.0, 423.0, 792.0, 101271.0, 941869.0, 1157.0, 478.0, 312.0, 248.0, 175.0, 128.0, 89.0, 72.0, 61.0, 52.0, 32.0, 29.0, 21.0, 21.0, 11.0, 14.0, 9.0, 6.0, 5.0, 8.0, 4.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.009796142578125, -0.009491205215454102, -0.009186267852783203, -0.008881330490112305, -0.008576393127441406, -0.008271455764770508, -0.00796651840209961, -0.007661581039428711, -0.0073566436767578125, -0.007051706314086914, -0.006746768951416016, -0.006441831588745117, -0.006136894226074219, -0.00583195686340332, -0.005527019500732422, -0.0052220821380615234, -0.004917144775390625, -0.0046122074127197266, -0.004307270050048828, -0.00400233268737793, -0.0036973953247070312, -0.003392457962036133, -0.0030875205993652344, -0.002782583236694336, -0.0024776458740234375, -0.002172708511352539, -0.0018677711486816406, -0.0015628337860107422, -0.0012578964233398438, -0.0009529590606689453, -0.0006480216979980469, -0.00034308433532714844, -3.814697265625e-05, 0.00026679039001464844, 0.0005717277526855469, 0.0008766651153564453, 0.0011816024780273438, 0.0014865398406982422, 0.0017914772033691406, 0.002096414566040039, 0.0024013519287109375, 0.002706289291381836, 0.0030112266540527344, 0.003316164016723633, 0.0036211013793945312, 0.00392603874206543, 0.004230976104736328, 0.0045359134674072266, 0.004840850830078125, 0.0051457881927490234, 0.005450725555419922, 0.00575566291809082, 0.006060600280761719, 0.006365537643432617, 0.006670475006103516, 0.006975412368774414, 0.0072803497314453125, 0.007585287094116211, 0.00789022445678711, 0.008195161819458008, 0.008500099182128906, 0.008805036544799805, 0.009109973907470703, 0.009414911270141602, 0.0097198486328125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 8.0, 115.0, 569.0, 294.0, 25.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012511188397184014, -0.0012170454720035195, -0.0011829721042886376, -0.0011488987365737557, -0.001114825252443552, -0.0010807518847286701, -0.0010466785170137882, -0.0010126051492989063, -0.0009785317815840244, -0.0009444584138691425, -0.0009103850461542606, -0.0008763116202317178, -0.0008422382525168359, -0.000808164884801954, -0.0007740914588794112, -0.0007400180911645293, -0.0007059447234496474, -0.0006718713557347655, -0.0006377979880198836, -0.0006037245620973408, -0.0005696511943824589, -0.000535577826667577, -0.0005015044007450342, -0.0004674310330301523, -0.0004333576653152704, -0.0003992842976003885, -0.0003652109007816762, -0.0003311375039629638, -0.0002970641362480819, -0.0002629907685332, -0.00022891737171448767, -0.00019484398944769055, -0.00016077060718089342, -0.0001266972249140963, -9.262384264729917e-05, -5.8550460380502045e-05, -2.447707811370492e-05, 9.596304153092206e-06, 4.366968641988933e-05, 7.774306868668646e-05, 0.00011181645095348358, 0.0001458898332202807, 0.00017996321548707783, 0.00021403659775387496, 0.0002481099800206721, 0.000282183347735554, 0.00031625674455426633, 0.0003503301413729787, 0.0003844035090878606, 0.0004184768768027425, 0.00045255027362145483, 0.0004866236704401672, 0.0005206970381550491, 0.000554770405869931, 0.0005888438317924738, 0.0006229171995073557, 0.0006569905672222376, 0.0006910639349371195, 0.0007251373026520014, 0.0007592107285745442, 0.0007932840962894261, 0.000827357464004308, 0.0008614308899268508, 0.0008955042576417327, 0.0009295776253566146]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 4.0, 5.0, 1.0, 4.0, 5.0, 8.0, 13.0, 17.0, 13.0, 18.0, 10.0, 21.0, 25.0, 31.0, 33.0, 31.0, 39.0, 47.0, 44.0, 47.0, 46.0, 52.0, 33.0, 36.0, 40.0, 30.0, 36.0, 33.0, 41.0, 29.0, 27.0, 22.0, 26.0, 21.0, 22.0, 16.0, 15.0, 10.0, 11.0, 12.0, 5.0, 7.0, 4.0, 8.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027191638946533203, -0.0002636248245835304, -0.0002553332597017288, -0.0002470416948199272, -0.0002387501299381256, -0.000230458565056324, -0.0002221670001745224, -0.0002138754352927208, -0.0002055838704109192, -0.00019729230552911758, -0.00018900074064731598, -0.00018070917576551437, -0.00017241761088371277, -0.00016412604600191116, -0.00015583448112010956, -0.00014754291623830795, -0.00013925135135650635, -0.00013095978647470474, -0.00012266822159290314, -0.00011437665671110153, -0.00010608509182929993, -9.779352694749832e-05, -8.950196206569672e-05, -8.121039718389511e-05, -7.29188323020935e-05, -6.46272674202919e-05, -5.6335702538490295e-05, -4.804413765668869e-05, -3.9752572774887085e-05, -3.146100789308548e-05, -2.3169443011283875e-05, -1.487787812948227e-05, -6.586313247680664e-06, 1.7052516341209412e-06, 9.996816515922546e-06, 1.828838139772415e-05, 2.6579946279525757e-05, 3.487151116132736e-05, 4.316307604312897e-05, 5.145464092493057e-05, 5.974620580673218e-05, 6.803777068853378e-05, 7.632933557033539e-05, 8.4620900452137e-05, 9.29124653339386e-05, 0.0001012040302157402, 0.00010949559509754181, 0.00011778715997934341, 0.00012607872486114502, 0.00013437028974294662, 0.00014266185462474823, 0.00015095341950654984, 0.00015924498438835144, 0.00016753654927015305, 0.00017582811415195465, 0.00018411967903375626, 0.00019241124391555786, 0.00020070280879735947, 0.00020899437367916107, 0.00021728593856096268, 0.00022557750344276428, 0.0002338690683245659, 0.0002421606332063675, 0.0002504521980881691, 0.0002587437629699707]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 7.0, 8.0, 12.0, 15.0, 16.0, 12.0, 27.0, 24.0, 18.0, 23.0, 30.0, 31.0, 35.0, 33.0, 35.0, 46.0, 45.0, 36.0, 52.0, 48.0, 47.0, 36.0, 38.0, 35.0, 34.0, 36.0, 32.0, 25.0, 14.0, 23.0, 18.0, 14.0, 16.0, 8.0, 10.0, 13.0, 8.0, 7.0, 3.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.279296875, -5.12109375, -4.962890625, -4.8046875, -4.646484375, -4.48828125, -4.330078125, -4.171875, -4.013671875, -3.85546875, -3.697265625, -3.5390625, -3.380859375, -3.22265625, -3.064453125, -2.90625, -2.748046875, -2.58984375, -2.431640625, -2.2734375, -2.115234375, -1.95703125, -1.798828125, -1.640625, -1.482421875, -1.32421875, -1.166015625, -1.0078125, -0.849609375, -0.69140625, -0.533203125, -0.375, -0.216796875, -0.05859375, 0.099609375, 0.2578125, 0.416015625, 0.57421875, 0.732421875, 0.890625, 1.048828125, 1.20703125, 1.365234375, 1.5234375, 1.681640625, 1.83984375, 1.998046875, 2.15625, 2.314453125, 2.47265625, 2.630859375, 2.7890625, 2.947265625, 3.10546875, 3.263671875, 3.421875, 3.580078125, 3.73828125, 3.896484375, 4.0546875, 4.212890625, 4.37109375, 4.529296875, 4.6875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 12.0, 21.0, 27.0, 29.0, 48.0, 55.0, 87.0, 108.0, 169.0, 230.0, 300.0, 409.0, 571.0, 873.0, 1252.0, 1958.0, 3078.0, 5057.0, 10313.0, 29691.0, 724875.0, 227402.0, 20969.0, 8354.0, 4496.0, 2679.0, 1602.0, 1168.0, 786.0, 548.0, 395.0, 260.0, 193.0, 157.0, 98.0, 72.0, 47.0, 43.0, 33.0, 29.0, 19.0, 12.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.0, -33.93505859375, -32.8701171875, -31.80517578125, -30.740234375, -29.67529296875, -28.6103515625, -27.54541015625, -26.48046875, -25.41552734375, -24.3505859375, -23.28564453125, -22.220703125, -21.15576171875, -20.0908203125, -19.02587890625, -17.9609375, -16.89599609375, -15.8310546875, -14.76611328125, -13.701171875, -12.63623046875, -11.5712890625, -10.50634765625, -9.44140625, -8.37646484375, -7.3115234375, -6.24658203125, -5.181640625, -4.11669921875, -3.0517578125, -1.98681640625, -0.921875, 0.14306640625, 1.2080078125, 2.27294921875, 3.337890625, 4.40283203125, 5.4677734375, 6.53271484375, 7.59765625, 8.66259765625, 9.7275390625, 10.79248046875, 11.857421875, 12.92236328125, 13.9873046875, 15.05224609375, 16.1171875, 17.18212890625, 18.2470703125, 19.31201171875, 20.376953125, 21.44189453125, 22.5068359375, 23.57177734375, 24.63671875, 25.70166015625, 26.7666015625, 27.83154296875, 28.896484375, 29.96142578125, 31.0263671875, 32.09130859375, 33.15625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 10.0, 4.0, 6.0, 4.0, 15.0, 18.0, 21.0, 20.0, 27.0, 25.0, 32.0, 34.0, 36.0, 41.0, 57.0, 66.0, 148.0, 1669.0, 309.0, 100.0, 59.0, 54.0, 43.0, 46.0, 44.0, 29.0, 27.0, 25.0, 20.0, 18.0, 11.0, 19.0, 4.0, 6.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.796875, -22.176513671875, -21.55615234375, -20.935791015625, -20.3154296875, -19.695068359375, -19.07470703125, -18.454345703125, -17.833984375, -17.213623046875, -16.59326171875, -15.972900390625, -15.3525390625, -14.732177734375, -14.11181640625, -13.491455078125, -12.87109375, -12.250732421875, -11.63037109375, -11.010009765625, -10.3896484375, -9.769287109375, -9.14892578125, -8.528564453125, -7.908203125, -7.287841796875, -6.66748046875, -6.047119140625, -5.4267578125, -4.806396484375, -4.18603515625, -3.565673828125, -2.9453125, -2.324951171875, -1.70458984375, -1.084228515625, -0.4638671875, 0.156494140625, 0.77685546875, 1.397216796875, 2.017578125, 2.637939453125, 3.25830078125, 3.878662109375, 4.4990234375, 5.119384765625, 5.73974609375, 6.360107421875, 6.98046875, 7.600830078125, 8.22119140625, 8.841552734375, 9.4619140625, 10.082275390625, 10.70263671875, 11.322998046875, 11.943359375, 12.563720703125, 13.18408203125, 13.804443359375, 14.4248046875, 15.045166015625, 15.66552734375, 16.285888671875, 16.90625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 5.0, 14.0, 12.0, 21.0, 21.0, 24.0, 20.0, 26.0, 33.0, 47.0, 49.0, 69.0, 153.0, 428.0, 3456.0, 3133949.0, 6329.0, 514.0, 177.0, 78.0, 46.0, 40.0, 28.0, 25.0, 24.0, 25.0, 26.0, 13.0, 13.0, 14.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.625, -66.90234375, -64.1796875, -61.45703125, -58.734375, -56.01171875, -53.2890625, -50.56640625, -47.84375, -45.12109375, -42.3984375, -39.67578125, -36.953125, -34.23046875, -31.5078125, -28.78515625, -26.0625, -23.33984375, -20.6171875, -17.89453125, -15.171875, -12.44921875, -9.7265625, -7.00390625, -4.28125, -1.55859375, 1.1640625, 3.88671875, 6.609375, 9.33203125, 12.0546875, 14.77734375, 17.5, 20.22265625, 22.9453125, 25.66796875, 28.390625, 31.11328125, 33.8359375, 36.55859375, 39.28125, 42.00390625, 44.7265625, 47.44921875, 50.171875, 52.89453125, 55.6171875, 58.33984375, 61.0625, 63.78515625, 66.5078125, 69.23046875, 71.953125, 74.67578125, 77.3984375, 80.12109375, 82.84375, 85.56640625, 88.2890625, 91.01171875, 93.734375, 96.45703125, 99.1796875, 101.90234375, 104.625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 14.0, 248.0, 667.0, 81.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.75102996826172, -85.73372650146484, -82.7164306640625, -79.69912719726562, -76.68183135986328, -73.6645278930664, -70.64723205566406, -67.62992858886719, -64.61262512207031, -61.5953254699707, -58.578025817871094, -55.56072235107422, -52.543426513671875, -49.526123046875, -46.50882339477539, -43.49152374267578, -40.47422790527344, -37.45692825317383, -34.43962860107422, -31.422327041625977, -28.405027389526367, -25.387727737426758, -22.370426177978516, -19.353126525878906, -16.335826873779297, -13.318527221679688, -10.301226615905762, -7.283926010131836, -4.266626358032227, -1.2493267059326172, 1.767974853515625, 4.785274505615234, 7.8025665283203125, 10.819866180419922, 13.837166786193848, 16.854467391967773, 19.871767044067383, 22.889066696166992, 25.906368255615234, 28.923667907714844, 31.940967559814453, 34.95826721191406, 37.97556686401367, 40.99286651611328, 44.010169982910156, 47.0274658203125, 50.044769287109375, 53.062068939208984, 56.079368591308594, 59.0966682434082, 62.11396789550781, 65.13127136230469, 68.14856719970703, 71.1658706665039, 74.18316650390625, 77.20046997070312, 80.2177734375, 83.23507690429688, 86.25237274169922, 89.2696762084961, 92.28697204589844, 95.30427551269531, 98.32157897949219, 101.33887481689453, 104.35617065429688]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 5.0, 6.0, 6.0, 7.0, 11.0, 13.0, 11.0, 7.0, 17.0, 15.0, 19.0, 28.0, 25.0, 29.0, 27.0, 25.0, 24.0, 30.0, 49.0, 28.0, 39.0, 36.0, 35.0, 37.0, 30.0, 38.0, 38.0, 34.0, 40.0, 37.0, 37.0, 24.0, 20.0, 17.0, 16.0, 16.0, 17.0, 13.0, 18.0, 13.0, 11.0, 9.0, 4.0, 10.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.125640869140625, -43.72932434082031, -42.3330078125, -40.93669509887695, -39.54037857055664, -38.14406204223633, -36.74774932861328, -35.35143280029297, -33.955116271972656, -32.558799743652344, -31.162485122680664, -29.766170501708984, -28.369853973388672, -26.97353744506836, -25.57722282409668, -24.180908203125, -22.784591674804688, -21.388275146484375, -19.991960525512695, -18.595645904541016, -17.199329376220703, -15.803013801574707, -14.406698226928711, -13.010382652282715, -11.614067077636719, -10.217751502990723, -8.821435928344727, -7.4251203536987305, -6.028804779052734, -4.632489204406738, -3.236173629760742, -1.839858055114746, -0.4435462951660156, 0.9527692794799805, 2.3490848541259766, 3.7454004287719727, 5.141716003417969, 6.538031578063965, 7.934347152709961, 9.330662727355957, 10.726978302001953, 12.12329387664795, 13.519609451293945, 14.915925025939941, 16.312240600585938, 17.70855712890625, 19.10487174987793, 20.50118637084961, 21.897502899169922, 23.293819427490234, 24.690134048461914, 26.086448669433594, 27.482765197753906, 28.87908172607422, 30.2753963470459, 31.671710968017578, 33.06802749633789, 34.4643440246582, 35.86065673828125, 37.25697326660156, 38.653289794921875, 40.04960632324219, 41.4459228515625, 42.84223556518555, 44.23855209350586]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 9.0, 12.0, 7.0, 14.0, 19.0, 24.0, 16.0, 15.0, 29.0, 18.0, 35.0, 38.0, 34.0, 39.0, 40.0, 36.0, 46.0, 44.0, 54.0, 40.0, 44.0, 41.0, 47.0, 38.0, 25.0, 43.0, 16.0, 22.0, 34.0, 17.0, 12.0, 13.0, 11.0, 11.0, 13.0, 9.0, 7.0, 4.0, 6.0, 3.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.88671875, -5.713134765625, -5.53955078125, -5.365966796875, -5.1923828125, -5.018798828125, -4.84521484375, -4.671630859375, -4.498046875, -4.324462890625, -4.15087890625, -3.977294921875, -3.8037109375, -3.630126953125, -3.45654296875, -3.282958984375, -3.109375, -2.935791015625, -2.76220703125, -2.588623046875, -2.4150390625, -2.241455078125, -2.06787109375, -1.894287109375, -1.720703125, -1.547119140625, -1.37353515625, -1.199951171875, -1.0263671875, -0.852783203125, -0.67919921875, -0.505615234375, -0.33203125, -0.158447265625, 0.01513671875, 0.188720703125, 0.3623046875, 0.535888671875, 0.70947265625, 0.883056640625, 1.056640625, 1.230224609375, 1.40380859375, 1.577392578125, 1.7509765625, 1.924560546875, 2.09814453125, 2.271728515625, 2.4453125, 2.618896484375, 2.79248046875, 2.966064453125, 3.1396484375, 3.313232421875, 3.48681640625, 3.660400390625, 3.833984375, 4.007568359375, 4.18115234375, 4.354736328125, 4.5283203125, 4.701904296875, 4.87548828125, 5.049072265625, 5.22265625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 12.0, 23.0, 24.0, 23.0, 51.0, 81.0, 100.0, 160.0, 253.0, 430.0, 732.0, 1433.0, 2913.0, 6396.0, 16299.0, 68876.0, 1748559.0, 2235883.0, 79695.0, 18215.0, 7103.0, 3204.0, 1657.0, 820.0, 471.0, 259.0, 185.0, 127.0, 76.0, 55.0, 27.0, 23.0, 21.0, 24.0, 9.0, 4.0, 10.0, 11.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.28125, -30.2734375, -29.265625, -28.2578125, -27.25, -26.2421875, -25.234375, -24.2265625, -23.21875, -22.2109375, -21.203125, -20.1953125, -19.1875, -18.1796875, -17.171875, -16.1640625, -15.15625, -14.1484375, -13.140625, -12.1328125, -11.125, -10.1171875, -9.109375, -8.1015625, -7.09375, -6.0859375, -5.078125, -4.0703125, -3.0625, -2.0546875, -1.046875, -0.0390625, 0.96875, 1.9765625, 2.984375, 3.9921875, 5.0, 6.0078125, 7.015625, 8.0234375, 9.03125, 10.0390625, 11.046875, 12.0546875, 13.0625, 14.0703125, 15.078125, 16.0859375, 17.09375, 18.1015625, 19.109375, 20.1171875, 21.125, 22.1328125, 23.140625, 24.1484375, 25.15625, 26.1640625, 27.171875, 28.1796875, 29.1875, 30.1953125, 31.203125, 32.2109375, 33.21875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 15.0, 28.0, 39.0, 45.0, 72.0, 161.0, 195.0, 372.0, 642.0, 772.0, 670.0, 411.0, 248.0, 155.0, 73.0, 65.0, 39.0, 24.0, 8.0, 11.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.8125, -26.68115234375, -25.5498046875, -24.41845703125, -23.287109375, -22.15576171875, -21.0244140625, -19.89306640625, -18.76171875, -17.63037109375, -16.4990234375, -15.36767578125, -14.236328125, -13.10498046875, -11.9736328125, -10.84228515625, -9.7109375, -8.57958984375, -7.4482421875, -6.31689453125, -5.185546875, -4.05419921875, -2.9228515625, -1.79150390625, -0.66015625, 0.47119140625, 1.6025390625, 2.73388671875, 3.865234375, 4.99658203125, 6.1279296875, 7.25927734375, 8.390625, 9.52197265625, 10.6533203125, 11.78466796875, 12.916015625, 14.04736328125, 15.1787109375, 16.31005859375, 17.44140625, 18.57275390625, 19.7041015625, 20.83544921875, 21.966796875, 23.09814453125, 24.2294921875, 25.36083984375, 26.4921875, 27.62353515625, 28.7548828125, 29.88623046875, 31.017578125, 32.14892578125, 33.2802734375, 34.41162109375, 35.54296875, 36.67431640625, 37.8056640625, 38.93701171875, 40.068359375, 41.19970703125, 42.3310546875, 43.46240234375, 44.59375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 10.0, 6.0, 14.0, 25.0, 38.0, 77.0, 112.0, 225.0, 427.0, 1640.0, 2008467.0, 2180520.0, 1764.0, 424.0, 193.0, 107.0, 79.0, 39.0, 31.0, 28.0, 21.0, 12.0, 3.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-218.125, -213.16796875, -208.2109375, -203.25390625, -198.296875, -193.33984375, -188.3828125, -183.42578125, -178.46875, -173.51171875, -168.5546875, -163.59765625, -158.640625, -153.68359375, -148.7265625, -143.76953125, -138.8125, -133.85546875, -128.8984375, -123.94140625, -118.984375, -114.02734375, -109.0703125, -104.11328125, -99.15625, -94.19921875, -89.2421875, -84.28515625, -79.328125, -74.37109375, -69.4140625, -64.45703125, -59.5, -54.54296875, -49.5859375, -44.62890625, -39.671875, -34.71484375, -29.7578125, -24.80078125, -19.84375, -14.88671875, -9.9296875, -4.97265625, -0.015625, 4.94140625, 9.8984375, 14.85546875, 19.8125, 24.76953125, 29.7265625, 34.68359375, 39.640625, 44.59765625, 49.5546875, 54.51171875, 59.46875, 64.42578125, 69.3828125, 74.33984375, 79.296875, 84.25390625, 89.2109375, 94.16796875, 99.125]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 17.0, 186.0, 595.0, 201.0, 17.0, 0.0, 1.0], "bins": [-532.6876220703125, -523.7340087890625, -514.7804565429688, -505.82684326171875, -496.87322998046875, -487.9196472167969, -478.9660339355469, -470.012451171875, -461.058837890625, -452.1052551269531, -443.1516418457031, -434.19805908203125, -425.24444580078125, -416.2908630371094, -407.3372497558594, -398.3836669921875, -389.4300537109375, -380.4764709472656, -371.5228576660156, -362.56927490234375, -353.61566162109375, -344.6620788574219, -335.7084655761719, -326.7548828125, -317.8013000488281, -308.84771728515625, -299.89410400390625, -290.9405212402344, -281.9869079589844, -273.0333251953125, -264.0797119140625, -255.12612915039062, -246.17251586914062, -237.2189178466797, -228.26531982421875, -219.3117218017578, -210.35812377929688, -201.40452575683594, -192.450927734375, -183.49734497070312, -174.54373168945312, -165.5901336669922, -156.63653564453125, -147.6829376220703, -138.72933959960938, -129.77574157714844, -120.82215118408203, -111.8685531616211, -102.91496276855469, -93.96136474609375, -85.00776672363281, -76.05416870117188, -67.10057067871094, -58.146976470947266, -49.193382263183594, -40.239784240722656, -31.28618621826172, -22.33258819580078, -13.378992080688477, -4.425395965576172, 4.528202056884766, 13.481800079345703, 22.435394287109375, 31.388992309570312, 40.34259033203125]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 5.0, 3.0, 5.0, 4.0, 5.0, 7.0, 13.0, 13.0, 15.0, 18.0, 10.0, 29.0, 18.0, 24.0, 24.0, 33.0, 27.0, 41.0, 32.0, 37.0, 33.0, 43.0, 29.0, 29.0, 45.0, 36.0, 43.0, 41.0, 33.0, 28.0, 26.0, 26.0, 28.0, 18.0, 18.0, 25.0, 20.0, 17.0, 23.0, 14.0, 8.0, 14.0, 8.0, 7.0, 9.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-66.51805877685547, -64.4088134765625, -62.29957580566406, -60.19033432006836, -58.081092834472656, -55.97184753417969, -53.862606048583984, -51.75336456298828, -49.64412307739258, -47.534881591796875, -45.42564010620117, -43.31639862060547, -41.2071533203125, -39.09791564941406, -36.988670349121094, -34.87942886352539, -32.77018737792969, -30.660945892333984, -28.55170440673828, -26.442461013793945, -24.333219528198242, -22.22397804260254, -20.114734649658203, -18.0054931640625, -15.896251678466797, -13.787010192871094, -11.677767753601074, -9.568525314331055, -7.459283828735352, -5.350042343139648, -3.240799903869629, -1.1315574645996094, 0.977691650390625, 3.0869336128234863, 5.196175575256348, 7.305417537689209, 9.41465950012207, 11.523900985717773, 13.633143424987793, 15.742385864257812, 17.851627349853516, 19.96086883544922, 22.070110321044922, 24.179353713989258, 26.28859519958496, 28.397836685180664, 30.507080078125, 32.6163215637207, 34.725563049316406, 36.83480453491211, 38.94404602050781, 41.053287506103516, 43.16252899169922, 45.27177429199219, 47.38101577758789, 49.490257263183594, 51.5994987487793, 53.708740234375, 55.8179817199707, 57.927223205566406, 60.036468505859375, 62.14570617675781, 64.25495147705078, 66.36419677734375, 68.47343444824219]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 8.0, 10.0, 16.0, 8.0, 8.0, 16.0, 14.0, 19.0, 24.0, 29.0, 30.0, 24.0, 25.0, 35.0, 40.0, 41.0, 46.0, 29.0, 53.0, 52.0, 38.0, 50.0, 47.0, 59.0, 25.0, 33.0, 37.0, 25.0, 25.0, 26.0, 16.0, 15.0, 15.0, 15.0, 6.0, 12.0, 10.0, 5.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9453125, -6.758056640625, -6.57080078125, -6.383544921875, -6.1962890625, -6.009033203125, -5.82177734375, -5.634521484375, -5.447265625, -5.260009765625, -5.07275390625, -4.885498046875, -4.6982421875, -4.510986328125, -4.32373046875, -4.136474609375, -3.94921875, -3.761962890625, -3.57470703125, -3.387451171875, -3.2001953125, -3.012939453125, -2.82568359375, -2.638427734375, -2.451171875, -2.263916015625, -2.07666015625, -1.889404296875, -1.7021484375, -1.514892578125, -1.32763671875, -1.140380859375, -0.953125, -0.765869140625, -0.57861328125, -0.391357421875, -0.2041015625, -0.016845703125, 0.17041015625, 0.357666015625, 0.544921875, 0.732177734375, 0.91943359375, 1.106689453125, 1.2939453125, 1.481201171875, 1.66845703125, 1.855712890625, 2.04296875, 2.230224609375, 2.41748046875, 2.604736328125, 2.7919921875, 2.979248046875, 3.16650390625, 3.353759765625, 3.541015625, 3.728271484375, 3.91552734375, 4.102783203125, 4.2900390625, 4.477294921875, 4.66455078125, 4.851806640625, 5.0390625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 3.0, 19.0, 35.0, 45.0, 56.0, 98.0, 160.0, 253.0, 442.0, 803.0, 1351.0, 2254.0, 3679.0, 5837.0, 9803.0, 15974.0, 27142.0, 47222.0, 89102.0, 198968.0, 362060.0, 129223.0, 65178.0, 35904.0, 20958.0, 12449.0, 7626.0, 4725.0, 2914.0, 1687.0, 1103.0, 596.0, 348.0, 221.0, 90.0, 81.0, 49.0, 30.0, 19.0, 19.0, 7.0, 3.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.541015625, -1.49603271484375, -1.4510498046875, -1.40606689453125, -1.361083984375, -1.31610107421875, -1.2711181640625, -1.22613525390625, -1.18115234375, -1.13616943359375, -1.0911865234375, -1.04620361328125, -1.001220703125, -0.95623779296875, -0.9112548828125, -0.86627197265625, -0.8212890625, -0.77630615234375, -0.7313232421875, -0.68634033203125, -0.641357421875, -0.59637451171875, -0.5513916015625, -0.50640869140625, -0.46142578125, -0.41644287109375, -0.3714599609375, -0.32647705078125, -0.281494140625, -0.23651123046875, -0.1915283203125, -0.14654541015625, -0.1015625, -0.05657958984375, -0.0115966796875, 0.03338623046875, 0.078369140625, 0.12335205078125, 0.1683349609375, 0.21331787109375, 0.25830078125, 0.30328369140625, 0.3482666015625, 0.39324951171875, 0.438232421875, 0.48321533203125, 0.5281982421875, 0.57318115234375, 0.6181640625, 0.66314697265625, 0.7081298828125, 0.75311279296875, 0.798095703125, 0.84307861328125, 0.8880615234375, 0.93304443359375, 0.97802734375, 1.02301025390625, 1.0679931640625, 1.11297607421875, 1.157958984375, 1.20294189453125, 1.2479248046875, 1.29290771484375, 1.337890625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 9.0, 7.0, 11.0, 10.0, 12.0, 13.0, 15.0, 17.0, 19.0, 27.0, 22.0, 27.0, 29.0, 32.0, 38.0, 31.0, 28.0, 48.0, 41.0, 1072.0, 41.0, 31.0, 41.0, 39.0, 39.0, 32.0, 33.0, 41.0, 32.0, 29.0, 19.0, 19.0, 23.0, 20.0, 14.0, 14.0, 11.0, 9.0, 7.0, 1.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.72265625, -3.608856201171875, -3.49505615234375, -3.381256103515625, -3.2674560546875, -3.153656005859375, -3.03985595703125, -2.926055908203125, -2.812255859375, -2.698455810546875, -2.58465576171875, -2.470855712890625, -2.3570556640625, -2.243255615234375, -2.12945556640625, -2.015655517578125, -1.90185546875, -1.788055419921875, -1.67425537109375, -1.560455322265625, -1.4466552734375, -1.332855224609375, -1.21905517578125, -1.105255126953125, -0.991455078125, -0.877655029296875, -0.76385498046875, -0.650054931640625, -0.5362548828125, -0.422454833984375, -0.30865478515625, -0.194854736328125, -0.0810546875, 0.032745361328125, 0.14654541015625, 0.260345458984375, 0.3741455078125, 0.487945556640625, 0.60174560546875, 0.715545654296875, 0.829345703125, 0.943145751953125, 1.05694580078125, 1.170745849609375, 1.2845458984375, 1.398345947265625, 1.51214599609375, 1.625946044921875, 1.73974609375, 1.853546142578125, 1.96734619140625, 2.081146240234375, 2.1949462890625, 2.308746337890625, 2.42254638671875, 2.536346435546875, 2.650146484375, 2.763946533203125, 2.87774658203125, 2.991546630859375, 3.1053466796875, 3.219146728515625, 3.33294677734375, 3.446746826171875, 3.560546875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 10.0, 13.0, 13.0, 19.0, 39.0, 54.0, 99.0, 142.0, 214.0, 367.0, 580.0, 887.0, 1473.0, 2327.0, 3742.0, 5752.0, 9002.0, 14583.0, 23968.0, 39298.0, 67321.0, 126158.0, 1391643.0, 191699.0, 88924.0, 49885.0, 29973.0, 18106.0, 11374.0, 7157.0, 4540.0, 2854.0, 1834.0, 1126.0, 740.0, 471.0, 268.0, 168.0, 121.0, 75.0, 43.0, 29.0, 14.0, 14.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3037109375, -1.263885498046875, -1.22406005859375, -1.184234619140625, -1.1444091796875, -1.104583740234375, -1.06475830078125, -1.024932861328125, -0.985107421875, -0.945281982421875, -0.90545654296875, -0.865631103515625, -0.8258056640625, -0.785980224609375, -0.74615478515625, -0.706329345703125, -0.66650390625, -0.626678466796875, -0.58685302734375, -0.547027587890625, -0.5072021484375, -0.467376708984375, -0.42755126953125, -0.387725830078125, -0.347900390625, -0.308074951171875, -0.26824951171875, -0.228424072265625, -0.1885986328125, -0.148773193359375, -0.10894775390625, -0.069122314453125, -0.029296875, 0.010528564453125, 0.05035400390625, 0.090179443359375, 0.1300048828125, 0.169830322265625, 0.20965576171875, 0.249481201171875, 0.289306640625, 0.329132080078125, 0.36895751953125, 0.408782958984375, 0.4486083984375, 0.488433837890625, 0.52825927734375, 0.568084716796875, 0.60791015625, 0.647735595703125, 0.68756103515625, 0.727386474609375, 0.7672119140625, 0.807037353515625, 0.84686279296875, 0.886688232421875, 0.926513671875, 0.966339111328125, 1.00616455078125, 1.045989990234375, 1.0858154296875, 1.125640869140625, 1.16546630859375, 1.205291748046875, 1.2451171875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 6.0, 6.0, 9.0, 20.0, 22.0, 42.0, 44.0, 67.0, 111.0, 158.0, 135.0, 121.0, 77.0, 50.0, 38.0, 15.0, 20.0, 11.0, 7.0, 8.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009045600891113281, -0.0008700713515281677, -0.0008355826139450073, -0.0008010938763618469, -0.0007666051387786865, -0.0007321164011955261, -0.0006976276636123657, -0.0006631389260292053, -0.0006286501884460449, -0.0005941614508628845, -0.0005596727132797241, -0.0005251839756965637, -0.0004906952381134033, -0.0004562065005302429, -0.0004217177629470825, -0.0003872290253639221, -0.0003527402877807617, -0.0003182515501976013, -0.0002837628126144409, -0.0002492740750312805, -0.00021478533744812012, -0.00018029659986495972, -0.00014580786228179932, -0.00011131912469863892, -7.683038711547852e-05, -4.2341649532318115e-05, -7.852911949157715e-06, 2.6635825634002686e-05, 6.112456321716309e-05, 9.561330080032349e-05, 0.0001301020383834839, 0.0001645907759666443, 0.0001990795135498047, 0.0002335682511329651, 0.0002680569887161255, 0.0003025457262992859, 0.0003370344638824463, 0.0003715232014656067, 0.0004060119390487671, 0.0004405006766319275, 0.0004749894142150879, 0.0005094781517982483, 0.0005439668893814087, 0.0005784556269645691, 0.0006129443645477295, 0.0006474331021308899, 0.0006819218397140503, 0.0007164105772972107, 0.0007508993148803711, 0.0007853880524635315, 0.0008198767900466919, 0.0008543655276298523, 0.0008888542652130127, 0.0009233430027961731, 0.0009578317403793335, 0.000992320477962494, 0.0010268092155456543, 0.0010612979531288147, 0.001095786690711975, 0.0011302754282951355, 0.001164764165878296, 0.0011992529034614563, 0.0012337416410446167, 0.001268230378627777, 0.0013027191162109375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 4.0, 5.0, 11.0, 13.0, 28.0, 36.0, 44.0, 81.0, 121.0, 264.0, 726.0, 1042164.0, 4170.0, 380.0, 183.0, 95.0, 51.0, 40.0, 32.0, 24.0, 18.0, 10.0, 4.0, 6.0, 6.0, 8.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0294189453125, -0.02863931655883789, -0.02785968780517578, -0.027080059051513672, -0.026300430297851562, -0.025520801544189453, -0.024741172790527344, -0.023961544036865234, -0.023181915283203125, -0.022402286529541016, -0.021622657775878906, -0.020843029022216797, -0.020063400268554688, -0.019283771514892578, -0.01850414276123047, -0.01772451400756836, -0.01694488525390625, -0.01616525650024414, -0.015385627746582031, -0.014605998992919922, -0.013826370239257812, -0.013046741485595703, -0.012267112731933594, -0.011487483978271484, -0.010707855224609375, -0.009928226470947266, -0.009148597717285156, -0.008368968963623047, -0.0075893402099609375, -0.006809711456298828, -0.006030082702636719, -0.005250453948974609, -0.0044708251953125, -0.0036911964416503906, -0.0029115676879882812, -0.002131938934326172, -0.0013523101806640625, -0.0005726814270019531, 0.00020694732666015625, 0.0009865760803222656, 0.001766204833984375, 0.0025458335876464844, 0.0033254623413085938, 0.004105091094970703, 0.0048847198486328125, 0.005664348602294922, 0.006443977355957031, 0.007223606109619141, 0.00800323486328125, 0.00878286361694336, 0.009562492370605469, 0.010342121124267578, 0.011121749877929688, 0.011901378631591797, 0.012681007385253906, 0.013460636138916016, 0.014240264892578125, 0.015019893646240234, 0.015799522399902344, 0.016579151153564453, 0.017358779907226562, 0.018138408660888672, 0.01891803741455078, 0.01969766616821289, 0.020477294921875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 131.0, 854.0, 30.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002152507659047842, -0.0001232009381055832, -3.115111030638218e-05, 6.089871749281883e-05, 0.00015294854529201984, 0.00024499837309122086, 0.00033704820089042187, 0.0004290980286896229, 0.0005211478564888239, 0.0006131976842880249, 0.0007052475120872259, 0.0007972973398864269, 0.0008893471676856279, 0.000981396995484829, 0.00107344682328403, 0.001165496651083231, 0.001257546478882432, 0.001349596306681633, 0.001441646134480834, 0.001533695962280035, 0.001625745790079236, 0.001717795617878437, 0.001809845445677638, 0.001901895273476839, 0.00199394510127604, 0.002085994929075241, 0.002178044756874442, 0.002270094584673643, 0.002362144412472844, 0.002454194240272045, 0.002546244068071246, 0.002638293895870447, 0.002730343956500292, 0.002822393784299493, 0.002914443612098694, 0.003006493439897895, 0.003098543267697096, 0.003190593095496297, 0.003282642923295498, 0.003374692751094699, 0.0034667425788939, 0.003558792406693101, 0.003650842234492302, 0.003742892062291503, 0.003834941890090704, 0.003926991485059261, 0.004019041545689106, 0.004111091606318951, 0.004203141201287508, 0.004295190796256065, 0.00438724085688591, 0.004479290917515755, 0.004571340512484312, 0.004663390107452869, 0.004755440168082714, 0.004847490228712559, 0.004939539823681116, 0.0050315894186496735, 0.005123639479279518, 0.005215689539909363, 0.00530773913487792, 0.0053997887298464775, 0.005491838790476322, 0.005583888851106167, 0.005675938446074724]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 7.0, 4.0, 7.0, 2.0, 12.0, 5.0, 12.0, 14.0, 14.0, 10.0, 14.0, 31.0, 26.0, 32.0, 31.0, 26.0, 41.0, 29.0, 31.0, 34.0, 44.0, 44.0, 33.0, 36.0, 46.0, 29.0, 38.0, 36.0, 35.0, 29.0, 23.0, 27.0, 25.0, 16.0, 22.0, 13.0, 17.0, 18.0, 12.0, 11.0, 8.0, 9.0, 13.0, 3.0, 3.0, 3.0, 2.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00031554698944091797, -0.0003055613487958908, -0.00029557570815086365, -0.0002855900675058365, -0.0002756044268608093, -0.00026561878621578217, -0.000255633145570755, -0.00024564750492572784, -0.00023566186428070068, -0.00022567622363567352, -0.00021569058299064636, -0.0002057049423456192, -0.00019571930170059204, -0.00018573366105556488, -0.00017574802041053772, -0.00016576237976551056, -0.0001557767391204834, -0.00014579109847545624, -0.00013580545783042908, -0.00012581981718540192, -0.00011583417654037476, -0.0001058485358953476, -9.586289525032043e-05, -8.587725460529327e-05, -7.589161396026611e-05, -6.590597331523895e-05, -5.592033267021179e-05, -4.593469202518463e-05, -3.594905138015747e-05, -2.596341073513031e-05, -1.597777009010315e-05, -5.992129445075989e-06, 3.993511199951172e-06, 1.3979151844978333e-05, 2.3964792490005493e-05, 3.3950433135032654e-05, 4.3936073780059814e-05, 5.3921714425086975e-05, 6.390735507011414e-05, 7.38929957151413e-05, 8.387863636016846e-05, 9.386427700519562e-05, 0.00010384991765022278, 0.00011383555829524994, 0.0001238211989402771, 0.00013380683958530426, 0.00014379248023033142, 0.00015377812087535858, 0.00016376376152038574, 0.0001737494021654129, 0.00018373504281044006, 0.00019372068345546722, 0.00020370632410049438, 0.00021369196474552155, 0.0002236776053905487, 0.00023366324603557587, 0.00024364888668060303, 0.0002536345273256302, 0.00026362016797065735, 0.0002736058086156845, 0.00028359144926071167, 0.00029357708990573883, 0.000303562730550766, 0.00031354837119579315, 0.0003235340118408203]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 8.0, 10.0, 16.0, 8.0, 8.0, 16.0, 14.0, 19.0, 24.0, 29.0, 30.0, 24.0, 25.0, 35.0, 40.0, 41.0, 46.0, 29.0, 53.0, 52.0, 38.0, 50.0, 47.0, 59.0, 25.0, 33.0, 37.0, 25.0, 25.0, 26.0, 16.0, 15.0, 15.0, 15.0, 6.0, 12.0, 10.0, 5.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9453125, -6.758056640625, -6.57080078125, -6.383544921875, -6.1962890625, -6.009033203125, -5.82177734375, -5.634521484375, -5.447265625, -5.260009765625, -5.07275390625, -4.885498046875, -4.6982421875, -4.510986328125, -4.32373046875, -4.136474609375, -3.94921875, -3.761962890625, -3.57470703125, -3.387451171875, -3.2001953125, -3.012939453125, -2.82568359375, -2.638427734375, -2.451171875, -2.263916015625, -2.07666015625, -1.889404296875, -1.7021484375, -1.514892578125, -1.32763671875, -1.140380859375, -0.953125, -0.765869140625, -0.57861328125, -0.391357421875, -0.2041015625, -0.016845703125, 0.17041015625, 0.357666015625, 0.544921875, 0.732177734375, 0.91943359375, 1.106689453125, 1.2939453125, 1.481201171875, 1.66845703125, 1.855712890625, 2.04296875, 2.230224609375, 2.41748046875, 2.604736328125, 2.7919921875, 2.979248046875, 3.16650390625, 3.353759765625, 3.541015625, 3.728271484375, 3.91552734375, 4.102783203125, 4.2900390625, 4.477294921875, 4.66455078125, 4.851806640625, 5.0390625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 15.0, 19.0, 18.0, 37.0, 38.0, 50.0, 88.0, 125.0, 135.0, 234.0, 338.0, 526.0, 993.0, 1833.0, 4162.0, 11821.0, 39580.0, 165749.0, 539543.0, 210350.0, 48888.0, 14177.0, 4932.0, 2080.0, 1059.0, 574.0, 382.0, 229.0, 178.0, 123.0, 64.0, 54.0, 52.0, 39.0, 20.0, 20.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2734375, -6.08087158203125, -5.8883056640625, -5.69573974609375, -5.503173828125, -5.31060791015625, -5.1180419921875, -4.92547607421875, -4.73291015625, -4.54034423828125, -4.3477783203125, -4.15521240234375, -3.962646484375, -3.77008056640625, -3.5775146484375, -3.38494873046875, -3.1923828125, -2.99981689453125, -2.8072509765625, -2.61468505859375, -2.422119140625, -2.22955322265625, -2.0369873046875, -1.84442138671875, -1.65185546875, -1.45928955078125, -1.2667236328125, -1.07415771484375, -0.881591796875, -0.68902587890625, -0.4964599609375, -0.30389404296875, -0.111328125, 0.08123779296875, 0.2738037109375, 0.46636962890625, 0.658935546875, 0.85150146484375, 1.0440673828125, 1.23663330078125, 1.42919921875, 1.62176513671875, 1.8143310546875, 2.00689697265625, 2.199462890625, 2.39202880859375, 2.5845947265625, 2.77716064453125, 2.9697265625, 3.16229248046875, 3.3548583984375, 3.54742431640625, 3.739990234375, 3.93255615234375, 4.1251220703125, 4.31768798828125, 4.51025390625, 4.70281982421875, 4.8953857421875, 5.08795166015625, 5.280517578125, 5.47308349609375, 5.6656494140625, 5.85821533203125, 6.05078125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 0.0, 5.0, 6.0, 3.0, 12.0, 9.0, 17.0, 6.0, 10.0, 15.0, 17.0, 21.0, 17.0, 37.0, 36.0, 43.0, 42.0, 40.0, 56.0, 82.0, 256.0, 1720.0, 112.0, 63.0, 39.0, 43.0, 43.0, 32.0, 51.0, 32.0, 28.0, 23.0, 24.0, 19.0, 15.0, 9.0, 14.0, 9.0, 5.0, 11.0, 9.0, 4.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.03125, -19.409423828125, -18.78759765625, -18.165771484375, -17.5439453125, -16.922119140625, -16.30029296875, -15.678466796875, -15.056640625, -14.434814453125, -13.81298828125, -13.191162109375, -12.5693359375, -11.947509765625, -11.32568359375, -10.703857421875, -10.08203125, -9.460205078125, -8.83837890625, -8.216552734375, -7.5947265625, -6.972900390625, -6.35107421875, -5.729248046875, -5.107421875, -4.485595703125, -3.86376953125, -3.241943359375, -2.6201171875, -1.998291015625, -1.37646484375, -0.754638671875, -0.1328125, 0.489013671875, 1.11083984375, 1.732666015625, 2.3544921875, 2.976318359375, 3.59814453125, 4.219970703125, 4.841796875, 5.463623046875, 6.08544921875, 6.707275390625, 7.3291015625, 7.950927734375, 8.57275390625, 9.194580078125, 9.81640625, 10.438232421875, 11.06005859375, 11.681884765625, 12.3037109375, 12.925537109375, 13.54736328125, 14.169189453125, 14.791015625, 15.412841796875, 16.03466796875, 16.656494140625, 17.2783203125, 17.900146484375, 18.52197265625, 19.143798828125, 19.765625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 11.0, 12.0, 6.0, 10.0, 6.0, 15.0, 13.0, 22.0, 26.0, 26.0, 28.0, 50.0, 61.0, 61.0, 88.0, 165.0, 334.0, 1033.0, 6514.0, 3075329.0, 59019.0, 1731.0, 528.0, 171.0, 104.0, 77.0, 51.0, 47.0, 31.0, 28.0, 10.0, 17.0, 7.0, 7.0, 16.0, 10.0, 9.0, 6.0, 6.0, 4.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-45.375, -43.9443359375, -42.513671875, -41.0830078125, -39.65234375, -38.2216796875, -36.791015625, -35.3603515625, -33.9296875, -32.4990234375, -31.068359375, -29.6376953125, -28.20703125, -26.7763671875, -25.345703125, -23.9150390625, -22.484375, -21.0537109375, -19.623046875, -18.1923828125, -16.76171875, -15.3310546875, -13.900390625, -12.4697265625, -11.0390625, -9.6083984375, -8.177734375, -6.7470703125, -5.31640625, -3.8857421875, -2.455078125, -1.0244140625, 0.40625, 1.8369140625, 3.267578125, 4.6982421875, 6.12890625, 7.5595703125, 8.990234375, 10.4208984375, 11.8515625, 13.2822265625, 14.712890625, 16.1435546875, 17.57421875, 19.0048828125, 20.435546875, 21.8662109375, 23.296875, 24.7275390625, 26.158203125, 27.5888671875, 29.01953125, 30.4501953125, 31.880859375, 33.3115234375, 34.7421875, 36.1728515625, 37.603515625, 39.0341796875, 40.46484375, 41.8955078125, 43.326171875, 44.7568359375, 46.1875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 108.0, 879.0, 27.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.258917808532715, -6.570531368255615, -1.8821449279785156, 2.806241035461426, 7.494627952575684, 12.183014869689941, 16.87139892578125, 21.55978775024414, 26.248172760009766, 30.936559677124023, 35.62494659423828, 40.313331604003906, 45.00171661376953, 49.69010543823242, 54.37849044799805, 59.06687927246094, 63.75526428222656, 68.44364929199219, 73.13203430175781, 77.82041931152344, 82.5088119506836, 87.19719696044922, 91.88558197021484, 96.573974609375, 101.26235961914062, 105.95074462890625, 110.63912963867188, 115.3275146484375, 120.01590728759766, 124.70429229736328, 129.39266967773438, 134.08106994628906, 138.7694549560547, 143.4578399658203, 148.14622497558594, 152.83460998535156, 157.5229949951172, 162.21139526367188, 166.8997802734375, 171.58816528320312, 176.27655029296875, 180.96493530273438, 185.6533203125, 190.34170532226562, 195.03009033203125, 199.71847534179688, 204.4068603515625, 209.0952606201172, 213.78363037109375, 218.47201538085938, 223.160400390625, 227.84878540039062, 232.53717041015625, 237.22555541992188, 241.9139404296875, 246.6023406982422, 251.2907257080078, 255.97911071777344, 260.6675109863281, 265.35589599609375, 270.0442810058594, 274.732666015625, 279.4210510253906, 284.10943603515625, 288.7978210449219]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 6.0, 8.0, 14.0, 19.0, 11.0, 18.0, 17.0, 24.0, 9.0, 29.0, 36.0, 39.0, 40.0, 34.0, 35.0, 32.0, 33.0, 47.0, 43.0, 34.0, 26.0, 46.0, 38.0, 32.0, 42.0, 38.0, 33.0, 27.0, 28.0, 18.0, 24.0, 18.0, 17.0, 13.0, 13.0, 8.0, 7.0, 6.0, 7.0, 4.0, 7.0, 2.0, 2.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-64.68431854248047, -62.79274368286133, -60.90116882324219, -59.00959777832031, -57.11802291870117, -55.22644805908203, -53.33487319946289, -51.44329833984375, -49.551727294921875, -47.660152435302734, -45.768577575683594, -43.87700653076172, -41.98543167114258, -40.09385681152344, -38.2022819519043, -36.310707092285156, -34.419132232666016, -32.527557373046875, -30.635984420776367, -28.744409561157227, -26.85283660888672, -24.961261749267578, -23.069686889648438, -21.178112030029297, -19.28653907775879, -17.39496421813965, -15.50339126586914, -13.61181640625, -11.720242500305176, -9.828668594360352, -7.937093734741211, -6.045519828796387, -4.1539459228515625, -2.262371778488159, -0.37079763412475586, 1.5207767486572266, 3.412350654602051, 5.303924560546875, 7.195499420166016, 9.08707332611084, 10.978647232055664, 12.870221138000488, 14.761795043945312, 16.653369903564453, 18.544944763183594, 20.4365177154541, 22.328092575073242, 24.21966552734375, 26.11124038696289, 28.00281524658203, 29.89438819885254, 31.78596305847168, 33.67753601074219, 35.56911087036133, 37.46068572998047, 39.35226058959961, 41.24383544921875, 43.13541030883789, 45.02698516845703, 46.918556213378906, 48.81013107299805, 50.70170593261719, 52.59328079223633, 54.48485565185547, 56.376426696777344]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 6.0, 19.0, 11.0, 11.0, 15.0, 18.0, 22.0, 19.0, 31.0, 23.0, 27.0, 36.0, 38.0, 37.0, 39.0, 30.0, 49.0, 47.0, 55.0, 41.0, 52.0, 44.0, 42.0, 39.0, 31.0, 29.0, 26.0, 29.0, 21.0, 19.0, 10.0, 15.0, 14.0, 13.0, 10.0, 5.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.078125, -6.88555908203125, -6.6929931640625, -6.50042724609375, -6.307861328125, -6.11529541015625, -5.9227294921875, -5.73016357421875, -5.53759765625, -5.34503173828125, -5.1524658203125, -4.95989990234375, -4.767333984375, -4.57476806640625, -4.3822021484375, -4.18963623046875, -3.9970703125, -3.80450439453125, -3.6119384765625, -3.41937255859375, -3.226806640625, -3.03424072265625, -2.8416748046875, -2.64910888671875, -2.45654296875, -2.26397705078125, -2.0714111328125, -1.87884521484375, -1.686279296875, -1.49371337890625, -1.3011474609375, -1.10858154296875, -0.916015625, -0.72344970703125, -0.5308837890625, -0.33831787109375, -0.145751953125, 0.04681396484375, 0.2393798828125, 0.43194580078125, 0.62451171875, 0.81707763671875, 1.0096435546875, 1.20220947265625, 1.394775390625, 1.58734130859375, 1.7799072265625, 1.97247314453125, 2.1650390625, 2.35760498046875, 2.5501708984375, 2.74273681640625, 2.935302734375, 3.12786865234375, 3.3204345703125, 3.51300048828125, 3.70556640625, 3.89813232421875, 4.0906982421875, 4.28326416015625, 4.475830078125, 4.66839599609375, 4.8609619140625, 5.05352783203125, 5.24609375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 13.0, 7.0, 8.0, 17.0, 14.0, 19.0, 17.0, 33.0, 39.0, 50.0, 66.0, 82.0, 146.0, 240.0, 480.0, 1290.0, 7568.0, 78921.0, 1831308.0, 2160487.0, 101629.0, 9047.0, 1552.0, 474.0, 240.0, 141.0, 91.0, 65.0, 54.0, 32.0, 34.0, 18.0, 17.0, 18.0, 8.0, 9.0, 11.0, 2.0, 7.0, 5.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.46875, -18.79833984375, -18.1279296875, -17.45751953125, -16.787109375, -16.11669921875, -15.4462890625, -14.77587890625, -14.10546875, -13.43505859375, -12.7646484375, -12.09423828125, -11.423828125, -10.75341796875, -10.0830078125, -9.41259765625, -8.7421875, -8.07177734375, -7.4013671875, -6.73095703125, -6.060546875, -5.39013671875, -4.7197265625, -4.04931640625, -3.37890625, -2.70849609375, -2.0380859375, -1.36767578125, -0.697265625, -0.02685546875, 0.6435546875, 1.31396484375, 1.984375, 2.65478515625, 3.3251953125, 3.99560546875, 4.666015625, 5.33642578125, 6.0068359375, 6.67724609375, 7.34765625, 8.01806640625, 8.6884765625, 9.35888671875, 10.029296875, 10.69970703125, 11.3701171875, 12.04052734375, 12.7109375, 13.38134765625, 14.0517578125, 14.72216796875, 15.392578125, 16.06298828125, 16.7333984375, 17.40380859375, 18.07421875, 18.74462890625, 19.4150390625, 20.08544921875, 20.755859375, 21.42626953125, 22.0966796875, 22.76708984375, 23.4375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 10.0, 23.0, 45.0, 90.0, 165.0, 334.0, 581.0, 1008.0, 816.0, 461.0, 259.0, 132.0, 79.0, 36.0, 25.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-60.59375, -59.271484375, -57.94921875, -56.626953125, -55.3046875, -53.982421875, -52.66015625, -51.337890625, -50.015625, -48.693359375, -47.37109375, -46.048828125, -44.7265625, -43.404296875, -42.08203125, -40.759765625, -39.4375, -38.115234375, -36.79296875, -35.470703125, -34.1484375, -32.826171875, -31.50390625, -30.181640625, -28.859375, -27.537109375, -26.21484375, -24.892578125, -23.5703125, -22.248046875, -20.92578125, -19.603515625, -18.28125, -16.958984375, -15.63671875, -14.314453125, -12.9921875, -11.669921875, -10.34765625, -9.025390625, -7.703125, -6.380859375, -5.05859375, -3.736328125, -2.4140625, -1.091796875, 0.23046875, 1.552734375, 2.875, 4.197265625, 5.51953125, 6.841796875, 8.1640625, 9.486328125, 10.80859375, 12.130859375, 13.453125, 14.775390625, 16.09765625, 17.419921875, 18.7421875, 20.064453125, 21.38671875, 22.708984375, 24.03125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 15.0, 27.0, 77.0, 178.0, 410.0, 3985.0, 4175879.0, 12846.0, 529.0, 189.0, 85.0, 38.0, 16.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.875, -90.423828125, -84.97265625, -79.521484375, -74.0703125, -68.619140625, -63.16796875, -57.716796875, -52.265625, -46.814453125, -41.36328125, -35.912109375, -30.4609375, -25.009765625, -19.55859375, -14.107421875, -8.65625, -3.205078125, 2.24609375, 7.697265625, 13.1484375, 18.599609375, 24.05078125, 29.501953125, 34.953125, 40.404296875, 45.85546875, 51.306640625, 56.7578125, 62.208984375, 67.66015625, 73.111328125, 78.5625, 84.013671875, 89.46484375, 94.916015625, 100.3671875, 105.818359375, 111.26953125, 116.720703125, 122.171875, 127.623046875, 133.07421875, 138.525390625, 143.9765625, 149.427734375, 154.87890625, 160.330078125, 165.78125, 171.232421875, 176.68359375, 182.134765625, 187.5859375, 193.037109375, 198.48828125, 203.939453125, 209.390625, 214.841796875, 220.29296875, 225.744140625, 231.1953125, 236.646484375, 242.09765625, 247.548828125, 253.0]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 18.0, 192.0, 517.0, 255.0, 24.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.34708023071289, -50.33559036254883, -41.32410430908203, -32.31261444091797, -23.301124572753906, -14.289634704589844, -5.278148651123047, 3.7333412170410156, 12.744831085205078, 21.75632095336914, 30.76780891418457, 39.779296875, 48.79078674316406, 57.802276611328125, 66.81376647949219, 75.82525634765625, 84.83674621582031, 93.84823608398438, 102.85972595214844, 111.8712158203125, 120.88270568847656, 129.89419555664062, 138.90567016601562, 147.91717529296875, 156.92864990234375, 165.9401397705078, 174.95162963867188, 183.96311950683594, 192.974609375, 201.98609924316406, 210.99758911132812, 220.00906372070312, 229.02053833007812, 238.0320281982422, 247.04351806640625, 256.05499267578125, 265.0664978027344, 274.0779724121094, 283.0894775390625, 292.1009521484375, 301.1124572753906, 310.1239318847656, 319.13543701171875, 328.14691162109375, 337.1584167480469, 346.1698913574219, 355.181396484375, 364.19287109375, 373.204345703125, 382.2158203125, 391.2273254394531, 400.2388000488281, 409.25030517578125, 418.26177978515625, 427.2732849121094, 436.2847595214844, 445.2962646484375, 454.3077392578125, 463.3192443847656, 472.3307189941406, 481.34222412109375, 490.35369873046875, 499.3652038574219, 508.3766784667969, 517.38818359375]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 10.0, 3.0, 5.0, 7.0, 11.0, 10.0, 10.0, 15.0, 16.0, 24.0, 15.0, 21.0, 24.0, 28.0, 40.0, 35.0, 37.0, 38.0, 49.0, 45.0, 41.0, 47.0, 33.0, 40.0, 47.0, 31.0, 39.0, 42.0, 37.0, 22.0, 28.0, 38.0, 20.0, 18.0, 11.0, 28.0, 6.0, 7.0, 6.0, 9.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-78.26520538330078, -75.99034118652344, -73.71546936035156, -71.44060516357422, -69.16574096679688, -66.890869140625, -64.61600494384766, -62.34113693237305, -60.06626892089844, -57.79140090942383, -55.51653289794922, -53.241668701171875, -50.966800689697266, -48.691932678222656, -46.41706848144531, -44.1422004699707, -41.867332458496094, -39.592464447021484, -37.317596435546875, -35.04273223876953, -32.76786422729492, -30.492996215820312, -28.218130111694336, -25.94326400756836, -23.66839599609375, -21.39352798461914, -19.118661880493164, -16.843795776367188, -14.568927764892578, -12.294060707092285, -10.019193649291992, -7.744326591491699, -5.469459533691406, -3.1945924758911133, -0.9197254180908203, 1.3551416397094727, 3.6300086975097656, 5.904875755310059, 8.179742813110352, 10.454609870910645, 12.729476928710938, 15.00434398651123, 17.279211044311523, 19.5540771484375, 21.82894515991211, 24.10381317138672, 26.378679275512695, 28.653545379638672, 30.92841339111328, 33.20328140258789, 35.4781494140625, 37.753013610839844, 40.02788162231445, 42.30274963378906, 44.577613830566406, 46.852481842041016, 49.127349853515625, 51.402217864990234, 53.677085876464844, 55.95195007324219, 58.2268180847168, 60.501686096191406, 62.77655029296875, 65.05142211914062, 67.32628631591797]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 8.0, 10.0, 11.0, 13.0, 13.0, 16.0, 18.0, 28.0, 18.0, 28.0, 19.0, 35.0, 35.0, 37.0, 43.0, 41.0, 56.0, 47.0, 52.0, 43.0, 60.0, 42.0, 47.0, 32.0, 33.0, 28.0, 20.0, 28.0, 33.0, 15.0, 17.0, 9.0, 14.0, 14.0, 11.0, 8.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-7.80859375, -7.6038818359375, -7.399169921875, -7.1944580078125, -6.98974609375, -6.7850341796875, -6.580322265625, -6.3756103515625, -6.1708984375, -5.9661865234375, -5.761474609375, -5.5567626953125, -5.35205078125, -5.1473388671875, -4.942626953125, -4.7379150390625, -4.533203125, -4.3284912109375, -4.123779296875, -3.9190673828125, -3.71435546875, -3.5096435546875, -3.304931640625, -3.1002197265625, -2.8955078125, -2.6907958984375, -2.486083984375, -2.2813720703125, -2.07666015625, -1.8719482421875, -1.667236328125, -1.4625244140625, -1.2578125, -1.0531005859375, -0.848388671875, -0.6436767578125, -0.43896484375, -0.2342529296875, -0.029541015625, 0.1751708984375, 0.3798828125, 0.5845947265625, 0.789306640625, 0.9940185546875, 1.19873046875, 1.4034423828125, 1.608154296875, 1.8128662109375, 2.017578125, 2.2222900390625, 2.427001953125, 2.6317138671875, 2.83642578125, 3.0411376953125, 3.245849609375, 3.4505615234375, 3.6552734375, 3.8599853515625, 4.064697265625, 4.2694091796875, 4.47412109375, 4.6788330078125, 4.883544921875, 5.0882568359375, 5.29296875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 5.0, 7.0, 10.0, 10.0, 23.0, 28.0, 47.0, 79.0, 105.0, 166.0, 288.0, 437.0, 676.0, 1060.0, 1697.0, 2684.0, 4608.0, 7511.0, 12669.0, 20866.0, 36029.0, 64636.0, 135430.0, 390093.0, 184860.0, 79378.0, 42831.0, 24775.0, 14750.0, 8881.0, 5309.0, 3226.0, 1968.0, 1234.0, 803.0, 511.0, 325.0, 189.0, 116.0, 73.0, 49.0, 27.0, 19.0, 24.0, 10.0, 13.0, 10.0, 6.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.48828125, -1.4412689208984375, -1.394256591796875, -1.3472442626953125, -1.30023193359375, -1.2532196044921875, -1.206207275390625, -1.1591949462890625, -1.1121826171875, -1.0651702880859375, -1.018157958984375, -0.9711456298828125, -0.92413330078125, -0.8771209716796875, -0.830108642578125, -0.7830963134765625, -0.736083984375, -0.6890716552734375, -0.642059326171875, -0.5950469970703125, -0.54803466796875, -0.5010223388671875, -0.454010009765625, -0.4069976806640625, -0.3599853515625, -0.3129730224609375, -0.265960693359375, -0.2189483642578125, -0.17193603515625, -0.1249237060546875, -0.077911376953125, -0.0308990478515625, 0.01611328125, 0.0631256103515625, 0.110137939453125, 0.1571502685546875, 0.20416259765625, 0.2511749267578125, 0.298187255859375, 0.3451995849609375, 0.3922119140625, 0.4392242431640625, 0.486236572265625, 0.5332489013671875, 0.58026123046875, 0.6272735595703125, 0.674285888671875, 0.7212982177734375, 0.768310546875, 0.8153228759765625, 0.862335205078125, 0.9093475341796875, 0.95635986328125, 1.0033721923828125, 1.050384521484375, 1.0973968505859375, 1.1444091796875, 1.1914215087890625, 1.238433837890625, 1.2854461669921875, 1.33245849609375, 1.3794708251953125, 1.426483154296875, 1.4734954833984375, 1.5205078125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 5.0, 12.0, 6.0, 9.0, 15.0, 14.0, 12.0, 26.0, 28.0, 19.0, 17.0, 31.0, 30.0, 33.0, 35.0, 32.0, 35.0, 42.0, 45.0, 1075.0, 44.0, 42.0, 40.0, 35.0, 39.0, 36.0, 31.0, 37.0, 24.0, 26.0, 31.0, 14.0, 13.0, 22.0, 12.0, 12.0, 7.0, 8.0, 3.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.93621826171875, -3.8177490234375, -3.69927978515625, -3.580810546875, -3.46234130859375, -3.3438720703125, -3.22540283203125, -3.10693359375, -2.98846435546875, -2.8699951171875, -2.75152587890625, -2.633056640625, -2.51458740234375, -2.3961181640625, -2.27764892578125, -2.1591796875, -2.04071044921875, -1.9222412109375, -1.80377197265625, -1.685302734375, -1.56683349609375, -1.4483642578125, -1.32989501953125, -1.21142578125, -1.09295654296875, -0.9744873046875, -0.85601806640625, -0.737548828125, -0.61907958984375, -0.5006103515625, -0.38214111328125, -0.263671875, -0.14520263671875, -0.0267333984375, 0.09173583984375, 0.210205078125, 0.32867431640625, 0.4471435546875, 0.56561279296875, 0.68408203125, 0.80255126953125, 0.9210205078125, 1.03948974609375, 1.157958984375, 1.27642822265625, 1.3948974609375, 1.51336669921875, 1.6318359375, 1.75030517578125, 1.8687744140625, 1.98724365234375, 2.105712890625, 2.22418212890625, 2.3426513671875, 2.46112060546875, 2.57958984375, 2.69805908203125, 2.8165283203125, 2.93499755859375, 3.053466796875, 3.17193603515625, 3.2904052734375, 3.40887451171875, 3.52734375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 9.0, 4.0, 11.0, 15.0, 27.0, 40.0, 53.0, 94.0, 162.0, 241.0, 395.0, 634.0, 982.0, 1613.0, 2439.0, 3976.0, 6136.0, 9830.0, 16086.0, 26176.0, 43539.0, 75746.0, 150937.0, 1421417.0, 150263.0, 74965.0, 43040.0, 25722.0, 15598.0, 9986.0, 6244.0, 3966.0, 2494.0, 1572.0, 1017.0, 636.0, 398.0, 259.0, 147.0, 107.0, 65.0, 32.0, 20.0, 24.0, 9.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.4248046875, -1.3834991455078125, -1.342193603515625, -1.3008880615234375, -1.25958251953125, -1.2182769775390625, -1.176971435546875, -1.1356658935546875, -1.0943603515625, -1.0530548095703125, -1.011749267578125, -0.9704437255859375, -0.92913818359375, -0.8878326416015625, -0.846527099609375, -0.8052215576171875, -0.763916015625, -0.7226104736328125, -0.681304931640625, -0.6399993896484375, -0.59869384765625, -0.5573883056640625, -0.516082763671875, -0.4747772216796875, -0.4334716796875, -0.3921661376953125, -0.350860595703125, -0.3095550537109375, -0.26824951171875, -0.2269439697265625, -0.185638427734375, -0.1443328857421875, -0.10302734375, -0.0617218017578125, -0.020416259765625, 0.0208892822265625, 0.06219482421875, 0.1035003662109375, 0.144805908203125, 0.1861114501953125, 0.2274169921875, 0.2687225341796875, 0.310028076171875, 0.3513336181640625, 0.39263916015625, 0.4339447021484375, 0.475250244140625, 0.5165557861328125, 0.557861328125, 0.5991668701171875, 0.640472412109375, 0.6817779541015625, 0.72308349609375, 0.7643890380859375, 0.805694580078125, 0.8470001220703125, 0.8883056640625, 0.9296112060546875, 0.970916748046875, 1.0122222900390625, 1.05352783203125, 1.0948333740234375, 1.136138916015625, 1.1774444580078125, 1.21875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 8.0, 13.0, 11.0, 17.0, 23.0, 23.0, 40.0, 51.0, 73.0, 102.0, 104.0, 99.0, 105.0, 84.0, 53.0, 46.0, 26.0, 27.0, 17.0, 11.0, 6.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008997917175292969, -0.0008734986186027527, -0.0008472055196762085, -0.0008209124207496643, -0.0007946193218231201, -0.0007683262228965759, -0.0007420331239700317, -0.0007157400250434875, -0.0006894469261169434, -0.0006631538271903992, -0.000636860728263855, -0.0006105676293373108, -0.0005842745304107666, -0.0005579814314842224, -0.0005316883325576782, -0.000505395233631134, -0.00047910213470458984, -0.00045280903577804565, -0.00042651593685150146, -0.0004002228379249573, -0.0003739297389984131, -0.0003476366400718689, -0.0003213435411453247, -0.0002950504422187805, -0.00026875734329223633, -0.00024246424436569214, -0.00021617114543914795, -0.00018987804651260376, -0.00016358494758605957, -0.00013729184865951538, -0.00011099874973297119, -8.4705650806427e-05, -5.841255187988281e-05, -3.211945295333862e-05, -5.826354026794434e-06, 2.0466744899749756e-05, 4.6759843826293945e-05, 7.305294275283813e-05, 9.934604167938232e-05, 0.00012563914060592651, 0.0001519322395324707, 0.0001782253384590149, 0.00020451843738555908, 0.00023081153631210327, 0.00025710463523864746, 0.00028339773416519165, 0.00030969083309173584, 0.00033598393201828003, 0.0003622770309448242, 0.0003885701298713684, 0.0004148632287979126, 0.0004411563277244568, 0.000467449426651001, 0.0004937425255775452, 0.0005200356245040894, 0.0005463287234306335, 0.0005726218223571777, 0.0005989149212837219, 0.0006252080202102661, 0.0006515011191368103, 0.0006777942180633545, 0.0007040873169898987, 0.0007303804159164429, 0.0007566735148429871, 0.0007829666137695312]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 9.0, 4.0, 2.0, 5.0, 5.0, 7.0, 12.0, 11.0, 19.0, 22.0, 28.0, 46.0, 41.0, 67.0, 104.0, 134.0, 225.0, 498.0, 15981.0, 1028467.0, 1872.0, 384.0, 174.0, 114.0, 76.0, 52.0, 33.0, 35.0, 28.0, 33.0, 18.0, 17.0, 4.0, 7.0, 4.0, 7.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0172882080078125, -0.016753196716308594, -0.016218185424804688, -0.01568317413330078, -0.015148162841796875, -0.014613151550292969, -0.014078140258789062, -0.013543128967285156, -0.01300811767578125, -0.012473106384277344, -0.011938095092773438, -0.011403083801269531, -0.010868072509765625, -0.010333061218261719, -0.009798049926757812, -0.009263038635253906, -0.00872802734375, -0.008193016052246094, -0.0076580047607421875, -0.007122993469238281, -0.006587982177734375, -0.006052970886230469, -0.0055179595947265625, -0.004982948303222656, -0.00444793701171875, -0.003912925720214844, -0.0033779144287109375, -0.0028429031372070312, -0.002307891845703125, -0.0017728805541992188, -0.0012378692626953125, -0.0007028579711914062, -0.0001678466796875, 0.00036716461181640625, 0.0009021759033203125, 0.0014371871948242188, 0.001972198486328125, 0.0025072097778320312, 0.0030422210693359375, 0.0035772323608398438, 0.00411224365234375, 0.004647254943847656, 0.0051822662353515625, 0.005717277526855469, 0.006252288818359375, 0.006787300109863281, 0.0073223114013671875, 0.007857322692871094, 0.008392333984375, 0.008927345275878906, 0.009462356567382812, 0.009997367858886719, 0.010532379150390625, 0.011067390441894531, 0.011602401733398438, 0.012137413024902344, 0.01267242431640625, 0.013207435607910156, 0.013742446899414062, 0.014277458190917969, 0.014812469482421875, 0.015347480773925781, 0.015882492065429688, 0.016417503356933594, 0.0169525146484375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 20.0, 254.0, 654.0, 86.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011516035301610827, -0.0010810287203639746, -0.0010104540269821882, -0.00093987921718508, -0.0008693044073879719, -0.0007987295975908637, -0.0007281548460014164, -0.0006575800944119692, -0.000587005284614861, -0.0005164304748177528, -0.0004458557232283056, -0.00037528094253502786, -0.00030470616184175014, -0.00023413138114847243, -0.0001635566004551947, -9.298184886574745e-05, -2.240703906863928e-05, 4.816774162463844e-05, 0.00011874252231791615, 0.00018931730301119387, 0.0002598920837044716, 0.0003304668643977493, 0.000401041645091027, 0.0004716163966804743, 0.0005421912064775825, 0.0006127660162746906, 0.0006833407678641379, 0.0007539155194535851, 0.0008244903292506933, 0.0008950651390478015, 0.0009656398906372488, 0.001036214642226696, 0.0011067893356084824, 0.0011773641454055905, 0.0012479389552026987, 0.001318513648584485, 0.0013890884583815932, 0.0014596632681787014, 0.0015302379615604877, 0.001600812771357596, 0.001671387581154704, 0.0017419623909518123, 0.0018125372007489204, 0.0018831118941307068, 0.001953686587512493, 0.002024261513724923, 0.0020948362071067095, 0.0021654111333191395, 0.002235985826700926, 0.002306560520082712, 0.002377135446295142, 0.0024477101396769285, 0.0025182850658893585, 0.002588859759271145, 0.002659434452652931, 0.0027300091460347176, 0.0028005840722471476, 0.002871158765628934, 0.002941733691841364, 0.0030123083852231503, 0.0030828830786049366, 0.0031534580048173666, 0.003224032698199153, 0.003294607624411583, 0.0033651823177933693]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 6.0, 15.0, 7.0, 12.0, 10.0, 15.0, 11.0, 21.0, 11.0, 23.0, 19.0, 33.0, 24.0, 33.0, 27.0, 27.0, 25.0, 35.0, 34.0, 22.0, 31.0, 44.0, 39.0, 44.0, 37.0, 25.0, 29.0, 34.0, 36.0, 23.0, 30.0, 27.0, 25.0, 14.0, 29.0, 17.0, 17.0, 11.0, 10.0, 8.0, 12.0, 11.0, 9.0, 9.0, 6.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.0002936720848083496, -0.00028464850038290024, -0.00027562491595745087, -0.0002666013315320015, -0.0002575777471065521, -0.00024855416268110275, -0.00023953057825565338, -0.000230506993830204, -0.00022148340940475464, -0.00021245982497930527, -0.0002034362405538559, -0.00019441265612840652, -0.00018538907170295715, -0.00017636548727750778, -0.0001673419028520584, -0.00015831831842660904, -0.00014929473400115967, -0.0001402711495757103, -0.00013124756515026093, -0.00012222398072481155, -0.00011320039629936218, -0.00010417681187391281, -9.515322744846344e-05, -8.612964302301407e-05, -7.71060585975647e-05, -6.808247417211533e-05, -5.9058889746665955e-05, -5.003530532121658e-05, -4.101172089576721e-05, -3.198813647031784e-05, -2.296455204486847e-05, -1.3940967619419098e-05, -4.9173831939697266e-06, 4.106201231479645e-06, 1.3129785656929016e-05, 2.2153370082378387e-05, 3.117695450782776e-05, 4.020053893327713e-05, 4.92241233587265e-05, 5.824770778417587e-05, 6.727129220962524e-05, 7.629487663507462e-05, 8.531846106052399e-05, 9.434204548597336e-05, 0.00010336562991142273, 0.0001123892143368721, 0.00012141279876232147, 0.00013043638318777084, 0.00013945996761322021, 0.00014848355203866959, 0.00015750713646411896, 0.00016653072088956833, 0.0001755543053150177, 0.00018457788974046707, 0.00019360147416591644, 0.00020262505859136581, 0.00021164864301681519, 0.00022067222744226456, 0.00022969581186771393, 0.0002387193962931633, 0.00024774298071861267, 0.00025676656514406204, 0.0002657901495695114, 0.0002748137339949608, 0.00028383731842041016]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 8.0, 10.0, 11.0, 13.0, 13.0, 16.0, 18.0, 28.0, 18.0, 28.0, 19.0, 35.0, 35.0, 37.0, 43.0, 41.0, 56.0, 47.0, 52.0, 43.0, 60.0, 42.0, 47.0, 32.0, 33.0, 28.0, 20.0, 28.0, 33.0, 15.0, 17.0, 9.0, 14.0, 14.0, 11.0, 8.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-7.80859375, -7.6038818359375, -7.399169921875, -7.1944580078125, -6.98974609375, -6.7850341796875, -6.580322265625, -6.3756103515625, -6.1708984375, -5.9661865234375, -5.761474609375, -5.5567626953125, -5.35205078125, -5.1473388671875, -4.942626953125, -4.7379150390625, -4.533203125, -4.3284912109375, -4.123779296875, -3.9190673828125, -3.71435546875, -3.5096435546875, -3.304931640625, -3.1002197265625, -2.8955078125, -2.6907958984375, -2.486083984375, -2.2813720703125, -2.07666015625, -1.8719482421875, -1.667236328125, -1.4625244140625, -1.2578125, -1.0531005859375, -0.848388671875, -0.6436767578125, -0.43896484375, -0.2342529296875, -0.029541015625, 0.1751708984375, 0.3798828125, 0.5845947265625, 0.789306640625, 0.9940185546875, 1.19873046875, 1.4034423828125, 1.608154296875, 1.8128662109375, 2.017578125, 2.2222900390625, 2.427001953125, 2.6317138671875, 2.83642578125, 3.0411376953125, 3.245849609375, 3.4505615234375, 3.6552734375, 3.8599853515625, 4.064697265625, 4.2694091796875, 4.47412109375, 4.6788330078125, 4.883544921875, 5.0882568359375, 5.29296875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 6.0, 4.0, 19.0, 29.0, 32.0, 55.0, 77.0, 124.0, 170.0, 384.0, 545.0, 918.0, 1621.0, 2715.0, 5318.0, 10518.0, 21595.0, 50711.0, 144609.0, 450546.0, 228281.0, 72675.0, 29032.0, 13299.0, 6802.0, 3624.0, 2007.0, 1067.0, 680.0, 422.0, 245.0, 145.0, 96.0, 49.0, 38.0, 31.0, 22.0, 20.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.23828125, -5.099273681640625, -4.96026611328125, -4.821258544921875, -4.6822509765625, -4.543243408203125, -4.40423583984375, -4.265228271484375, -4.126220703125, -3.987213134765625, -3.84820556640625, -3.709197998046875, -3.5701904296875, -3.431182861328125, -3.29217529296875, -3.153167724609375, -3.01416015625, -2.875152587890625, -2.73614501953125, -2.597137451171875, -2.4581298828125, -2.319122314453125, -2.18011474609375, -2.041107177734375, -1.902099609375, -1.763092041015625, -1.62408447265625, -1.485076904296875, -1.3460693359375, -1.207061767578125, -1.06805419921875, -0.929046630859375, -0.7900390625, -0.651031494140625, -0.51202392578125, -0.373016357421875, -0.2340087890625, -0.095001220703125, 0.04400634765625, 0.183013916015625, 0.322021484375, 0.461029052734375, 0.60003662109375, 0.739044189453125, 0.8780517578125, 1.017059326171875, 1.15606689453125, 1.295074462890625, 1.43408203125, 1.573089599609375, 1.71209716796875, 1.851104736328125, 1.9901123046875, 2.129119873046875, 2.26812744140625, 2.407135009765625, 2.546142578125, 2.685150146484375, 2.82415771484375, 2.963165283203125, 3.1021728515625, 3.241180419921875, 3.38018798828125, 3.519195556640625, 3.658203125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 8.0, 13.0, 20.0, 15.0, 18.0, 28.0, 30.0, 27.0, 30.0, 35.0, 41.0, 37.0, 41.0, 57.0, 66.0, 196.0, 1761.0, 137.0, 68.0, 47.0, 34.0, 44.0, 36.0, 43.0, 27.0, 35.0, 25.0, 19.0, 14.0, 14.0, 14.0, 8.0, 15.0, 6.0, 9.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.984375, -21.261474609375, -20.53857421875, -19.815673828125, -19.0927734375, -18.369873046875, -17.64697265625, -16.924072265625, -16.201171875, -15.478271484375, -14.75537109375, -14.032470703125, -13.3095703125, -12.586669921875, -11.86376953125, -11.140869140625, -10.41796875, -9.695068359375, -8.97216796875, -8.249267578125, -7.5263671875, -6.803466796875, -6.08056640625, -5.357666015625, -4.634765625, -3.911865234375, -3.18896484375, -2.466064453125, -1.7431640625, -1.020263671875, -0.29736328125, 0.425537109375, 1.1484375, 1.871337890625, 2.59423828125, 3.317138671875, 4.0400390625, 4.762939453125, 5.48583984375, 6.208740234375, 6.931640625, 7.654541015625, 8.37744140625, 9.100341796875, 9.8232421875, 10.546142578125, 11.26904296875, 11.991943359375, 12.71484375, 13.437744140625, 14.16064453125, 14.883544921875, 15.6064453125, 16.329345703125, 17.05224609375, 17.775146484375, 18.498046875, 19.220947265625, 19.94384765625, 20.666748046875, 21.3896484375, 22.112548828125, 22.83544921875, 23.558349609375, 24.28125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 18.0, 11.0, 7.0, 12.0, 20.0, 14.0, 22.0, 28.0, 43.0, 30.0, 47.0, 68.0, 93.0, 160.0, 216.0, 481.0, 1603.0, 22985.0, 3047818.0, 67922.0, 2608.0, 603.0, 293.0, 148.0, 86.0, 72.0, 46.0, 35.0, 34.0, 42.0, 20.0, 22.0, 15.0, 19.0, 15.0, 7.0, 10.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.3125, -33.19189453125, -32.0712890625, -30.95068359375, -29.830078125, -28.70947265625, -27.5888671875, -26.46826171875, -25.34765625, -24.22705078125, -23.1064453125, -21.98583984375, -20.865234375, -19.74462890625, -18.6240234375, -17.50341796875, -16.3828125, -15.26220703125, -14.1416015625, -13.02099609375, -11.900390625, -10.77978515625, -9.6591796875, -8.53857421875, -7.41796875, -6.29736328125, -5.1767578125, -4.05615234375, -2.935546875, -1.81494140625, -0.6943359375, 0.42626953125, 1.546875, 2.66748046875, 3.7880859375, 4.90869140625, 6.029296875, 7.14990234375, 8.2705078125, 9.39111328125, 10.51171875, 11.63232421875, 12.7529296875, 13.87353515625, 14.994140625, 16.11474609375, 17.2353515625, 18.35595703125, 19.4765625, 20.59716796875, 21.7177734375, 22.83837890625, 23.958984375, 25.07958984375, 26.2001953125, 27.32080078125, 28.44140625, 29.56201171875, 30.6826171875, 31.80322265625, 32.923828125, 34.04443359375, 35.1650390625, 36.28564453125, 37.40625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [5.0, 926.0, 87.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.113909721374512, -6.182736396789551, 2.74843692779541, 11.679610252380371, 20.610782623291016, 29.54195785522461, 38.47312927246094, 47.404300689697266, 56.33547592163086, 65.26664733886719, 74.19782257080078, 83.12899780273438, 92.06016540527344, 100.99134826660156, 109.92251586914062, 118.85368347167969, 127.78486633300781, 136.71603393554688, 145.647216796875, 154.57838439941406, 163.50955200195312, 172.44073486328125, 181.3719024658203, 190.30307006835938, 199.2342529296875, 208.16542053222656, 217.0966033935547, 226.02777099609375, 234.95895385742188, 243.89012145996094, 252.8212890625, 261.7524719238281, 270.68365478515625, 279.6148376464844, 288.5459899902344, 297.4771728515625, 306.4083557128906, 315.33953857421875, 324.27069091796875, 333.2018737792969, 342.133056640625, 351.0642395019531, 359.9953918457031, 368.92657470703125, 377.8577575683594, 386.7889404296875, 395.7200927734375, 404.6512756347656, 413.5824279785156, 422.51361083984375, 431.44476318359375, 440.3759460449219, 449.30712890625, 458.23828125, 467.1694641113281, 476.10064697265625, 485.03179931640625, 493.9629821777344, 502.8941345214844, 511.8253173828125, 520.7564697265625, 529.6876831054688, 538.6188354492188, 547.5499877929688, 556.481201171875]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 9.0, 10.0, 8.0, 17.0, 3.0, 10.0, 20.0, 19.0, 23.0, 20.0, 29.0, 28.0, 33.0, 41.0, 44.0, 51.0, 38.0, 53.0, 44.0, 41.0, 53.0, 42.0, 37.0, 39.0, 41.0, 32.0, 44.0, 20.0, 22.0, 27.0, 21.0, 19.0, 15.0, 10.0, 10.0, 10.0, 11.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-84.63715362548828, -82.20208740234375, -79.76702880859375, -77.33197021484375, -74.89690399169922, -72.46183776855469, -70.02677917480469, -67.59172058105469, -65.15665435791016, -62.72159194946289, -60.286529541015625, -57.85146713256836, -55.416404724121094, -52.98134231567383, -50.54627990722656, -48.1112174987793, -45.67615509033203, -43.241092681884766, -40.8060302734375, -38.370967864990234, -35.93590545654297, -33.5008430480957, -31.065780639648438, -28.630718231201172, -26.195655822753906, -23.76059341430664, -21.325531005859375, -18.89046859741211, -16.455406188964844, -14.020343780517578, -11.585281372070312, -9.150218963623047, -6.71514892578125, -4.280086517333984, -1.8450241088867188, 0.5900382995605469, 3.0251007080078125, 5.460163116455078, 7.895225524902344, 10.33028793334961, 12.765350341796875, 15.20041275024414, 17.635475158691406, 20.070537567138672, 22.505599975585938, 24.940662384033203, 27.37572479248047, 29.810787200927734, 32.245849609375, 34.680912017822266, 37.11597442626953, 39.5510368347168, 41.98609924316406, 44.42116165161133, 46.856224060058594, 49.29128646850586, 51.726348876953125, 54.16141128540039, 56.596473693847656, 59.03153610229492, 61.46659851074219, 63.90166091918945, 66.33672332763672, 68.77178955078125, 71.20684814453125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 10.0, 10.0, 7.0, 14.0, 14.0, 14.0, 15.0, 20.0, 20.0, 31.0, 22.0, 26.0, 32.0, 42.0, 42.0, 31.0, 56.0, 52.0, 53.0, 53.0, 52.0, 56.0, 48.0, 35.0, 28.0, 34.0, 25.0, 27.0, 23.0, 15.0, 21.0, 16.0, 17.0, 10.0, 13.0, 7.0, 3.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.2421875, -8.02288818359375, -7.8035888671875, -7.58428955078125, -7.364990234375, -7.14569091796875, -6.9263916015625, -6.70709228515625, -6.48779296875, -6.26849365234375, -6.0491943359375, -5.82989501953125, -5.610595703125, -5.39129638671875, -5.1719970703125, -4.95269775390625, -4.7333984375, -4.51409912109375, -4.2947998046875, -4.07550048828125, -3.856201171875, -3.63690185546875, -3.4176025390625, -3.19830322265625, -2.97900390625, -2.75970458984375, -2.5404052734375, -2.32110595703125, -2.101806640625, -1.88250732421875, -1.6632080078125, -1.44390869140625, -1.224609375, -1.00531005859375, -0.7860107421875, -0.56671142578125, -0.347412109375, -0.12811279296875, 0.0911865234375, 0.31048583984375, 0.52978515625, 0.74908447265625, 0.9683837890625, 1.18768310546875, 1.406982421875, 1.62628173828125, 1.8455810546875, 2.06488037109375, 2.2841796875, 2.50347900390625, 2.7227783203125, 2.94207763671875, 3.161376953125, 3.38067626953125, 3.5999755859375, 3.81927490234375, 4.03857421875, 4.25787353515625, 4.4771728515625, 4.69647216796875, 4.915771484375, 5.13507080078125, 5.3543701171875, 5.57366943359375, 5.79296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 9.0, 11.0, 7.0, 8.0, 13.0, 13.0, 19.0, 16.0, 18.0, 23.0, 39.0, 28.0, 26.0, 38.0, 61.0, 124.0, 476.0, 5869.0, 590445.0, 3560565.0, 34690.0, 1225.0, 166.0, 78.0, 55.0, 42.0, 37.0, 21.0, 23.0, 20.0, 17.0, 23.0, 15.0, 14.0, 15.0, 8.0, 10.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0], "bins": [-50.8125, -49.549560546875, -48.28662109375, -47.023681640625, -45.7607421875, -44.497802734375, -43.23486328125, -41.971923828125, -40.708984375, -39.446044921875, -38.18310546875, -36.920166015625, -35.6572265625, -34.394287109375, -33.13134765625, -31.868408203125, -30.60546875, -29.342529296875, -28.07958984375, -26.816650390625, -25.5537109375, -24.290771484375, -23.02783203125, -21.764892578125, -20.501953125, -19.239013671875, -17.97607421875, -16.713134765625, -15.4501953125, -14.187255859375, -12.92431640625, -11.661376953125, -10.3984375, -9.135498046875, -7.87255859375, -6.609619140625, -5.3466796875, -4.083740234375, -2.82080078125, -1.557861328125, -0.294921875, 0.968017578125, 2.23095703125, 3.493896484375, 4.7568359375, 6.019775390625, 7.28271484375, 8.545654296875, 9.80859375, 11.071533203125, 12.33447265625, 13.597412109375, 14.8603515625, 16.123291015625, 17.38623046875, 18.649169921875, 19.912109375, 21.175048828125, 22.43798828125, 23.700927734375, 24.9638671875, 26.226806640625, 27.48974609375, 28.752685546875, 30.015625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 15.0, 18.0, 36.0, 70.0, 114.0, 213.0, 422.0, 742.0, 964.0, 683.0, 365.0, 205.0, 110.0, 60.0, 19.0, 15.0, 14.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.65625, -43.4931640625, -42.330078125, -41.1669921875, -40.00390625, -38.8408203125, -37.677734375, -36.5146484375, -35.3515625, -34.1884765625, -33.025390625, -31.8623046875, -30.69921875, -29.5361328125, -28.373046875, -27.2099609375, -26.046875, -24.8837890625, -23.720703125, -22.5576171875, -21.39453125, -20.2314453125, -19.068359375, -17.9052734375, -16.7421875, -15.5791015625, -14.416015625, -13.2529296875, -12.08984375, -10.9267578125, -9.763671875, -8.6005859375, -7.4375, -6.2744140625, -5.111328125, -3.9482421875, -2.78515625, -1.6220703125, -0.458984375, 0.7041015625, 1.8671875, 3.0302734375, 4.193359375, 5.3564453125, 6.51953125, 7.6826171875, 8.845703125, 10.0087890625, 11.171875, 12.3349609375, 13.498046875, 14.6611328125, 15.82421875, 16.9873046875, 18.150390625, 19.3134765625, 20.4765625, 21.6396484375, 22.802734375, 23.9658203125, 25.12890625, 26.2919921875, 27.455078125, 28.6181640625, 29.78125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 7.0, 10.0, 11.0, 27.0, 73.0, 175.0, 368.0, 1666.0, 4054035.0, 136641.0, 762.0, 276.0, 114.0, 65.0, 30.0, 16.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.375, -126.080078125, -120.78515625, -115.490234375, -110.1953125, -104.900390625, -99.60546875, -94.310546875, -89.015625, -83.720703125, -78.42578125, -73.130859375, -67.8359375, -62.541015625, -57.24609375, -51.951171875, -46.65625, -41.361328125, -36.06640625, -30.771484375, -25.4765625, -20.181640625, -14.88671875, -9.591796875, -4.296875, 0.998046875, 6.29296875, 11.587890625, 16.8828125, 22.177734375, 27.47265625, 32.767578125, 38.0625, 43.357421875, 48.65234375, 53.947265625, 59.2421875, 64.537109375, 69.83203125, 75.126953125, 80.421875, 85.716796875, 91.01171875, 96.306640625, 101.6015625, 106.896484375, 112.19140625, 117.486328125, 122.78125, 128.076171875, 133.37109375, 138.666015625, 143.9609375, 149.255859375, 154.55078125, 159.845703125, 165.140625, 170.435546875, 175.73046875, 181.025390625, 186.3203125, 191.615234375, 196.91015625, 202.205078125, 207.5]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 11.0, 17.0, 37.0, 95.0, 161.0, 189.0, 164.0, 149.0, 87.0, 60.0, 23.0, 16.0, 2.0, 2.0], "bins": [-197.8241729736328, -194.30081176757812, -190.77745056152344, -187.2540740966797, -183.730712890625, -180.2073516845703, -176.68399047851562, -173.16061401367188, -169.6372528076172, -166.1138916015625, -162.5905303955078, -159.06715393066406, -155.54379272460938, -152.0204315185547, -148.4970703125, -144.97369384765625, -141.45034790039062, -137.92698669433594, -134.40362548828125, -130.8802490234375, -127.35688781738281, -123.83352661132812, -120.31016540527344, -116.78679656982422, -113.263427734375, -109.74006652832031, -106.2166976928711, -102.6933364868164, -99.16996765136719, -95.6466064453125, -92.12324523925781, -88.5998764038086, -85.0765151977539, -81.55315399169922, -78.02978515625, -74.50642395019531, -70.9830551147461, -67.4596939086914, -63.93632888793945, -60.4129638671875, -56.88959503173828, -53.36623001098633, -49.842864990234375, -46.31950378417969, -42.79613494873047, -39.27277374267578, -35.74940872192383, -32.226043701171875, -28.702680587768555, -25.1793155670166, -21.65595245361328, -18.132587432861328, -14.609222412109375, -11.085857391357422, -7.562494277954102, -4.039129257202148, -0.5157642364501953, 3.0076003074645996, 6.5309648513793945, 10.054328918457031, 13.577693939208984, 17.101058959960938, 20.624422073364258, 24.14778709411621, 27.671152114868164]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 6.0, 4.0, 6.0, 9.0, 8.0, 12.0, 13.0, 12.0, 16.0, 19.0, 14.0, 22.0, 20.0, 19.0, 23.0, 32.0, 40.0, 37.0, 39.0, 32.0, 29.0, 23.0, 32.0, 43.0, 43.0, 38.0, 40.0, 50.0, 33.0, 31.0, 24.0, 26.0, 29.0, 17.0, 20.0, 23.0, 19.0, 11.0, 16.0, 12.0, 8.0, 8.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0], "bins": [-61.10663986206055, -59.26850891113281, -57.43037796020508, -55.592247009277344, -53.754112243652344, -51.915985107421875, -50.077850341796875, -48.23971939086914, -46.401588439941406, -44.56345748901367, -42.72532653808594, -40.8871955871582, -39.04906463623047, -37.21092987060547, -35.372798919677734, -33.53466796875, -31.696537017822266, -29.85840606689453, -28.020275115966797, -26.18214225769043, -24.344011306762695, -22.50588035583496, -20.667747497558594, -18.82961654663086, -16.991485595703125, -15.15335464477539, -13.31522274017334, -11.477090835571289, -9.638959884643555, -7.80082893371582, -5.9626970291137695, -4.124565124511719, -2.2864303588867188, -0.44829893112182617, 1.3898324966430664, 3.227963924407959, 5.066095352172852, 6.904226303100586, 8.742358207702637, 10.580490112304688, 12.418621063232422, 14.256752014160156, 16.09488296508789, 17.933015823364258, 19.771146774291992, 21.609277725219727, 23.447410583496094, 25.285541534423828, 27.123672485351562, 28.961803436279297, 30.79993438720703, 32.638065338134766, 34.4761962890625, 36.3143310546875, 38.152462005615234, 39.99059295654297, 41.8287239074707, 43.66685485839844, 45.50498580932617, 47.343116760253906, 49.181251525878906, 51.019378662109375, 52.857513427734375, 54.69564437866211, 56.533775329589844]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 16.0, 11.0, 11.0, 16.0, 21.0, 20.0, 24.0, 33.0, 25.0, 30.0, 28.0, 28.0, 40.0, 37.0, 42.0, 58.0, 50.0, 42.0, 54.0, 50.0, 43.0, 33.0, 40.0, 30.0, 34.0, 18.0, 18.0, 19.0, 21.0, 22.0, 23.0, 13.0, 10.0, 5.0, 12.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-8.3046875, -8.0850830078125, -7.865478515625, -7.6458740234375, -7.42626953125, -7.2066650390625, -6.987060546875, -6.7674560546875, -6.5478515625, -6.3282470703125, -6.108642578125, -5.8890380859375, -5.66943359375, -5.4498291015625, -5.230224609375, -5.0106201171875, -4.791015625, -4.5714111328125, -4.351806640625, -4.1322021484375, -3.91259765625, -3.6929931640625, -3.473388671875, -3.2537841796875, -3.0341796875, -2.8145751953125, -2.594970703125, -2.3753662109375, -2.15576171875, -1.9361572265625, -1.716552734375, -1.4969482421875, -1.27734375, -1.0577392578125, -0.838134765625, -0.6185302734375, -0.39892578125, -0.1793212890625, 0.040283203125, 0.2598876953125, 0.4794921875, 0.6990966796875, 0.918701171875, 1.1383056640625, 1.35791015625, 1.5775146484375, 1.797119140625, 2.0167236328125, 2.236328125, 2.4559326171875, 2.675537109375, 2.8951416015625, 3.11474609375, 3.3343505859375, 3.553955078125, 3.7735595703125, 3.9931640625, 4.2127685546875, 4.432373046875, 4.6519775390625, 4.87158203125, 5.0911865234375, 5.310791015625, 5.5303955078125, 5.75]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 15.0, 17.0, 19.0, 43.0, 63.0, 76.0, 155.0, 237.0, 376.0, 582.0, 961.0, 1644.0, 2645.0, 4634.0, 7890.0, 13324.0, 22290.0, 38706.0, 69603.0, 144694.0, 398448.0, 165240.0, 75709.0, 41658.0, 24359.0, 14423.0, 8392.0, 4898.0, 2956.0, 1686.0, 1044.0, 642.0, 379.0, 250.0, 163.0, 98.0, 82.0, 41.0, 33.0, 20.0, 12.0, 12.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.537109375, -1.483306884765625, -1.42950439453125, -1.375701904296875, -1.3218994140625, -1.268096923828125, -1.21429443359375, -1.160491943359375, -1.106689453125, -1.052886962890625, -0.99908447265625, -0.945281982421875, -0.8914794921875, -0.837677001953125, -0.78387451171875, -0.730072021484375, -0.67626953125, -0.622467041015625, -0.56866455078125, -0.514862060546875, -0.4610595703125, -0.407257080078125, -0.35345458984375, -0.299652099609375, -0.245849609375, -0.192047119140625, -0.13824462890625, -0.084442138671875, -0.0306396484375, 0.023162841796875, 0.07696533203125, 0.130767822265625, 0.1845703125, 0.238372802734375, 0.29217529296875, 0.345977783203125, 0.3997802734375, 0.453582763671875, 0.50738525390625, 0.561187744140625, 0.614990234375, 0.668792724609375, 0.72259521484375, 0.776397705078125, 0.8302001953125, 0.884002685546875, 0.93780517578125, 0.991607666015625, 1.04541015625, 1.099212646484375, 1.15301513671875, 1.206817626953125, 1.2606201171875, 1.314422607421875, 1.36822509765625, 1.422027587890625, 1.475830078125, 1.529632568359375, 1.58343505859375, 1.637237548828125, 1.6910400390625, 1.744842529296875, 1.79864501953125, 1.852447509765625, 1.90625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 2.0, 11.0, 8.0, 7.0, 6.0, 10.0, 13.0, 19.0, 29.0, 32.0, 27.0, 40.0, 40.0, 27.0, 28.0, 43.0, 42.0, 47.0, 1063.0, 43.0, 48.0, 47.0, 42.0, 45.0, 42.0, 36.0, 33.0, 45.0, 24.0, 22.0, 28.0, 11.0, 13.0, 11.0, 12.0, 5.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.03900146484375, -3.8944091796875, -3.74981689453125, -3.605224609375, -3.46063232421875, -3.3160400390625, -3.17144775390625, -3.02685546875, -2.88226318359375, -2.7376708984375, -2.59307861328125, -2.448486328125, -2.30389404296875, -2.1593017578125, -2.01470947265625, -1.8701171875, -1.72552490234375, -1.5809326171875, -1.43634033203125, -1.291748046875, -1.14715576171875, -1.0025634765625, -0.85797119140625, -0.71337890625, -0.56878662109375, -0.4241943359375, -0.27960205078125, -0.135009765625, 0.00958251953125, 0.1541748046875, 0.29876708984375, 0.443359375, 0.58795166015625, 0.7325439453125, 0.87713623046875, 1.021728515625, 1.16632080078125, 1.3109130859375, 1.45550537109375, 1.60009765625, 1.74468994140625, 1.8892822265625, 2.03387451171875, 2.178466796875, 2.32305908203125, 2.4676513671875, 2.61224365234375, 2.7568359375, 2.90142822265625, 3.0460205078125, 3.19061279296875, 3.335205078125, 3.47979736328125, 3.6243896484375, 3.76898193359375, 3.91357421875, 4.05816650390625, 4.2027587890625, 4.34735107421875, 4.491943359375, 4.63653564453125, 4.7811279296875, 4.92572021484375, 5.0703125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 8.0, 9.0, 16.0, 16.0, 33.0, 46.0, 80.0, 132.0, 206.0, 351.0, 566.0, 890.0, 1441.0, 2271.0, 3728.0, 6189.0, 10542.0, 18796.0, 32550.0, 58926.0, 113421.0, 1366009.0, 255428.0, 100768.0, 53500.0, 29723.0, 16977.0, 9791.0, 5705.0, 3400.0, 2107.0, 1349.0, 813.0, 518.0, 305.0, 214.0, 118.0, 73.0, 39.0, 30.0, 17.0, 12.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.462890625, -1.4123077392578125, -1.361724853515625, -1.3111419677734375, -1.26055908203125, -1.2099761962890625, -1.159393310546875, -1.1088104248046875, -1.0582275390625, -1.0076446533203125, -0.957061767578125, -0.9064788818359375, -0.85589599609375, -0.8053131103515625, -0.754730224609375, -0.7041473388671875, -0.653564453125, -0.6029815673828125, -0.552398681640625, -0.5018157958984375, -0.45123291015625, -0.4006500244140625, -0.350067138671875, -0.2994842529296875, -0.2489013671875, -0.1983184814453125, -0.147735595703125, -0.0971527099609375, -0.04656982421875, 0.0040130615234375, 0.054595947265625, 0.1051788330078125, 0.15576171875, 0.2063446044921875, 0.256927490234375, 0.3075103759765625, 0.35809326171875, 0.4086761474609375, 0.459259033203125, 0.5098419189453125, 0.5604248046875, 0.6110076904296875, 0.661590576171875, 0.7121734619140625, 0.76275634765625, 0.8133392333984375, 0.863922119140625, 0.9145050048828125, 0.965087890625, 1.0156707763671875, 1.066253662109375, 1.1168365478515625, 1.16741943359375, 1.2180023193359375, 1.268585205078125, 1.3191680908203125, 1.3697509765625, 1.4203338623046875, 1.470916748046875, 1.5214996337890625, 1.57208251953125, 1.6226654052734375, 1.673248291015625, 1.7238311767578125, 1.7744140625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 6.0, 6.0, 5.0, 11.0, 9.0, 8.0, 14.0, 14.0, 15.0, 17.0, 27.0, 22.0, 53.0, 62.0, 69.0, 119.0, 125.0, 102.0, 61.0, 48.0, 49.0, 29.0, 18.0, 15.0, 16.0, 15.0, 8.0, 7.0, 6.0, 8.0, 9.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007700920104980469, -0.0007467493414878845, -0.0007234066724777222, -0.0007000640034675598, -0.0006767213344573975, -0.0006533786654472351, -0.0006300359964370728, -0.0006066933274269104, -0.000583350658416748, -0.0005600079894065857, -0.0005366653203964233, -0.000513322651386261, -0.0004899799823760986, -0.0004666373133659363, -0.0004432946443557739, -0.00041995197534561157, -0.0003966093063354492, -0.00037326663732528687, -0.0003499239683151245, -0.00032658129930496216, -0.0003032386302947998, -0.00027989596128463745, -0.0002565532922744751, -0.00023321062326431274, -0.0002098679542541504, -0.00018652528524398804, -0.00016318261623382568, -0.00013983994722366333, -0.00011649727821350098, -9.315460920333862e-05, -6.981194019317627e-05, -4.6469271183013916e-05, -2.3126602172851562e-05, 2.1606683731079102e-07, 2.3558735847473145e-05, 4.69014048576355e-05, 7.024407386779785e-05, 9.35867428779602e-05, 0.00011692941188812256, 0.0001402720808982849, 0.00016361474990844727, 0.00018695741891860962, 0.00021030008792877197, 0.00023364275693893433, 0.0002569854259490967, 0.00028032809495925903, 0.0003036707639694214, 0.00032701343297958374, 0.0003503561019897461, 0.00037369877099990845, 0.0003970414400100708, 0.00042038410902023315, 0.0004437267780303955, 0.00046706944704055786, 0.0004904121160507202, 0.0005137547850608826, 0.0005370974540710449, 0.0005604401230812073, 0.0005837827920913696, 0.000607125461101532, 0.0006304681301116943, 0.0006538107991218567, 0.000677153468132019, 0.0007004961371421814, 0.0007238388061523438]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 6.0, 5.0, 10.0, 7.0, 7.0, 20.0, 15.0, 32.0, 50.0, 52.0, 76.0, 152.0, 233.0, 534.0, 19660.0, 1025654.0, 1183.0, 316.0, 185.0, 102.0, 68.0, 30.0, 28.0, 25.0, 14.0, 13.0, 11.0, 8.0, 9.0, 6.0, 4.0, 4.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01540374755859375, -0.014838814735412598, -0.014273881912231445, -0.013708949089050293, -0.01314401626586914, -0.012579083442687988, -0.012014150619506836, -0.011449217796325684, -0.010884284973144531, -0.010319352149963379, -0.009754419326782227, -0.009189486503601074, -0.008624553680419922, -0.00805962085723877, -0.007494688034057617, -0.006929755210876465, -0.0063648223876953125, -0.00579988956451416, -0.005234956741333008, -0.0046700239181518555, -0.004105091094970703, -0.0035401582717895508, -0.0029752254486083984, -0.002410292625427246, -0.0018453598022460938, -0.0012804269790649414, -0.0007154941558837891, -0.00015056133270263672, 0.0004143714904785156, 0.000979304313659668, 0.0015442371368408203, 0.0021091699600219727, 0.002674102783203125, 0.0032390356063842773, 0.0038039684295654297, 0.004368901252746582, 0.004933834075927734, 0.005498766899108887, 0.006063699722290039, 0.006628632545471191, 0.007193565368652344, 0.007758498191833496, 0.008323431015014648, 0.0088883638381958, 0.009453296661376953, 0.010018229484558105, 0.010583162307739258, 0.01114809513092041, 0.011713027954101562, 0.012277960777282715, 0.012842893600463867, 0.01340782642364502, 0.013972759246826172, 0.014537692070007324, 0.015102624893188477, 0.01566755771636963, 0.01623249053955078, 0.016797423362731934, 0.017362356185913086, 0.01792728900909424, 0.01849222183227539, 0.019057154655456543, 0.019622087478637695, 0.020187020301818848, 0.020751953125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 94.0, 570.0, 323.0, 29.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000628731562756002, -0.0005643651238642633, -0.0004999986849725246, -0.0004356321878731251, -0.0003712657489813864, -0.00030689931008964777, -0.00024253284209407866, -0.00017816637409850955, -0.0001137999352067709, -4.9433481763117015e-05, 1.4932971680536866e-05, 7.929942512419075e-05, 0.00014366587856784463, 0.00020803231745958328, 0.0002723987854551524, 0.0003367652534507215, 0.00040113169234246016, 0.0004654981312341988, 0.0005298645701259375, 0.000594231067225337, 0.0006585975061170757, 0.0007229639450088143, 0.0007873304421082139, 0.0008516968809999526, 0.0009160633198916912, 0.0009804298169910908, 0.0010447961976751685, 0.001109162694774568, 0.0011735290754586458, 0.0012378955725580454, 0.001302262069657445, 0.0013666285667568445, 0.001430995063856244, 0.0014953615609556437, 0.0015597279416397214, 0.001624094438739121, 0.0016884608194231987, 0.0017528273165225983, 0.0018171938136219978, 0.0018815603107213974, 0.0019459266914054751, 0.002010293072089553, 0.0020746595691889524, 0.002139026066288352, 0.0022033925633877516, 0.0022677588276565075, 0.002332125324755907, 0.0023964918218553066, 0.002460858318954706, 0.0025252248160541058, 0.0025895913131535053, 0.0026539575774222612, 0.002718324074521661, 0.0027826905716210604, 0.00284705706872046, 0.0029114235658198595, 0.0029757898300886154, 0.003040156327188015, 0.0031045228242874146, 0.0031688890885561705, 0.00323325558565557, 0.0032976220827549696, 0.003361988579854369, 0.0034263550769537687, 0.0034907215740531683]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 1.0, 7.0, 10.0, 7.0, 5.0, 11.0, 16.0, 15.0, 18.0, 17.0, 17.0, 21.0, 31.0, 31.0, 24.0, 41.0, 25.0, 43.0, 37.0, 33.0, 40.0, 46.0, 48.0, 35.0, 34.0, 32.0, 41.0, 38.0, 31.0, 28.0, 33.0, 27.0, 30.0, 24.0, 14.0, 13.0, 14.0, 17.0, 9.0, 10.0, 5.0, 3.0, 7.0, 0.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003083944320678711, -0.0002981293946504593, -0.0002878643572330475, -0.0002775993198156357, -0.0002673342823982239, -0.00025706924498081207, -0.00024680420756340027, -0.00023653917014598846, -0.00022627413272857666, -0.00021600909531116486, -0.00020574405789375305, -0.00019547902047634125, -0.00018521398305892944, -0.00017494894564151764, -0.00016468390822410583, -0.00015441887080669403, -0.00014415383338928223, -0.00013388879597187042, -0.00012362375855445862, -0.00011335872113704681, -0.00010309368371963501, -9.28286463022232e-05, -8.25636088848114e-05, -7.22985714673996e-05, -6.203353404998779e-05, -5.176849663257599e-05, -4.1503459215164185e-05, -3.123842179775238e-05, -2.0973384380340576e-05, -1.0708346962928772e-05, -4.4330954551696777e-07, 9.821727871894836e-06, 2.008676528930664e-05, 3.0351802706718445e-05, 4.061684012413025e-05, 5.088187754154205e-05, 6.114691495895386e-05, 7.141195237636566e-05, 8.167698979377747e-05, 9.194202721118927e-05, 0.00010220706462860107, 0.00011247210204601288, 0.00012273713946342468, 0.0001330021768808365, 0.0001432672142982483, 0.0001535322517156601, 0.0001637972891330719, 0.0001740623265504837, 0.0001843273639678955, 0.0001945924013853073, 0.00020485743880271912, 0.00021512247622013092, 0.00022538751363754272, 0.00023565255105495453, 0.00024591758847236633, 0.00025618262588977814, 0.00026644766330718994, 0.00027671270072460175, 0.00028697773814201355, 0.00029724277555942535, 0.00030750781297683716, 0.00031777285039424896, 0.00032803788781166077, 0.00033830292522907257, 0.0003485679626464844]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 16.0, 11.0, 11.0, 16.0, 21.0, 20.0, 24.0, 33.0, 25.0, 30.0, 28.0, 28.0, 40.0, 37.0, 42.0, 58.0, 50.0, 42.0, 54.0, 50.0, 43.0, 33.0, 40.0, 30.0, 34.0, 18.0, 18.0, 19.0, 21.0, 22.0, 23.0, 13.0, 10.0, 5.0, 12.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-8.3046875, -8.0850830078125, -7.865478515625, -7.6458740234375, -7.42626953125, -7.2066650390625, -6.987060546875, -6.7674560546875, -6.5478515625, -6.3282470703125, -6.108642578125, -5.8890380859375, -5.66943359375, -5.4498291015625, -5.230224609375, -5.0106201171875, -4.791015625, -4.5714111328125, -4.351806640625, -4.1322021484375, -3.91259765625, -3.6929931640625, -3.473388671875, -3.2537841796875, -3.0341796875, -2.8145751953125, -2.594970703125, -2.3753662109375, -2.15576171875, -1.9361572265625, -1.716552734375, -1.4969482421875, -1.27734375, -1.0577392578125, -0.838134765625, -0.6185302734375, -0.39892578125, -0.1793212890625, 0.040283203125, 0.2598876953125, 0.4794921875, 0.6990966796875, 0.918701171875, 1.1383056640625, 1.35791015625, 1.5775146484375, 1.797119140625, 2.0167236328125, 2.236328125, 2.4559326171875, 2.675537109375, 2.8951416015625, 3.11474609375, 3.3343505859375, 3.553955078125, 3.7735595703125, 3.9931640625, 4.2127685546875, 4.432373046875, 4.6519775390625, 4.87158203125, 5.0911865234375, 5.310791015625, 5.5303955078125, 5.75]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 9.0, 14.0, 13.0, 20.0, 27.0, 33.0, 45.0, 66.0, 96.0, 132.0, 175.0, 294.0, 466.0, 784.0, 1379.0, 2685.0, 6076.0, 16084.0, 60719.0, 412690.0, 451348.0, 65519.0, 17064.0, 6419.0, 2702.0, 1467.0, 786.0, 485.0, 288.0, 202.0, 128.0, 85.0, 74.0, 46.0, 35.0, 22.0, 22.0, 17.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.66912841796875, -5.4593505859375, -5.24957275390625, -5.039794921875, -4.83001708984375, -4.6202392578125, -4.41046142578125, -4.20068359375, -3.99090576171875, -3.7811279296875, -3.57135009765625, -3.361572265625, -3.15179443359375, -2.9420166015625, -2.73223876953125, -2.5224609375, -2.31268310546875, -2.1029052734375, -1.89312744140625, -1.683349609375, -1.47357177734375, -1.2637939453125, -1.05401611328125, -0.84423828125, -0.63446044921875, -0.4246826171875, -0.21490478515625, -0.005126953125, 0.20465087890625, 0.4144287109375, 0.62420654296875, 0.833984375, 1.04376220703125, 1.2535400390625, 1.46331787109375, 1.673095703125, 1.88287353515625, 2.0926513671875, 2.30242919921875, 2.51220703125, 2.72198486328125, 2.9317626953125, 3.14154052734375, 3.351318359375, 3.56109619140625, 3.7708740234375, 3.98065185546875, 4.1904296875, 4.40020751953125, 4.6099853515625, 4.81976318359375, 5.029541015625, 5.23931884765625, 5.4490966796875, 5.65887451171875, 5.86865234375, 6.07843017578125, 6.2882080078125, 6.49798583984375, 6.707763671875, 6.91754150390625, 7.1273193359375, 7.33709716796875, 7.546875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 13.0, 13.0, 11.0, 13.0, 23.0, 26.0, 27.0, 39.0, 31.0, 40.0, 39.0, 48.0, 48.0, 68.0, 235.0, 1774.0, 113.0, 60.0, 43.0, 43.0, 51.0, 35.0, 31.0, 32.0, 31.0, 18.0, 25.0, 11.0, 20.0, 10.0, 18.0, 9.0, 7.0, 2.0, 6.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-23.890625, -23.150146484375, -22.40966796875, -21.669189453125, -20.9287109375, -20.188232421875, -19.44775390625, -18.707275390625, -17.966796875, -17.226318359375, -16.48583984375, -15.745361328125, -15.0048828125, -14.264404296875, -13.52392578125, -12.783447265625, -12.04296875, -11.302490234375, -10.56201171875, -9.821533203125, -9.0810546875, -8.340576171875, -7.60009765625, -6.859619140625, -6.119140625, -5.378662109375, -4.63818359375, -3.897705078125, -3.1572265625, -2.416748046875, -1.67626953125, -0.935791015625, -0.1953125, 0.545166015625, 1.28564453125, 2.026123046875, 2.7666015625, 3.507080078125, 4.24755859375, 4.988037109375, 5.728515625, 6.468994140625, 7.20947265625, 7.949951171875, 8.6904296875, 9.430908203125, 10.17138671875, 10.911865234375, 11.65234375, 12.392822265625, 13.13330078125, 13.873779296875, 14.6142578125, 15.354736328125, 16.09521484375, 16.835693359375, 17.576171875, 18.316650390625, 19.05712890625, 19.797607421875, 20.5380859375, 21.278564453125, 22.01904296875, 22.759521484375, 23.5]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 1.0, 9.0, 11.0, 13.0, 15.0, 15.0, 17.0, 25.0, 23.0, 50.0, 37.0, 65.0, 93.0, 148.0, 212.0, 425.0, 1377.0, 24349.0, 3097926.0, 18657.0, 1133.0, 435.0, 183.0, 128.0, 73.0, 55.0, 53.0, 37.0, 33.0, 18.0, 9.0, 14.0, 17.0, 10.0, 7.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-38.78125, -37.548828125, -36.31640625, -35.083984375, -33.8515625, -32.619140625, -31.38671875, -30.154296875, -28.921875, -27.689453125, -26.45703125, -25.224609375, -23.9921875, -22.759765625, -21.52734375, -20.294921875, -19.0625, -17.830078125, -16.59765625, -15.365234375, -14.1328125, -12.900390625, -11.66796875, -10.435546875, -9.203125, -7.970703125, -6.73828125, -5.505859375, -4.2734375, -3.041015625, -1.80859375, -0.576171875, 0.65625, 1.888671875, 3.12109375, 4.353515625, 5.5859375, 6.818359375, 8.05078125, 9.283203125, 10.515625, 11.748046875, 12.98046875, 14.212890625, 15.4453125, 16.677734375, 17.91015625, 19.142578125, 20.375, 21.607421875, 22.83984375, 24.072265625, 25.3046875, 26.537109375, 27.76953125, 29.001953125, 30.234375, 31.466796875, 32.69921875, 33.931640625, 35.1640625, 36.396484375, 37.62890625, 38.861328125, 40.09375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 461.0, 546.0, 8.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.848634719848633, -14.17556095123291, -9.502487182617188, -4.829413414001465, -0.1563396453857422, 4.516733169555664, 9.189807891845703, 13.862882614135742, 18.53595542907715, 23.209030151367188, 27.882102966308594, 32.55517578125, 37.228248596191406, 41.90132141113281, 46.574398040771484, 51.247474670410156, 55.92054748535156, 60.59362030029297, 65.26669311523438, 69.93976593017578, 74.61283874511719, 79.28591918945312, 83.95899200439453, 88.63206481933594, 93.30513763427734, 97.97821044921875, 102.65128326416016, 107.32435607910156, 111.9974365234375, 116.67050170898438, 121.34358215332031, 126.01665496826172, 130.68972778320312, 135.36280822753906, 140.03587341308594, 144.70895385742188, 149.38201904296875, 154.0550994873047, 158.72816467285156, 163.4012451171875, 168.07431030273438, 172.7473907470703, 177.4204559326172, 182.09353637695312, 186.7666015625, 191.43968200683594, 196.1127471923828, 200.78582763671875, 205.4589080810547, 210.13198852539062, 214.8050537109375, 219.47813415527344, 224.1511993408203, 228.82427978515625, 233.49734497070312, 238.17042541503906, 242.843505859375, 247.51658630371094, 252.1896514892578, 256.86273193359375, 261.5357971191406, 266.2088623046875, 270.8819580078125, 275.5550231933594, 280.22808837890625]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 11.0, 11.0, 10.0, 15.0, 22.0, 25.0, 26.0, 34.0, 26.0, 41.0, 36.0, 32.0, 49.0, 41.0, 47.0, 48.0, 49.0, 43.0, 38.0, 43.0, 45.0, 27.0, 45.0, 30.0, 35.0, 29.0, 18.0, 17.0, 23.0, 13.0, 7.0, 13.0, 7.0, 1.0, 9.0, 8.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.12337493896484, -67.60015106201172, -65.07691955566406, -62.55369567871094, -60.03047180175781, -57.50724792480469, -54.9840202331543, -52.460792541503906, -49.93756866455078, -47.414344787597656, -44.891117095947266, -42.367889404296875, -39.84466552734375, -37.321441650390625, -34.798213958740234, -32.274986267089844, -29.75176239013672, -27.22853660583496, -24.705310821533203, -22.182085037231445, -19.658859252929688, -17.13563346862793, -14.612407684326172, -12.089181900024414, -9.565956115722656, -7.042730331420898, -4.519504547119141, -1.9962787628173828, 0.526947021484375, 3.050172805786133, 5.573398590087891, 8.096624374389648, 10.619850158691406, 13.143075942993164, 15.666301727294922, 18.18952751159668, 20.712753295898438, 23.235979080200195, 25.759204864501953, 28.28243064880371, 30.80565643310547, 33.328880310058594, 35.852108001708984, 38.375335693359375, 40.8985595703125, 43.421783447265625, 45.945011138916016, 48.468238830566406, 50.99146270751953, 53.514686584472656, 56.03791427612305, 58.56114196777344, 61.08436584472656, 63.60758972167969, 66.13081359863281, 68.65404510498047, 71.1772689819336, 73.70049285888672, 76.22372436523438, 78.7469482421875, 81.27017211914062, 83.79339599609375, 86.31661987304688, 88.83985137939453, 91.36307525634766]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 6.0, 16.0, 8.0, 13.0, 14.0, 19.0, 25.0, 25.0, 28.0, 26.0, 26.0, 24.0, 32.0, 23.0, 51.0, 40.0, 59.0, 49.0, 46.0, 49.0, 45.0, 42.0, 40.0, 34.0, 37.0, 29.0, 19.0, 20.0, 24.0, 19.0, 21.0, 20.0, 21.0, 10.0, 7.0, 10.0, 6.0, 6.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0], "bins": [-8.390625, -8.17041015625, -7.9501953125, -7.72998046875, -7.509765625, -7.28955078125, -7.0693359375, -6.84912109375, -6.62890625, -6.40869140625, -6.1884765625, -5.96826171875, -5.748046875, -5.52783203125, -5.3076171875, -5.08740234375, -4.8671875, -4.64697265625, -4.4267578125, -4.20654296875, -3.986328125, -3.76611328125, -3.5458984375, -3.32568359375, -3.10546875, -2.88525390625, -2.6650390625, -2.44482421875, -2.224609375, -2.00439453125, -1.7841796875, -1.56396484375, -1.34375, -1.12353515625, -0.9033203125, -0.68310546875, -0.462890625, -0.24267578125, -0.0224609375, 0.19775390625, 0.41796875, 0.63818359375, 0.8583984375, 1.07861328125, 1.298828125, 1.51904296875, 1.7392578125, 1.95947265625, 2.1796875, 2.39990234375, 2.6201171875, 2.84033203125, 3.060546875, 3.28076171875, 3.5009765625, 3.72119140625, 3.94140625, 4.16162109375, 4.3818359375, 4.60205078125, 4.822265625, 5.04248046875, 5.2626953125, 5.48291015625, 5.703125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 9.0, 6.0, 12.0, 6.0, 20.0, 29.0, 20.0, 23.0, 29.0, 47.0, 96.0, 139.0, 235.0, 608.0, 1743.0, 6052.0, 24436.0, 140076.0, 1209464.0, 2291875.0, 444746.0, 57454.0, 11969.0, 3244.0, 1027.0, 373.0, 190.0, 106.0, 64.0, 33.0, 23.0, 14.0, 16.0, 16.0, 17.0, 14.0, 10.0, 8.0, 9.0, 6.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.859375, -14.41259765625, -13.9658203125, -13.51904296875, -13.072265625, -12.62548828125, -12.1787109375, -11.73193359375, -11.28515625, -10.83837890625, -10.3916015625, -9.94482421875, -9.498046875, -9.05126953125, -8.6044921875, -8.15771484375, -7.7109375, -7.26416015625, -6.8173828125, -6.37060546875, -5.923828125, -5.47705078125, -5.0302734375, -4.58349609375, -4.13671875, -3.68994140625, -3.2431640625, -2.79638671875, -2.349609375, -1.90283203125, -1.4560546875, -1.00927734375, -0.5625, -0.11572265625, 0.3310546875, 0.77783203125, 1.224609375, 1.67138671875, 2.1181640625, 2.56494140625, 3.01171875, 3.45849609375, 3.9052734375, 4.35205078125, 4.798828125, 5.24560546875, 5.6923828125, 6.13916015625, 6.5859375, 7.03271484375, 7.4794921875, 7.92626953125, 8.373046875, 8.81982421875, 9.2666015625, 9.71337890625, 10.16015625, 10.60693359375, 11.0537109375, 11.50048828125, 11.947265625, 12.39404296875, 12.8408203125, 13.28759765625, 13.734375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 13.0, 11.0, 22.0, 43.0, 64.0, 83.0, 105.0, 154.0, 292.0, 449.0, 649.0, 715.0, 538.0, 335.0, 221.0, 138.0, 92.0, 62.0, 30.0, 22.0, 18.0, 13.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.40625, -38.5521240234375, -37.697998046875, -36.8438720703125, -35.98974609375, -35.1356201171875, -34.281494140625, -33.4273681640625, -32.5732421875, -31.7191162109375, -30.864990234375, -30.0108642578125, -29.15673828125, -28.3026123046875, -27.448486328125, -26.5943603515625, -25.740234375, -24.8861083984375, -24.031982421875, -23.1778564453125, -22.32373046875, -21.4696044921875, -20.615478515625, -19.7613525390625, -18.9072265625, -18.0531005859375, -17.198974609375, -16.3448486328125, -15.49072265625, -14.6365966796875, -13.782470703125, -12.9283447265625, -12.07421875, -11.2200927734375, -10.365966796875, -9.5118408203125, -8.65771484375, -7.8035888671875, -6.949462890625, -6.0953369140625, -5.2412109375, -4.3870849609375, -3.532958984375, -2.6788330078125, -1.82470703125, -0.9705810546875, -0.116455078125, 0.7376708984375, 1.591796875, 2.4459228515625, 3.300048828125, 4.1541748046875, 5.00830078125, 5.8624267578125, 6.716552734375, 7.5706787109375, 8.4248046875, 9.2789306640625, 10.133056640625, 10.9871826171875, 11.84130859375, 12.6954345703125, 13.549560546875, 14.4036865234375, 15.2578125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 12.0, 21.0, 42.0, 60.0, 117.0, 260.0, 645.0, 34838.0, 4150404.0, 7011.0, 458.0, 176.0, 104.0, 55.0, 28.0, 21.0, 17.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.6875, -66.3740234375, -62.060546875, -57.7470703125, -53.43359375, -49.1201171875, -44.806640625, -40.4931640625, -36.1796875, -31.8662109375, -27.552734375, -23.2392578125, -18.92578125, -14.6123046875, -10.298828125, -5.9853515625, -1.671875, 2.6416015625, 6.955078125, 11.2685546875, 15.58203125, 19.8955078125, 24.208984375, 28.5224609375, 32.8359375, 37.1494140625, 41.462890625, 45.7763671875, 50.08984375, 54.4033203125, 58.716796875, 63.0302734375, 67.34375, 71.6572265625, 75.970703125, 80.2841796875, 84.59765625, 88.9111328125, 93.224609375, 97.5380859375, 101.8515625, 106.1650390625, 110.478515625, 114.7919921875, 119.10546875, 123.4189453125, 127.732421875, 132.0458984375, 136.359375, 140.6728515625, 144.986328125, 149.2998046875, 153.61328125, 157.9267578125, 162.240234375, 166.5537109375, 170.8671875, 175.1806640625, 179.494140625, 183.8076171875, 188.12109375, 192.4345703125, 196.748046875, 201.0615234375, 205.375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 9.0, 73.0, 262.0, 442.0, 190.0, 37.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-488.6776428222656, -480.0137023925781, -471.3497619628906, -462.6858215332031, -454.0218811035156, -445.3579406738281, -436.6940002441406, -428.030029296875, -419.3660888671875, -410.7021484375, -402.0382080078125, -393.374267578125, -384.7103271484375, -376.04638671875, -367.3824462890625, -358.718505859375, -350.0545654296875, -341.390625, -332.7266845703125, -324.062744140625, -315.3988037109375, -306.73486328125, -298.0709228515625, -289.406982421875, -280.7430419921875, -272.0791015625, -263.4151611328125, -254.751220703125, -246.0872802734375, -237.42333984375, -228.75938415527344, -220.09544372558594, -211.4315185546875, -202.767578125, -194.1036376953125, -185.439697265625, -176.7757568359375, -168.11181640625, -159.44786071777344, -150.78392028808594, -142.11997985839844, -133.45603942871094, -124.79209899902344, -116.1281509399414, -107.4642105102539, -98.8002700805664, -90.13632202148438, -81.47238159179688, -72.80844116210938, -64.14450073242188, -55.48055648803711, -46.816612243652344, -38.152671813964844, -29.488731384277344, -20.824787139892578, -12.160842895507812, -3.4969024658203125, 5.16703987121582, 13.830982208251953, 22.494924545288086, 31.15886688232422, 39.82280731201172, 48.486751556396484, 57.15069580078125, 65.81463623046875]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 9.0, 9.0, 13.0, 18.0, 15.0, 27.0, 10.0, 33.0, 24.0, 37.0, 38.0, 41.0, 27.0, 35.0, 40.0, 40.0, 43.0, 47.0, 42.0, 45.0, 40.0, 46.0, 39.0, 36.0, 25.0, 34.0, 25.0, 22.0, 24.0, 18.0, 21.0, 16.0, 13.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.26802062988281, -53.31504440307617, -51.36206817626953, -49.409088134765625, -47.456111907958984, -45.503135681152344, -43.5501594543457, -41.59718322753906, -39.644203186035156, -37.691226959228516, -35.738250732421875, -33.78527069091797, -31.832294464111328, -29.879318237304688, -27.926342010498047, -25.973363876342773, -24.020387649536133, -22.067411422729492, -20.11443328857422, -18.161457061767578, -16.208478927612305, -14.255502700805664, -12.302525520324707, -10.34954833984375, -8.396571159362793, -6.443593978881836, -4.490616798400879, -2.53764009475708, -0.584662914276123, 1.3683137893676758, 3.321290969848633, 5.27426815032959, 7.227245330810547, 9.180222511291504, 11.133199691772461, 13.086175918579102, 15.039154052734375, 16.992130279541016, 18.945106506347656, 20.89808464050293, 22.851062774658203, 24.804039001464844, 26.757017135620117, 28.709993362426758, 30.66297149658203, 32.61594772338867, 34.56892395019531, 36.52190399169922, 38.474876403808594, 40.427852630615234, 42.380828857421875, 44.33380889892578, 46.28678512573242, 48.23976135253906, 50.1927375793457, 52.145713806152344, 54.09869384765625, 56.05167007446289, 58.00464630126953, 59.95762634277344, 61.91060256958008, 63.86357879638672, 65.81655883789062, 67.76953125, 69.7225112915039]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 15.0, 16.0, 11.0, 17.0, 12.0, 38.0, 16.0, 30.0, 20.0, 27.0, 38.0, 36.0, 39.0, 35.0, 59.0, 68.0, 38.0, 45.0, 37.0, 48.0, 35.0, 40.0, 46.0, 28.0, 27.0, 16.0, 28.0, 17.0, 25.0, 11.0, 15.0, 15.0, 10.0, 8.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.4921875, -8.25860595703125, -8.0250244140625, -7.79144287109375, -7.557861328125, -7.32427978515625, -7.0906982421875, -6.85711669921875, -6.62353515625, -6.38995361328125, -6.1563720703125, -5.92279052734375, -5.689208984375, -5.45562744140625, -5.2220458984375, -4.98846435546875, -4.7548828125, -4.52130126953125, -4.2877197265625, -4.05413818359375, -3.820556640625, -3.58697509765625, -3.3533935546875, -3.11981201171875, -2.88623046875, -2.65264892578125, -2.4190673828125, -2.18548583984375, -1.951904296875, -1.71832275390625, -1.4847412109375, -1.25115966796875, -1.017578125, -0.78399658203125, -0.5504150390625, -0.31683349609375, -0.083251953125, 0.15032958984375, 0.3839111328125, 0.61749267578125, 0.85107421875, 1.08465576171875, 1.3182373046875, 1.55181884765625, 1.785400390625, 2.01898193359375, 2.2525634765625, 2.48614501953125, 2.7197265625, 2.95330810546875, 3.1868896484375, 3.42047119140625, 3.654052734375, 3.88763427734375, 4.1212158203125, 4.35479736328125, 4.58837890625, 4.82196044921875, 5.0555419921875, 5.28912353515625, 5.522705078125, 5.75628662109375, 5.9898681640625, 6.22344970703125, 6.45703125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 6.0, 5.0, 7.0, 13.0, 15.0, 21.0, 33.0, 46.0, 58.0, 104.0, 139.0, 251.0, 389.0, 654.0, 1031.0, 1620.0, 2647.0, 4309.0, 7175.0, 11570.0, 18867.0, 32507.0, 56615.0, 107190.0, 320433.0, 256991.0, 97662.0, 52422.0, 29754.0, 17764.0, 10937.0, 6746.0, 4060.0, 2490.0, 1497.0, 926.0, 551.0, 366.0, 208.0, 161.0, 101.0, 68.0, 45.0, 35.0, 20.0, 19.0, 12.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5087890625, -1.45477294921875, -1.4007568359375, -1.34674072265625, -1.292724609375, -1.23870849609375, -1.1846923828125, -1.13067626953125, -1.07666015625, -1.02264404296875, -0.9686279296875, -0.91461181640625, -0.860595703125, -0.80657958984375, -0.7525634765625, -0.69854736328125, -0.64453125, -0.59051513671875, -0.5364990234375, -0.48248291015625, -0.428466796875, -0.37445068359375, -0.3204345703125, -0.26641845703125, -0.21240234375, -0.15838623046875, -0.1043701171875, -0.05035400390625, 0.003662109375, 0.05767822265625, 0.1116943359375, 0.16571044921875, 0.2197265625, 0.27374267578125, 0.3277587890625, 0.38177490234375, 0.435791015625, 0.48980712890625, 0.5438232421875, 0.59783935546875, 0.65185546875, 0.70587158203125, 0.7598876953125, 0.81390380859375, 0.867919921875, 0.92193603515625, 0.9759521484375, 1.02996826171875, 1.083984375, 1.13800048828125, 1.1920166015625, 1.24603271484375, 1.300048828125, 1.35406494140625, 1.4080810546875, 1.46209716796875, 1.51611328125, 1.57012939453125, 1.6241455078125, 1.67816162109375, 1.732177734375, 1.78619384765625, 1.8402099609375, 1.89422607421875, 1.9482421875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 9.0, 6.0, 13.0, 12.0, 19.0, 12.0, 12.0, 20.0, 34.0, 35.0, 31.0, 17.0, 32.0, 31.0, 41.0, 48.0, 44.0, 48.0, 1065.0, 50.0, 49.0, 36.0, 41.0, 42.0, 42.0, 27.0, 34.0, 26.0, 30.0, 19.0, 19.0, 13.0, 9.0, 11.0, 16.0, 6.0, 3.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.87890625, -4.73175048828125, -4.5845947265625, -4.43743896484375, -4.290283203125, -4.14312744140625, -3.9959716796875, -3.84881591796875, -3.70166015625, -3.55450439453125, -3.4073486328125, -3.26019287109375, -3.113037109375, -2.96588134765625, -2.8187255859375, -2.67156982421875, -2.5244140625, -2.37725830078125, -2.2301025390625, -2.08294677734375, -1.935791015625, -1.78863525390625, -1.6414794921875, -1.49432373046875, -1.34716796875, -1.20001220703125, -1.0528564453125, -0.90570068359375, -0.758544921875, -0.61138916015625, -0.4642333984375, -0.31707763671875, -0.169921875, -0.02276611328125, 0.1243896484375, 0.27154541015625, 0.418701171875, 0.56585693359375, 0.7130126953125, 0.86016845703125, 1.00732421875, 1.15447998046875, 1.3016357421875, 1.44879150390625, 1.595947265625, 1.74310302734375, 1.8902587890625, 2.03741455078125, 2.1845703125, 2.33172607421875, 2.4788818359375, 2.62603759765625, 2.773193359375, 2.92034912109375, 3.0675048828125, 3.21466064453125, 3.36181640625, 3.50897216796875, 3.6561279296875, 3.80328369140625, 3.950439453125, 4.09759521484375, 4.2447509765625, 4.39190673828125, 4.5390625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 8.0, 13.0, 23.0, 46.0, 55.0, 92.0, 133.0, 215.0, 345.0, 560.0, 896.0, 1513.0, 2432.0, 3831.0, 6280.0, 10404.0, 17242.0, 29575.0, 50412.0, 94598.0, 230258.0, 1388801.0, 115048.0, 59486.0, 33979.0, 20104.0, 11921.0, 7085.0, 4481.0, 2787.0, 1702.0, 1034.0, 700.0, 365.0, 260.0, 165.0, 89.0, 76.0, 39.0, 26.0, 20.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7041015625, -1.652679443359375, -1.60125732421875, -1.549835205078125, -1.4984130859375, -1.446990966796875, -1.39556884765625, -1.344146728515625, -1.292724609375, -1.241302490234375, -1.18988037109375, -1.138458251953125, -1.0870361328125, -1.035614013671875, -0.98419189453125, -0.932769775390625, -0.88134765625, -0.829925537109375, -0.77850341796875, -0.727081298828125, -0.6756591796875, -0.624237060546875, -0.57281494140625, -0.521392822265625, -0.469970703125, -0.418548583984375, -0.36712646484375, -0.315704345703125, -0.2642822265625, -0.212860107421875, -0.16143798828125, -0.110015869140625, -0.05859375, -0.007171630859375, 0.04425048828125, 0.095672607421875, 0.1470947265625, 0.198516845703125, 0.24993896484375, 0.301361083984375, 0.352783203125, 0.404205322265625, 0.45562744140625, 0.507049560546875, 0.5584716796875, 0.609893798828125, 0.66131591796875, 0.712738037109375, 0.76416015625, 0.815582275390625, 0.86700439453125, 0.918426513671875, 0.9698486328125, 1.021270751953125, 1.07269287109375, 1.124114990234375, 1.175537109375, 1.226959228515625, 1.27838134765625, 1.329803466796875, 1.3812255859375, 1.432647705078125, 1.48406982421875, 1.535491943359375, 1.5869140625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 5.0, 9.0, 4.0, 6.0, 17.0, 19.0, 21.0, 30.0, 41.0, 66.0, 66.0, 92.0, 121.0, 114.0, 74.0, 59.0, 64.0, 36.0, 41.0, 25.0, 18.0, 17.0, 15.0, 4.0, 10.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.0012407302856445312, -0.001211114227771759, -0.0011814981698989868, -0.0011518821120262146, -0.0011222660541534424, -0.0010926499962806702, -0.001063033938407898, -0.0010334178805351257, -0.0010038018226623535, -0.0009741857647895813, -0.0009445697069168091, -0.0009149536490440369, -0.0008853375911712646, -0.0008557215332984924, -0.0008261054754257202, -0.000796489417552948, -0.0007668733596801758, -0.0007372573018074036, -0.0007076412439346313, -0.0006780251860618591, -0.0006484091281890869, -0.0006187930703163147, -0.0005891770124435425, -0.0005595609545707703, -0.000529944896697998, -0.0005003288388252258, -0.0004707127809524536, -0.0004410967230796814, -0.0004114806652069092, -0.00038186460733413696, -0.00035224854946136475, -0.00032263249158859253, -0.0002930164337158203, -0.0002634003758430481, -0.00023378431797027588, -0.00020416826009750366, -0.00017455220222473145, -0.00014493614435195923, -0.00011532008647918701, -8.57040286064148e-05, -5.608797073364258e-05, -2.647191286087036e-05, 3.1441450119018555e-06, 3.276020288467407e-05, 6.237626075744629e-05, 9.19923186302185e-05, 0.00012160837650299072, 0.00015122443437576294, 0.00018084049224853516, 0.00021045655012130737, 0.0002400726079940796, 0.0002696886658668518, 0.000299304723739624, 0.00032892078161239624, 0.00035853683948516846, 0.0003881528973579407, 0.0004177689552307129, 0.0004473850131034851, 0.0004770010709762573, 0.0005066171288490295, 0.0005362331867218018, 0.000565849244594574, 0.0005954653024673462, 0.0006250813603401184, 0.0006546974182128906]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 7.0, 3.0, 7.0, 13.0, 16.0, 19.0, 22.0, 28.0, 40.0, 58.0, 90.0, 161.0, 343.0, 1189.0, 1027915.0, 17541.0, 515.0, 225.0, 117.0, 62.0, 54.0, 21.0, 24.0, 22.0, 17.0, 6.0, 11.0, 9.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0143890380859375, -0.01372671127319336, -0.013064384460449219, -0.012402057647705078, -0.011739730834960938, -0.011077404022216797, -0.010415077209472656, -0.009752750396728516, -0.009090423583984375, -0.008428096771240234, -0.007765769958496094, -0.007103443145751953, -0.0064411163330078125, -0.005778789520263672, -0.005116462707519531, -0.004454135894775391, -0.00379180908203125, -0.0031294822692871094, -0.0024671554565429688, -0.0018048286437988281, -0.0011425018310546875, -0.0004801750183105469, 0.00018215179443359375, 0.0008444786071777344, 0.001506805419921875, 0.0021691322326660156, 0.0028314590454101562, 0.003493785858154297, 0.0041561126708984375, 0.004818439483642578, 0.005480766296386719, 0.006143093109130859, 0.006805419921875, 0.007467746734619141, 0.008130073547363281, 0.008792400360107422, 0.009454727172851562, 0.010117053985595703, 0.010779380798339844, 0.011441707611083984, 0.012104034423828125, 0.012766361236572266, 0.013428688049316406, 0.014091014862060547, 0.014753341674804688, 0.015415668487548828, 0.01607799530029297, 0.01674032211303711, 0.01740264892578125, 0.01806497573852539, 0.01872730255126953, 0.019389629364013672, 0.020051956176757812, 0.020714282989501953, 0.021376609802246094, 0.022038936614990234, 0.022701263427734375, 0.023363590240478516, 0.024025917053222656, 0.024688243865966797, 0.025350570678710938, 0.026012897491455078, 0.02667522430419922, 0.02733755111694336, 0.0279998779296875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 75.0, 274.0, 445.0, 177.0, 30.0, 5.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.0026572111528366804, -0.0026100443210452795, -0.0025628774892538786, -0.0025157108902931213, -0.0024685440585017204, -0.0024213772267103195, -0.0023742103949189186, -0.0023270437959581614, -0.0022798769641667604, -0.0022327101323753595, -0.0021855433005839586, -0.0021383767016232014, -0.0020912098698318005, -0.0020440430380403996, -0.0019968762062489986, -0.0019497094908729196, -0.0019025427754968405, -0.0018553759437054396, -0.0018082092283293605, -0.0017610423965379596, -0.0017138756811618805, -0.0016667088493704796, -0.0016195421339944005, -0.0015723753022029996, -0.0015252084704115987, -0.0014780416386201978, -0.0014308749232441187, -0.0013837080914527178, -0.0013365413760766387, -0.0012893745442852378, -0.0012422078289091587, -0.0011950409971177578, -0.0011478741653263569, -0.001100707333534956, -0.001053540618158877, -0.001006373786367476, -0.0009592070709913969, -0.0009120402974076569, -0.0008648735238239169, -0.000817706692032516, -0.0007705399766564369, -0.0007233732030726969, -0.0006762064294889569, -0.0006290396559052169, -0.0005818728823214769, -0.0005347061087377369, -0.0004875393060501665, -0.0004403725324664265, -0.0003932057588826865, -0.0003460389852989465, -0.0002988722117152065, -0.00025170540902763605, -0.00020453864999581128, -0.0001573718764120713, -0.00011020508827641606, -6.303831469267607e-05, -1.587154110893607e-05, 3.129523611278273e-05, 7.846201333450153e-05, 0.00012562879419419914, 0.00017279556777793914, 0.00021996234136167914, 0.00026712912949733436, 0.00031429590308107436, 0.00036146267666481435]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 7.0, 5.0, 20.0, 14.0, 19.0, 18.0, 10.0, 27.0, 27.0, 42.0, 27.0, 42.0, 48.0, 44.0, 37.0, 42.0, 45.0, 46.0, 55.0, 41.0, 42.0, 31.0, 38.0, 24.0, 46.0, 29.0, 33.0, 21.0, 26.0, 19.0, 17.0, 12.0, 14.0, 12.0, 6.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043129920959472656, -0.00041876547038555145, -0.00040623173117637634, -0.00039369799196720123, -0.0003811642527580261, -0.000368630513548851, -0.0003560967743396759, -0.0003435630351305008, -0.0003310292959213257, -0.0003184955567121506, -0.00030596181750297546, -0.00029342807829380035, -0.00028089433908462524, -0.00026836059987545013, -0.000255826860666275, -0.00024329312145709991, -0.0002307593822479248, -0.0002182256430387497, -0.00020569190382957458, -0.00019315816462039948, -0.00018062442541122437, -0.00016809068620204926, -0.00015555694699287415, -0.00014302320778369904, -0.00013048946857452393, -0.00011795572936534882, -0.0001054219901561737, -9.28882509469986e-05, -8.035451173782349e-05, -6.782077252864838e-05, -5.5287033319473267e-05, -4.275329411029816e-05, -3.0219554901123047e-05, -1.7685815691947937e-05, -5.152076482772827e-06, 7.381662726402283e-06, 1.9915401935577393e-05, 3.24491411447525e-05, 4.498288035392761e-05, 5.751661956310272e-05, 7.005035877227783e-05, 8.258409798145294e-05, 9.511783719062805e-05, 0.00010765157639980316, 0.00012018531560897827, 0.00013271905481815338, 0.0001452527940273285, 0.0001577865332365036, 0.0001703202724456787, 0.00018285401165485382, 0.00019538775086402893, 0.00020792149007320404, 0.00022045522928237915, 0.00023298896849155426, 0.00024552270770072937, 0.0002580564469099045, 0.0002705901861190796, 0.0002831239253282547, 0.0002956576645374298, 0.0003081914037466049, 0.00032072514295578003, 0.00033325888216495514, 0.00034579262137413025, 0.00035832636058330536, 0.00037086009979248047]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 15.0, 16.0, 11.0, 17.0, 12.0, 38.0, 16.0, 30.0, 20.0, 27.0, 38.0, 36.0, 39.0, 35.0, 59.0, 68.0, 38.0, 45.0, 37.0, 49.0, 34.0, 40.0, 46.0, 28.0, 27.0, 16.0, 28.0, 17.0, 25.0, 11.0, 15.0, 15.0, 10.0, 8.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.4921875, -8.25860595703125, -8.0250244140625, -7.79144287109375, -7.557861328125, -7.32427978515625, -7.0906982421875, -6.85711669921875, -6.62353515625, -6.38995361328125, -6.1563720703125, -5.92279052734375, -5.689208984375, -5.45562744140625, -5.2220458984375, -4.98846435546875, -4.7548828125, -4.52130126953125, -4.2877197265625, -4.05413818359375, -3.820556640625, -3.58697509765625, -3.3533935546875, -3.11981201171875, -2.88623046875, -2.65264892578125, -2.4190673828125, -2.18548583984375, -1.951904296875, -1.71832275390625, -1.4847412109375, -1.25115966796875, -1.017578125, -0.78399658203125, -0.5504150390625, -0.31683349609375, -0.083251953125, 0.15032958984375, 0.3839111328125, 0.61749267578125, 0.85107421875, 1.08465576171875, 1.3182373046875, 1.55181884765625, 1.785400390625, 2.01898193359375, 2.2525634765625, 2.48614501953125, 2.7197265625, 2.95330810546875, 3.1868896484375, 3.42047119140625, 3.654052734375, 3.88763427734375, 4.1212158203125, 4.35479736328125, 4.58837890625, 4.82196044921875, 5.0555419921875, 5.28912353515625, 5.522705078125, 5.75628662109375, 5.9898681640625, 6.22344970703125, 6.45703125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 13.0, 14.0, 16.0, 16.0, 26.0, 26.0, 47.0, 99.0, 142.0, 243.0, 506.0, 1002.0, 2281.0, 5878.0, 16223.0, 53067.0, 200564.0, 486745.0, 201396.0, 53381.0, 16413.0, 5866.0, 2315.0, 1060.0, 528.0, 252.0, 146.0, 97.0, 44.0, 38.0, 27.0, 18.0, 14.0, 15.0, 7.0, 12.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.3203125, -5.174560546875, -5.02880859375, -4.883056640625, -4.7373046875, -4.591552734375, -4.44580078125, -4.300048828125, -4.154296875, -4.008544921875, -3.86279296875, -3.717041015625, -3.5712890625, -3.425537109375, -3.27978515625, -3.134033203125, -2.98828125, -2.842529296875, -2.69677734375, -2.551025390625, -2.4052734375, -2.259521484375, -2.11376953125, -1.968017578125, -1.822265625, -1.676513671875, -1.53076171875, -1.385009765625, -1.2392578125, -1.093505859375, -0.94775390625, -0.802001953125, -0.65625, -0.510498046875, -0.36474609375, -0.218994140625, -0.0732421875, 0.072509765625, 0.21826171875, 0.364013671875, 0.509765625, 0.655517578125, 0.80126953125, 0.947021484375, 1.0927734375, 1.238525390625, 1.38427734375, 1.530029296875, 1.67578125, 1.821533203125, 1.96728515625, 2.113037109375, 2.2587890625, 2.404541015625, 2.55029296875, 2.696044921875, 2.841796875, 2.987548828125, 3.13330078125, 3.279052734375, 3.4248046875, 3.570556640625, 3.71630859375, 3.862060546875, 4.0078125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 5.0, 6.0, 3.0, 14.0, 13.0, 21.0, 21.0, 29.0, 27.0, 38.0, 31.0, 47.0, 53.0, 50.0, 76.0, 156.0, 1789.0, 183.0, 64.0, 46.0, 43.0, 45.0, 46.0, 45.0, 30.0, 18.0, 22.0, 15.0, 16.0, 16.0, 10.0, 12.0, 12.0, 7.0, 7.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.640625, -21.81884765625, -20.9970703125, -20.17529296875, -19.353515625, -18.53173828125, -17.7099609375, -16.88818359375, -16.06640625, -15.24462890625, -14.4228515625, -13.60107421875, -12.779296875, -11.95751953125, -11.1357421875, -10.31396484375, -9.4921875, -8.67041015625, -7.8486328125, -7.02685546875, -6.205078125, -5.38330078125, -4.5615234375, -3.73974609375, -2.91796875, -2.09619140625, -1.2744140625, -0.45263671875, 0.369140625, 1.19091796875, 2.0126953125, 2.83447265625, 3.65625, 4.47802734375, 5.2998046875, 6.12158203125, 6.943359375, 7.76513671875, 8.5869140625, 9.40869140625, 10.23046875, 11.05224609375, 11.8740234375, 12.69580078125, 13.517578125, 14.33935546875, 15.1611328125, 15.98291015625, 16.8046875, 17.62646484375, 18.4482421875, 19.27001953125, 20.091796875, 20.91357421875, 21.7353515625, 22.55712890625, 23.37890625, 24.20068359375, 25.0224609375, 25.84423828125, 26.666015625, 27.48779296875, 28.3095703125, 29.13134765625, 29.953125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 4.0, 9.0, 7.0, 12.0, 10.0, 11.0, 15.0, 17.0, 20.0, 21.0, 35.0, 42.0, 68.0, 94.0, 141.0, 219.0, 355.0, 1033.0, 13901.0, 3118565.0, 9171.0, 928.0, 408.0, 206.0, 96.0, 64.0, 53.0, 45.0, 42.0, 28.0, 17.0, 16.0, 11.0, 6.0, 3.0, 6.0, 2.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-50.84375, -49.44921875, -48.0546875, -46.66015625, -45.265625, -43.87109375, -42.4765625, -41.08203125, -39.6875, -38.29296875, -36.8984375, -35.50390625, -34.109375, -32.71484375, -31.3203125, -29.92578125, -28.53125, -27.13671875, -25.7421875, -24.34765625, -22.953125, -21.55859375, -20.1640625, -18.76953125, -17.375, -15.98046875, -14.5859375, -13.19140625, -11.796875, -10.40234375, -9.0078125, -7.61328125, -6.21875, -4.82421875, -3.4296875, -2.03515625, -0.640625, 0.75390625, 2.1484375, 3.54296875, 4.9375, 6.33203125, 7.7265625, 9.12109375, 10.515625, 11.91015625, 13.3046875, 14.69921875, 16.09375, 17.48828125, 18.8828125, 20.27734375, 21.671875, 23.06640625, 24.4609375, 25.85546875, 27.25, 28.64453125, 30.0390625, 31.43359375, 32.828125, 34.22265625, 35.6171875, 37.01171875, 38.40625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [602.0, 413.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.62917709350586, 0.27597999572753906, 10.181137084960938, 20.086294174194336, 29.991451263427734, 39.896610260009766, 49.80176544189453, 59.7069206237793, 69.61207580566406, 79.5172348022461, 89.42239379882812, 99.32754516601562, 109.23270416259766, 119.13786315917969, 129.0430145263672, 138.94818115234375, 148.85333251953125, 158.75848388671875, 168.6636505126953, 178.5688018798828, 188.47396850585938, 198.37911987304688, 208.28427124023438, 218.18942260742188, 228.09458923339844, 237.99974060058594, 247.9049072265625, 257.81005859375, 267.7152099609375, 277.620361328125, 287.5255432128906, 297.4306945800781, 307.33587646484375, 317.24102783203125, 327.14617919921875, 337.0513610839844, 346.9565124511719, 356.8616638183594, 366.7668151855469, 376.6719665527344, 386.5771484375, 396.4822998046875, 406.387451171875, 416.2926330566406, 426.1977844238281, 436.1029357910156, 446.0080871582031, 455.9132385253906, 465.8183898925781, 475.7235412597656, 485.6286926269531, 495.53387451171875, 505.43902587890625, 515.3441772460938, 525.2493286132812, 535.1544799804688, 545.0596313476562, 554.9647827148438, 564.8699340820312, 574.7750854492188, 584.6802368164062, 594.58544921875, 604.4906005859375, 614.395751953125, 624.3009033203125]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 6.0, 8.0, 14.0, 17.0, 17.0, 15.0, 13.0, 31.0, 25.0, 33.0, 31.0, 40.0, 29.0, 31.0, 51.0, 35.0, 38.0, 41.0, 47.0, 52.0, 42.0, 40.0, 44.0, 33.0, 37.0, 31.0, 23.0, 32.0, 23.0, 17.0, 16.0, 14.0, 12.0, 8.0, 10.0, 8.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.72724914550781, -69.2081527709961, -66.68905639648438, -64.16995239257812, -61.650856018066406, -59.13175964355469, -56.61266326904297, -54.093563079833984, -51.574462890625, -49.05536651611328, -46.5362663269043, -44.01716995239258, -41.498069763183594, -38.978973388671875, -36.459877014160156, -33.94077682495117, -31.421680450439453, -28.9025821685791, -26.38348388671875, -23.86438751220703, -21.345287322998047, -18.826190948486328, -16.307092666625977, -13.787994384765625, -11.268896102905273, -8.749797821044922, -6.2307000160217285, -3.711602210998535, -1.1925039291381836, 1.326594352722168, 3.845691680908203, 6.364789962768555, 8.883888244628906, 11.402986526489258, 13.92208480834961, 16.441181182861328, 18.960281372070312, 21.47937774658203, 23.998476028442383, 26.517574310302734, 29.036672592163086, 31.555770874023438, 34.074867248535156, 36.59396743774414, 39.11306381225586, 41.632164001464844, 44.15126037597656, 46.67035675048828, 49.189456939697266, 51.708553314208984, 54.22765350341797, 56.74674987792969, 59.26585006713867, 61.78494644165039, 64.30404663085938, 66.8231430053711, 69.34223937988281, 71.86133575439453, 74.38043212890625, 76.8995361328125, 79.41863250732422, 81.93772888183594, 84.45682525634766, 86.97592163085938, 89.49502563476562]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 10.0, 15.0, 12.0, 16.0, 16.0, 21.0, 31.0, 24.0, 19.0, 23.0, 36.0, 36.0, 39.0, 38.0, 49.0, 61.0, 52.0, 38.0, 49.0, 41.0, 55.0, 36.0, 30.0, 42.0, 31.0, 25.0, 18.0, 23.0, 19.0, 14.0, 15.0, 13.0, 11.0, 12.0, 10.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6796875, -8.4375, -8.1953125, -7.953125, -7.7109375, -7.46875, -7.2265625, -6.984375, -6.7421875, -6.5, -6.2578125, -6.015625, -5.7734375, -5.53125, -5.2890625, -5.046875, -4.8046875, -4.5625, -4.3203125, -4.078125, -3.8359375, -3.59375, -3.3515625, -3.109375, -2.8671875, -2.625, -2.3828125, -2.140625, -1.8984375, -1.65625, -1.4140625, -1.171875, -0.9296875, -0.6875, -0.4453125, -0.203125, 0.0390625, 0.28125, 0.5234375, 0.765625, 1.0078125, 1.25, 1.4921875, 1.734375, 1.9765625, 2.21875, 2.4609375, 2.703125, 2.9453125, 3.1875, 3.4296875, 3.671875, 3.9140625, 4.15625, 4.3984375, 4.640625, 4.8828125, 5.125, 5.3671875, 5.609375, 5.8515625, 6.09375, 6.3359375, 6.578125, 6.8203125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 7.0, 7.0, 12.0, 7.0, 12.0, 16.0, 13.0, 21.0, 27.0, 29.0, 32.0, 38.0, 60.0, 85.0, 188.0, 386.0, 1205.0, 6000.0, 47584.0, 1090346.0, 2845948.0, 184314.0, 14399.0, 2296.0, 602.0, 216.0, 108.0, 71.0, 51.0, 47.0, 20.0, 26.0, 16.0, 19.0, 15.0, 15.0, 7.0, 13.0, 8.0, 7.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-25.140625, -24.44677734375, -23.7529296875, -23.05908203125, -22.365234375, -21.67138671875, -20.9775390625, -20.28369140625, -19.58984375, -18.89599609375, -18.2021484375, -17.50830078125, -16.814453125, -16.12060546875, -15.4267578125, -14.73291015625, -14.0390625, -13.34521484375, -12.6513671875, -11.95751953125, -11.263671875, -10.56982421875, -9.8759765625, -9.18212890625, -8.48828125, -7.79443359375, -7.1005859375, -6.40673828125, -5.712890625, -5.01904296875, -4.3251953125, -3.63134765625, -2.9375, -2.24365234375, -1.5498046875, -0.85595703125, -0.162109375, 0.53173828125, 1.2255859375, 1.91943359375, 2.61328125, 3.30712890625, 4.0009765625, 4.69482421875, 5.388671875, 6.08251953125, 6.7763671875, 7.47021484375, 8.1640625, 8.85791015625, 9.5517578125, 10.24560546875, 10.939453125, 11.63330078125, 12.3271484375, 13.02099609375, 13.71484375, 14.40869140625, 15.1025390625, 15.79638671875, 16.490234375, 17.18408203125, 17.8779296875, 18.57177734375, 19.265625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 11.0, 6.0, 15.0, 21.0, 27.0, 27.0, 42.0, 80.0, 98.0, 111.0, 127.0, 174.0, 217.0, 298.0, 347.0, 410.0, 422.0, 368.0, 337.0, 236.0, 169.0, 123.0, 96.0, 90.0, 63.0, 26.0, 35.0, 26.0, 20.0, 9.0, 6.0, 9.0, 9.0, 9.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.0, -18.4864501953125, -17.972900390625, -17.4593505859375, -16.94580078125, -16.4322509765625, -15.918701171875, -15.4051513671875, -14.8916015625, -14.3780517578125, -13.864501953125, -13.3509521484375, -12.83740234375, -12.3238525390625, -11.810302734375, -11.2967529296875, -10.783203125, -10.2696533203125, -9.756103515625, -9.2425537109375, -8.72900390625, -8.2154541015625, -7.701904296875, -7.1883544921875, -6.6748046875, -6.1612548828125, -5.647705078125, -5.1341552734375, -4.62060546875, -4.1070556640625, -3.593505859375, -3.0799560546875, -2.56640625, -2.0528564453125, -1.539306640625, -1.0257568359375, -0.51220703125, 0.0013427734375, 0.514892578125, 1.0284423828125, 1.5419921875, 2.0555419921875, 2.569091796875, 3.0826416015625, 3.59619140625, 4.1097412109375, 4.623291015625, 5.1368408203125, 5.650390625, 6.1639404296875, 6.677490234375, 7.1910400390625, 7.70458984375, 8.2181396484375, 8.731689453125, 9.2452392578125, 9.7587890625, 10.2723388671875, 10.785888671875, 11.2994384765625, 11.81298828125, 12.3265380859375, 12.840087890625, 13.3536376953125, 13.8671875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 9.0, 4.0, 10.0, 14.0, 21.0, 24.0, 23.0, 45.0, 35.0, 53.0, 76.0, 98.0, 163.0, 211.0, 381.0, 762.0, 4465.0, 135044.0, 3865770.0, 179856.0, 5125.0, 842.0, 381.0, 236.0, 148.0, 115.0, 82.0, 69.0, 42.0, 46.0, 33.0, 24.0, 13.0, 11.0, 7.0, 7.0, 16.0, 6.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.90625, -54.13330078125, -52.3603515625, -50.58740234375, -48.814453125, -47.04150390625, -45.2685546875, -43.49560546875, -41.72265625, -39.94970703125, -38.1767578125, -36.40380859375, -34.630859375, -32.85791015625, -31.0849609375, -29.31201171875, -27.5390625, -25.76611328125, -23.9931640625, -22.22021484375, -20.447265625, -18.67431640625, -16.9013671875, -15.12841796875, -13.35546875, -11.58251953125, -9.8095703125, -8.03662109375, -6.263671875, -4.49072265625, -2.7177734375, -0.94482421875, 0.828125, 2.60107421875, 4.3740234375, 6.14697265625, 7.919921875, 9.69287109375, 11.4658203125, 13.23876953125, 15.01171875, 16.78466796875, 18.5576171875, 20.33056640625, 22.103515625, 23.87646484375, 25.6494140625, 27.42236328125, 29.1953125, 30.96826171875, 32.7412109375, 34.51416015625, 36.287109375, 38.06005859375, 39.8330078125, 41.60595703125, 43.37890625, 45.15185546875, 46.9248046875, 48.69775390625, 50.470703125, 52.24365234375, 54.0166015625, 55.78955078125, 57.5625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 9.0, 21.0, 32.0, 65.0, 81.0, 127.0, 143.0, 127.0, 129.0, 103.0, 74.0, 30.0, 22.0, 21.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.46642303466797, -32.75718688964844, -30.047954559326172, -27.338720321655273, -24.629486083984375, -21.920251846313477, -19.211017608642578, -16.50178337097168, -13.792549133300781, -11.083314895629883, -8.374080657958984, -5.664846420288086, -2.9556121826171875, -0.24637794494628906, 2.4628562927246094, 5.172090530395508, 7.881324768066406, 10.590559005737305, 13.299793243408203, 16.0090274810791, 18.71826171875, 21.4274959564209, 24.136730194091797, 26.845964431762695, 29.555198669433594, 32.264434814453125, 34.97366714477539, 37.682899475097656, 40.39213562011719, 43.10137176513672, 45.810604095458984, 48.51983642578125, 51.22906494140625, 53.93830108642578, 56.64753341674805, 59.35676574707031, 62.066001892089844, 64.77523803710938, 67.48446655273438, 70.1937026977539, 72.90293884277344, 75.61217498779297, 78.3214111328125, 81.0306396484375, 83.73987579345703, 86.44911193847656, 89.15834045410156, 91.8675765991211, 94.57681274414062, 97.28604888916016, 99.99528503417969, 102.70451354980469, 105.41374969482422, 108.12298583984375, 110.83221435546875, 113.54145050048828, 116.25068664550781, 118.95992279052734, 121.66915893554688, 124.37838745117188, 127.0876235961914, 129.79685974121094, 132.50608825683594, 135.21533203125, 137.924560546875]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 3.0, 3.0, 12.0, 9.0, 12.0, 13.0, 11.0, 19.0, 17.0, 11.0, 18.0, 18.0, 19.0, 28.0, 25.0, 38.0, 35.0, 40.0, 41.0, 40.0, 34.0, 45.0, 42.0, 44.0, 32.0, 35.0, 41.0, 40.0, 37.0, 30.0, 34.0, 33.0, 23.0, 23.0, 20.0, 13.0, 16.0, 10.0, 6.0, 6.0, 7.0, 6.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.507137298583984, -51.64177322387695, -49.77641296386719, -47.911048889160156, -46.045684814453125, -44.180320739746094, -42.31495666503906, -40.4495964050293, -38.584232330322266, -36.718868255615234, -34.85350799560547, -32.98814392089844, -31.122779846191406, -29.257415771484375, -27.392053604125977, -25.526691436767578, -23.661327362060547, -21.795963287353516, -19.930601119995117, -18.06523895263672, -16.199874877929688, -14.334511756896973, -12.469148635864258, -10.603785514831543, -8.738422393798828, -6.873059272766113, -5.007696151733398, -3.1423330307006836, -1.2769699096679688, 0.5883932113647461, 2.453756332397461, 4.319119453430176, 6.184478759765625, 8.04984188079834, 9.915205001831055, 11.78056812286377, 13.645931243896484, 15.5112943649292, 17.376657485961914, 19.242019653320312, 21.107383728027344, 22.972747802734375, 24.838109970092773, 26.703472137451172, 28.568836212158203, 30.434200286865234, 32.299560546875, 34.16492462158203, 36.03028869628906, 37.895652770996094, 39.761016845703125, 41.62637710571289, 43.49174118041992, 45.35710525512695, 47.22246551513672, 49.08782958984375, 50.95319366455078, 52.81855773925781, 54.683921813964844, 56.54928207397461, 58.41464614868164, 60.28001022338867, 62.14537048339844, 64.01073455810547, 65.8760986328125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 8.0, 11.0, 13.0, 19.0, 7.0, 18.0, 17.0, 17.0, 25.0, 27.0, 36.0, 32.0, 42.0, 42.0, 41.0, 52.0, 50.0, 48.0, 56.0, 46.0, 46.0, 52.0, 33.0, 33.0, 44.0, 29.0, 23.0, 19.0, 29.0, 17.0, 10.0, 14.0, 8.0, 16.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0546875, -8.7996826171875, -8.544677734375, -8.2896728515625, -8.03466796875, -7.7796630859375, -7.524658203125, -7.2696533203125, -7.0146484375, -6.7596435546875, -6.504638671875, -6.2496337890625, -5.99462890625, -5.7396240234375, -5.484619140625, -5.2296142578125, -4.974609375, -4.7196044921875, -4.464599609375, -4.2095947265625, -3.95458984375, -3.6995849609375, -3.444580078125, -3.1895751953125, -2.9345703125, -2.6795654296875, -2.424560546875, -2.1695556640625, -1.91455078125, -1.6595458984375, -1.404541015625, -1.1495361328125, -0.89453125, -0.6395263671875, -0.384521484375, -0.1295166015625, 0.12548828125, 0.3804931640625, 0.635498046875, 0.8905029296875, 1.1455078125, 1.4005126953125, 1.655517578125, 1.9105224609375, 2.16552734375, 2.4205322265625, 2.675537109375, 2.9305419921875, 3.185546875, 3.4405517578125, 3.695556640625, 3.9505615234375, 4.20556640625, 4.4605712890625, 4.715576171875, 4.9705810546875, 5.2255859375, 5.4805908203125, 5.735595703125, 5.9906005859375, 6.24560546875, 6.5006103515625, 6.755615234375, 7.0106201171875, 7.265625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 5.0, 9.0, 12.0, 9.0, 29.0, 36.0, 50.0, 78.0, 127.0, 169.0, 252.0, 373.0, 592.0, 938.0, 1552.0, 2823.0, 4715.0, 7784.0, 12150.0, 20798.0, 36177.0, 63750.0, 123448.0, 358420.0, 204683.0, 90564.0, 48796.0, 28231.0, 16629.0, 9947.0, 6202.0, 3733.0, 2126.0, 1251.0, 750.0, 431.0, 319.0, 208.0, 148.0, 72.0, 56.0, 36.0, 18.0, 12.0, 15.0, 8.0, 6.0, 6.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.876953125, -1.8196868896484375, -1.762420654296875, -1.7051544189453125, -1.64788818359375, -1.5906219482421875, -1.533355712890625, -1.4760894775390625, -1.4188232421875, -1.3615570068359375, -1.304290771484375, -1.2470245361328125, -1.18975830078125, -1.1324920654296875, -1.075225830078125, -1.0179595947265625, -0.960693359375, -0.9034271240234375, -0.846160888671875, -0.7888946533203125, -0.73162841796875, -0.6743621826171875, -0.617095947265625, -0.5598297119140625, -0.5025634765625, -0.4452972412109375, -0.388031005859375, -0.3307647705078125, -0.27349853515625, -0.2162322998046875, -0.158966064453125, -0.1016998291015625, -0.04443359375, 0.0128326416015625, 0.070098876953125, 0.1273651123046875, 0.18463134765625, 0.2418975830078125, 0.299163818359375, 0.3564300537109375, 0.4136962890625, 0.4709625244140625, 0.528228759765625, 0.5854949951171875, 0.64276123046875, 0.7000274658203125, 0.757293701171875, 0.8145599365234375, 0.871826171875, 0.9290924072265625, 0.986358642578125, 1.0436248779296875, 1.10089111328125, 1.1581573486328125, 1.215423583984375, 1.2726898193359375, 1.3299560546875, 1.3872222900390625, 1.444488525390625, 1.5017547607421875, 1.55902099609375, 1.6162872314453125, 1.673553466796875, 1.7308197021484375, 1.7880859375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 7.0, 6.0, 9.0, 14.0, 10.0, 14.0, 13.0, 15.0, 22.0, 24.0, 25.0, 20.0, 21.0, 29.0, 36.0, 39.0, 27.0, 42.0, 31.0, 48.0, 1055.0, 39.0, 33.0, 41.0, 42.0, 32.0, 17.0, 33.0, 36.0, 30.0, 25.0, 26.0, 26.0, 10.0, 23.0, 15.0, 17.0, 15.0, 11.0, 9.0, 8.0, 5.0, 6.0, 6.0, 1.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.30859375, -4.18035888671875, -4.0521240234375, -3.92388916015625, -3.795654296875, -3.66741943359375, -3.5391845703125, -3.41094970703125, -3.28271484375, -3.15447998046875, -3.0262451171875, -2.89801025390625, -2.769775390625, -2.64154052734375, -2.5133056640625, -2.38507080078125, -2.2568359375, -2.12860107421875, -2.0003662109375, -1.87213134765625, -1.743896484375, -1.61566162109375, -1.4874267578125, -1.35919189453125, -1.23095703125, -1.10272216796875, -0.9744873046875, -0.84625244140625, -0.718017578125, -0.58978271484375, -0.4615478515625, -0.33331298828125, -0.205078125, -0.07684326171875, 0.0513916015625, 0.17962646484375, 0.307861328125, 0.43609619140625, 0.5643310546875, 0.69256591796875, 0.82080078125, 0.94903564453125, 1.0772705078125, 1.20550537109375, 1.333740234375, 1.46197509765625, 1.5902099609375, 1.71844482421875, 1.8466796875, 1.97491455078125, 2.1031494140625, 2.23138427734375, 2.359619140625, 2.48785400390625, 2.6160888671875, 2.74432373046875, 2.87255859375, 3.00079345703125, 3.1290283203125, 3.25726318359375, 3.385498046875, 3.51373291015625, 3.6419677734375, 3.77020263671875, 3.8984375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 6.0, 13.0, 14.0, 19.0, 31.0, 54.0, 103.0, 132.0, 229.0, 344.0, 582.0, 834.0, 1346.0, 2055.0, 3193.0, 4899.0, 7459.0, 11496.0, 17988.0, 28092.0, 44378.0, 74265.0, 142722.0, 1388674.0, 158620.0, 80208.0, 47075.0, 29504.0, 18580.0, 11920.0, 7793.0, 5045.0, 3330.0, 2192.0, 1423.0, 912.0, 579.0, 370.0, 227.0, 151.0, 101.0, 60.0, 41.0, 28.0, 17.0, 6.0, 12.0, 2.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.5029296875, -1.4581451416015625, -1.413360595703125, -1.3685760498046875, -1.32379150390625, -1.2790069580078125, -1.234222412109375, -1.1894378662109375, -1.1446533203125, -1.0998687744140625, -1.055084228515625, -1.0102996826171875, -0.96551513671875, -0.9207305908203125, -0.875946044921875, -0.8311614990234375, -0.786376953125, -0.7415924072265625, -0.696807861328125, -0.6520233154296875, -0.60723876953125, -0.5624542236328125, -0.517669677734375, -0.4728851318359375, -0.4281005859375, -0.3833160400390625, -0.338531494140625, -0.2937469482421875, -0.24896240234375, -0.2041778564453125, -0.159393310546875, -0.1146087646484375, -0.06982421875, -0.0250396728515625, 0.019744873046875, 0.0645294189453125, 0.10931396484375, 0.1540985107421875, 0.198883056640625, 0.2436676025390625, 0.2884521484375, 0.3332366943359375, 0.378021240234375, 0.4228057861328125, 0.46759033203125, 0.5123748779296875, 0.557159423828125, 0.6019439697265625, 0.646728515625, 0.6915130615234375, 0.736297607421875, 0.7810821533203125, 0.82586669921875, 0.8706512451171875, 0.915435791015625, 0.9602203369140625, 1.0050048828125, 1.0497894287109375, 1.094573974609375, 1.1393585205078125, 1.18414306640625, 1.2289276123046875, 1.273712158203125, 1.3184967041015625, 1.36328125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 11.0, 19.0, 26.0, 29.0, 41.0, 61.0, 85.0, 132.0, 164.0, 115.0, 72.0, 53.0, 40.0, 36.0, 18.0, 12.0, 13.0, 13.0, 5.0, 5.0, 5.0, 6.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013446807861328125, -0.0013044029474258423, -0.001264125108718872, -0.0012238472700119019, -0.0011835694313049316, -0.0011432915925979614, -0.0011030137538909912, -0.001062735915184021, -0.0010224580764770508, -0.0009821802377700806, -0.0009419023990631104, -0.0009016245603561401, -0.0008613467216491699, -0.0008210688829421997, -0.0007807910442352295, -0.0007405132055282593, -0.0007002353668212891, -0.0006599575281143188, -0.0006196796894073486, -0.0005794018507003784, -0.0005391240119934082, -0.000498846173286438, -0.0004585683345794678, -0.00041829049587249756, -0.00037801265716552734, -0.00033773481845855713, -0.0002974569797515869, -0.0002571791410446167, -0.00021690130233764648, -0.00017662346363067627, -0.00013634562492370605, -9.606778621673584e-05, -5.5789947509765625e-05, -1.551210880279541e-05, 2.4765729904174805e-05, 6.504356861114502e-05, 0.00010532140731811523, 0.00014559924602508545, 0.00018587708473205566, 0.00022615492343902588, 0.0002664327621459961, 0.0003067106008529663, 0.0003469884395599365, 0.00038726627826690674, 0.00042754411697387695, 0.00046782195568084717, 0.0005080997943878174, 0.0005483776330947876, 0.0005886554718017578, 0.000628933310508728, 0.0006692111492156982, 0.0007094889879226685, 0.0007497668266296387, 0.0007900446653366089, 0.0008303225040435791, 0.0008706003427505493, 0.0009108781814575195, 0.0009511560201644897, 0.00099143385887146, 0.0010317116975784302, 0.0010719895362854004, 0.0011122673749923706, 0.0011525452136993408, 0.001192823052406311, 0.0012331008911132812]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 3.0, 4.0, 5.0, 7.0, 7.0, 6.0, 9.0, 16.0, 17.0, 17.0, 36.0, 60.0, 75.0, 136.0, 261.0, 625.0, 26861.0, 1018202.0, 1345.0, 357.0, 176.0, 100.0, 68.0, 46.0, 31.0, 17.0, 16.0, 9.0, 7.0, 7.0, 4.0, 4.0, 5.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0228424072265625, -0.02208709716796875, -0.021331787109375, -0.02057647705078125, -0.0198211669921875, -0.01906585693359375, -0.018310546875, -0.01755523681640625, -0.0167999267578125, -0.01604461669921875, -0.015289306640625, -0.01453399658203125, -0.0137786865234375, -0.01302337646484375, -0.01226806640625, -0.01151275634765625, -0.0107574462890625, -0.01000213623046875, -0.009246826171875, -0.00849151611328125, -0.0077362060546875, -0.00698089599609375, -0.0062255859375, -0.00547027587890625, -0.0047149658203125, -0.00395965576171875, -0.003204345703125, -0.00244903564453125, -0.0016937255859375, -0.00093841552734375, -0.00018310546875, 0.00057220458984375, 0.0013275146484375, 0.00208282470703125, 0.002838134765625, 0.00359344482421875, 0.0043487548828125, 0.00510406494140625, 0.005859375, 0.00661468505859375, 0.0073699951171875, 0.00812530517578125, 0.008880615234375, 0.00963592529296875, 0.0103912353515625, 0.01114654541015625, 0.01190185546875, 0.01265716552734375, 0.0134124755859375, 0.01416778564453125, 0.014923095703125, 0.01567840576171875, 0.0164337158203125, 0.01718902587890625, 0.0179443359375, 0.01869964599609375, 0.0194549560546875, 0.02021026611328125, 0.020965576171875, 0.02172088623046875, 0.0224761962890625, 0.02323150634765625, 0.02398681640625, 0.02474212646484375, 0.0254974365234375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 56.0, 149.0, 312.0, 316.0, 128.0, 37.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008222717442549765, -0.0007787694339640439, -0.0007352670654654503, -0.0006917647551745176, -0.0006482623866759241, -0.0006047600763849914, -0.0005612577078863978, -0.0005177553975954652, -0.00047425305820070207, -0.00043075071880593896, -0.00038724837941117585, -0.00034374604001641273, -0.0003002437297254801, -0.0002567413612268865, -0.00021323905093595386, -0.00016973671154119074, -0.00012623437214642763, -8.273203275166452e-05, -3.922970063285902e-05, 4.2726314859464765e-06, 4.777497088070959e-05, 9.12773102754727e-05, 0.00013477963511832058, 0.0001782819745130837, 0.0002217843139078468, 0.0002652866533026099, 0.00030878899269737303, 0.00035229133209213614, 0.0003957936423830688, 0.00043929601088166237, 0.000482798321172595, 0.0005263006314635277, 0.0005698030581697822, 0.0006133053684607148, 0.0006568077369593084, 0.000700310047250241, 0.0007438124157488346, 0.0007873147260397673, 0.0008308170363306999, 0.0008743194048292935, 0.0009178217733278871, 0.0009613240836188197, 0.0010048263939097524, 0.0010483288206160069, 0.0010918311309069395, 0.0011353334411978722, 0.0011788357514888048, 0.0012223380617797375, 0.0012658403720706701, 0.0013093426823616028, 0.0013528449926525354, 0.00139634741935879, 0.0014398497296497226, 0.0014833520399406552, 0.0015268543502315879, 0.0015703567769378424, 0.001613859087228775, 0.0016573613975197077, 0.0017008637078106403, 0.0017443661345168948, 0.0017878684448078275, 0.0018313707550987601, 0.0018748730653896928, 0.0019183754920959473, 0.00196187780238688]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 9.0, 5.0, 6.0, 11.0, 19.0, 15.0, 14.0, 18.0, 15.0, 23.0, 21.0, 40.0, 34.0, 36.0, 40.0, 35.0, 56.0, 38.0, 46.0, 45.0, 48.0, 39.0, 40.0, 32.0, 34.0, 25.0, 29.0, 30.0, 25.0, 24.0, 18.0, 31.0, 22.0, 11.0, 11.0, 9.0, 7.0, 20.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041043758392333984, -0.00039662234485149384, -0.00038280710577964783, -0.0003689918667078018, -0.0003551766276359558, -0.0003413613885641098, -0.0003275461494922638, -0.0003137309104204178, -0.0002999156713485718, -0.00028610043227672577, -0.00027228519320487976, -0.00025846995413303375, -0.00024465471506118774, -0.00023083947598934174, -0.00021702423691749573, -0.00020320899784564972, -0.0001893937587738037, -0.0001755785197019577, -0.0001617632806301117, -0.00014794804155826569, -0.00013413280248641968, -0.00012031756341457367, -0.00010650232434272766, -9.268708527088165e-05, -7.887184619903564e-05, -6.505660712718964e-05, -5.124136805534363e-05, -3.742612898349762e-05, -2.361088991165161e-05, -9.795650839805603e-06, 4.019588232040405e-06, 1.7834827303886414e-05, 3.165006637573242e-05, 4.546530544757843e-05, 5.928054451942444e-05, 7.309578359127045e-05, 8.691102266311646e-05, 0.00010072626173496246, 0.00011454150080680847, 0.00012835673987865448, 0.0001421719789505005, 0.0001559872180223465, 0.0001698024570941925, 0.0001836176961660385, 0.00019743293523788452, 0.00021124817430973053, 0.00022506341338157654, 0.00023887865245342255, 0.00025269389152526855, 0.00026650913059711456, 0.00028032436966896057, 0.0002941396087408066, 0.0003079548478126526, 0.0003217700868844986, 0.0003355853259563446, 0.0003494005650281906, 0.0003632158041000366, 0.00037703104317188263, 0.00039084628224372864, 0.00040466152131557465, 0.00041847676038742065, 0.00043229199945926666, 0.00044610723853111267, 0.0004599224776029587, 0.0004737377166748047]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 8.0, 11.0, 13.0, 19.0, 7.0, 18.0, 17.0, 17.0, 25.0, 27.0, 36.0, 32.0, 42.0, 42.0, 41.0, 52.0, 50.0, 48.0, 56.0, 46.0, 46.0, 52.0, 33.0, 33.0, 44.0, 29.0, 23.0, 19.0, 29.0, 17.0, 10.0, 14.0, 8.0, 16.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0546875, -8.7996826171875, -8.544677734375, -8.2896728515625, -8.03466796875, -7.7796630859375, -7.524658203125, -7.2696533203125, -7.0146484375, -6.7596435546875, -6.504638671875, -6.2496337890625, -5.99462890625, -5.7396240234375, -5.484619140625, -5.2296142578125, -4.974609375, -4.7196044921875, -4.464599609375, -4.2095947265625, -3.95458984375, -3.6995849609375, -3.444580078125, -3.1895751953125, -2.9345703125, -2.6795654296875, -2.424560546875, -2.1695556640625, -1.91455078125, -1.6595458984375, -1.404541015625, -1.1495361328125, -0.89453125, -0.6395263671875, -0.384521484375, -0.1295166015625, 0.12548828125, 0.3804931640625, 0.635498046875, 0.8905029296875, 1.1455078125, 1.4005126953125, 1.655517578125, 1.9105224609375, 2.16552734375, 2.4205322265625, 2.675537109375, 2.9305419921875, 3.185546875, 3.4405517578125, 3.695556640625, 3.9505615234375, 4.20556640625, 4.4605712890625, 4.715576171875, 4.9705810546875, 5.2255859375, 5.4805908203125, 5.735595703125, 5.9906005859375, 6.24560546875, 6.5006103515625, 6.755615234375, 7.0106201171875, 7.265625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 12.0, 15.0, 19.0, 32.0, 54.0, 70.0, 139.0, 225.0, 365.0, 543.0, 857.0, 1368.0, 2258.0, 3794.0, 6635.0, 12583.0, 30914.0, 116304.0, 577680.0, 212069.0, 45988.0, 16806.0, 8094.0, 4630.0, 2711.0, 1654.0, 1044.0, 613.0, 425.0, 225.0, 137.0, 99.0, 59.0, 48.0, 25.0, 16.0, 14.0, 18.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.77734375, -6.556396484375, -6.33544921875, -6.114501953125, -5.8935546875, -5.672607421875, -5.45166015625, -5.230712890625, -5.009765625, -4.788818359375, -4.56787109375, -4.346923828125, -4.1259765625, -3.905029296875, -3.68408203125, -3.463134765625, -3.2421875, -3.021240234375, -2.80029296875, -2.579345703125, -2.3583984375, -2.137451171875, -1.91650390625, -1.695556640625, -1.474609375, -1.253662109375, -1.03271484375, -0.811767578125, -0.5908203125, -0.369873046875, -0.14892578125, 0.072021484375, 0.29296875, 0.513916015625, 0.73486328125, 0.955810546875, 1.1767578125, 1.397705078125, 1.61865234375, 1.839599609375, 2.060546875, 2.281494140625, 2.50244140625, 2.723388671875, 2.9443359375, 3.165283203125, 3.38623046875, 3.607177734375, 3.828125, 4.049072265625, 4.27001953125, 4.490966796875, 4.7119140625, 4.932861328125, 5.15380859375, 5.374755859375, 5.595703125, 5.816650390625, 6.03759765625, 6.258544921875, 6.4794921875, 6.700439453125, 6.92138671875, 7.142333984375, 7.36328125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 5.0, 10.0, 13.0, 11.0, 14.0, 20.0, 27.0, 31.0, 31.0, 37.0, 60.0, 57.0, 48.0, 61.0, 145.0, 1797.0, 205.0, 66.0, 58.0, 43.0, 52.0, 37.0, 39.0, 39.0, 29.0, 25.0, 22.0, 13.0, 9.0, 6.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.546875, -29.580810546875, -28.61474609375, -27.648681640625, -26.6826171875, -25.716552734375, -24.75048828125, -23.784423828125, -22.818359375, -21.852294921875, -20.88623046875, -19.920166015625, -18.9541015625, -17.988037109375, -17.02197265625, -16.055908203125, -15.08984375, -14.123779296875, -13.15771484375, -12.191650390625, -11.2255859375, -10.259521484375, -9.29345703125, -8.327392578125, -7.361328125, -6.395263671875, -5.42919921875, -4.463134765625, -3.4970703125, -2.531005859375, -1.56494140625, -0.598876953125, 0.3671875, 1.333251953125, 2.29931640625, 3.265380859375, 4.2314453125, 5.197509765625, 6.16357421875, 7.129638671875, 8.095703125, 9.061767578125, 10.02783203125, 10.993896484375, 11.9599609375, 12.926025390625, 13.89208984375, 14.858154296875, 15.82421875, 16.790283203125, 17.75634765625, 18.722412109375, 19.6884765625, 20.654541015625, 21.62060546875, 22.586669921875, 23.552734375, 24.518798828125, 25.48486328125, 26.450927734375, 27.4169921875, 28.383056640625, 29.34912109375, 30.315185546875, 31.28125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 1.0, 3.0, 9.0, 5.0, 9.0, 9.0, 12.0, 19.0, 18.0, 29.0, 36.0, 48.0, 59.0, 79.0, 102.0, 218.0, 325.0, 636.0, 4004.0, 783229.0, 2350341.0, 4837.0, 668.0, 304.0, 202.0, 138.0, 87.0, 55.0, 49.0, 36.0, 30.0, 16.0, 20.0, 9.0, 15.0, 9.0, 8.0, 9.0, 5.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.46875, -53.78955078125, -52.1103515625, -50.43115234375, -48.751953125, -47.07275390625, -45.3935546875, -43.71435546875, -42.03515625, -40.35595703125, -38.6767578125, -36.99755859375, -35.318359375, -33.63916015625, -31.9599609375, -30.28076171875, -28.6015625, -26.92236328125, -25.2431640625, -23.56396484375, -21.884765625, -20.20556640625, -18.5263671875, -16.84716796875, -15.16796875, -13.48876953125, -11.8095703125, -10.13037109375, -8.451171875, -6.77197265625, -5.0927734375, -3.41357421875, -1.734375, -0.05517578125, 1.6240234375, 3.30322265625, 4.982421875, 6.66162109375, 8.3408203125, 10.02001953125, 11.69921875, 13.37841796875, 15.0576171875, 16.73681640625, 18.416015625, 20.09521484375, 21.7744140625, 23.45361328125, 25.1328125, 26.81201171875, 28.4912109375, 30.17041015625, 31.849609375, 33.52880859375, 35.2080078125, 36.88720703125, 38.56640625, 40.24560546875, 41.9248046875, 43.60400390625, 45.283203125, 46.96240234375, 48.6416015625, 50.32080078125, 52.0]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [224.0, 796.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8457670211792, -2.088886260986328, 8.667994499206543, 19.42487335205078, 30.18175506591797, 40.938636779785156, 51.69551467895508, 62.452396392822266, 73.20928192138672, 83.9661636352539, 94.7230453491211, 105.47991943359375, 116.23680114746094, 126.99368286132812, 137.7505645751953, 148.5074462890625, 159.2643280029297, 170.02120971679688, 180.77809143066406, 191.53497314453125, 202.29185485839844, 213.04873657226562, 223.80560302734375, 234.5625, 245.31936645507812, 256.07623291015625, 266.8331298828125, 277.5899963378906, 288.3468933105469, 299.103759765625, 309.86065673828125, 320.6175231933594, 331.3744201660156, 342.13128662109375, 352.88818359375, 363.6450500488281, 374.4019470214844, 385.1588134765625, 395.91571044921875, 406.6725769042969, 417.4294738769531, 428.18634033203125, 438.9432373046875, 449.7001037597656, 460.4570007324219, 471.2138671875, 481.97076416015625, 492.7276306152344, 503.4844970703125, 514.2413940429688, 524.9982299804688, 535.755126953125, 546.5120239257812, 557.2689208984375, 568.0257568359375, 578.7826538085938, 589.53955078125, 600.2964477539062, 611.0532836914062, 621.8101806640625, 632.5670776367188, 643.323974609375, 654.080810546875, 664.8377075195312, 675.5946044921875]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 7.0, 8.0, 8.0, 14.0, 8.0, 9.0, 14.0, 27.0, 26.0, 19.0, 20.0, 28.0, 34.0, 28.0, 35.0, 40.0, 32.0, 38.0, 45.0, 44.0, 42.0, 36.0, 32.0, 36.0, 41.0, 27.0, 33.0, 46.0, 32.0, 21.0, 22.0, 17.0, 26.0, 12.0, 10.0, 16.0, 8.0, 12.0, 10.0, 11.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-75.22618103027344, -72.8869400024414, -70.54769134521484, -68.20845031738281, -65.86920928955078, -63.529964447021484, -61.19071960449219, -58.851478576660156, -56.51223373413086, -54.17298889160156, -51.83374786376953, -49.494503021240234, -47.15525817871094, -44.816017150878906, -42.47677230834961, -40.13752746582031, -37.79828643798828, -35.459041595458984, -33.11980056762695, -30.780555725097656, -28.441312789916992, -26.102069854736328, -23.76282501220703, -21.423582077026367, -19.084339141845703, -16.74509620666504, -14.405852317810059, -12.066608428955078, -9.727365493774414, -7.38812255859375, -5.0488786697387695, -2.709634780883789, -0.37039947509765625, 1.968843936920166, 4.308087348937988, 6.6473307609558105, 8.986574172973633, 11.325817108154297, 13.665060997009277, 16.004304885864258, 18.343547821044922, 20.682790756225586, 23.02203369140625, 25.361278533935547, 27.70052146911621, 30.039764404296875, 32.37900924682617, 34.71825408935547, 37.0574951171875, 39.3967399597168, 41.73598098754883, 44.075225830078125, 46.414466857910156, 48.75371170043945, 51.09295654296875, 53.43219757080078, 55.77144241333008, 58.110687255859375, 60.449928283691406, 62.7891731262207, 65.12841796875, 67.46765899658203, 69.80690002441406, 72.14614868164062, 74.48538970947266]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 8.0, 3.0, 4.0, 14.0, 14.0, 16.0, 12.0, 13.0, 15.0, 24.0, 19.0, 29.0, 32.0, 32.0, 41.0, 36.0, 43.0, 47.0, 43.0, 49.0, 43.0, 60.0, 41.0, 43.0, 44.0, 41.0, 31.0, 30.0, 29.0, 24.0, 21.0, 19.0, 18.0, 21.0, 6.0, 10.0, 6.0, 11.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.265625, -9.0142822265625, -8.762939453125, -8.5115966796875, -8.26025390625, -8.0089111328125, -7.757568359375, -7.5062255859375, -7.2548828125, -7.0035400390625, -6.752197265625, -6.5008544921875, -6.24951171875, -5.9981689453125, -5.746826171875, -5.4954833984375, -5.244140625, -4.9927978515625, -4.741455078125, -4.4901123046875, -4.23876953125, -3.9874267578125, -3.736083984375, -3.4847412109375, -3.2333984375, -2.9820556640625, -2.730712890625, -2.4793701171875, -2.22802734375, -1.9766845703125, -1.725341796875, -1.4739990234375, -1.22265625, -0.9713134765625, -0.719970703125, -0.4686279296875, -0.21728515625, 0.0340576171875, 0.285400390625, 0.5367431640625, 0.7880859375, 1.0394287109375, 1.290771484375, 1.5421142578125, 1.79345703125, 2.0447998046875, 2.296142578125, 2.5474853515625, 2.798828125, 3.0501708984375, 3.301513671875, 3.5528564453125, 3.80419921875, 4.0555419921875, 4.306884765625, 4.5582275390625, 4.8095703125, 5.0609130859375, 5.312255859375, 5.5635986328125, 5.81494140625, 6.0662841796875, 6.317626953125, 6.5689697265625, 6.8203125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 7.0, 5.0, 4.0, 10.0, 18.0, 21.0, 36.0, 36.0, 45.0, 70.0, 97.0, 123.0, 184.0, 315.0, 480.0, 856.0, 1596.0, 3098.0, 6613.0, 14881.0, 37300.0, 115209.0, 432411.0, 1213381.0, 1431430.0, 653372.0, 188037.0, 56045.0, 21296.0, 8583.0, 4016.0, 1965.0, 1104.0, 616.0, 357.0, 199.0, 142.0, 88.0, 78.0, 47.0, 38.0, 21.0, 15.0, 14.0, 8.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7734375, -8.5167236328125, -8.260009765625, -8.0032958984375, -7.74658203125, -7.4898681640625, -7.233154296875, -6.9764404296875, -6.7197265625, -6.4630126953125, -6.206298828125, -5.9495849609375, -5.69287109375, -5.4361572265625, -5.179443359375, -4.9227294921875, -4.666015625, -4.4093017578125, -4.152587890625, -3.8958740234375, -3.63916015625, -3.3824462890625, -3.125732421875, -2.8690185546875, -2.6123046875, -2.3555908203125, -2.098876953125, -1.8421630859375, -1.58544921875, -1.3287353515625, -1.072021484375, -0.8153076171875, -0.55859375, -0.3018798828125, -0.045166015625, 0.2115478515625, 0.46826171875, 0.7249755859375, 0.981689453125, 1.2384033203125, 1.4951171875, 1.7518310546875, 2.008544921875, 2.2652587890625, 2.52197265625, 2.7786865234375, 3.035400390625, 3.2921142578125, 3.548828125, 3.8055419921875, 4.062255859375, 4.3189697265625, 4.57568359375, 4.8323974609375, 5.089111328125, 5.3458251953125, 5.6025390625, 5.8592529296875, 6.115966796875, 6.3726806640625, 6.62939453125, 6.8861083984375, 7.142822265625, 7.3995361328125, 7.65625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 8.0, 9.0, 10.0, 19.0, 18.0, 16.0, 27.0, 38.0, 50.0, 57.0, 83.0, 138.0, 125.0, 192.0, 224.0, 329.0, 372.0, 401.0, 426.0, 340.0, 276.0, 218.0, 158.0, 122.0, 85.0, 81.0, 51.0, 44.0, 40.0, 29.0, 22.0, 23.0, 12.0, 8.0, 7.0, 3.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-18.1875, -17.690673828125, -17.19384765625, -16.697021484375, -16.2001953125, -15.703369140625, -15.20654296875, -14.709716796875, -14.212890625, -13.716064453125, -13.21923828125, -12.722412109375, -12.2255859375, -11.728759765625, -11.23193359375, -10.735107421875, -10.23828125, -9.741455078125, -9.24462890625, -8.747802734375, -8.2509765625, -7.754150390625, -7.25732421875, -6.760498046875, -6.263671875, -5.766845703125, -5.27001953125, -4.773193359375, -4.2763671875, -3.779541015625, -3.28271484375, -2.785888671875, -2.2890625, -1.792236328125, -1.29541015625, -0.798583984375, -0.3017578125, 0.195068359375, 0.69189453125, 1.188720703125, 1.685546875, 2.182373046875, 2.67919921875, 3.176025390625, 3.6728515625, 4.169677734375, 4.66650390625, 5.163330078125, 5.66015625, 6.156982421875, 6.65380859375, 7.150634765625, 7.6474609375, 8.144287109375, 8.64111328125, 9.137939453125, 9.634765625, 10.131591796875, 10.62841796875, 11.125244140625, 11.6220703125, 12.118896484375, 12.61572265625, 13.112548828125, 13.609375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 13.0, 7.0, 12.0, 9.0, 9.0, 18.0, 29.0, 31.0, 41.0, 66.0, 84.0, 103.0, 174.0, 284.0, 585.0, 2420.0, 139680.0, 3991696.0, 56220.0, 1657.0, 394.0, 240.0, 140.0, 91.0, 73.0, 58.0, 39.0, 27.0, 25.0, 10.0, 12.0, 15.0, 6.0, 5.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.9375, -71.724609375, -69.51171875, -67.298828125, -65.0859375, -62.873046875, -60.66015625, -58.447265625, -56.234375, -54.021484375, -51.80859375, -49.595703125, -47.3828125, -45.169921875, -42.95703125, -40.744140625, -38.53125, -36.318359375, -34.10546875, -31.892578125, -29.6796875, -27.466796875, -25.25390625, -23.041015625, -20.828125, -18.615234375, -16.40234375, -14.189453125, -11.9765625, -9.763671875, -7.55078125, -5.337890625, -3.125, -0.912109375, 1.30078125, 3.513671875, 5.7265625, 7.939453125, 10.15234375, 12.365234375, 14.578125, 16.791015625, 19.00390625, 21.216796875, 23.4296875, 25.642578125, 27.85546875, 30.068359375, 32.28125, 34.494140625, 36.70703125, 38.919921875, 41.1328125, 43.345703125, 45.55859375, 47.771484375, 49.984375, 52.197265625, 54.41015625, 56.623046875, 58.8359375, 61.048828125, 63.26171875, 65.474609375, 67.6875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 125.0, 410.0, 383.0, 82.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-404.25421142578125, -394.1183166503906, -383.982421875, -373.84649658203125, -363.7106018066406, -353.57470703125, -343.43878173828125, -333.3028869628906, -323.1669921875, -313.0310974121094, -302.89520263671875, -292.75927734375, -282.6233825683594, -272.48748779296875, -262.3515625, -252.21566772460938, -242.07977294921875, -231.94387817382812, -221.80796813964844, -211.67205810546875, -201.53616333007812, -191.4002685546875, -181.2643585205078, -171.12844848632812, -160.9925537109375, -150.85665893554688, -140.7207489013672, -130.5848388671875, -120.44894409179688, -110.31304168701172, -100.17713928222656, -90.0412368774414, -79.90534973144531, -69.76944732666016, -59.633544921875, -49.497642517089844, -39.36174011230469, -29.22583770751953, -19.089935302734375, -8.954032897949219, 1.1818695068359375, 11.317771911621094, 21.45367431640625, 31.589576721191406, 41.72547912597656, 51.86138153076172, 61.997283935546875, 72.13318634033203, 82.26908874511719, 92.40499114990234, 102.5408935546875, 112.67679595947266, 122.81269836425781, 132.9486083984375, 143.08450317382812, 153.22039794921875, 163.35630798339844, 173.49221801757812, 183.62811279296875, 193.76400756835938, 203.89991760253906, 214.03582763671875, 224.17172241210938, 234.3076171875, 244.4435272216797]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 5.0, 3.0, 7.0, 8.0, 7.0, 19.0, 21.0, 17.0, 21.0, 15.0, 22.0, 26.0, 27.0, 32.0, 21.0, 37.0, 37.0, 40.0, 45.0, 58.0, 45.0, 54.0, 47.0, 41.0, 37.0, 34.0, 31.0, 38.0, 22.0, 26.0, 20.0, 16.0, 22.0, 17.0, 18.0, 10.0, 13.0, 7.0, 5.0, 11.0, 5.0, 1.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-65.22952270507812, -63.26201248168945, -61.29450607299805, -59.326995849609375, -57.35948944091797, -55.3919792175293, -53.424468994140625, -51.45696258544922, -49.48945236206055, -47.521942138671875, -45.55443572998047, -43.5869255065918, -41.619415283203125, -39.65190887451172, -37.68439865112305, -35.716888427734375, -33.74938201904297, -31.78187370300293, -29.81436538696289, -27.84685516357422, -25.87934684753418, -23.91183853149414, -21.94432830810547, -19.97681999206543, -18.00931167602539, -16.04180335998535, -14.074294090270996, -12.10678482055664, -10.139276504516602, -8.171768188476562, -6.204258918762207, -4.236749649047852, -2.269245147705078, -0.30173635482788086, 1.6657724380493164, 3.6332812309265137, 5.600790023803711, 7.56829833984375, 9.535807609558105, 11.503316879272461, 13.4708251953125, 15.438333511352539, 17.405841827392578, 19.37335205078125, 21.34086036682129, 23.308368682861328, 25.27587890625, 27.24338722229004, 29.210895538330078, 31.178403854370117, 33.145912170410156, 35.11342239379883, 37.0809326171875, 39.048439025878906, 41.01594924926758, 42.98345947265625, 44.950965881347656, 46.91847610473633, 48.885982513427734, 50.853492736816406, 52.82099914550781, 54.788509368896484, 56.756019592285156, 58.72352600097656, 60.691036224365234]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 2.0, 2.0, 20.0, 9.0, 15.0, 17.0, 22.0, 24.0, 24.0, 36.0, 24.0, 32.0, 32.0, 36.0, 48.0, 49.0, 43.0, 57.0, 52.0, 54.0, 46.0, 39.0, 37.0, 41.0, 38.0, 30.0, 28.0, 19.0, 25.0, 20.0, 20.0, 20.0, 6.0, 5.0, 8.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.640625, -9.371337890625, -9.10205078125, -8.832763671875, -8.5634765625, -8.294189453125, -8.02490234375, -7.755615234375, -7.486328125, -7.217041015625, -6.94775390625, -6.678466796875, -6.4091796875, -6.139892578125, -5.87060546875, -5.601318359375, -5.33203125, -5.062744140625, -4.79345703125, -4.524169921875, -4.2548828125, -3.985595703125, -3.71630859375, -3.447021484375, -3.177734375, -2.908447265625, -2.63916015625, -2.369873046875, -2.1005859375, -1.831298828125, -1.56201171875, -1.292724609375, -1.0234375, -0.754150390625, -0.48486328125, -0.215576171875, 0.0537109375, 0.322998046875, 0.59228515625, 0.861572265625, 1.130859375, 1.400146484375, 1.66943359375, 1.938720703125, 2.2080078125, 2.477294921875, 2.74658203125, 3.015869140625, 3.28515625, 3.554443359375, 3.82373046875, 4.093017578125, 4.3623046875, 4.631591796875, 4.90087890625, 5.170166015625, 5.439453125, 5.708740234375, 5.97802734375, 6.247314453125, 6.5166015625, 6.785888671875, 7.05517578125, 7.324462890625, 7.59375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 16.0, 18.0, 15.0, 34.0, 43.0, 57.0, 119.0, 175.0, 202.0, 357.0, 558.0, 950.0, 1422.0, 2366.0, 3841.0, 6596.0, 11038.0, 18891.0, 32396.0, 57789.0, 114325.0, 337809.0, 243039.0, 95974.0, 50350.0, 28641.0, 16730.0, 9897.0, 5755.0, 3540.0, 2078.0, 1228.0, 883.0, 493.0, 322.0, 177.0, 143.0, 103.0, 62.0, 35.0, 24.0, 16.0, 14.0, 8.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.0625, -2.0016326904296875, -1.940765380859375, -1.8798980712890625, -1.81903076171875, -1.7581634521484375, -1.697296142578125, -1.6364288330078125, -1.5755615234375, -1.5146942138671875, -1.453826904296875, -1.3929595947265625, -1.33209228515625, -1.2712249755859375, -1.210357666015625, -1.1494903564453125, -1.088623046875, -1.0277557373046875, -0.966888427734375, -0.9060211181640625, -0.84515380859375, -0.7842864990234375, -0.723419189453125, -0.6625518798828125, -0.6016845703125, -0.5408172607421875, -0.479949951171875, -0.4190826416015625, -0.35821533203125, -0.2973480224609375, -0.236480712890625, -0.1756134033203125, -0.11474609375, -0.0538787841796875, 0.006988525390625, 0.0678558349609375, 0.12872314453125, 0.1895904541015625, 0.250457763671875, 0.3113250732421875, 0.3721923828125, 0.4330596923828125, 0.493927001953125, 0.5547943115234375, 0.61566162109375, 0.6765289306640625, 0.737396240234375, 0.7982635498046875, 0.859130859375, 0.9199981689453125, 0.980865478515625, 1.0417327880859375, 1.10260009765625, 1.1634674072265625, 1.224334716796875, 1.2852020263671875, 1.3460693359375, 1.4069366455078125, 1.467803955078125, 1.5286712646484375, 1.58953857421875, 1.6504058837890625, 1.711273193359375, 1.7721405029296875, 1.8330078125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 8.0, 7.0, 5.0, 5.0, 6.0, 5.0, 12.0, 16.0, 18.0, 19.0, 13.0, 21.0, 24.0, 34.0, 36.0, 20.0, 31.0, 45.0, 37.0, 46.0, 56.0, 1093.0, 46.0, 37.0, 50.0, 27.0, 41.0, 32.0, 31.0, 28.0, 34.0, 24.0, 17.0, 24.0, 11.0, 20.0, 19.0, 8.0, 6.0, 3.0, 5.0, 5.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.73651123046875, -4.5784912109375, -4.42047119140625, -4.262451171875, -4.10443115234375, -3.9464111328125, -3.78839111328125, -3.63037109375, -3.47235107421875, -3.3143310546875, -3.15631103515625, -2.998291015625, -2.84027099609375, -2.6822509765625, -2.52423095703125, -2.3662109375, -2.20819091796875, -2.0501708984375, -1.89215087890625, -1.734130859375, -1.57611083984375, -1.4180908203125, -1.26007080078125, -1.10205078125, -0.94403076171875, -0.7860107421875, -0.62799072265625, -0.469970703125, -0.31195068359375, -0.1539306640625, 0.00408935546875, 0.162109375, 0.32012939453125, 0.4781494140625, 0.63616943359375, 0.794189453125, 0.95220947265625, 1.1102294921875, 1.26824951171875, 1.42626953125, 1.58428955078125, 1.7423095703125, 1.90032958984375, 2.058349609375, 2.21636962890625, 2.3743896484375, 2.53240966796875, 2.6904296875, 2.84844970703125, 3.0064697265625, 3.16448974609375, 3.322509765625, 3.48052978515625, 3.6385498046875, 3.79656982421875, 3.95458984375, 4.11260986328125, 4.2706298828125, 4.42864990234375, 4.586669921875, 4.74468994140625, 4.9027099609375, 5.06072998046875, 5.21875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 11.0, 14.0, 22.0, 32.0, 58.0, 77.0, 138.0, 240.0, 356.0, 618.0, 968.0, 1581.0, 2434.0, 4115.0, 6380.0, 10655.0, 17724.0, 29846.0, 51122.0, 95705.0, 259550.0, 1374713.0, 104980.0, 55286.0, 31503.0, 18923.0, 11538.0, 7044.0, 4416.0, 2684.0, 1649.0, 1040.0, 650.0, 413.0, 250.0, 162.0, 91.0, 45.0, 38.0, 22.0, 12.0, 7.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7216796875, -1.666259765625, -1.61083984375, -1.555419921875, -1.5, -1.444580078125, -1.38916015625, -1.333740234375, -1.2783203125, -1.222900390625, -1.16748046875, -1.112060546875, -1.056640625, -1.001220703125, -0.94580078125, -0.890380859375, -0.8349609375, -0.779541015625, -0.72412109375, -0.668701171875, -0.61328125, -0.557861328125, -0.50244140625, -0.447021484375, -0.3916015625, -0.336181640625, -0.28076171875, -0.225341796875, -0.169921875, -0.114501953125, -0.05908203125, -0.003662109375, 0.0517578125, 0.107177734375, 0.16259765625, 0.218017578125, 0.2734375, 0.328857421875, 0.38427734375, 0.439697265625, 0.4951171875, 0.550537109375, 0.60595703125, 0.661376953125, 0.716796875, 0.772216796875, 0.82763671875, 0.883056640625, 0.9384765625, 0.993896484375, 1.04931640625, 1.104736328125, 1.16015625, 1.215576171875, 1.27099609375, 1.326416015625, 1.3818359375, 1.437255859375, 1.49267578125, 1.548095703125, 1.603515625, 1.658935546875, 1.71435546875, 1.769775390625, 1.8251953125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 13.0, 10.0, 18.0, 18.0, 25.0, 52.0, 71.0, 122.0, 174.0, 170.0, 105.0, 63.0, 35.0, 27.0, 27.0, 10.0, 12.0, 8.0, 4.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.0017185211181640625, -0.0016783997416496277, -0.0016382783651351929, -0.001598156988620758, -0.0015580356121063232, -0.0015179142355918884, -0.0014777928590774536, -0.0014376714825630188, -0.001397550106048584, -0.0013574287295341492, -0.0013173073530197144, -0.0012771859765052795, -0.0012370645999908447, -0.00119694322347641, -0.001156821846961975, -0.0011167004704475403, -0.0010765790939331055, -0.0010364577174186707, -0.0009963363409042358, -0.000956214964389801, -0.0009160935878753662, -0.0008759722113609314, -0.0008358508348464966, -0.0007957294583320618, -0.000755608081817627, -0.0007154867053031921, -0.0006753653287887573, -0.0006352439522743225, -0.0005951225757598877, -0.0005550011992454529, -0.0005148798227310181, -0.00047475844621658325, -0.00043463706970214844, -0.0003945156931877136, -0.0003543943166732788, -0.000314272940158844, -0.0002741515636444092, -0.00023403018712997437, -0.00019390881061553955, -0.00015378743410110474, -0.00011366605758666992, -7.354468107223511e-05, -3.342330455780029e-05, 6.6980719566345215e-06, 4.6819448471069336e-05, 8.694082498550415e-05, 0.00012706220149993896, 0.00016718357801437378, 0.0002073049545288086, 0.0002474263310432434, 0.0002875477075576782, 0.00032766908407211304, 0.00036779046058654785, 0.00040791183710098267, 0.0004480332136154175, 0.0004881545901298523, 0.0005282759666442871, 0.0005683973431587219, 0.0006085187196731567, 0.0006486400961875916, 0.0006887614727020264, 0.0007288828492164612, 0.000769004225730896, 0.0008091256022453308, 0.0008492469787597656]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 10.0, 15.0, 23.0, 40.0, 71.0, 142.0, 365.0, 6065.0, 1040254.0, 1047.0, 235.0, 121.0, 58.0, 35.0, 17.0, 15.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0238494873046875, -0.02273106575012207, -0.02161264419555664, -0.02049422264099121, -0.01937580108642578, -0.01825737953186035, -0.017138957977294922, -0.016020536422729492, -0.014902114868164062, -0.013783693313598633, -0.012665271759033203, -0.011546850204467773, -0.010428428649902344, -0.009310007095336914, -0.008191585540771484, -0.007073163986206055, -0.005954742431640625, -0.004836320877075195, -0.0037178993225097656, -0.002599477767944336, -0.0014810562133789062, -0.00036263465881347656, 0.0007557868957519531, 0.0018742084503173828, 0.0029926300048828125, 0.004111051559448242, 0.005229473114013672, 0.0063478946685791016, 0.007466316223144531, 0.008584737777709961, 0.00970315933227539, 0.01082158088684082, 0.01194000244140625, 0.01305842399597168, 0.01417684555053711, 0.015295267105102539, 0.01641368865966797, 0.0175321102142334, 0.018650531768798828, 0.019768953323364258, 0.020887374877929688, 0.022005796432495117, 0.023124217987060547, 0.024242639541625977, 0.025361061096191406, 0.026479482650756836, 0.027597904205322266, 0.028716325759887695, 0.029834747314453125, 0.030953168869018555, 0.032071590423583984, 0.033190011978149414, 0.034308433532714844, 0.03542685508728027, 0.0365452766418457, 0.03766369819641113, 0.03878211975097656, 0.03990054130554199, 0.04101896286010742, 0.04213738441467285, 0.04325580596923828, 0.04437422752380371, 0.04549264907836914, 0.04661107063293457, 0.0477294921875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 166.0, 794.0, 55.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014830208383500576, -0.0013401660835370421, -0.0011973113287240267, -0.0010544565739110112, -0.0009116018190979958, -0.0007687470642849803, -0.0006258923094719648, -0.0004830375546589494, -0.0003401827998459339, -0.00019732804503291845, -5.447329021990299e-05, 8.838146459311247e-05, 0.00023123621940612793, 0.0003740909742191434, 0.0005169457290321589, 0.0006598004838451743, 0.0008026552386581898, 0.0009455099934712052, 0.0010883647482842207, 0.0012312195030972362, 0.0013740742579102516, 0.001516929012723267, 0.0016597837675362825, 0.001802638522349298, 0.0019454932771623135, 0.002088347915560007, 0.0022312027867883444, 0.0023740576580166817, 0.0025169122964143753, 0.002659766934812069, 0.0028026218060404062, 0.0029454766772687435, 0.0030883317813277245, 0.003231186419725418, 0.0033740412909537554, 0.0035168961621820927, 0.0036597508005797863, 0.00380260543897748, 0.003945460543036461, 0.0040883151814341545, 0.004231169819831848, 0.004374024458229542, 0.004516879096627235, 0.004659734200686216, 0.00480258883908391, 0.004945443477481604, 0.0050882985815405846, 0.005231153219938278, 0.005374007858335972, 0.0055168624967336655, 0.005659717135131359, 0.00580257223919034, 0.005945426877588034, 0.006088281515985727, 0.006231136620044708, 0.006373991258442402, 0.0065168458968400955, 0.006659700535237789, 0.006802555173635483, 0.006945410277694464, 0.007088264916092157, 0.007231119554489851, 0.007373974658548832, 0.007516829296946526, 0.007659683935344219]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 4.0, 7.0, 3.0, 9.0, 5.0, 9.0, 9.0, 10.0, 22.0, 15.0, 16.0, 16.0, 29.0, 36.0, 25.0, 20.0, 27.0, 27.0, 39.0, 37.0, 36.0, 42.0, 36.0, 46.0, 38.0, 41.0, 32.0, 36.0, 39.0, 27.0, 31.0, 35.0, 29.0, 18.0, 26.0, 13.0, 16.0, 11.0, 18.0, 19.0, 7.0, 6.0, 5.0, 5.0, 4.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.000371396541595459, -0.0003599422052502632, -0.00034848786890506744, -0.0003370335325598717, -0.0003255791962146759, -0.00031412485986948013, -0.00030267052352428436, -0.0002912161871790886, -0.0002797618508338928, -0.00026830751448869705, -0.0002568531781435013, -0.0002453988417983055, -0.00023394450545310974, -0.00022249016910791397, -0.0002110358327627182, -0.00019958149641752243, -0.00018812716007232666, -0.0001766728237271309, -0.00016521848738193512, -0.00015376415103673935, -0.00014230981469154358, -0.0001308554783463478, -0.00011940114200115204, -0.00010794680565595627, -9.64924693107605e-05, -8.503813296556473e-05, -7.358379662036896e-05, -6.212946027517319e-05, -5.067512392997742e-05, -3.922078758478165e-05, -2.7766451239585876e-05, -1.6312114894390106e-05, -4.857778549194336e-06, 6.596557796001434e-06, 1.8050894141197205e-05, 2.9505230486392975e-05, 4.0959566831588745e-05, 5.2413903176784515e-05, 6.386823952198029e-05, 7.532257586717606e-05, 8.677691221237183e-05, 9.82312485575676e-05, 0.00010968558490276337, 0.00012113992124795914, 0.0001325942575931549, 0.00014404859393835068, 0.00015550293028354645, 0.00016695726662874222, 0.000178411602973938, 0.00018986593931913376, 0.00020132027566432953, 0.0002127746120095253, 0.00022422894835472107, 0.00023568328469991684, 0.0002471376210451126, 0.0002585919573903084, 0.00027004629373550415, 0.0002815006300806999, 0.0002929549664258957, 0.00030440930277109146, 0.00031586363911628723, 0.000327317975461483, 0.00033877231180667877, 0.00035022664815187454, 0.0003616809844970703]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 2.0, 2.0, 20.0, 9.0, 15.0, 17.0, 22.0, 24.0, 24.0, 36.0, 24.0, 32.0, 32.0, 36.0, 48.0, 49.0, 43.0, 57.0, 52.0, 54.0, 46.0, 39.0, 37.0, 41.0, 38.0, 30.0, 28.0, 19.0, 25.0, 20.0, 20.0, 20.0, 6.0, 5.0, 8.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.640625, -9.371337890625, -9.10205078125, -8.832763671875, -8.5634765625, -8.294189453125, -8.02490234375, -7.755615234375, -7.486328125, -7.217041015625, -6.94775390625, -6.678466796875, -6.4091796875, -6.139892578125, -5.87060546875, -5.601318359375, -5.33203125, -5.062744140625, -4.79345703125, -4.524169921875, -4.2548828125, -3.985595703125, -3.71630859375, -3.447021484375, -3.177734375, -2.908447265625, -2.63916015625, -2.369873046875, -2.1005859375, -1.831298828125, -1.56201171875, -1.292724609375, -1.0234375, -0.754150390625, -0.48486328125, -0.215576171875, 0.0537109375, 0.322998046875, 0.59228515625, 0.861572265625, 1.130859375, 1.400146484375, 1.66943359375, 1.938720703125, 2.2080078125, 2.477294921875, 2.74658203125, 3.015869140625, 3.28515625, 3.554443359375, 3.82373046875, 4.093017578125, 4.3623046875, 4.631591796875, 4.90087890625, 5.170166015625, 5.439453125, 5.708740234375, 5.97802734375, 6.247314453125, 6.5166015625, 6.785888671875, 7.05517578125, 7.324462890625, 7.59375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 8.0, 19.0, 19.0, 24.0, 43.0, 72.0, 83.0, 127.0, 183.0, 328.0, 459.0, 794.0, 1415.0, 2581.0, 5179.0, 12004.0, 31910.0, 102741.0, 422847.0, 338739.0, 82008.0, 26299.0, 10428.0, 4663.0, 2358.0, 1284.0, 709.0, 434.0, 287.0, 145.0, 113.0, 78.0, 47.0, 36.0, 25.0, 16.0, 11.0, 12.0, 13.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.4296875, -6.2554931640625, -6.081298828125, -5.9071044921875, -5.73291015625, -5.5587158203125, -5.384521484375, -5.2103271484375, -5.0361328125, -4.8619384765625, -4.687744140625, -4.5135498046875, -4.33935546875, -4.1651611328125, -3.990966796875, -3.8167724609375, -3.642578125, -3.4683837890625, -3.294189453125, -3.1199951171875, -2.94580078125, -2.7716064453125, -2.597412109375, -2.4232177734375, -2.2490234375, -2.0748291015625, -1.900634765625, -1.7264404296875, -1.55224609375, -1.3780517578125, -1.203857421875, -1.0296630859375, -0.85546875, -0.6812744140625, -0.507080078125, -0.3328857421875, -0.15869140625, 0.0155029296875, 0.189697265625, 0.3638916015625, 0.5380859375, 0.7122802734375, 0.886474609375, 1.0606689453125, 1.23486328125, 1.4090576171875, 1.583251953125, 1.7574462890625, 1.931640625, 2.1058349609375, 2.280029296875, 2.4542236328125, 2.62841796875, 2.8026123046875, 2.976806640625, 3.1510009765625, 3.3251953125, 3.4993896484375, 3.673583984375, 3.8477783203125, 4.02197265625, 4.1961669921875, 4.370361328125, 4.5445556640625, 4.71875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 7.0, 10.0, 18.0, 17.0, 19.0, 19.0, 20.0, 40.0, 23.0, 27.0, 29.0, 44.0, 52.0, 54.0, 97.0, 428.0, 1530.0, 108.0, 61.0, 51.0, 45.0, 45.0, 43.0, 42.0, 40.0, 24.0, 28.0, 16.0, 11.0, 13.0, 14.0, 14.0, 18.0, 4.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.734375, -25.8740234375, -25.013671875, -24.1533203125, -23.29296875, -22.4326171875, -21.572265625, -20.7119140625, -19.8515625, -18.9912109375, -18.130859375, -17.2705078125, -16.41015625, -15.5498046875, -14.689453125, -13.8291015625, -12.96875, -12.1083984375, -11.248046875, -10.3876953125, -9.52734375, -8.6669921875, -7.806640625, -6.9462890625, -6.0859375, -5.2255859375, -4.365234375, -3.5048828125, -2.64453125, -1.7841796875, -0.923828125, -0.0634765625, 0.796875, 1.6572265625, 2.517578125, 3.3779296875, 4.23828125, 5.0986328125, 5.958984375, 6.8193359375, 7.6796875, 8.5400390625, 9.400390625, 10.2607421875, 11.12109375, 11.9814453125, 12.841796875, 13.7021484375, 14.5625, 15.4228515625, 16.283203125, 17.1435546875, 18.00390625, 18.8642578125, 19.724609375, 20.5849609375, 21.4453125, 22.3056640625, 23.166015625, 24.0263671875, 24.88671875, 25.7470703125, 26.607421875, 27.4677734375, 28.328125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 7.0, 10.0, 14.0, 17.0, 16.0, 23.0, 17.0, 25.0, 34.0, 51.0, 96.0, 107.0, 128.0, 190.0, 330.0, 554.0, 1839.0, 31445.0, 3092658.0, 15314.0, 1432.0, 479.0, 287.0, 179.0, 104.0, 79.0, 56.0, 41.0, 27.0, 26.0, 27.0, 22.0, 15.0, 11.0, 6.0, 8.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.5, -54.75732421875, -53.0146484375, -51.27197265625, -49.529296875, -47.78662109375, -46.0439453125, -44.30126953125, -42.55859375, -40.81591796875, -39.0732421875, -37.33056640625, -35.587890625, -33.84521484375, -32.1025390625, -30.35986328125, -28.6171875, -26.87451171875, -25.1318359375, -23.38916015625, -21.646484375, -19.90380859375, -18.1611328125, -16.41845703125, -14.67578125, -12.93310546875, -11.1904296875, -9.44775390625, -7.705078125, -5.96240234375, -4.2197265625, -2.47705078125, -0.734375, 1.00830078125, 2.7509765625, 4.49365234375, 6.236328125, 7.97900390625, 9.7216796875, 11.46435546875, 13.20703125, 14.94970703125, 16.6923828125, 18.43505859375, 20.177734375, 21.92041015625, 23.6630859375, 25.40576171875, 27.1484375, 28.89111328125, 30.6337890625, 32.37646484375, 34.119140625, 35.86181640625, 37.6044921875, 39.34716796875, 41.08984375, 42.83251953125, 44.5751953125, 46.31787109375, 48.060546875, 49.80322265625, 51.5458984375, 53.28857421875, 55.03125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [2.0, 4.0, 911.0, 105.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.955711364746094, -23.05750274658203, -10.159292221069336, 2.7389183044433594, 15.637126922607422, 28.53533935546875, 41.43354797363281, 54.331756591796875, 67.22996520996094, 80.128173828125, 93.02638244628906, 105.92459106445312, 118.82279968261719, 131.72100830078125, 144.61923217773438, 157.51742553710938, 170.4156494140625, 183.31385803222656, 196.21206665039062, 209.1102752685547, 222.00848388671875, 234.90670776367188, 247.80490112304688, 260.703125, 273.601318359375, 286.4995422363281, 299.3977355957031, 312.29595947265625, 325.19415283203125, 338.0923767089844, 350.9905700683594, 363.8887939453125, 376.7870178222656, 389.68524169921875, 402.58343505859375, 415.4816589355469, 428.3798522949219, 441.278076171875, 454.17626953125, 467.0744934082031, 479.9726867675781, 492.87091064453125, 505.76910400390625, 518.6672973632812, 531.5655517578125, 544.4637451171875, 557.3619384765625, 570.2601318359375, 583.1583862304688, 596.0565795898438, 608.954833984375, 621.85302734375, 634.751220703125, 647.6494140625, 660.5476684570312, 673.4458618164062, 686.3440551757812, 699.2422485351562, 712.1405029296875, 725.0386962890625, 737.9368896484375, 750.8350830078125, 763.7333374023438, 776.6315307617188, 789.5297241210938]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 9.0, 8.0, 8.0, 6.0, 19.0, 10.0, 15.0, 19.0, 24.0, 26.0, 23.0, 25.0, 37.0, 25.0, 33.0, 26.0, 32.0, 41.0, 38.0, 38.0, 49.0, 37.0, 46.0, 42.0, 47.0, 34.0, 32.0, 27.0, 20.0, 26.0, 19.0, 14.0, 18.0, 19.0, 15.0, 16.0, 14.0, 12.0, 10.0, 10.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-60.701507568359375, -58.80759048461914, -56.91366958618164, -55.019752502441406, -53.12583541870117, -51.23191833496094, -49.33799743652344, -47.4440803527832, -45.55016326904297, -43.656246185302734, -41.762325286865234, -39.868408203125, -37.974491119384766, -36.08057403564453, -34.18665313720703, -32.2927360534668, -30.398815155029297, -28.50489616394043, -26.610979080200195, -24.717060089111328, -22.823143005371094, -20.929224014282227, -19.03530502319336, -17.141387939453125, -15.247468948364258, -13.353550910949707, -11.459632873535156, -9.565713882446289, -7.671795845031738, -5.7778778076171875, -3.8839588165283203, -1.9900407791137695, -0.09612274169921875, 1.7977955341339111, 3.691713809967041, 5.58563232421875, 7.479550361633301, 9.373468399047852, 11.267387390136719, 13.16130542755127, 15.05522346496582, 16.949142456054688, 18.843059539794922, 20.73697853088379, 22.630897521972656, 24.52481460571289, 26.418733596801758, 28.312652587890625, 30.20656967163086, 32.100486755371094, 33.994407653808594, 35.88832473754883, 37.78224182128906, 39.67616271972656, 41.5700798034668, 43.46399688720703, 45.35791778564453, 47.251834869384766, 49.145755767822266, 51.0396728515625, 52.933589935302734, 54.82750701904297, 56.72142791748047, 58.6153450012207, 60.50926208496094]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 4.0, 8.0, 9.0, 11.0, 10.0, 18.0, 15.0, 26.0, 36.0, 28.0, 20.0, 30.0, 31.0, 34.0, 36.0, 54.0, 41.0, 55.0, 49.0, 47.0, 54.0, 48.0, 36.0, 37.0, 40.0, 38.0, 25.0, 22.0, 24.0, 23.0, 18.0, 16.0, 17.0, 9.0, 11.0, 5.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.453125, -9.18597412109375, -8.9188232421875, -8.65167236328125, -8.384521484375, -8.11737060546875, -7.8502197265625, -7.58306884765625, -7.31591796875, -7.04876708984375, -6.7816162109375, -6.51446533203125, -6.247314453125, -5.98016357421875, -5.7130126953125, -5.44586181640625, -5.1787109375, -4.91156005859375, -4.6444091796875, -4.37725830078125, -4.110107421875, -3.84295654296875, -3.5758056640625, -3.30865478515625, -3.04150390625, -2.77435302734375, -2.5072021484375, -2.24005126953125, -1.972900390625, -1.70574951171875, -1.4385986328125, -1.17144775390625, -0.904296875, -0.63714599609375, -0.3699951171875, -0.10284423828125, 0.164306640625, 0.43145751953125, 0.6986083984375, 0.96575927734375, 1.23291015625, 1.50006103515625, 1.7672119140625, 2.03436279296875, 2.301513671875, 2.56866455078125, 2.8358154296875, 3.10296630859375, 3.3701171875, 3.63726806640625, 3.9044189453125, 4.17156982421875, 4.438720703125, 4.70587158203125, 4.9730224609375, 5.24017333984375, 5.50732421875, 5.77447509765625, 6.0416259765625, 6.30877685546875, 6.575927734375, 6.84307861328125, 7.1102294921875, 7.37738037109375, 7.64453125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 2.0, 7.0, 5.0, 23.0, 14.0, 19.0, 14.0, 23.0, 29.0, 30.0, 36.0, 51.0, 61.0, 110.0, 188.0, 480.0, 4397.0, 296822.0, 3837481.0, 51786.0, 1820.0, 318.0, 160.0, 84.0, 62.0, 50.0, 25.0, 31.0, 22.0, 19.0, 17.0, 17.0, 15.0, 16.0, 12.0, 9.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.8125, -44.478515625, -43.14453125, -41.810546875, -40.4765625, -39.142578125, -37.80859375, -36.474609375, -35.140625, -33.806640625, -32.47265625, -31.138671875, -29.8046875, -28.470703125, -27.13671875, -25.802734375, -24.46875, -23.134765625, -21.80078125, -20.466796875, -19.1328125, -17.798828125, -16.46484375, -15.130859375, -13.796875, -12.462890625, -11.12890625, -9.794921875, -8.4609375, -7.126953125, -5.79296875, -4.458984375, -3.125, -1.791015625, -0.45703125, 0.876953125, 2.2109375, 3.544921875, 4.87890625, 6.212890625, 7.546875, 8.880859375, 10.21484375, 11.548828125, 12.8828125, 14.216796875, 15.55078125, 16.884765625, 18.21875, 19.552734375, 20.88671875, 22.220703125, 23.5546875, 24.888671875, 26.22265625, 27.556640625, 28.890625, 30.224609375, 31.55859375, 32.892578125, 34.2265625, 35.560546875, 36.89453125, 38.228515625, 39.5625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 10.0, 6.0, 18.0, 13.0, 35.0, 47.0, 58.0, 93.0, 142.0, 233.0, 349.0, 507.0, 631.0, 602.0, 434.0, 307.0, 196.0, 154.0, 81.0, 59.0, 31.0, 26.0, 21.0, 9.0, 10.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.59375, -13.894287109375, -13.19482421875, -12.495361328125, -11.7958984375, -11.096435546875, -10.39697265625, -9.697509765625, -8.998046875, -8.298583984375, -7.59912109375, -6.899658203125, -6.2001953125, -5.500732421875, -4.80126953125, -4.101806640625, -3.40234375, -2.702880859375, -2.00341796875, -1.303955078125, -0.6044921875, 0.094970703125, 0.79443359375, 1.493896484375, 2.193359375, 2.892822265625, 3.59228515625, 4.291748046875, 4.9912109375, 5.690673828125, 6.39013671875, 7.089599609375, 7.7890625, 8.488525390625, 9.18798828125, 9.887451171875, 10.5869140625, 11.286376953125, 11.98583984375, 12.685302734375, 13.384765625, 14.084228515625, 14.78369140625, 15.483154296875, 16.1826171875, 16.882080078125, 17.58154296875, 18.281005859375, 18.98046875, 19.679931640625, 20.37939453125, 21.078857421875, 21.7783203125, 22.477783203125, 23.17724609375, 23.876708984375, 24.576171875, 25.275634765625, 25.97509765625, 26.674560546875, 27.3740234375, 28.073486328125, 28.77294921875, 29.472412109375, 30.171875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 15.0, 12.0, 29.0, 22.0, 50.0, 63.0, 99.0, 141.0, 202.0, 351.0, 634.0, 3377.0, 1576296.0, 2607100.0, 4154.0, 740.0, 343.0, 209.0, 128.0, 97.0, 56.0, 51.0, 25.0, 26.0, 17.0, 9.0, 9.0, 8.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-111.0625, -108.2880859375, -105.513671875, -102.7392578125, -99.96484375, -97.1904296875, -94.416015625, -91.6416015625, -88.8671875, -86.0927734375, -83.318359375, -80.5439453125, -77.76953125, -74.9951171875, -72.220703125, -69.4462890625, -66.671875, -63.8974609375, -61.123046875, -58.3486328125, -55.57421875, -52.7998046875, -50.025390625, -47.2509765625, -44.4765625, -41.7021484375, -38.927734375, -36.1533203125, -33.37890625, -30.6044921875, -27.830078125, -25.0556640625, -22.28125, -19.5068359375, -16.732421875, -13.9580078125, -11.18359375, -8.4091796875, -5.634765625, -2.8603515625, -0.0859375, 2.6884765625, 5.462890625, 8.2373046875, 11.01171875, 13.7861328125, 16.560546875, 19.3349609375, 22.109375, 24.8837890625, 27.658203125, 30.4326171875, 33.20703125, 35.9814453125, 38.755859375, 41.5302734375, 44.3046875, 47.0791015625, 49.853515625, 52.6279296875, 55.40234375, 58.1767578125, 60.951171875, 63.7255859375, 66.5]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 22.0, 163.0, 377.0, 352.0, 79.0, 20.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-331.5423889160156, -323.2313232421875, -314.92022705078125, -306.6091613769531, -298.298095703125, -289.98699951171875, -281.6759338378906, -273.3648376464844, -265.05377197265625, -256.7427062988281, -248.43161010742188, -240.12054443359375, -231.80946350097656, -223.49838256835938, -215.18731689453125, -206.87623596191406, -198.56515502929688, -190.2540740966797, -181.9429931640625, -173.63192749023438, -165.3208465576172, -157.009765625, -148.69869995117188, -140.3876190185547, -132.0765380859375, -123.76545715332031, -115.45438385009766, -107.143310546875, -98.83222961425781, -90.52114868164062, -82.21007537841797, -73.89900207519531, -65.587890625, -57.27681350708008, -48.965736389160156, -40.654659271240234, -32.34358215332031, -24.03250503540039, -15.721427917480469, -7.410350799560547, 0.900726318359375, 9.211803436279297, 17.52288055419922, 25.83395767211914, 34.14503479003906, 42.456111907958984, 50.767189025878906, 59.07826614379883, 67.38934326171875, 75.70042419433594, 84.0114974975586, 92.32257080078125, 100.63365173339844, 108.94473266601562, 117.25580596923828, 125.56687927246094, 133.87796020507812, 142.1890411376953, 150.5001220703125, 158.81118774414062, 167.1222686767578, 175.433349609375, 183.74441528320312, 192.0554962158203, 200.3665771484375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 6.0, 10.0, 12.0, 13.0, 22.0, 16.0, 17.0, 15.0, 30.0, 24.0, 41.0, 45.0, 37.0, 46.0, 56.0, 45.0, 49.0, 45.0, 54.0, 36.0, 38.0, 49.0, 27.0, 35.0, 33.0, 32.0, 33.0, 22.0, 16.0, 12.0, 12.0, 13.0, 16.0, 9.0, 9.0, 3.0, 3.0, 4.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.607322692871094, -54.67772674560547, -52.748130798339844, -50.81853485107422, -48.888938903808594, -46.95934295654297, -45.029747009277344, -43.10015106201172, -41.170555114746094, -39.24095916748047, -37.311363220214844, -35.38176727294922, -33.452171325683594, -31.52257537841797, -29.592979431152344, -27.66338348388672, -25.733789443969727, -23.8041934967041, -21.874597549438477, -19.94500160217285, -18.015405654907227, -16.085811614990234, -14.156214714050293, -12.226618766784668, -10.297022819519043, -8.367426872253418, -6.437830924987793, -4.508235454559326, -2.578639507293701, -0.6490440368652344, 1.2805519104003906, 3.2101478576660156, 5.139743804931641, 7.069339752197266, 8.99893569946289, 10.928531646728516, 12.85812759399414, 14.78772258758545, 16.71731948852539, 18.646915435791016, 20.57651138305664, 22.506107330322266, 24.43570327758789, 26.365299224853516, 28.29489517211914, 30.224491119384766, 32.15408706665039, 34.083683013916016, 36.013275146484375, 37.94287109375, 39.872467041015625, 41.80206298828125, 43.731658935546875, 45.6612548828125, 47.590850830078125, 49.52044677734375, 51.450042724609375, 53.379638671875, 55.309234619140625, 57.23883056640625, 59.168426513671875, 61.0980224609375, 63.027618408203125, 64.95721435546875, 66.88681030273438]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 8.0, 5.0, 13.0, 22.0, 19.0, 34.0, 19.0, 46.0, 30.0, 36.0, 35.0, 38.0, 52.0, 36.0, 45.0, 45.0, 60.0, 45.0, 59.0, 40.0, 41.0, 38.0, 25.0, 36.0, 35.0, 24.0, 15.0, 17.0, 16.0, 9.0, 10.0, 7.0, 7.0, 6.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -9.01904296875, -8.7412109375, -8.46337890625, -8.185546875, -7.90771484375, -7.6298828125, -7.35205078125, -7.07421875, -6.79638671875, -6.5185546875, -6.24072265625, -5.962890625, -5.68505859375, -5.4072265625, -5.12939453125, -4.8515625, -4.57373046875, -4.2958984375, -4.01806640625, -3.740234375, -3.46240234375, -3.1845703125, -2.90673828125, -2.62890625, -2.35107421875, -2.0732421875, -1.79541015625, -1.517578125, -1.23974609375, -0.9619140625, -0.68408203125, -0.40625, -0.12841796875, 0.1494140625, 0.42724609375, 0.705078125, 0.98291015625, 1.2607421875, 1.53857421875, 1.81640625, 2.09423828125, 2.3720703125, 2.64990234375, 2.927734375, 3.20556640625, 3.4833984375, 3.76123046875, 4.0390625, 4.31689453125, 4.5947265625, 4.87255859375, 5.150390625, 5.42822265625, 5.7060546875, 5.98388671875, 6.26171875, 6.53955078125, 6.8173828125, 7.09521484375, 7.373046875, 7.65087890625, 7.9287109375, 8.20654296875, 8.484375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 10.0, 12.0, 22.0, 26.0, 40.0, 64.0, 77.0, 135.0, 194.0, 307.0, 465.0, 692.0, 1045.0, 1586.0, 2444.0, 3903.0, 6157.0, 9619.0, 15792.0, 25654.0, 42765.0, 75198.0, 149078.0, 346878.0, 166017.0, 81562.0, 45870.0, 27659.0, 16755.0, 10348.0, 6406.0, 4195.0, 2611.0, 1734.0, 1087.0, 717.0, 484.0, 328.0, 206.0, 121.0, 92.0, 55.0, 44.0, 28.0, 23.0, 18.0, 11.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.666015625, -1.61151123046875, -1.5570068359375, -1.50250244140625, -1.447998046875, -1.39349365234375, -1.3389892578125, -1.28448486328125, -1.22998046875, -1.17547607421875, -1.1209716796875, -1.06646728515625, -1.011962890625, -0.95745849609375, -0.9029541015625, -0.84844970703125, -0.7939453125, -0.73944091796875, -0.6849365234375, -0.63043212890625, -0.575927734375, -0.52142333984375, -0.4669189453125, -0.41241455078125, -0.35791015625, -0.30340576171875, -0.2489013671875, -0.19439697265625, -0.139892578125, -0.08538818359375, -0.0308837890625, 0.02362060546875, 0.078125, 0.13262939453125, 0.1871337890625, 0.24163818359375, 0.296142578125, 0.35064697265625, 0.4051513671875, 0.45965576171875, 0.51416015625, 0.56866455078125, 0.6231689453125, 0.67767333984375, 0.732177734375, 0.78668212890625, 0.8411865234375, 0.89569091796875, 0.9501953125, 1.00469970703125, 1.0592041015625, 1.11370849609375, 1.168212890625, 1.22271728515625, 1.2772216796875, 1.33172607421875, 1.38623046875, 1.44073486328125, 1.4952392578125, 1.54974365234375, 1.604248046875, 1.65875244140625, 1.7132568359375, 1.76776123046875, 1.822265625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 6.0, 4.0, 2.0, 4.0, 6.0, 5.0, 3.0, 7.0, 9.0, 4.0, 14.0, 23.0, 20.0, 15.0, 26.0, 22.0, 26.0, 30.0, 26.0, 43.0, 28.0, 35.0, 42.0, 52.0, 38.0, 1058.0, 37.0, 41.0, 24.0, 32.0, 33.0, 43.0, 27.0, 25.0, 27.0, 29.0, 18.0, 22.0, 20.0, 18.0, 17.0, 9.0, 13.0, 10.0, 10.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.939453125, -3.799835205078125, -3.66021728515625, -3.520599365234375, -3.3809814453125, -3.241363525390625, -3.10174560546875, -2.962127685546875, -2.822509765625, -2.682891845703125, -2.54327392578125, -2.403656005859375, -2.2640380859375, -2.124420166015625, -1.98480224609375, -1.845184326171875, -1.70556640625, -1.565948486328125, -1.42633056640625, -1.286712646484375, -1.1470947265625, -1.007476806640625, -0.86785888671875, -0.728240966796875, -0.588623046875, -0.449005126953125, -0.30938720703125, -0.169769287109375, -0.0301513671875, 0.109466552734375, 0.24908447265625, 0.388702392578125, 0.5283203125, 0.667938232421875, 0.80755615234375, 0.947174072265625, 1.0867919921875, 1.226409912109375, 1.36602783203125, 1.505645751953125, 1.645263671875, 1.784881591796875, 1.92449951171875, 2.064117431640625, 2.2037353515625, 2.343353271484375, 2.48297119140625, 2.622589111328125, 2.76220703125, 2.901824951171875, 3.04144287109375, 3.181060791015625, 3.3206787109375, 3.460296630859375, 3.59991455078125, 3.739532470703125, 3.879150390625, 4.018768310546875, 4.15838623046875, 4.298004150390625, 4.4376220703125, 4.577239990234375, 4.71685791015625, 4.856475830078125, 4.99609375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 8.0, 7.0, 6.0, 14.0, 16.0, 33.0, 49.0, 94.0, 111.0, 202.0, 290.0, 444.0, 650.0, 1006.0, 1543.0, 2337.0, 3361.0, 5174.0, 7901.0, 12382.0, 19287.0, 30501.0, 49869.0, 86439.0, 181123.0, 1386280.0, 128012.0, 68848.0, 40864.0, 24824.0, 15853.0, 10095.0, 6677.0, 4425.0, 2758.0, 1897.0, 1218.0, 878.0, 568.0, 404.0, 245.0, 151.0, 109.0, 59.0, 43.0, 29.0, 22.0, 8.0, 11.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.3348846435546875, -1.285980224609375, -1.2370758056640625, -1.18817138671875, -1.1392669677734375, -1.090362548828125, -1.0414581298828125, -0.9925537109375, -0.9436492919921875, -0.894744873046875, -0.8458404541015625, -0.79693603515625, -0.7480316162109375, -0.699127197265625, -0.6502227783203125, -0.601318359375, -0.5524139404296875, -0.503509521484375, -0.4546051025390625, -0.40570068359375, -0.3567962646484375, -0.307891845703125, -0.2589874267578125, -0.2100830078125, -0.1611785888671875, -0.112274169921875, -0.0633697509765625, -0.01446533203125, 0.0344390869140625, 0.083343505859375, 0.1322479248046875, 0.18115234375, 0.2300567626953125, 0.278961181640625, 0.3278656005859375, 0.37677001953125, 0.4256744384765625, 0.474578857421875, 0.5234832763671875, 0.5723876953125, 0.6212921142578125, 0.670196533203125, 0.7191009521484375, 0.76800537109375, 0.8169097900390625, 0.865814208984375, 0.9147186279296875, 0.963623046875, 1.0125274658203125, 1.061431884765625, 1.1103363037109375, 1.15924072265625, 1.2081451416015625, 1.257049560546875, 1.3059539794921875, 1.3548583984375, 1.4037628173828125, 1.452667236328125, 1.5015716552734375, 1.55047607421875, 1.5993804931640625, 1.648284912109375, 1.6971893310546875, 1.74609375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 14.0, 12.0, 13.0, 35.0, 31.0, 82.0, 119.0, 173.0, 166.0, 118.0, 80.0, 44.0, 27.0, 18.0, 16.0, 10.0, 3.0, 3.0, 7.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010900497436523438, -0.001048162579536438, -0.0010062754154205322, -0.0009643882513046265, -0.0009225010871887207, -0.0008806139230728149, -0.0008387267589569092, -0.0007968395948410034, -0.0007549524307250977, -0.0007130652666091919, -0.0006711781024932861, -0.0006292909383773804, -0.0005874037742614746, -0.0005455166101455688, -0.0005036294460296631, -0.0004617422819137573, -0.00041985511779785156, -0.0003779679536819458, -0.00033608078956604004, -0.0002941936254501343, -0.0002523064613342285, -0.00021041929721832275, -0.000168532133102417, -0.00012664496898651123, -8.475780487060547e-05, -4.287064075469971e-05, -9.834766387939453e-07, 4.0903687477111816e-05, 8.279085159301758e-05, 0.00012467801570892334, 0.0001665651798248291, 0.00020845234394073486, 0.0002503395080566406, 0.0002922266721725464, 0.00033411383628845215, 0.0003760010004043579, 0.00041788816452026367, 0.00045977532863616943, 0.0005016624927520752, 0.000543549656867981, 0.0005854368209838867, 0.0006273239850997925, 0.0006692111492156982, 0.000711098313331604, 0.0007529854774475098, 0.0007948726415634155, 0.0008367598056793213, 0.000878646969795227, 0.0009205341339111328, 0.0009624212980270386, 0.0010043084621429443, 0.00104619562625885, 0.0010880827903747559, 0.0011299699544906616, 0.0011718571186065674, 0.0012137442827224731, 0.001255631446838379, 0.0012975186109542847, 0.0013394057750701904, 0.0013812929391860962, 0.001423180103302002, 0.0014650672674179077, 0.0015069544315338135, 0.0015488415956497192, 0.001590728759765625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 4.0, 4.0, 6.0, 3.0, 15.0, 15.0, 21.0, 50.0, 80.0, 153.0, 419.0, 11112.0, 1035065.0, 1096.0, 223.0, 114.0, 54.0, 32.0, 22.0, 13.0, 8.0, 16.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.034423828125, -0.033524274826049805, -0.03262472152709961, -0.031725168228149414, -0.03082561492919922, -0.029926061630249023, -0.029026508331298828, -0.028126955032348633, -0.027227401733398438, -0.026327848434448242, -0.025428295135498047, -0.02452874183654785, -0.023629188537597656, -0.02272963523864746, -0.021830081939697266, -0.02093052864074707, -0.020030975341796875, -0.01913142204284668, -0.018231868743896484, -0.01733231544494629, -0.016432762145996094, -0.015533208847045898, -0.014633655548095703, -0.013734102249145508, -0.012834548950195312, -0.011934995651245117, -0.011035442352294922, -0.010135889053344727, -0.009236335754394531, -0.008336782455444336, -0.007437229156494141, -0.006537675857543945, -0.00563812255859375, -0.004738569259643555, -0.0038390159606933594, -0.002939462661743164, -0.0020399093627929688, -0.0011403560638427734, -0.00024080276489257812, 0.0006587505340576172, 0.0015583038330078125, 0.002457857131958008, 0.003357410430908203, 0.0042569637298583984, 0.005156517028808594, 0.006056070327758789, 0.006955623626708984, 0.00785517692565918, 0.008754730224609375, 0.00965428352355957, 0.010553836822509766, 0.011453390121459961, 0.012352943420410156, 0.013252496719360352, 0.014152050018310547, 0.015051603317260742, 0.015951156616210938, 0.016850709915161133, 0.017750263214111328, 0.018649816513061523, 0.01954936981201172, 0.020448923110961914, 0.02134847640991211, 0.022248029708862305, 0.0231475830078125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 17.0, 25.0, 64.0, 126.0, 196.0, 204.0, 169.0, 101.0, 51.0, 27.0, 18.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009930555243045092, -0.0009690666338428855, -0.0009450777433812618, -0.0009210888529196382, -0.0008970999624580145, -0.0008731110719963908, -0.0008491221815347672, -0.0008251332910731435, -0.0008011444006115198, -0.0007771555101498961, -0.0007531666196882725, -0.0007291777292266488, -0.0007051888387650251, -0.0006811999483034015, -0.0006572110578417778, -0.0006332221673801541, -0.0006092333351261914, -0.0005852444446645677, -0.000561255554202944, -0.0005372666637413204, -0.0005132777732796967, -0.000489288882818073, -0.0004653000214602798, -0.00044131113099865615, -0.0004173222405370325, -0.0003933333500754088, -0.00036934445961378515, -0.00034535559825599194, -0.00032136670779436827, -0.0002973778173327446, -0.00027338892687112093, -0.00024940003640949726, -0.0002254111459478736, -0.00020142225548624992, -0.00017743336502462626, -0.00015344448911491781, -0.00012945559865329415, -0.00010546670819167048, -8.147783228196204e-05, -5.748894182033837e-05, -3.35000513587147e-05, -9.511164535069838e-06, 1.4477722288575023e-05, 3.846660547424108e-05, 6.245549593586475e-05, 8.644438639748842e-05, 0.00011043326230719686, 0.00013442215276882052, 0.0001584110432304442, 0.00018239993369206786, 0.00020638882415369153, 0.00023037770006339997, 0.00025436660507693887, 0.00027835549553856254, 0.00030234435689635575, 0.0003263332473579794, 0.0003503221378196031, 0.00037431102828122675, 0.0003982999187428504, 0.00042228878010064363, 0.0004462776705622673, 0.00047026656102389097, 0.0004942554514855146, 0.0005182443419471383, 0.000542233232408762]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 7.0, 9.0, 10.0, 13.0, 18.0, 17.0, 21.0, 26.0, 15.0, 24.0, 20.0, 22.0, 22.0, 22.0, 34.0, 31.0, 39.0, 25.0, 36.0, 31.0, 23.0, 29.0, 33.0, 39.0, 34.0, 41.0, 23.0, 30.0, 25.0, 24.0, 28.0, 35.0, 18.0, 19.0, 24.0, 20.0, 13.0, 21.0, 18.0, 10.0, 10.0, 11.0, 6.0, 9.0, 7.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033909082412719727, -0.0003283778205513954, -0.00031766481697559357, -0.0003069518133997917, -0.00029623880982398987, -0.000285525806248188, -0.00027481280267238617, -0.0002640997990965843, -0.00025338679552078247, -0.00024267379194498062, -0.00023196078836917877, -0.00022124778479337692, -0.00021053478121757507, -0.00019982177764177322, -0.00018910877406597137, -0.00017839577049016953, -0.00016768276691436768, -0.00015696976333856583, -0.00014625675976276398, -0.00013554375618696213, -0.00012483075261116028, -0.00011411774903535843, -0.00010340474545955658, -9.269174188375473e-05, -8.197873830795288e-05, -7.126573473215103e-05, -6.055273115634918e-05, -4.983972758054733e-05, -3.9126724004745483e-05, -2.8413720428943634e-05, -1.7700716853141785e-05, -6.987713277339935e-06, 3.725290298461914e-06, 1.4438293874263763e-05, 2.5151297450065613e-05, 3.586430102586746e-05, 4.657730460166931e-05, 5.729030817747116e-05, 6.800331175327301e-05, 7.871631532907486e-05, 8.942931890487671e-05, 0.00010014232248067856, 0.00011085532605648041, 0.00012156832963228226, 0.0001322813332080841, 0.00014299433678388596, 0.0001537073403596878, 0.00016442034393548965, 0.0001751333475112915, 0.00018584635108709335, 0.0001965593546628952, 0.00020727235823869705, 0.0002179853618144989, 0.00022869836539030075, 0.0002394113689661026, 0.00025012437254190445, 0.0002608373761177063, 0.00027155037969350815, 0.00028226338326931, 0.00029297638684511185, 0.0003036893904209137, 0.00031440239399671555, 0.0003251153975725174, 0.00033582840114831924, 0.0003465414047241211]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 8.0, 5.0, 13.0, 22.0, 19.0, 34.0, 19.0, 46.0, 30.0, 36.0, 35.0, 38.0, 52.0, 36.0, 45.0, 45.0, 60.0, 45.0, 59.0, 40.0, 41.0, 38.0, 25.0, 36.0, 35.0, 24.0, 15.0, 17.0, 16.0, 9.0, 10.0, 7.0, 7.0, 6.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -9.01904296875, -8.7412109375, -8.46337890625, -8.185546875, -7.90771484375, -7.6298828125, -7.35205078125, -7.07421875, -6.79638671875, -6.5185546875, -6.24072265625, -5.962890625, -5.68505859375, -5.4072265625, -5.12939453125, -4.8515625, -4.57373046875, -4.2958984375, -4.01806640625, -3.740234375, -3.46240234375, -3.1845703125, -2.90673828125, -2.62890625, -2.35107421875, -2.0732421875, -1.79541015625, -1.517578125, -1.23974609375, -0.9619140625, -0.68408203125, -0.40625, -0.12841796875, 0.1494140625, 0.42724609375, 0.705078125, 0.98291015625, 1.2607421875, 1.53857421875, 1.81640625, 2.09423828125, 2.3720703125, 2.64990234375, 2.927734375, 3.20556640625, 3.4833984375, 3.76123046875, 4.0390625, 4.31689453125, 4.5947265625, 4.87255859375, 5.150390625, 5.42822265625, 5.7060546875, 5.98388671875, 6.26171875, 6.53955078125, 6.8173828125, 7.09521484375, 7.373046875, 7.65087890625, 7.9287109375, 8.20654296875, 8.484375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 6.0, 6.0, 15.0, 25.0, 41.0, 58.0, 81.0, 121.0, 177.0, 268.0, 452.0, 716.0, 1148.0, 1976.0, 3271.0, 5675.0, 11212.0, 23642.0, 60479.0, 177267.0, 449741.0, 194423.0, 65877.0, 25736.0, 11505.0, 5984.0, 3419.0, 1916.0, 1215.0, 736.0, 478.0, 301.0, 198.0, 139.0, 96.0, 58.0, 27.0, 25.0, 21.0, 14.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.11993408203125, -3.9703369140625, -3.82073974609375, -3.671142578125, -3.52154541015625, -3.3719482421875, -3.22235107421875, -3.07275390625, -2.92315673828125, -2.7735595703125, -2.62396240234375, -2.474365234375, -2.32476806640625, -2.1751708984375, -2.02557373046875, -1.8759765625, -1.72637939453125, -1.5767822265625, -1.42718505859375, -1.277587890625, -1.12799072265625, -0.9783935546875, -0.82879638671875, -0.67919921875, -0.52960205078125, -0.3800048828125, -0.23040771484375, -0.080810546875, 0.06878662109375, 0.2183837890625, 0.36798095703125, 0.517578125, 0.66717529296875, 0.8167724609375, 0.96636962890625, 1.115966796875, 1.26556396484375, 1.4151611328125, 1.56475830078125, 1.71435546875, 1.86395263671875, 2.0135498046875, 2.16314697265625, 2.312744140625, 2.46234130859375, 2.6119384765625, 2.76153564453125, 2.9111328125, 3.06072998046875, 3.2103271484375, 3.35992431640625, 3.509521484375, 3.65911865234375, 3.8087158203125, 3.95831298828125, 4.10791015625, 4.25750732421875, 4.4071044921875, 4.55670166015625, 4.706298828125, 4.85589599609375, 5.0054931640625, 5.15509033203125, 5.3046875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 7.0, 6.0, 1.0, 2.0, 5.0, 5.0, 9.0, 11.0, 11.0, 15.0, 15.0, 18.0, 21.0, 24.0, 43.0, 28.0, 30.0, 41.0, 49.0, 64.0, 82.0, 185.0, 1692.0, 182.0, 90.0, 63.0, 41.0, 50.0, 34.0, 22.0, 37.0, 33.0, 31.0, 19.0, 17.0, 6.0, 19.0, 14.0, 3.0, 7.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-32.9375, -31.9833984375, -31.029296875, -30.0751953125, -29.12109375, -28.1669921875, -27.212890625, -26.2587890625, -25.3046875, -24.3505859375, -23.396484375, -22.4423828125, -21.48828125, -20.5341796875, -19.580078125, -18.6259765625, -17.671875, -16.7177734375, -15.763671875, -14.8095703125, -13.85546875, -12.9013671875, -11.947265625, -10.9931640625, -10.0390625, -9.0849609375, -8.130859375, -7.1767578125, -6.22265625, -5.2685546875, -4.314453125, -3.3603515625, -2.40625, -1.4521484375, -0.498046875, 0.4560546875, 1.41015625, 2.3642578125, 3.318359375, 4.2724609375, 5.2265625, 6.1806640625, 7.134765625, 8.0888671875, 9.04296875, 9.9970703125, 10.951171875, 11.9052734375, 12.859375, 13.8134765625, 14.767578125, 15.7216796875, 16.67578125, 17.6298828125, 18.583984375, 19.5380859375, 20.4921875, 21.4462890625, 22.400390625, 23.3544921875, 24.30859375, 25.2626953125, 26.216796875, 27.1708984375, 28.125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 10.0, 26.0, 48.0, 96.0, 247.0, 636.0, 19605.0, 3123184.0, 1285.0, 296.0, 138.0, 62.0, 25.0, 25.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-168.25, -162.28125, -156.3125, -150.34375, -144.375, -138.40625, -132.4375, -126.46875, -120.5, -114.53125, -108.5625, -102.59375, -96.625, -90.65625, -84.6875, -78.71875, -72.75, -66.78125, -60.8125, -54.84375, -48.875, -42.90625, -36.9375, -30.96875, -25.0, -19.03125, -13.0625, -7.09375, -1.125, 4.84375, 10.8125, 16.78125, 22.75, 28.71875, 34.6875, 40.65625, 46.625, 52.59375, 58.5625, 64.53125, 70.5, 76.46875, 82.4375, 88.40625, 94.375, 100.34375, 106.3125, 112.28125, 118.25, 124.21875, 130.1875, 136.15625, 142.125, 148.09375, 154.0625, 160.03125, 166.0, 171.96875, 177.9375, 183.90625, 189.875, 195.84375, 201.8125, 207.78125, 213.75]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 316.0, 704.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.2321014404297, -149.2974853515625, -112.36286926269531, -75.42825317382812, -38.49363708496094, -1.55902099609375, 35.37559509277344, 72.31019592285156, 109.24482727050781, 146.179443359375, 183.1140594482422, 220.04867553710938, 256.9832763671875, 293.91790771484375, 330.8525390625, 367.787109375, 404.72174072265625, 441.6563720703125, 478.5909729003906, 515.5255737304688, 552.460205078125, 589.3948364257812, 626.3294677734375, 663.2640380859375, 700.1986694335938, 737.13330078125, 774.06787109375, 811.0025024414062, 847.9371337890625, 884.8717651367188, 921.806396484375, 958.740966796875, 995.675537109375, 1032.610107421875, 1069.5447998046875, 1106.4793701171875, 1143.4140625, 1180.3486328125, 1217.283203125, 1254.2177734375, 1291.1524658203125, 1328.0870361328125, 1365.021728515625, 1401.956298828125, 1438.890869140625, 1475.8255615234375, 1512.7601318359375, 1549.69482421875, 1586.62939453125, 1623.56396484375, 1660.4986572265625, 1697.4332275390625, 1734.367919921875, 1771.302490234375, 1808.237060546875, 1845.171630859375, 1882.1063232421875, 1919.0408935546875, 1955.9755859375, 1992.91015625, 2029.8447265625, 2066.779296875, 2103.714111328125, 2140.648681640625, 2177.583251953125]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 11.0, 7.0, 8.0, 14.0, 14.0, 10.0, 17.0, 27.0, 24.0, 25.0, 40.0, 33.0, 33.0, 37.0, 45.0, 53.0, 39.0, 54.0, 51.0, 54.0, 41.0, 50.0, 38.0, 47.0, 27.0, 35.0, 28.0, 18.0, 31.0, 18.0, 13.0, 15.0, 12.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.19775390625, -83.11909484863281, -80.04043579101562, -76.96177673339844, -73.88311767578125, -70.80445861816406, -67.72579956054688, -64.64714050292969, -61.5684814453125, -58.48982238769531, -55.411163330078125, -52.33250427246094, -49.25384521484375, -46.17518615722656, -43.096527099609375, -40.01786804199219, -36.939208984375, -33.86054992675781, -30.781890869140625, -27.703231811523438, -24.62457275390625, -21.545913696289062, -18.467254638671875, -15.388595581054688, -12.3099365234375, -9.231277465820312, -6.152618408203125, -3.0739593505859375, 0.00469970703125, 3.0833587646484375, 6.162017822265625, 9.240676879882812, 12.3193359375, 15.397994995117188, 18.476654052734375, 21.555313110351562, 24.63397216796875, 27.712631225585938, 30.791290283203125, 33.86994934082031, 36.9486083984375, 40.02726745605469, 43.105926513671875, 46.18458557128906, 49.26324462890625, 52.34190368652344, 55.420562744140625, 58.49922180175781, 61.577880859375, 64.65653991699219, 67.73519897460938, 70.81385803222656, 73.89251708984375, 76.97117614746094, 80.04983520507812, 83.12849426269531, 86.2071533203125, 89.28581237792969, 92.36447143554688, 95.44313049316406, 98.52178955078125, 101.60044860839844, 104.67910766601562, 107.75776672363281, 110.83642578125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 8.0, 8.0, 13.0, 16.0, 26.0, 23.0, 30.0, 26.0, 29.0, 29.0, 42.0, 44.0, 39.0, 48.0, 42.0, 37.0, 38.0, 59.0, 49.0, 47.0, 39.0, 45.0, 31.0, 37.0, 29.0, 27.0, 21.0, 21.0, 17.0, 13.0, 13.0, 10.0, 9.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.923828125, -8.63671875, -8.349609375, -8.0625, -7.775390625, -7.48828125, -7.201171875, -6.9140625, -6.626953125, -6.33984375, -6.052734375, -5.765625, -5.478515625, -5.19140625, -4.904296875, -4.6171875, -4.330078125, -4.04296875, -3.755859375, -3.46875, -3.181640625, -2.89453125, -2.607421875, -2.3203125, -2.033203125, -1.74609375, -1.458984375, -1.171875, -0.884765625, -0.59765625, -0.310546875, -0.0234375, 0.263671875, 0.55078125, 0.837890625, 1.125, 1.412109375, 1.69921875, 1.986328125, 2.2734375, 2.560546875, 2.84765625, 3.134765625, 3.421875, 3.708984375, 3.99609375, 4.283203125, 4.5703125, 4.857421875, 5.14453125, 5.431640625, 5.71875, 6.005859375, 6.29296875, 6.580078125, 6.8671875, 7.154296875, 7.44140625, 7.728515625, 8.015625, 8.302734375, 8.58984375, 8.876953125, 9.1640625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 6.0, 9.0, 15.0, 16.0, 28.0, 40.0, 38.0, 53.0, 62.0, 94.0, 125.0, 169.0, 265.0, 375.0, 636.0, 1084.0, 2019.0, 4151.0, 9560.0, 26259.0, 95991.0, 438045.0, 1328392.0, 1476786.0, 607795.0, 143311.0, 36637.0, 11966.0, 4939.0, 2322.0, 1156.0, 628.0, 392.0, 260.0, 171.0, 125.0, 86.0, 84.0, 48.0, 36.0, 28.0, 23.0, 15.0, 12.0, 11.0, 6.0, 2.0, 5.0, 1.0, 2.0], "bins": [-11.1875, -10.8861083984375, -10.584716796875, -10.2833251953125, -9.98193359375, -9.6805419921875, -9.379150390625, -9.0777587890625, -8.7763671875, -8.4749755859375, -8.173583984375, -7.8721923828125, -7.57080078125, -7.2694091796875, -6.968017578125, -6.6666259765625, -6.365234375, -6.0638427734375, -5.762451171875, -5.4610595703125, -5.15966796875, -4.8582763671875, -4.556884765625, -4.2554931640625, -3.9541015625, -3.6527099609375, -3.351318359375, -3.0499267578125, -2.74853515625, -2.4471435546875, -2.145751953125, -1.8443603515625, -1.54296875, -1.2415771484375, -0.940185546875, -0.6387939453125, -0.33740234375, -0.0360107421875, 0.265380859375, 0.5667724609375, 0.8681640625, 1.1695556640625, 1.470947265625, 1.7723388671875, 2.07373046875, 2.3751220703125, 2.676513671875, 2.9779052734375, 3.279296875, 3.5806884765625, 3.882080078125, 4.1834716796875, 4.48486328125, 4.7862548828125, 5.087646484375, 5.3890380859375, 5.6904296875, 5.9918212890625, 6.293212890625, 6.5946044921875, 6.89599609375, 7.1973876953125, 7.498779296875, 7.8001708984375, 8.1015625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 12.0, 16.0, 20.0, 35.0, 39.0, 64.0, 98.0, 123.0, 175.0, 277.0, 406.0, 503.0, 554.0, 473.0, 414.0, 275.0, 161.0, 120.0, 105.0, 57.0, 39.0, 30.0, 17.0, 18.0, 13.0, 1.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5078125, -12.8448486328125, -12.181884765625, -11.5189208984375, -10.85595703125, -10.1929931640625, -9.530029296875, -8.8670654296875, -8.2041015625, -7.5411376953125, -6.878173828125, -6.2152099609375, -5.55224609375, -4.8892822265625, -4.226318359375, -3.5633544921875, -2.900390625, -2.2374267578125, -1.574462890625, -0.9114990234375, -0.24853515625, 0.4144287109375, 1.077392578125, 1.7403564453125, 2.4033203125, 3.0662841796875, 3.729248046875, 4.3922119140625, 5.05517578125, 5.7181396484375, 6.381103515625, 7.0440673828125, 7.70703125, 8.3699951171875, 9.032958984375, 9.6959228515625, 10.35888671875, 11.0218505859375, 11.684814453125, 12.3477783203125, 13.0107421875, 13.6737060546875, 14.336669921875, 14.9996337890625, 15.66259765625, 16.3255615234375, 16.988525390625, 17.6514892578125, 18.314453125, 18.9774169921875, 19.640380859375, 20.3033447265625, 20.96630859375, 21.6292724609375, 22.292236328125, 22.9552001953125, 23.6181640625, 24.2811279296875, 24.944091796875, 25.6070556640625, 26.27001953125, 26.9329833984375, 27.595947265625, 28.2589111328125, 28.921875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 7.0, 10.0, 12.0, 17.0, 30.0, 35.0, 40.0, 67.0, 72.0, 101.0, 116.0, 213.0, 403.0, 819.0, 6787.0, 2430382.0, 1747546.0, 5797.0, 800.0, 338.0, 207.0, 112.0, 92.0, 55.0, 52.0, 43.0, 28.0, 22.0, 14.0, 15.0, 5.0, 4.0, 7.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.75, -69.3564453125, -66.962890625, -64.5693359375, -62.17578125, -59.7822265625, -57.388671875, -54.9951171875, -52.6015625, -50.2080078125, -47.814453125, -45.4208984375, -43.02734375, -40.6337890625, -38.240234375, -35.8466796875, -33.453125, -31.0595703125, -28.666015625, -26.2724609375, -23.87890625, -21.4853515625, -19.091796875, -16.6982421875, -14.3046875, -11.9111328125, -9.517578125, -7.1240234375, -4.73046875, -2.3369140625, 0.056640625, 2.4501953125, 4.84375, 7.2373046875, 9.630859375, 12.0244140625, 14.41796875, 16.8115234375, 19.205078125, 21.5986328125, 23.9921875, 26.3857421875, 28.779296875, 31.1728515625, 33.56640625, 35.9599609375, 38.353515625, 40.7470703125, 43.140625, 45.5341796875, 47.927734375, 50.3212890625, 52.71484375, 55.1083984375, 57.501953125, 59.8955078125, 62.2890625, 64.6826171875, 67.076171875, 69.4697265625, 71.86328125, 74.2568359375, 76.650390625, 79.0439453125, 81.4375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 62.0, 268.0, 459.0, 176.0, 40.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.87384033203125, -149.67791748046875, -140.4819793701172, -131.2860565185547, -122.09012603759766, -112.89419555664062, -103.69827270507812, -94.5023422241211, -85.30641174316406, -76.11048126220703, -66.91455078125, -57.7186279296875, -48.52269744873047, -39.32676696777344, -30.130840301513672, -20.934913635253906, -11.738983154296875, -2.5430545806884766, 6.652873992919922, 15.84880256652832, 25.04473114013672, 34.24066162109375, 43.436588287353516, 52.63251495361328, 61.82844543457031, 71.02437591552734, 80.22030639648438, 89.41622924804688, 98.6121597290039, 107.80809020996094, 117.00401306152344, 126.19994354248047, 135.39584350585938, 144.59176635742188, 153.78770446777344, 162.98362731933594, 172.1795654296875, 181.37548828125, 190.5714111328125, 199.767333984375, 208.96327209472656, 218.15919494628906, 227.35513305664062, 236.55105590820312, 245.74697875976562, 254.9429168701172, 264.13885498046875, 273.33477783203125, 282.53070068359375, 291.72662353515625, 300.92254638671875, 310.1184997558594, 319.3144226074219, 328.5103454589844, 337.7062683105469, 346.9021911621094, 356.09814453125, 365.2940673828125, 374.489990234375, 383.6859436035156, 392.8818664550781, 402.0777893066406, 411.2737121582031, 420.4696350097656, 429.6655578613281]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 8.0, 7.0, 9.0, 11.0, 18.0, 13.0, 11.0, 16.0, 22.0, 28.0, 23.0, 27.0, 40.0, 35.0, 32.0, 45.0, 43.0, 42.0, 44.0, 38.0, 43.0, 59.0, 40.0, 37.0, 42.0, 37.0, 24.0, 20.0, 25.0, 29.0, 31.0, 22.0, 15.0, 8.0, 13.0, 5.0, 6.0, 3.0, 5.0, 7.0, 4.0, 2.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-66.602294921875, -64.64596557617188, -62.68964385986328, -60.733314514160156, -58.7769889831543, -56.82066345214844, -54.86433410644531, -52.90800857543945, -50.951683044433594, -48.995357513427734, -47.039031982421875, -45.08270263671875, -43.12637710571289, -41.17005157470703, -39.213722229003906, -37.25739669799805, -35.30107116699219, -33.34474563598633, -31.388418197631836, -29.432090759277344, -27.475765228271484, -25.519439697265625, -23.563112258911133, -21.60678482055664, -19.65045928955078, -17.694133758544922, -15.73780632019043, -13.781479835510254, -11.825153350830078, -9.868826866149902, -7.912500381469727, -5.956173896789551, -3.999847412109375, -2.043520927429199, -0.08719444274902344, 1.8691320419311523, 3.825458526611328, 5.781785011291504, 7.73811149597168, 9.694437980651855, 11.650764465332031, 13.607090950012207, 15.563417434692383, 17.519744873046875, 19.476070404052734, 21.432395935058594, 23.388723373413086, 25.345050811767578, 27.301376342773438, 29.257701873779297, 31.21402931213379, 33.17035675048828, 35.12668228149414, 37.0830078125, 39.039337158203125, 40.995662689208984, 42.951988220214844, 44.9083137512207, 46.86463928222656, 48.82096862792969, 50.77729415893555, 52.733619689941406, 54.68994903564453, 56.64627456665039, 58.60260009765625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 5.0, 11.0, 8.0, 14.0, 18.0, 11.0, 27.0, 25.0, 21.0, 34.0, 25.0, 37.0, 33.0, 52.0, 37.0, 49.0, 43.0, 41.0, 43.0, 46.0, 52.0, 52.0, 29.0, 39.0, 28.0, 25.0, 23.0, 24.0, 24.0, 29.0, 20.0, 13.0, 13.0, 10.0, 7.0, 6.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.625, -8.360107421875, -8.09521484375, -7.830322265625, -7.5654296875, -7.300537109375, -7.03564453125, -6.770751953125, -6.505859375, -6.240966796875, -5.97607421875, -5.711181640625, -5.4462890625, -5.181396484375, -4.91650390625, -4.651611328125, -4.38671875, -4.121826171875, -3.85693359375, -3.592041015625, -3.3271484375, -3.062255859375, -2.79736328125, -2.532470703125, -2.267578125, -2.002685546875, -1.73779296875, -1.472900390625, -1.2080078125, -0.943115234375, -0.67822265625, -0.413330078125, -0.1484375, 0.116455078125, 0.38134765625, 0.646240234375, 0.9111328125, 1.176025390625, 1.44091796875, 1.705810546875, 1.970703125, 2.235595703125, 2.50048828125, 2.765380859375, 3.0302734375, 3.295166015625, 3.56005859375, 3.824951171875, 4.08984375, 4.354736328125, 4.61962890625, 4.884521484375, 5.1494140625, 5.414306640625, 5.67919921875, 5.944091796875, 6.208984375, 6.473876953125, 6.73876953125, 7.003662109375, 7.2685546875, 7.533447265625, 7.79833984375, 8.063232421875, 8.328125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 13.0, 12.0, 19.0, 37.0, 47.0, 64.0, 86.0, 114.0, 190.0, 244.0, 367.0, 515.0, 761.0, 1143.0, 1611.0, 2316.0, 3482.0, 5157.0, 7838.0, 11922.0, 18005.0, 28217.0, 44286.0, 73482.0, 141944.0, 335841.0, 157991.0, 78775.0, 47113.0, 29774.0, 19354.0, 12491.0, 8218.0, 5539.0, 3767.0, 2519.0, 1663.0, 1157.0, 747.0, 536.0, 370.0, 224.0, 189.0, 131.0, 77.0, 62.0, 47.0, 32.0, 14.0, 12.0, 13.0, 11.0, 4.0, 4.0, 2.0, 1.0, 3.0], "bins": [-1.6357421875, -1.58551025390625, -1.5352783203125, -1.48504638671875, -1.434814453125, -1.38458251953125, -1.3343505859375, -1.28411865234375, -1.23388671875, -1.18365478515625, -1.1334228515625, -1.08319091796875, -1.032958984375, -0.98272705078125, -0.9324951171875, -0.88226318359375, -0.83203125, -0.78179931640625, -0.7315673828125, -0.68133544921875, -0.631103515625, -0.58087158203125, -0.5306396484375, -0.48040771484375, -0.43017578125, -0.37994384765625, -0.3297119140625, -0.27947998046875, -0.229248046875, -0.17901611328125, -0.1287841796875, -0.07855224609375, -0.0283203125, 0.02191162109375, 0.0721435546875, 0.12237548828125, 0.172607421875, 0.22283935546875, 0.2730712890625, 0.32330322265625, 0.37353515625, 0.42376708984375, 0.4739990234375, 0.52423095703125, 0.574462890625, 0.62469482421875, 0.6749267578125, 0.72515869140625, 0.775390625, 0.82562255859375, 0.8758544921875, 0.92608642578125, 0.976318359375, 1.02655029296875, 1.0767822265625, 1.12701416015625, 1.17724609375, 1.22747802734375, 1.2777099609375, 1.32794189453125, 1.378173828125, 1.42840576171875, 1.4786376953125, 1.52886962890625, 1.5791015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 2.0, 5.0, 10.0, 6.0, 9.0, 20.0, 19.0, 22.0, 13.0, 21.0, 24.0, 23.0, 27.0, 28.0, 32.0, 26.0, 22.0, 40.0, 38.0, 44.0, 38.0, 1063.0, 37.0, 45.0, 34.0, 38.0, 35.0, 29.0, 27.0, 24.0, 25.0, 27.0, 25.0, 19.0, 22.0, 22.0, 12.0, 11.0, 8.0, 5.0, 7.0, 5.0, 5.0, 9.0, 5.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0], "bins": [-4.87890625, -4.73431396484375, -4.5897216796875, -4.44512939453125, -4.300537109375, -4.15594482421875, -4.0113525390625, -3.86676025390625, -3.72216796875, -3.57757568359375, -3.4329833984375, -3.28839111328125, -3.143798828125, -2.99920654296875, -2.8546142578125, -2.71002197265625, -2.5654296875, -2.42083740234375, -2.2762451171875, -2.13165283203125, -1.987060546875, -1.84246826171875, -1.6978759765625, -1.55328369140625, -1.40869140625, -1.26409912109375, -1.1195068359375, -0.97491455078125, -0.830322265625, -0.68572998046875, -0.5411376953125, -0.39654541015625, -0.251953125, -0.10736083984375, 0.0372314453125, 0.18182373046875, 0.326416015625, 0.47100830078125, 0.6156005859375, 0.76019287109375, 0.90478515625, 1.04937744140625, 1.1939697265625, 1.33856201171875, 1.483154296875, 1.62774658203125, 1.7723388671875, 1.91693115234375, 2.0615234375, 2.20611572265625, 2.3507080078125, 2.49530029296875, 2.639892578125, 2.78448486328125, 2.9290771484375, 3.07366943359375, 3.21826171875, 3.36285400390625, 3.5074462890625, 3.65203857421875, 3.796630859375, 3.94122314453125, 4.0858154296875, 4.23040771484375, 4.375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 7.0, 16.0, 19.0, 26.0, 42.0, 63.0, 114.0, 173.0, 272.0, 378.0, 557.0, 868.0, 1263.0, 1869.0, 2845.0, 4454.0, 6903.0, 10584.0, 16053.0, 25357.0, 40764.0, 66920.0, 125091.0, 1383282.0, 184584.0, 86277.0, 50131.0, 31417.0, 20066.0, 12954.0, 8119.0, 5337.0, 3484.0, 2317.0, 1517.0, 1030.0, 671.0, 455.0, 271.0, 203.0, 140.0, 78.0, 63.0, 38.0, 18.0, 17.0, 9.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 4.0], "bins": [-1.7099609375, -1.6592559814453125, -1.608551025390625, -1.5578460693359375, -1.50714111328125, -1.4564361572265625, -1.405731201171875, -1.3550262451171875, -1.3043212890625, -1.2536163330078125, -1.202911376953125, -1.1522064208984375, -1.10150146484375, -1.0507965087890625, -1.000091552734375, -0.9493865966796875, -0.898681640625, -0.8479766845703125, -0.797271728515625, -0.7465667724609375, -0.69586181640625, -0.6451568603515625, -0.594451904296875, -0.5437469482421875, -0.4930419921875, -0.4423370361328125, -0.391632080078125, -0.3409271240234375, -0.29022216796875, -0.2395172119140625, -0.188812255859375, -0.1381072998046875, -0.08740234375, -0.0366973876953125, 0.014007568359375, 0.0647125244140625, 0.11541748046875, 0.1661224365234375, 0.216827392578125, 0.2675323486328125, 0.3182373046875, 0.3689422607421875, 0.419647216796875, 0.4703521728515625, 0.52105712890625, 0.5717620849609375, 0.622467041015625, 0.6731719970703125, 0.723876953125, 0.7745819091796875, 0.825286865234375, 0.8759918212890625, 0.92669677734375, 0.9774017333984375, 1.028106689453125, 1.0788116455078125, 1.1295166015625, 1.1802215576171875, 1.230926513671875, 1.2816314697265625, 1.33233642578125, 1.3830413818359375, 1.433746337890625, 1.4844512939453125, 1.53515625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 5.0, 7.0, 7.0, 9.0, 10.0, 17.0, 19.0, 20.0, 24.0, 26.0, 35.0, 41.0, 43.0, 54.0, 60.0, 79.0, 66.0, 62.0, 45.0, 51.0, 43.0, 37.0, 32.0, 35.0, 37.0, 31.0, 10.0, 8.0, 12.0, 14.0, 11.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00047898292541503906, -0.0004617162048816681, -0.0004444494843482971, -0.00042718276381492615, -0.0004099160432815552, -0.0003926493227481842, -0.00037538260221481323, -0.00035811588168144226, -0.0003408491611480713, -0.0003235824406147003, -0.00030631572008132935, -0.0002890489995479584, -0.0002717822790145874, -0.00025451555848121643, -0.00023724883794784546, -0.0002199821174144745, -0.00020271539688110352, -0.00018544867634773254, -0.00016818195581436157, -0.0001509152352809906, -0.00013364851474761963, -0.00011638179421424866, -9.911507368087769e-05, -8.184835314750671e-05, -6.458163261413574e-05, -4.731491208076477e-05, -3.00481915473938e-05, -1.2781471014022827e-05, 4.4852495193481445e-06, 2.1751970052719116e-05, 3.901869058609009e-05, 5.628541111946106e-05, 7.355213165283203e-05, 9.0818852186203e-05, 0.00010808557271957397, 0.00012535229325294495, 0.00014261901378631592, 0.0001598857343196869, 0.00017715245485305786, 0.00019441917538642883, 0.0002116858959197998, 0.00022895261645317078, 0.00024621933698654175, 0.0002634860575199127, 0.0002807527780532837, 0.00029801949858665466, 0.00031528621912002563, 0.0003325529396533966, 0.0003498196601867676, 0.00036708638072013855, 0.0003843531012535095, 0.0004016198217868805, 0.00041888654232025146, 0.00043615326285362244, 0.0004534199833869934, 0.0004706867039203644, 0.00048795342445373535, 0.0005052201449871063, 0.0005224868655204773, 0.0005397535860538483, 0.0005570203065872192, 0.0005742870271205902, 0.0005915537476539612, 0.0006088204681873322, 0.0006260871887207031]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 5.0, 5.0, 6.0, 7.0, 6.0, 9.0, 15.0, 17.0, 21.0, 28.0, 34.0, 39.0, 51.0, 56.0, 95.0, 142.0, 211.0, 648.0, 3340.0, 159975.0, 871849.0, 10102.0, 925.0, 323.0, 191.0, 111.0, 70.0, 60.0, 33.0, 31.0, 24.0, 26.0, 18.0, 12.0, 11.0, 6.0, 9.0, 7.0, 8.0, 4.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.01233673095703125, -0.011964917182922363, -0.011593103408813477, -0.01122128963470459, -0.010849475860595703, -0.010477662086486816, -0.01010584831237793, -0.009734034538269043, -0.009362220764160156, -0.00899040699005127, -0.008618593215942383, -0.008246779441833496, -0.00787496566772461, -0.007503151893615723, -0.007131338119506836, -0.006759524345397949, -0.0063877105712890625, -0.006015896797180176, -0.005644083023071289, -0.005272269248962402, -0.004900455474853516, -0.004528641700744629, -0.004156827926635742, -0.0037850141525268555, -0.0034132003784179688, -0.003041386604309082, -0.0026695728302001953, -0.0022977590560913086, -0.0019259452819824219, -0.0015541315078735352, -0.0011823177337646484, -0.0008105039596557617, -0.000438690185546875, -6.687641143798828e-05, 0.00030493736267089844, 0.0006767511367797852, 0.0010485649108886719, 0.0014203786849975586, 0.0017921924591064453, 0.002164006233215332, 0.0025358200073242188, 0.0029076337814331055, 0.003279447555541992, 0.003651261329650879, 0.004023075103759766, 0.004394888877868652, 0.004766702651977539, 0.005138516426086426, 0.0055103302001953125, 0.005882143974304199, 0.006253957748413086, 0.006625771522521973, 0.006997585296630859, 0.007369399070739746, 0.007741212844848633, 0.00811302661895752, 0.008484840393066406, 0.008856654167175293, 0.00922846794128418, 0.009600281715393066, 0.009972095489501953, 0.01034390926361084, 0.010715723037719727, 0.011087536811828613, 0.0114593505859375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 14.0, 27.0, 58.0, 80.0, 112.0, 176.0, 172.0, 134.0, 104.0, 54.0, 33.0, 15.0, 13.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006888743955641985, -0.0006652384181506932, -0.0006416024407371879, -0.0006179664633236825, -0.0005943304859101772, -0.0005706945084966719, -0.0005470585310831666, -0.0005234226118773222, -0.000499786576256156, -0.00047615059884265065, -0.00045251462142914534, -0.00042887864401564, -0.0004052426666021347, -0.0003816066891886294, -0.00035797074087895453, -0.0003343347634654492, -0.00031069881515577435, -0.00028706283774226904, -0.0002634268603287637, -0.00023979089746717364, -0.00021615492005366832, -0.000192518942640163, -0.00016888297977857292, -0.0001452470023650676, -0.00012161102495156229, -9.797504753805697e-05, -7.433907740050927e-05, -5.0703107262961566e-05, -2.706712984945625e-05, -3.431152435950935e-06, 2.0204810425639153e-05, 4.384078783914447e-05, 6.747676525264978e-05, 9.11127426661551e-05, 0.0001147487128037028, 0.0001383846829412505, 0.00016202066035475582, 0.00018565663776826113, 0.00020929260062985122, 0.00023292857804335654, 0.00025656455545686185, 0.00028020053287036717, 0.0003038365102838725, 0.00032747245859354734, 0.00035110843600705266, 0.000374744413420558, 0.0003983803908340633, 0.0004220163682475686, 0.0004456523456610739, 0.00046928832307457924, 0.0004929243004880846, 0.0005165602779015899, 0.0005401962553150952, 0.0005638322327286005, 0.0005874681519344449, 0.0006111041875556111, 0.0006347401067614555, 0.0006583760841749609, 0.0006820120615884662, 0.0007056480390019715, 0.0007292840164154768, 0.0007529199938289821, 0.0007765559712424874, 0.0008001918904483318, 0.0008238279260694981]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 5.0, 11.0, 10.0, 13.0, 18.0, 21.0, 33.0, 25.0, 30.0, 25.0, 52.0, 34.0, 35.0, 50.0, 45.0, 48.0, 64.0, 30.0, 43.0, 39.0, 42.0, 43.0, 42.0, 33.0, 29.0, 27.0, 27.0, 26.0, 18.0, 10.0, 12.0, 9.0, 9.0, 8.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00031936168670654297, -0.0003092959523200989, -0.0002992302179336548, -0.0002891644835472107, -0.0002790987491607666, -0.0002690330147743225, -0.0002589672803878784, -0.0002489015460014343, -0.00023883581161499023, -0.00022877007722854614, -0.00021870434284210205, -0.00020863860845565796, -0.00019857287406921387, -0.00018850713968276978, -0.00017844140529632568, -0.0001683756709098816, -0.0001583099365234375, -0.0001482442021369934, -0.00013817846775054932, -0.00012811273336410522, -0.00011804699897766113, -0.00010798126459121704, -9.791553020477295e-05, -8.784979581832886e-05, -7.778406143188477e-05, -6.771832704544067e-05, -5.765259265899658e-05, -4.758685827255249e-05, -3.75211238861084e-05, -2.7455389499664307e-05, -1.7389655113220215e-05, -7.323920726776123e-06, 2.7418136596679688e-06, 1.280754804611206e-05, 2.2873282432556152e-05, 3.2939016819000244e-05, 4.3004751205444336e-05, 5.307048559188843e-05, 6.313621997833252e-05, 7.320195436477661e-05, 8.32676887512207e-05, 9.33334231376648e-05, 0.00010339915752410889, 0.00011346489191055298, 0.00012353062629699707, 0.00013359636068344116, 0.00014366209506988525, 0.00015372782945632935, 0.00016379356384277344, 0.00017385929822921753, 0.00018392503261566162, 0.0001939907670021057, 0.0002040565013885498, 0.0002141222357749939, 0.000224187970161438, 0.00023425370454788208, 0.00024431943893432617, 0.00025438517332077026, 0.00026445090770721436, 0.00027451664209365845, 0.00028458237648010254, 0.00029464811086654663, 0.0003047138452529907, 0.0003147795796394348, 0.0003248453140258789]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 5.0, 11.0, 8.0, 14.0, 18.0, 11.0, 27.0, 25.0, 21.0, 34.0, 25.0, 37.0, 33.0, 52.0, 37.0, 49.0, 43.0, 41.0, 43.0, 46.0, 52.0, 52.0, 29.0, 39.0, 28.0, 25.0, 23.0, 24.0, 24.0, 29.0, 20.0, 13.0, 13.0, 10.0, 7.0, 6.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.625, -8.360107421875, -8.09521484375, -7.830322265625, -7.5654296875, -7.300537109375, -7.03564453125, -6.770751953125, -6.505859375, -6.240966796875, -5.97607421875, -5.711181640625, -5.4462890625, -5.181396484375, -4.91650390625, -4.651611328125, -4.38671875, -4.121826171875, -3.85693359375, -3.592041015625, -3.3271484375, -3.062255859375, -2.79736328125, -2.532470703125, -2.267578125, -2.002685546875, -1.73779296875, -1.472900390625, -1.2080078125, -0.943115234375, -0.67822265625, -0.413330078125, -0.1484375, 0.116455078125, 0.38134765625, 0.646240234375, 0.9111328125, 1.176025390625, 1.44091796875, 1.705810546875, 1.970703125, 2.235595703125, 2.50048828125, 2.765380859375, 3.0302734375, 3.295166015625, 3.56005859375, 3.824951171875, 4.08984375, 4.354736328125, 4.61962890625, 4.884521484375, 5.1494140625, 5.414306640625, 5.67919921875, 5.944091796875, 6.208984375, 6.473876953125, 6.73876953125, 7.003662109375, 7.2685546875, 7.533447265625, 7.79833984375, 8.063232421875, 8.328125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 15.0, 7.0, 20.0, 25.0, 30.0, 34.0, 57.0, 65.0, 118.0, 155.0, 212.0, 344.0, 493.0, 763.0, 1341.0, 2223.0, 4015.0, 7298.0, 14455.0, 29375.0, 64820.0, 158527.0, 366716.0, 228598.0, 89522.0, 39021.0, 18656.0, 9458.0, 5062.0, 2753.0, 1610.0, 975.0, 593.0, 355.0, 247.0, 160.0, 123.0, 98.0, 54.0, 43.0, 30.0, 22.0, 21.0, 13.0, 12.0, 3.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.9296875, -4.77886962890625, -4.6280517578125, -4.47723388671875, -4.326416015625, -4.17559814453125, -4.0247802734375, -3.87396240234375, -3.72314453125, -3.57232666015625, -3.4215087890625, -3.27069091796875, -3.119873046875, -2.96905517578125, -2.8182373046875, -2.66741943359375, -2.5166015625, -2.36578369140625, -2.2149658203125, -2.06414794921875, -1.913330078125, -1.76251220703125, -1.6116943359375, -1.46087646484375, -1.31005859375, -1.15924072265625, -1.0084228515625, -0.85760498046875, -0.706787109375, -0.55596923828125, -0.4051513671875, -0.25433349609375, -0.103515625, 0.04730224609375, 0.1981201171875, 0.34893798828125, 0.499755859375, 0.65057373046875, 0.8013916015625, 0.95220947265625, 1.10302734375, 1.25384521484375, 1.4046630859375, 1.55548095703125, 1.706298828125, 1.85711669921875, 2.0079345703125, 2.15875244140625, 2.3095703125, 2.46038818359375, 2.6112060546875, 2.76202392578125, 2.912841796875, 3.06365966796875, 3.2144775390625, 3.36529541015625, 3.51611328125, 3.66693115234375, 3.8177490234375, 3.96856689453125, 4.119384765625, 4.27020263671875, 4.4210205078125, 4.57183837890625, 4.72265625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 2.0, 16.0, 12.0, 9.0, 11.0, 17.0, 27.0, 31.0, 33.0, 39.0, 60.0, 48.0, 57.0, 108.0, 149.0, 1670.0, 231.0, 110.0, 60.0, 60.0, 41.0, 37.0, 39.0, 30.0, 34.0, 24.0, 20.0, 19.0, 10.0, 9.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.21875, -34.10595703125, -32.9931640625, -31.88037109375, -30.767578125, -29.65478515625, -28.5419921875, -27.42919921875, -26.31640625, -25.20361328125, -24.0908203125, -22.97802734375, -21.865234375, -20.75244140625, -19.6396484375, -18.52685546875, -17.4140625, -16.30126953125, -15.1884765625, -14.07568359375, -12.962890625, -11.85009765625, -10.7373046875, -9.62451171875, -8.51171875, -7.39892578125, -6.2861328125, -5.17333984375, -4.060546875, -2.94775390625, -1.8349609375, -0.72216796875, 0.390625, 1.50341796875, 2.6162109375, 3.72900390625, 4.841796875, 5.95458984375, 7.0673828125, 8.18017578125, 9.29296875, 10.40576171875, 11.5185546875, 12.63134765625, 13.744140625, 14.85693359375, 15.9697265625, 17.08251953125, 18.1953125, 19.30810546875, 20.4208984375, 21.53369140625, 22.646484375, 23.75927734375, 24.8720703125, 25.98486328125, 27.09765625, 28.21044921875, 29.3232421875, 30.43603515625, 31.548828125, 32.66162109375, 33.7744140625, 34.88720703125, 36.0]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 7.0, 3.0, 5.0, 11.0, 10.0, 12.0, 16.0, 24.0, 30.0, 41.0, 47.0, 82.0, 83.0, 130.0, 195.0, 272.0, 370.0, 1172.0, 22425.0, 3108880.0, 9768.0, 922.0, 348.0, 247.0, 192.0, 106.0, 76.0, 59.0, 46.0, 35.0, 18.0, 14.0, 17.0, 17.0, 8.0, 6.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.0625, -78.5615234375, -76.060546875, -73.5595703125, -71.05859375, -68.5576171875, -66.056640625, -63.5556640625, -61.0546875, -58.5537109375, -56.052734375, -53.5517578125, -51.05078125, -48.5498046875, -46.048828125, -43.5478515625, -41.046875, -38.5458984375, -36.044921875, -33.5439453125, -31.04296875, -28.5419921875, -26.041015625, -23.5400390625, -21.0390625, -18.5380859375, -16.037109375, -13.5361328125, -11.03515625, -8.5341796875, -6.033203125, -3.5322265625, -1.03125, 1.4697265625, 3.970703125, 6.4716796875, 8.97265625, 11.4736328125, 13.974609375, 16.4755859375, 18.9765625, 21.4775390625, 23.978515625, 26.4794921875, 28.98046875, 31.4814453125, 33.982421875, 36.4833984375, 38.984375, 41.4853515625, 43.986328125, 46.4873046875, 48.98828125, 51.4892578125, 53.990234375, 56.4912109375, 58.9921875, 61.4931640625, 63.994140625, 66.4951171875, 68.99609375, 71.4970703125, 73.998046875, 76.4990234375, 79.0]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 41.0, 398.0, 486.0, 83.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.95267486572266, -97.7256088256836, -93.49854278564453, -89.27147674560547, -85.0444107055664, -80.81734466552734, -76.59028625488281, -72.36322021484375, -68.13615417480469, -63.909088134765625, -59.68202209472656, -55.4549560546875, -51.22789001464844, -47.000823974609375, -42.77376174926758, -38.546695709228516, -34.31962585449219, -30.092559814453125, -25.865493774414062, -21.638429641723633, -17.41136360168457, -13.184297561645508, -8.957233428955078, -4.730167388916016, -0.5031013488769531, 3.723964214324951, 7.9510297775268555, 12.178094863891602, 16.405160903930664, 20.632226943969727, 24.859291076660156, 29.08635711669922, 33.31343078613281, 37.540496826171875, 41.76756286621094, 45.99462890625, 50.22169494628906, 54.448760986328125, 58.67582321166992, 62.902889251708984, 67.12995910644531, 71.35702514648438, 75.58409118652344, 79.8111572265625, 84.03822326660156, 88.26528930664062, 92.49235534667969, 96.71942138671875, 100.94647979736328, 105.17354583740234, 109.4006118774414, 113.62767791748047, 117.85474395751953, 122.0818099975586, 126.30886840820312, 130.5359344482422, 134.76300048828125, 138.9900665283203, 143.21713256835938, 147.44419860839844, 151.6712646484375, 155.89833068847656, 160.12539672851562, 164.3524627685547, 168.57952880859375]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 6.0, 3.0, 10.0, 11.0, 18.0, 7.0, 14.0, 21.0, 25.0, 22.0, 22.0, 39.0, 36.0, 33.0, 40.0, 35.0, 42.0, 44.0, 52.0, 53.0, 50.0, 48.0, 42.0, 33.0, 43.0, 38.0, 35.0, 25.0, 22.0, 20.0, 23.0, 16.0, 16.0, 10.0, 16.0, 8.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-92.94241333007812, -90.44367980957031, -87.94493865966797, -85.44620513916016, -82.94747161865234, -80.44873046875, -77.94999694824219, -75.45126342773438, -72.95252990722656, -70.45379638671875, -67.9550552368164, -65.4563217163086, -62.95758819580078, -60.4588508605957, -57.960113525390625, -55.46138000488281, -52.96263885498047, -50.46390151977539, -47.96516799926758, -45.4664306640625, -42.96769714355469, -40.46895980834961, -37.97022247314453, -35.47148895263672, -32.97275161743164, -30.474016189575195, -27.97528076171875, -25.476543426513672, -22.977807998657227, -20.47907257080078, -17.980335235595703, -15.481599807739258, -12.982872009277344, -10.484136581420898, -7.985400199890137, -5.486664295196533, -2.9879283905029297, -0.4891929626464844, 2.0095434188842773, 4.508279800415039, 7.007015228271484, 9.50575065612793, 12.004487037658691, 14.503223419189453, 17.0019588470459, 19.500694274902344, 21.999431610107422, 24.498167037963867, 26.996902465820312, 29.495637893676758, 31.994373321533203, 34.49311065673828, 36.991844177246094, 39.49058151245117, 41.98931884765625, 44.48805236816406, 46.98678970336914, 49.48552703857422, 51.98426055908203, 54.48299789428711, 56.98173522949219, 59.48046875, 61.97920608520508, 64.47794342041016, 66.97667694091797]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 9.0, 4.0, 5.0, 9.0, 10.0, 10.0, 18.0, 9.0, 19.0, 19.0, 41.0, 33.0, 23.0, 29.0, 36.0, 39.0, 40.0, 51.0, 48.0, 34.0, 48.0, 49.0, 53.0, 51.0, 33.0, 42.0, 37.0, 16.0, 23.0, 25.0, 25.0, 23.0, 20.0, 14.0, 16.0, 11.0, 9.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.421875, -8.1495361328125, -7.877197265625, -7.6048583984375, -7.33251953125, -7.0601806640625, -6.787841796875, -6.5155029296875, -6.2431640625, -5.9708251953125, -5.698486328125, -5.4261474609375, -5.15380859375, -4.8814697265625, -4.609130859375, -4.3367919921875, -4.064453125, -3.7921142578125, -3.519775390625, -3.2474365234375, -2.97509765625, -2.7027587890625, -2.430419921875, -2.1580810546875, -1.8857421875, -1.6134033203125, -1.341064453125, -1.0687255859375, -0.79638671875, -0.5240478515625, -0.251708984375, 0.0206298828125, 0.29296875, 0.5653076171875, 0.837646484375, 1.1099853515625, 1.38232421875, 1.6546630859375, 1.927001953125, 2.1993408203125, 2.4716796875, 2.7440185546875, 3.016357421875, 3.2886962890625, 3.56103515625, 3.8333740234375, 4.105712890625, 4.3780517578125, 4.650390625, 4.9227294921875, 5.195068359375, 5.4674072265625, 5.73974609375, 6.0120849609375, 6.284423828125, 6.5567626953125, 6.8291015625, 7.1014404296875, 7.373779296875, 7.6461181640625, 7.91845703125, 8.1907958984375, 8.463134765625, 8.7354736328125, 9.0078125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 4.0, 7.0, 6.0, 15.0, 8.0, 13.0, 12.0, 28.0, 21.0, 24.0, 19.0, 38.0, 54.0, 85.0, 142.0, 321.0, 898.0, 4431.0, 54312.0, 2814652.0, 1293250.0, 22189.0, 2430.0, 613.0, 259.0, 127.0, 58.0, 51.0, 41.0, 24.0, 20.0, 16.0, 15.0, 18.0, 18.0, 11.0, 13.0, 7.0, 7.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.4375, -31.41943359375, -30.4013671875, -29.38330078125, -28.365234375, -27.34716796875, -26.3291015625, -25.31103515625, -24.29296875, -23.27490234375, -22.2568359375, -21.23876953125, -20.220703125, -19.20263671875, -18.1845703125, -17.16650390625, -16.1484375, -15.13037109375, -14.1123046875, -13.09423828125, -12.076171875, -11.05810546875, -10.0400390625, -9.02197265625, -8.00390625, -6.98583984375, -5.9677734375, -4.94970703125, -3.931640625, -2.91357421875, -1.8955078125, -0.87744140625, 0.140625, 1.15869140625, 2.1767578125, 3.19482421875, 4.212890625, 5.23095703125, 6.2490234375, 7.26708984375, 8.28515625, 9.30322265625, 10.3212890625, 11.33935546875, 12.357421875, 13.37548828125, 14.3935546875, 15.41162109375, 16.4296875, 17.44775390625, 18.4658203125, 19.48388671875, 20.501953125, 21.52001953125, 22.5380859375, 23.55615234375, 24.57421875, 25.59228515625, 26.6103515625, 27.62841796875, 28.646484375, 29.66455078125, 30.6826171875, 31.70068359375, 32.71875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 9.0, 18.0, 12.0, 26.0, 38.0, 73.0, 111.0, 181.0, 233.0, 380.0, 494.0, 638.0, 623.0, 417.0, 257.0, 178.0, 129.0, 69.0, 65.0, 33.0, 28.0, 25.0, 9.0, 10.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.28125, -21.598876953125, -20.91650390625, -20.234130859375, -19.5517578125, -18.869384765625, -18.18701171875, -17.504638671875, -16.822265625, -16.139892578125, -15.45751953125, -14.775146484375, -14.0927734375, -13.410400390625, -12.72802734375, -12.045654296875, -11.36328125, -10.680908203125, -9.99853515625, -9.316162109375, -8.6337890625, -7.951416015625, -7.26904296875, -6.586669921875, -5.904296875, -5.221923828125, -4.53955078125, -3.857177734375, -3.1748046875, -2.492431640625, -1.81005859375, -1.127685546875, -0.4453125, 0.237060546875, 0.91943359375, 1.601806640625, 2.2841796875, 2.966552734375, 3.64892578125, 4.331298828125, 5.013671875, 5.696044921875, 6.37841796875, 7.060791015625, 7.7431640625, 8.425537109375, 9.10791015625, 9.790283203125, 10.47265625, 11.155029296875, 11.83740234375, 12.519775390625, 13.2021484375, 13.884521484375, 14.56689453125, 15.249267578125, 15.931640625, 16.614013671875, 17.29638671875, 17.978759765625, 18.6611328125, 19.343505859375, 20.02587890625, 20.708251953125, 21.390625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 9.0, 11.0, 7.0, 22.0, 19.0, 26.0, 31.0, 41.0, 59.0, 86.0, 88.0, 153.0, 250.0, 613.0, 1774.0, 51288.0, 4103532.0, 33340.0, 1593.0, 540.0, 265.0, 157.0, 89.0, 66.0, 50.0, 33.0, 27.0, 24.0, 18.0, 19.0, 5.0, 12.0, 10.0, 5.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.5, -68.896484375, -66.29296875, -63.689453125, -61.0859375, -58.482421875, -55.87890625, -53.275390625, -50.671875, -48.068359375, -45.46484375, -42.861328125, -40.2578125, -37.654296875, -35.05078125, -32.447265625, -29.84375, -27.240234375, -24.63671875, -22.033203125, -19.4296875, -16.826171875, -14.22265625, -11.619140625, -9.015625, -6.412109375, -3.80859375, -1.205078125, 1.3984375, 4.001953125, 6.60546875, 9.208984375, 11.8125, 14.416015625, 17.01953125, 19.623046875, 22.2265625, 24.830078125, 27.43359375, 30.037109375, 32.640625, 35.244140625, 37.84765625, 40.451171875, 43.0546875, 45.658203125, 48.26171875, 50.865234375, 53.46875, 56.072265625, 58.67578125, 61.279296875, 63.8828125, 66.486328125, 69.08984375, 71.693359375, 74.296875, 76.900390625, 79.50390625, 82.107421875, 84.7109375, 87.314453125, 89.91796875, 92.521484375, 95.125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 10.0, 14.0, 49.0, 112.0, 201.0, 239.0, 197.0, 106.0, 59.0, 23.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.20028686523438, -111.45030975341797, -106.70032501220703, -101.95034790039062, -97.20036315917969, -92.45038604736328, -87.70040893554688, -82.95042419433594, -78.20044708251953, -73.45046997070312, -68.70048522949219, -63.95050811767578, -59.20052719116211, -54.45054626464844, -49.70056915283203, -44.95058822631836, -40.20060729980469, -35.450626373291016, -30.700647354125977, -25.950668334960938, -21.200687408447266, -16.450706481933594, -11.700727462768555, -6.950748443603516, -2.2007675170898438, 2.5492124557495117, 7.299192428588867, 12.049172401428223, 16.799152374267578, 21.54913330078125, 26.29911231994629, 31.049091339111328, 35.79905700683594, 40.54903793334961, 45.29901885986328, 50.04899597167969, 54.79897689819336, 59.54895782470703, 64.29893493652344, 69.04891967773438, 73.79889678955078, 78.54887390136719, 83.29885864257812, 88.04883575439453, 92.79881286621094, 97.54879760742188, 102.29877471923828, 107.04875183105469, 111.79873657226562, 116.54871368408203, 121.29869842529297, 126.04867553710938, 130.7986602783203, 135.54864501953125, 140.29861450195312, 145.04859924316406, 149.798583984375, 154.54856872558594, 159.2985382080078, 164.04852294921875, 168.7985076904297, 173.54849243164062, 178.2984619140625, 183.04844665527344, 187.7984161376953]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 6.0, 8.0, 1.0, 10.0, 9.0, 14.0, 16.0, 25.0, 22.0, 18.0, 32.0, 30.0, 28.0, 37.0, 50.0, 40.0, 29.0, 40.0, 33.0, 50.0, 32.0, 38.0, 39.0, 36.0, 46.0, 41.0, 36.0, 26.0, 33.0, 20.0, 22.0, 25.0, 22.0, 12.0, 10.0, 10.0, 9.0, 10.0, 9.0, 6.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-60.53215026855469, -58.83130645751953, -57.13045883178711, -55.42961502075195, -53.72876739501953, -52.027923583984375, -50.32707977294922, -48.6262321472168, -46.925384521484375, -45.22454071044922, -43.5236930847168, -41.82284927368164, -40.12200164794922, -38.42115783691406, -36.720314025878906, -35.019466400146484, -33.31862258911133, -31.61777687072754, -29.91693115234375, -28.216087341308594, -26.515239715576172, -24.814395904541016, -23.113550186157227, -21.412704467773438, -19.71185874938965, -18.01101303100586, -16.31016731262207, -14.609322547912598, -12.908476829528809, -11.20763111114502, -9.506786346435547, -7.805940628051758, -6.105094909667969, -4.40424919128418, -2.703403949737549, -1.002558708190918, 0.6982870101928711, 2.39913272857666, 4.099977493286133, 5.800823211669922, 7.501668930053711, 9.2025146484375, 10.903360366821289, 12.604205131530762, 14.30505084991455, 16.005897521972656, 17.706741333007812, 19.4075870513916, 21.10843276977539, 22.80927848815918, 24.51012420654297, 26.210968017578125, 27.911815643310547, 29.612659454345703, 31.313505172729492, 33.01435089111328, 34.71519470214844, 36.416038513183594, 38.116886138916016, 39.81772994995117, 41.518577575683594, 43.21942138671875, 44.920265197753906, 46.62111282348633, 48.32196044921875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 12.0, 15.0, 16.0, 18.0, 30.0, 17.0, 24.0, 31.0, 33.0, 33.0, 50.0, 51.0, 46.0, 45.0, 42.0, 49.0, 42.0, 51.0, 36.0, 44.0, 45.0, 29.0, 28.0, 23.0, 27.0, 28.0, 22.0, 21.0, 11.0, 12.0, 8.0, 9.0, 6.0, 6.0, 1.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.82666015625, -8.5517578125, -8.27685546875, -8.001953125, -7.72705078125, -7.4521484375, -7.17724609375, -6.90234375, -6.62744140625, -6.3525390625, -6.07763671875, -5.802734375, -5.52783203125, -5.2529296875, -4.97802734375, -4.703125, -4.42822265625, -4.1533203125, -3.87841796875, -3.603515625, -3.32861328125, -3.0537109375, -2.77880859375, -2.50390625, -2.22900390625, -1.9541015625, -1.67919921875, -1.404296875, -1.12939453125, -0.8544921875, -0.57958984375, -0.3046875, -0.02978515625, 0.2451171875, 0.52001953125, 0.794921875, 1.06982421875, 1.3447265625, 1.61962890625, 1.89453125, 2.16943359375, 2.4443359375, 2.71923828125, 2.994140625, 3.26904296875, 3.5439453125, 3.81884765625, 4.09375, 4.36865234375, 4.6435546875, 4.91845703125, 5.193359375, 5.46826171875, 5.7431640625, 6.01806640625, 6.29296875, 6.56787109375, 6.8427734375, 7.11767578125, 7.392578125, 7.66748046875, 7.9423828125, 8.21728515625, 8.4921875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 7.0, 4.0, 11.0, 17.0, 35.0, 18.0, 54.0, 59.0, 123.0, 151.0, 241.0, 270.0, 430.0, 599.0, 936.0, 1304.0, 1851.0, 2824.0, 4222.0, 6166.0, 9151.0, 13940.0, 21420.0, 33268.0, 54226.0, 95795.0, 199928.0, 301358.0, 120694.0, 66041.0, 39244.0, 25071.0, 16212.0, 10742.0, 7005.0, 4874.0, 3283.0, 2161.0, 1474.0, 1036.0, 704.0, 463.0, 356.0, 232.0, 190.0, 128.0, 88.0, 51.0, 41.0, 17.0, 17.0, 15.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.59765625, -1.546417236328125, -1.49517822265625, -1.443939208984375, -1.3927001953125, -1.341461181640625, -1.29022216796875, -1.238983154296875, -1.187744140625, -1.136505126953125, -1.08526611328125, -1.034027099609375, -0.9827880859375, -0.931549072265625, -0.88031005859375, -0.829071044921875, -0.77783203125, -0.726593017578125, -0.67535400390625, -0.624114990234375, -0.5728759765625, -0.521636962890625, -0.47039794921875, -0.419158935546875, -0.367919921875, -0.316680908203125, -0.26544189453125, -0.214202880859375, -0.1629638671875, -0.111724853515625, -0.06048583984375, -0.009246826171875, 0.0419921875, 0.093231201171875, 0.14447021484375, 0.195709228515625, 0.2469482421875, 0.298187255859375, 0.34942626953125, 0.400665283203125, 0.451904296875, 0.503143310546875, 0.55438232421875, 0.605621337890625, 0.6568603515625, 0.708099365234375, 0.75933837890625, 0.810577392578125, 0.86181640625, 0.913055419921875, 0.96429443359375, 1.015533447265625, 1.0667724609375, 1.118011474609375, 1.16925048828125, 1.220489501953125, 1.271728515625, 1.322967529296875, 1.37420654296875, 1.425445556640625, 1.4766845703125, 1.527923583984375, 1.57916259765625, 1.630401611328125, 1.681640625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 6.0, 5.0, 6.0, 9.0, 7.0, 12.0, 11.0, 15.0, 17.0, 18.0, 21.0, 16.0, 20.0, 21.0, 22.0, 28.0, 33.0, 30.0, 41.0, 33.0, 40.0, 34.0, 47.0, 1068.0, 45.0, 36.0, 30.0, 46.0, 40.0, 23.0, 26.0, 31.0, 29.0, 25.0, 20.0, 20.0, 15.0, 10.0, 16.0, 7.0, 8.0, 11.0, 6.0, 5.0, 13.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.81640625, -4.6676025390625, -4.518798828125, -4.3699951171875, -4.22119140625, -4.0723876953125, -3.923583984375, -3.7747802734375, -3.6259765625, -3.4771728515625, -3.328369140625, -3.1795654296875, -3.03076171875, -2.8819580078125, -2.733154296875, -2.5843505859375, -2.435546875, -2.2867431640625, -2.137939453125, -1.9891357421875, -1.84033203125, -1.6915283203125, -1.542724609375, -1.3939208984375, -1.2451171875, -1.0963134765625, -0.947509765625, -0.7987060546875, -0.64990234375, -0.5010986328125, -0.352294921875, -0.2034912109375, -0.0546875, 0.0941162109375, 0.242919921875, 0.3917236328125, 0.54052734375, 0.6893310546875, 0.838134765625, 0.9869384765625, 1.1357421875, 1.2845458984375, 1.433349609375, 1.5821533203125, 1.73095703125, 1.8797607421875, 2.028564453125, 2.1773681640625, 2.326171875, 2.4749755859375, 2.623779296875, 2.7725830078125, 2.92138671875, 3.0701904296875, 3.218994140625, 3.3677978515625, 3.5166015625, 3.6654052734375, 3.814208984375, 3.9630126953125, 4.11181640625, 4.2606201171875, 4.409423828125, 4.5582275390625, 4.70703125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 15.0, 14.0, 24.0, 37.0, 67.0, 89.0, 146.0, 238.0, 356.0, 553.0, 932.0, 1372.0, 2047.0, 3187.0, 4883.0, 7448.0, 11632.0, 17934.0, 28411.0, 46984.0, 81636.0, 166082.0, 1406982.0, 133579.0, 70184.0, 40540.0, 25594.0, 16101.0, 10361.0, 6752.0, 4574.0, 2955.0, 1932.0, 1278.0, 784.0, 508.0, 336.0, 207.0, 136.0, 87.0, 55.0, 36.0, 20.0, 17.0, 8.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.69140625, -1.63916015625, -1.5869140625, -1.53466796875, -1.482421875, -1.43017578125, -1.3779296875, -1.32568359375, -1.2734375, -1.22119140625, -1.1689453125, -1.11669921875, -1.064453125, -1.01220703125, -0.9599609375, -0.90771484375, -0.85546875, -0.80322265625, -0.7509765625, -0.69873046875, -0.646484375, -0.59423828125, -0.5419921875, -0.48974609375, -0.4375, -0.38525390625, -0.3330078125, -0.28076171875, -0.228515625, -0.17626953125, -0.1240234375, -0.07177734375, -0.01953125, 0.03271484375, 0.0849609375, 0.13720703125, 0.189453125, 0.24169921875, 0.2939453125, 0.34619140625, 0.3984375, 0.45068359375, 0.5029296875, 0.55517578125, 0.607421875, 0.65966796875, 0.7119140625, 0.76416015625, 0.81640625, 0.86865234375, 0.9208984375, 0.97314453125, 1.025390625, 1.07763671875, 1.1298828125, 1.18212890625, 1.234375, 1.28662109375, 1.3388671875, 1.39111328125, 1.443359375, 1.49560546875, 1.5478515625, 1.60009765625, 1.65234375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 4.0, 8.0, 6.0, 8.0, 9.0, 12.0, 11.0, 16.0, 23.0, 28.0, 29.0, 41.0, 62.0, 90.0, 104.0, 118.0, 93.0, 78.0, 62.0, 32.0, 41.0, 27.0, 22.0, 21.0, 7.0, 8.0, 9.0, 15.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011453628540039062, -0.0011076927185058594, -0.0010700225830078125, -0.0010323524475097656, -0.0009946823120117188, -0.0009570121765136719, -0.000919342041015625, -0.0008816719055175781, -0.0008440017700195312, -0.0008063316345214844, -0.0007686614990234375, -0.0007309913635253906, -0.0006933212280273438, -0.0006556510925292969, -0.00061798095703125, -0.0005803108215332031, -0.0005426406860351562, -0.0005049705505371094, -0.0004673004150390625, -0.0004296302795410156, -0.00039196014404296875, -0.0003542900085449219, -0.000316619873046875, -0.0002789497375488281, -0.00024127960205078125, -0.00020360946655273438, -0.0001659393310546875, -0.00012826919555664062, -9.059906005859375e-05, -5.2928924560546875e-05, -1.52587890625e-05, 2.2411346435546875e-05, 6.008148193359375e-05, 9.775161743164062e-05, 0.0001354217529296875, 0.00017309188842773438, 0.00021076202392578125, 0.0002484321594238281, 0.000286102294921875, 0.0003237724304199219, 0.00036144256591796875, 0.0003991127014160156, 0.0004367828369140625, 0.0004744529724121094, 0.0005121231079101562, 0.0005497932434082031, 0.00058746337890625, 0.0006251335144042969, 0.0006628036499023438, 0.0007004737854003906, 0.0007381439208984375, 0.0007758140563964844, 0.0008134841918945312, 0.0008511543273925781, 0.000888824462890625, 0.0009264945983886719, 0.0009641647338867188, 0.0010018348693847656, 0.0010395050048828125, 0.0010771751403808594, 0.0011148452758789062, 0.0011525154113769531, 0.001190185546875, 0.0012278556823730469, 0.0012655258178710938]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 5.0, 5.0, 7.0, 8.0, 8.0, 10.0, 19.0, 11.0, 31.0, 36.0, 62.0, 64.0, 116.0, 262.0, 758.0, 89305.0, 955851.0, 1241.0, 301.0, 146.0, 89.0, 55.0, 30.0, 20.0, 20.0, 19.0, 5.0, 15.0, 12.0, 8.0, 5.0, 10.0, 5.0, 4.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0263824462890625, -0.025586366653442383, -0.024790287017822266, -0.02399420738220215, -0.02319812774658203, -0.022402048110961914, -0.021605968475341797, -0.02080988883972168, -0.020013809204101562, -0.019217729568481445, -0.018421649932861328, -0.01762557029724121, -0.016829490661621094, -0.016033411026000977, -0.01523733139038086, -0.014441251754760742, -0.013645172119140625, -0.012849092483520508, -0.01205301284790039, -0.011256933212280273, -0.010460853576660156, -0.009664773941040039, -0.008868694305419922, -0.008072614669799805, -0.0072765350341796875, -0.00648045539855957, -0.005684375762939453, -0.004888296127319336, -0.004092216491699219, -0.0032961368560791016, -0.0025000572204589844, -0.0017039775848388672, -0.00090789794921875, -0.00011181831359863281, 0.0006842613220214844, 0.0014803409576416016, 0.0022764205932617188, 0.003072500228881836, 0.003868579864501953, 0.00466465950012207, 0.0054607391357421875, 0.006256818771362305, 0.007052898406982422, 0.007848978042602539, 0.008645057678222656, 0.009441137313842773, 0.01023721694946289, 0.011033296585083008, 0.011829376220703125, 0.012625455856323242, 0.01342153549194336, 0.014217615127563477, 0.015013694763183594, 0.01580977439880371, 0.016605854034423828, 0.017401933670043945, 0.018198013305664062, 0.01899409294128418, 0.019790172576904297, 0.020586252212524414, 0.02138233184814453, 0.02217841148376465, 0.022974491119384766, 0.023770570755004883, 0.024566650390625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 24.0, 146.0, 461.0, 313.0, 60.0, 11.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.003901917487382889, -0.0038279974833130836, -0.003754077712073922, -0.003680157708004117, -0.0036062379367649555, -0.0035323179326951504, -0.003458398161455989, -0.0033844781573861837, -0.0033105583861470222, -0.003236638382077217, -0.0031627186108380556, -0.0030887986067682505, -0.003014878835529089, -0.002940958831459284, -0.0028670390602201223, -0.002793119056150317, -0.0027191992849111557, -0.0026452792808413506, -0.002571359509602189, -0.002497439505532384, -0.0024235197342932224, -0.0023495997302234173, -0.002275679958984256, -0.0022017599549144506, -0.0021278399508446455, -0.0020539199467748404, -0.001980000175535679, -0.0019060802878811955, -0.0018321604002267122, -0.001758240512572229, -0.0016843206249177456, -0.0016104006208479404, -0.001536480849608779, -0.0014625609619542956, -0.0013886410742998123, -0.001314721186645329, -0.0012408012989908457, -0.0011668814113363624, -0.001092961523681879, -0.001019041519612074, -0.0009451216319575906, -0.0008712017443031073, -0.0007972818566486239, -0.0007233619689941406, -0.0006494420813396573, -0.000575522193685174, -0.0005016022478230298, -0.00042768236016854644, -0.0003537624725140631, -0.0002798425848595798, -0.00020592268265318125, -0.0001320027804467827, -5.808289279229939e-05, 1.583699486218393e-05, 8.97569116204977e-05, 0.00016367679927498102, 0.00023759668692946434, 0.00031151657458394766, 0.000385436462238431, 0.00045935637899674475, 0.0005332762375473976, 0.0006071961252018809, 0.0006811160710640252, 0.0007550359587185085, 0.0008289558463729918]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 2.0, 7.0, 5.0, 5.0, 9.0, 9.0, 9.0, 14.0, 11.0, 23.0, 13.0, 23.0, 20.0, 24.0, 23.0, 28.0, 32.0, 35.0, 34.0, 46.0, 32.0, 27.0, 36.0, 29.0, 32.0, 37.0, 40.0, 32.0, 33.0, 42.0, 35.0, 32.0, 25.0, 20.0, 24.0, 28.0, 19.0, 13.0, 12.0, 10.0, 13.0, 13.0, 13.0, 15.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004456043243408203, -0.0004318896681070328, -0.00041817501187324524, -0.0004044603556394577, -0.00039074569940567017, -0.00037703104317188263, -0.0003633163869380951, -0.00034960173070430756, -0.00033588707447052, -0.0003221724182367325, -0.00030845776200294495, -0.0002947431057691574, -0.0002810284495353699, -0.00026731379330158234, -0.0002535991370677948, -0.00023988448083400726, -0.00022616982460021973, -0.0002124551683664322, -0.00019874051213264465, -0.00018502585589885712, -0.00017131119966506958, -0.00015759654343128204, -0.0001438818871974945, -0.00013016723096370697, -0.00011645257472991943, -0.0001027379184961319, -8.902326226234436e-05, -7.530860602855682e-05, -6.159394979476929e-05, -4.787929356098175e-05, -3.4164637327194214e-05, -2.0449981093406677e-05, -6.735324859619141e-06, 6.979331374168396e-06, 2.0693987607955933e-05, 3.440864384174347e-05, 4.8123300075531006e-05, 6.183795630931854e-05, 7.555261254310608e-05, 8.926726877689362e-05, 0.00010298192501068115, 0.00011669658124446869, 0.00013041123747825623, 0.00014412589371204376, 0.0001578405499458313, 0.00017155520617961884, 0.00018526986241340637, 0.0001989845186471939, 0.00021269917488098145, 0.00022641383111476898, 0.00024012848734855652, 0.00025384314358234406, 0.0002675577998161316, 0.00028127245604991913, 0.00029498711228370667, 0.0003087017685174942, 0.00032241642475128174, 0.0003361310809850693, 0.0003498457372188568, 0.00036356039345264435, 0.0003772750496864319, 0.0003909897059202194, 0.00040470436215400696, 0.0004184190183877945, 0.00043213367462158203]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 12.0, 15.0, 16.0, 18.0, 30.0, 17.0, 24.0, 31.0, 33.0, 33.0, 50.0, 51.0, 46.0, 45.0, 42.0, 49.0, 42.0, 51.0, 36.0, 44.0, 45.0, 29.0, 28.0, 23.0, 27.0, 28.0, 22.0, 21.0, 11.0, 12.0, 8.0, 9.0, 6.0, 6.0, 1.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.82666015625, -8.5517578125, -8.27685546875, -8.001953125, -7.72705078125, -7.4521484375, -7.17724609375, -6.90234375, -6.62744140625, -6.3525390625, -6.07763671875, -5.802734375, -5.52783203125, -5.2529296875, -4.97802734375, -4.703125, -4.42822265625, -4.1533203125, -3.87841796875, -3.603515625, -3.32861328125, -3.0537109375, -2.77880859375, -2.50390625, -2.22900390625, -1.9541015625, -1.67919921875, -1.404296875, -1.12939453125, -0.8544921875, -0.57958984375, -0.3046875, -0.02978515625, 0.2451171875, 0.52001953125, 0.794921875, 1.06982421875, 1.3447265625, 1.61962890625, 1.89453125, 2.16943359375, 2.4443359375, 2.71923828125, 2.994140625, 3.26904296875, 3.5439453125, 3.81884765625, 4.09375, 4.36865234375, 4.6435546875, 4.91845703125, 5.193359375, 5.46826171875, 5.7431640625, 6.01806640625, 6.29296875, 6.56787109375, 6.8427734375, 7.11767578125, 7.392578125, 7.66748046875, 7.9423828125, 8.21728515625, 8.4921875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 14.0, 18.0, 21.0, 25.0, 38.0, 46.0, 54.0, 84.0, 111.0, 142.0, 197.0, 279.0, 409.0, 603.0, 952.0, 1648.0, 3275.0, 6843.0, 16496.0, 48316.0, 191344.0, 563776.0, 146884.0, 39644.0, 14140.0, 6004.0, 2734.0, 1587.0, 918.0, 593.0, 384.0, 253.0, 188.0, 116.0, 105.0, 76.0, 40.0, 40.0, 25.0, 29.0, 20.0, 21.0, 13.0, 11.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.7520751953125, -7.488525390625, -7.2249755859375, -6.96142578125, -6.6978759765625, -6.434326171875, -6.1707763671875, -5.9072265625, -5.6436767578125, -5.380126953125, -5.1165771484375, -4.85302734375, -4.5894775390625, -4.325927734375, -4.0623779296875, -3.798828125, -3.5352783203125, -3.271728515625, -3.0081787109375, -2.74462890625, -2.4810791015625, -2.217529296875, -1.9539794921875, -1.6904296875, -1.4268798828125, -1.163330078125, -0.8997802734375, -0.63623046875, -0.3726806640625, -0.109130859375, 0.1544189453125, 0.41796875, 0.6815185546875, 0.945068359375, 1.2086181640625, 1.47216796875, 1.7357177734375, 1.999267578125, 2.2628173828125, 2.5263671875, 2.7899169921875, 3.053466796875, 3.3170166015625, 3.58056640625, 3.8441162109375, 4.107666015625, 4.3712158203125, 4.634765625, 4.8983154296875, 5.161865234375, 5.4254150390625, 5.68896484375, 5.9525146484375, 6.216064453125, 6.4796142578125, 6.7431640625, 7.0067138671875, 7.270263671875, 7.5338134765625, 7.79736328125, 8.0609130859375, 8.324462890625, 8.5880126953125, 8.8515625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 11.0, 12.0, 19.0, 13.0, 14.0, 23.0, 24.0, 25.0, 32.0, 23.0, 35.0, 37.0, 36.0, 56.0, 53.0, 102.0, 321.0, 1590.0, 129.0, 57.0, 53.0, 43.0, 49.0, 34.0, 34.0, 33.0, 30.0, 27.0, 26.0, 14.0, 15.0, 16.0, 11.0, 8.0, 7.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.484375, -26.631103515625, -25.77783203125, -24.924560546875, -24.0712890625, -23.218017578125, -22.36474609375, -21.511474609375, -20.658203125, -19.804931640625, -18.95166015625, -18.098388671875, -17.2451171875, -16.391845703125, -15.53857421875, -14.685302734375, -13.83203125, -12.978759765625, -12.12548828125, -11.272216796875, -10.4189453125, -9.565673828125, -8.71240234375, -7.859130859375, -7.005859375, -6.152587890625, -5.29931640625, -4.446044921875, -3.5927734375, -2.739501953125, -1.88623046875, -1.032958984375, -0.1796875, 0.673583984375, 1.52685546875, 2.380126953125, 3.2333984375, 4.086669921875, 4.93994140625, 5.793212890625, 6.646484375, 7.499755859375, 8.35302734375, 9.206298828125, 10.0595703125, 10.912841796875, 11.76611328125, 12.619384765625, 13.47265625, 14.325927734375, 15.17919921875, 16.032470703125, 16.8857421875, 17.739013671875, 18.59228515625, 19.445556640625, 20.298828125, 21.152099609375, 22.00537109375, 22.858642578125, 23.7119140625, 24.565185546875, 25.41845703125, 26.271728515625, 27.125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 18.0, 23.0, 33.0, 52.0, 70.0, 98.0, 137.0, 212.0, 394.0, 924.0, 14797.0, 3116991.0, 10101.0, 836.0, 374.0, 218.0, 130.0, 69.0, 72.0, 36.0, 40.0, 17.0, 12.0, 10.0, 10.0, 3.0, 5.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.5, -98.466796875, -95.43359375, -92.400390625, -89.3671875, -86.333984375, -83.30078125, -80.267578125, -77.234375, -74.201171875, -71.16796875, -68.134765625, -65.1015625, -62.068359375, -59.03515625, -56.001953125, -52.96875, -49.935546875, -46.90234375, -43.869140625, -40.8359375, -37.802734375, -34.76953125, -31.736328125, -28.703125, -25.669921875, -22.63671875, -19.603515625, -16.5703125, -13.537109375, -10.50390625, -7.470703125, -4.4375, -1.404296875, 1.62890625, 4.662109375, 7.6953125, 10.728515625, 13.76171875, 16.794921875, 19.828125, 22.861328125, 25.89453125, 28.927734375, 31.9609375, 34.994140625, 38.02734375, 41.060546875, 44.09375, 47.126953125, 50.16015625, 53.193359375, 56.2265625, 59.259765625, 62.29296875, 65.326171875, 68.359375, 71.392578125, 74.42578125, 77.458984375, 80.4921875, 83.525390625, 86.55859375, 89.591796875, 92.625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 4.0, 844.0, 169.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.942787170410156, -38.25898742675781, -17.575191497802734, 3.1086044311523438, 23.792404174804688, 44.47620391845703, 65.15999603271484, 85.84380340576172, 106.52759552001953, 127.21139526367188, 147.8951873779297, 168.5789794921875, 189.26278686523438, 209.94659423828125, 230.63037109375, 251.31417846679688, 271.99798583984375, 292.6817932128906, 313.3655700683594, 334.04937744140625, 354.7331848144531, 375.4169921875, 396.10076904296875, 416.7845764160156, 437.4683532714844, 458.15216064453125, 478.8359375, 499.5197448730469, 520.2035522460938, 540.8873291015625, 561.5711669921875, 582.2549438476562, 602.9387817382812, 623.62255859375, 644.306396484375, 664.9901733398438, 685.6739501953125, 706.3577880859375, 727.0415649414062, 747.725341796875, 768.4091796875, 789.0929565429688, 809.7767944335938, 830.4605712890625, 851.1443481445312, 871.8281860351562, 892.511962890625, 913.19580078125, 933.8795166015625, 954.5632934570312, 975.2471313476562, 995.930908203125, 1016.6146850585938, 1037.2984619140625, 1057.9822998046875, 1078.6661376953125, 1099.3499755859375, 1120.0338134765625, 1140.717529296875, 1161.4013671875, 1182.085205078125, 1202.7689208984375, 1223.4527587890625, 1244.1365966796875, 1264.8203125]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 8.0, 3.0, 5.0, 3.0, 6.0, 11.0, 13.0, 12.0, 13.0, 11.0, 24.0, 22.0, 23.0, 21.0, 29.0, 22.0, 35.0, 34.0, 41.0, 28.0, 33.0, 33.0, 43.0, 38.0, 34.0, 50.0, 35.0, 27.0, 42.0, 25.0, 33.0, 34.0, 25.0, 23.0, 23.0, 19.0, 14.0, 18.0, 21.0, 11.0, 13.0, 8.0, 11.0, 9.0, 10.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-73.85661315917969, -71.62713623046875, -69.39766693115234, -67.1681900024414, -64.938720703125, -62.70924377441406, -60.47977066040039, -58.25029754638672, -56.02082443237305, -53.791351318359375, -51.5618782043457, -49.33240509033203, -47.102928161621094, -44.87345886230469, -42.64398193359375, -40.41450881958008, -38.185035705566406, -35.955562591552734, -33.72608947753906, -31.496614456176758, -29.267141342163086, -27.037668228149414, -24.80819320678711, -22.578720092773438, -20.349246978759766, -18.119773864746094, -15.890299797058105, -13.660825729370117, -11.431352615356445, -9.201879501342773, -6.972405433654785, -4.742931365966797, -2.513458251953125, -0.2839846611022949, 1.9454889297485352, 4.174962520599365, 6.404436111450195, 8.633909225463867, 10.863383293151855, 13.092857360839844, 15.322330474853516, 17.551803588867188, 19.78127670288086, 22.010751724243164, 24.240224838256836, 26.469697952270508, 28.699172973632812, 30.928646087646484, 33.158119201660156, 35.38759231567383, 37.6170654296875, 39.84653854370117, 42.076011657714844, 44.30548858642578, 46.53496170043945, 48.764434814453125, 50.9939079284668, 53.22338104248047, 55.45285415649414, 57.68232727050781, 59.91180419921875, 62.141273498535156, 64.3707504272461, 66.6002197265625, 68.82969665527344]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 10.0, 9.0, 12.0, 18.0, 21.0, 12.0, 26.0, 29.0, 27.0, 35.0, 31.0, 34.0, 43.0, 44.0, 37.0, 40.0, 55.0, 45.0, 50.0, 39.0, 30.0, 35.0, 45.0, 44.0, 35.0, 20.0, 15.0, 26.0, 23.0, 14.0, 11.0, 14.0, 23.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.6640625, -9.378662109375, -9.09326171875, -8.807861328125, -8.5224609375, -8.237060546875, -7.95166015625, -7.666259765625, -7.380859375, -7.095458984375, -6.81005859375, -6.524658203125, -6.2392578125, -5.953857421875, -5.66845703125, -5.383056640625, -5.09765625, -4.812255859375, -4.52685546875, -4.241455078125, -3.9560546875, -3.670654296875, -3.38525390625, -3.099853515625, -2.814453125, -2.529052734375, -2.24365234375, -1.958251953125, -1.6728515625, -1.387451171875, -1.10205078125, -0.816650390625, -0.53125, -0.245849609375, 0.03955078125, 0.324951171875, 0.6103515625, 0.895751953125, 1.18115234375, 1.466552734375, 1.751953125, 2.037353515625, 2.32275390625, 2.608154296875, 2.8935546875, 3.178955078125, 3.46435546875, 3.749755859375, 4.03515625, 4.320556640625, 4.60595703125, 4.891357421875, 5.1767578125, 5.462158203125, 5.74755859375, 6.032958984375, 6.318359375, 6.603759765625, 6.88916015625, 7.174560546875, 7.4599609375, 7.745361328125, 8.03076171875, 8.316162109375, 8.6015625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 4.0, 8.0, 8.0, 10.0, 13.0, 20.0, 21.0, 19.0, 20.0, 27.0, 14.0, 36.0, 42.0, 62.0, 131.0, 398.0, 1856.0, 14284.0, 609306.0, 3428000.0, 132196.0, 6167.0, 989.0, 266.0, 86.0, 47.0, 37.0, 34.0, 28.0, 12.0, 23.0, 19.0, 15.0, 13.0, 12.0, 14.0, 11.0, 8.0, 3.0, 7.0, 0.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.4375, -33.404296875, -32.37109375, -31.337890625, -30.3046875, -29.271484375, -28.23828125, -27.205078125, -26.171875, -25.138671875, -24.10546875, -23.072265625, -22.0390625, -21.005859375, -19.97265625, -18.939453125, -17.90625, -16.873046875, -15.83984375, -14.806640625, -13.7734375, -12.740234375, -11.70703125, -10.673828125, -9.640625, -8.607421875, -7.57421875, -6.541015625, -5.5078125, -4.474609375, -3.44140625, -2.408203125, -1.375, -0.341796875, 0.69140625, 1.724609375, 2.7578125, 3.791015625, 4.82421875, 5.857421875, 6.890625, 7.923828125, 8.95703125, 9.990234375, 11.0234375, 12.056640625, 13.08984375, 14.123046875, 15.15625, 16.189453125, 17.22265625, 18.255859375, 19.2890625, 20.322265625, 21.35546875, 22.388671875, 23.421875, 24.455078125, 25.48828125, 26.521484375, 27.5546875, 28.587890625, 29.62109375, 30.654296875, 31.6875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 8.0, 19.0, 17.0, 40.0, 42.0, 58.0, 80.0, 150.0, 208.0, 315.0, 438.0, 552.0, 598.0, 472.0, 325.0, 218.0, 166.0, 108.0, 76.0, 43.0, 39.0, 28.0, 23.0, 9.0, 7.0, 8.0, 7.0, 5.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8828125, -14.2381591796875, -13.593505859375, -12.9488525390625, -12.30419921875, -11.6595458984375, -11.014892578125, -10.3702392578125, -9.7255859375, -9.0809326171875, -8.436279296875, -7.7916259765625, -7.14697265625, -6.5023193359375, -5.857666015625, -5.2130126953125, -4.568359375, -3.9237060546875, -3.279052734375, -2.6343994140625, -1.98974609375, -1.3450927734375, -0.700439453125, -0.0557861328125, 0.5888671875, 1.2335205078125, 1.878173828125, 2.5228271484375, 3.16748046875, 3.8121337890625, 4.456787109375, 5.1014404296875, 5.74609375, 6.3907470703125, 7.035400390625, 7.6800537109375, 8.32470703125, 8.9693603515625, 9.614013671875, 10.2586669921875, 10.9033203125, 11.5479736328125, 12.192626953125, 12.8372802734375, 13.48193359375, 14.1265869140625, 14.771240234375, 15.4158935546875, 16.060546875, 16.7052001953125, 17.349853515625, 17.9945068359375, 18.63916015625, 19.2838134765625, 19.928466796875, 20.5731201171875, 21.2177734375, 21.8624267578125, 22.507080078125, 23.1517333984375, 23.79638671875, 24.4410400390625, 25.085693359375, 25.7303466796875, 26.375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 13.0, 28.0, 37.0, 52.0, 54.0, 64.0, 97.0, 127.0, 161.0, 226.0, 370.0, 744.0, 5992.0, 3396733.0, 784485.0, 3307.0, 655.0, 338.0, 204.0, 156.0, 113.0, 86.0, 52.0, 44.0, 32.0, 23.0, 19.0, 16.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.9375, -94.2373046875, -91.537109375, -88.8369140625, -86.13671875, -83.4365234375, -80.736328125, -78.0361328125, -75.3359375, -72.6357421875, -69.935546875, -67.2353515625, -64.53515625, -61.8349609375, -59.134765625, -56.4345703125, -53.734375, -51.0341796875, -48.333984375, -45.6337890625, -42.93359375, -40.2333984375, -37.533203125, -34.8330078125, -32.1328125, -29.4326171875, -26.732421875, -24.0322265625, -21.33203125, -18.6318359375, -15.931640625, -13.2314453125, -10.53125, -7.8310546875, -5.130859375, -2.4306640625, 0.26953125, 2.9697265625, 5.669921875, 8.3701171875, 11.0703125, 13.7705078125, 16.470703125, 19.1708984375, 21.87109375, 24.5712890625, 27.271484375, 29.9716796875, 32.671875, 35.3720703125, 38.072265625, 40.7724609375, 43.47265625, 46.1728515625, 48.873046875, 51.5732421875, 54.2734375, 56.9736328125, 59.673828125, 62.3740234375, 65.07421875, 67.7744140625, 70.474609375, 73.1748046875, 75.875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 49.0, 289.0, 485.0, 164.0, 23.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-274.226806640625, -264.1585388183594, -254.0902557373047, -244.02198791503906, -233.95370483398438, -223.88543701171875, -213.81716918945312, -203.74888610839844, -193.68060302734375, -183.61233520507812, -173.54405212402344, -163.4757843017578, -153.40750122070312, -143.3392333984375, -133.27096557617188, -123.20268249511719, -113.13441467285156, -103.0661392211914, -92.99786376953125, -82.92959594726562, -72.86131286621094, -62.79304122924805, -52.724769592285156, -42.656494140625, -32.588218688964844, -22.519943237304688, -12.451669692993164, -2.3833961486816406, 7.684879302978516, 17.753154754638672, 27.821426391601562, 37.88970184326172, 47.957977294921875, 58.02625274658203, 68.09452819824219, 78.16279602050781, 88.2310791015625, 98.29934692382812, 108.36762237548828, 118.43589782714844, 128.50418090820312, 138.57244873046875, 148.64073181152344, 158.70899963378906, 168.77728271484375, 178.84555053710938, 188.913818359375, 198.9821014404297, 209.0503692626953, 219.11863708496094, 229.18692016601562, 239.25518798828125, 249.32347106933594, 259.3917541503906, 269.46002197265625, 279.5282897949219, 289.5965576171875, 299.6648254394531, 309.73309326171875, 319.8013916015625, 329.8696594238281, 339.93792724609375, 350.0061950683594, 360.074462890625, 370.14276123046875]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 5.0, 12.0, 13.0, 8.0, 13.0, 12.0, 15.0, 28.0, 13.0, 19.0, 19.0, 34.0, 27.0, 37.0, 33.0, 26.0, 33.0, 38.0, 35.0, 53.0, 35.0, 42.0, 35.0, 39.0, 33.0, 35.0, 39.0, 42.0, 24.0, 24.0, 19.0, 19.0, 27.0, 11.0, 11.0, 20.0, 11.0, 5.0, 12.0, 7.0, 9.0, 4.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-61.08891296386719, -59.38489532470703, -57.680877685546875, -55.976863861083984, -54.27284622192383, -52.56882858276367, -50.86481475830078, -49.160797119140625, -47.45677947998047, -45.75276184082031, -44.048744201660156, -42.344730377197266, -40.64071273803711, -38.93669509887695, -37.23268127441406, -35.528663635253906, -33.82464599609375, -32.120628356933594, -30.41661262512207, -28.712596893310547, -27.00857925415039, -25.304561614990234, -23.60054588317871, -21.896530151367188, -20.19251251220703, -18.488494873046875, -16.78447914123535, -15.080462455749512, -13.376445770263672, -11.672429084777832, -9.968412399291992, -8.264395713806152, -6.5603790283203125, -4.856362342834473, -3.152345657348633, -1.448328971862793, 0.2556877136230469, 1.9597043991088867, 3.6637210845947266, 5.367737770080566, 7.071754455566406, 8.775771141052246, 10.479787826538086, 12.183804512023926, 13.887821197509766, 15.591837882995605, 17.295854568481445, 18.99987030029297, 20.703887939453125, 22.40790557861328, 24.111921310424805, 25.815937042236328, 27.519954681396484, 29.22397232055664, 30.927988052368164, 32.63200378417969, 34.336021423339844, 36.0400390625, 37.744056701660156, 39.44807052612305, 41.1520881652832, 42.85610580444336, 44.56011962890625, 46.264137268066406, 47.96815490722656]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 5.0, 0.0, 7.0, 4.0, 13.0, 9.0, 9.0, 18.0, 13.0, 19.0, 18.0, 20.0, 33.0, 37.0, 39.0, 42.0, 50.0, 46.0, 46.0, 54.0, 50.0, 45.0, 47.0, 48.0, 36.0, 34.0, 44.0, 34.0, 24.0, 24.0, 20.0, 16.0, 16.0, 14.0, 12.0, 19.0, 6.0, 8.0, 6.0, 8.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.52392578125, -8.2353515625, -7.94677734375, -7.658203125, -7.36962890625, -7.0810546875, -6.79248046875, -6.50390625, -6.21533203125, -5.9267578125, -5.63818359375, -5.349609375, -5.06103515625, -4.7724609375, -4.48388671875, -4.1953125, -3.90673828125, -3.6181640625, -3.32958984375, -3.041015625, -2.75244140625, -2.4638671875, -2.17529296875, -1.88671875, -1.59814453125, -1.3095703125, -1.02099609375, -0.732421875, -0.44384765625, -0.1552734375, 0.13330078125, 0.421875, 0.71044921875, 0.9990234375, 1.28759765625, 1.576171875, 1.86474609375, 2.1533203125, 2.44189453125, 2.73046875, 3.01904296875, 3.3076171875, 3.59619140625, 3.884765625, 4.17333984375, 4.4619140625, 4.75048828125, 5.0390625, 5.32763671875, 5.6162109375, 5.90478515625, 6.193359375, 6.48193359375, 6.7705078125, 7.05908203125, 7.34765625, 7.63623046875, 7.9248046875, 8.21337890625, 8.501953125, 8.79052734375, 9.0791015625, 9.36767578125, 9.65625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 11.0, 9.0, 28.0, 45.0, 61.0, 92.0, 111.0, 177.0, 242.0, 336.0, 560.0, 805.0, 1213.0, 1816.0, 2765.0, 4135.0, 6286.0, 9546.0, 15314.0, 25197.0, 42915.0, 78453.0, 167070.0, 376962.0, 142720.0, 69681.0, 38506.0, 22874.0, 14177.0, 8991.0, 5916.0, 3776.0, 2530.0, 1741.0, 1150.0, 782.0, 521.0, 381.0, 231.0, 159.0, 94.0, 59.0, 33.0, 22.0, 19.0, 16.0, 9.0, 10.0, 8.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.03515625, -1.9742431640625, -1.913330078125, -1.8524169921875, -1.79150390625, -1.7305908203125, -1.669677734375, -1.6087646484375, -1.5478515625, -1.4869384765625, -1.426025390625, -1.3651123046875, -1.30419921875, -1.2432861328125, -1.182373046875, -1.1214599609375, -1.060546875, -0.9996337890625, -0.938720703125, -0.8778076171875, -0.81689453125, -0.7559814453125, -0.695068359375, -0.6341552734375, -0.5732421875, -0.5123291015625, -0.451416015625, -0.3905029296875, -0.32958984375, -0.2686767578125, -0.207763671875, -0.1468505859375, -0.0859375, -0.0250244140625, 0.035888671875, 0.0968017578125, 0.15771484375, 0.2186279296875, 0.279541015625, 0.3404541015625, 0.4013671875, 0.4622802734375, 0.523193359375, 0.5841064453125, 0.64501953125, 0.7059326171875, 0.766845703125, 0.8277587890625, 0.888671875, 0.9495849609375, 1.010498046875, 1.0714111328125, 1.13232421875, 1.1932373046875, 1.254150390625, 1.3150634765625, 1.3759765625, 1.4368896484375, 1.497802734375, 1.5587158203125, 1.61962890625, 1.6805419921875, 1.741455078125, 1.8023681640625, 1.86328125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 6.0, 8.0, 4.0, 14.0, 12.0, 7.0, 19.0, 15.0, 24.0, 17.0, 24.0, 30.0, 35.0, 34.0, 38.0, 37.0, 36.0, 44.0, 47.0, 1065.0, 30.0, 45.0, 39.0, 48.0, 36.0, 38.0, 27.0, 34.0, 33.0, 26.0, 19.0, 27.0, 14.0, 20.0, 17.0, 19.0, 8.0, 9.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.00390625, -4.83563232421875, -4.6673583984375, -4.49908447265625, -4.330810546875, -4.16253662109375, -3.9942626953125, -3.82598876953125, -3.65771484375, -3.48944091796875, -3.3211669921875, -3.15289306640625, -2.984619140625, -2.81634521484375, -2.6480712890625, -2.47979736328125, -2.3115234375, -2.14324951171875, -1.9749755859375, -1.80670166015625, -1.638427734375, -1.47015380859375, -1.3018798828125, -1.13360595703125, -0.96533203125, -0.79705810546875, -0.6287841796875, -0.46051025390625, -0.292236328125, -0.12396240234375, 0.0443115234375, 0.21258544921875, 0.380859375, 0.54913330078125, 0.7174072265625, 0.88568115234375, 1.053955078125, 1.22222900390625, 1.3905029296875, 1.55877685546875, 1.72705078125, 1.89532470703125, 2.0635986328125, 2.23187255859375, 2.400146484375, 2.56842041015625, 2.7366943359375, 2.90496826171875, 3.0732421875, 3.24151611328125, 3.4097900390625, 3.57806396484375, 3.746337890625, 3.91461181640625, 4.0828857421875, 4.25115966796875, 4.41943359375, 4.58770751953125, 4.7559814453125, 4.92425537109375, 5.092529296875, 5.26080322265625, 5.4290771484375, 5.59735107421875, 5.765625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 12.0, 14.0, 26.0, 28.0, 50.0, 81.0, 144.0, 175.0, 340.0, 498.0, 807.0, 1291.0, 2028.0, 3420.0, 5425.0, 8632.0, 14000.0, 23124.0, 38961.0, 66941.0, 130271.0, 1397237.0, 192089.0, 88660.0, 48924.0, 28814.0, 17128.0, 10573.0, 6552.0, 4102.0, 2537.0, 1608.0, 954.0, 622.0, 389.0, 226.0, 172.0, 109.0, 58.0, 46.0, 19.0, 20.0, 6.0, 8.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7421875, -1.683563232421875, -1.62493896484375, -1.566314697265625, -1.5076904296875, -1.449066162109375, -1.39044189453125, -1.331817626953125, -1.273193359375, -1.214569091796875, -1.15594482421875, -1.097320556640625, -1.0386962890625, -0.980072021484375, -0.92144775390625, -0.862823486328125, -0.80419921875, -0.745574951171875, -0.68695068359375, -0.628326416015625, -0.5697021484375, -0.511077880859375, -0.45245361328125, -0.393829345703125, -0.335205078125, -0.276580810546875, -0.21795654296875, -0.159332275390625, -0.1007080078125, -0.042083740234375, 0.01654052734375, 0.075164794921875, 0.1337890625, 0.192413330078125, 0.25103759765625, 0.309661865234375, 0.3682861328125, 0.426910400390625, 0.48553466796875, 0.544158935546875, 0.602783203125, 0.661407470703125, 0.72003173828125, 0.778656005859375, 0.8372802734375, 0.895904541015625, 0.95452880859375, 1.013153076171875, 1.07177734375, 1.130401611328125, 1.18902587890625, 1.247650146484375, 1.3062744140625, 1.364898681640625, 1.42352294921875, 1.482147216796875, 1.540771484375, 1.599395751953125, 1.65802001953125, 1.716644287109375, 1.7752685546875, 1.833892822265625, 1.89251708984375, 1.951141357421875, 2.009765625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 6.0, 10.0, 6.0, 7.0, 8.0, 10.0, 14.0, 21.0, 23.0, 32.0, 58.0, 94.0, 94.0, 121.0, 91.0, 76.0, 78.0, 51.0, 49.0, 32.0, 24.0, 24.0, 20.0, 9.0, 5.0, 5.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0013866424560546875, -0.0013488829135894775, -0.0013111233711242676, -0.0012733638286590576, -0.0012356042861938477, -0.0011978447437286377, -0.0011600852012634277, -0.0011223256587982178, -0.0010845661163330078, -0.0010468065738677979, -0.0010090470314025879, -0.0009712874889373779, -0.000933527946472168, -0.000895768404006958, -0.000858008861541748, -0.0008202493190765381, -0.0007824897766113281, -0.0007447302341461182, -0.0007069706916809082, -0.0006692111492156982, -0.0006314516067504883, -0.0005936920642852783, -0.0005559325218200684, -0.0005181729793548584, -0.00048041343688964844, -0.0004426538944244385, -0.0004048943519592285, -0.00036713480949401855, -0.0003293752670288086, -0.00029161572456359863, -0.00025385618209838867, -0.0002160966396331787, -0.00017833709716796875, -0.0001405775547027588, -0.00010281801223754883, -6.505846977233887e-05, -2.7298927307128906e-05, 1.0460615158081055e-05, 4.8220157623291016e-05, 8.597970008850098e-05, 0.00012373924255371094, 0.0001614987850189209, 0.00019925832748413086, 0.00023701786994934082, 0.0002747774124145508, 0.00031253695487976074, 0.0003502964973449707, 0.00038805603981018066, 0.0004258155822753906, 0.0004635751247406006, 0.0005013346672058105, 0.0005390942096710205, 0.0005768537521362305, 0.0006146132946014404, 0.0006523728370666504, 0.0006901323795318604, 0.0007278919219970703, 0.0007656514644622803, 0.0008034110069274902, 0.0008411705493927002, 0.0008789300918579102, 0.0009166896343231201, 0.0009544491767883301, 0.00099220871925354, 0.00102996826171875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 3.0, 13.0, 17.0, 26.0, 30.0, 45.0, 77.0, 111.0, 245.0, 713.0, 272641.0, 773259.0, 795.0, 252.0, 104.0, 60.0, 38.0, 24.0, 16.0, 14.0, 7.0, 6.0, 10.0, 4.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027862548828125, -0.026935100555419922, -0.026007652282714844, -0.025080204010009766, -0.024152755737304688, -0.02322530746459961, -0.02229785919189453, -0.021370410919189453, -0.020442962646484375, -0.019515514373779297, -0.01858806610107422, -0.01766061782836914, -0.016733169555664062, -0.015805721282958984, -0.014878273010253906, -0.013950824737548828, -0.01302337646484375, -0.012095928192138672, -0.011168479919433594, -0.010241031646728516, -0.009313583374023438, -0.00838613510131836, -0.007458686828613281, -0.006531238555908203, -0.005603790283203125, -0.004676342010498047, -0.0037488937377929688, -0.0028214454650878906, -0.0018939971923828125, -0.0009665489196777344, -3.910064697265625e-05, 0.0008883476257324219, 0.0018157958984375, 0.002743244171142578, 0.0036706924438476562, 0.004598140716552734, 0.0055255889892578125, 0.006453037261962891, 0.007380485534667969, 0.008307933807373047, 0.009235382080078125, 0.010162830352783203, 0.011090278625488281, 0.01201772689819336, 0.012945175170898438, 0.013872623443603516, 0.014800071716308594, 0.015727519989013672, 0.01665496826171875, 0.017582416534423828, 0.018509864807128906, 0.019437313079833984, 0.020364761352539062, 0.02129220962524414, 0.02221965789794922, 0.023147106170654297, 0.024074554443359375, 0.025002002716064453, 0.02592945098876953, 0.02685689926147461, 0.027784347534179688, 0.028711795806884766, 0.029639244079589844, 0.030566692352294922, 0.031494140625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 16.0, 61.0, 275.0, 400.0, 205.0, 45.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002701913006603718, -0.002642368897795677, -0.0025828250218182802, -0.0025232809130102396, -0.0024637370370328426, -0.002404192928224802, -0.0023446488194167614, -0.0022851049434393644, -0.002225560834631324, -0.002166016725823283, -0.0021064728498458862, -0.0020469287410378456, -0.0019873848650604486, -0.001927840756252408, -0.0018682967638596892, -0.0018087527714669704, -0.0017492087790742517, -0.0016896647866815329, -0.001630120794288814, -0.0015705768018960953, -0.0015110326930880547, -0.0014514887006953359, -0.001391944708302617, -0.0013324007159098983, -0.0012728567235171795, -0.0012133127311244607, -0.001153768738731742, -0.0010942246299237013, -0.0010346806375309825, -0.0009751366451382637, -0.0009155926527455449, -0.0008560486603528261, -0.0007965045515447855, -0.0007369605591520667, -0.000677416508551687, -0.0006178725161589682, -0.0005583284655585885, -0.0004987844731658697, -0.0004392404807731509, -0.00037969645927660167, -0.0003201524377800524, -0.0002606084162835032, -0.00020106440933886915, -0.00014152040239423513, -8.197638089768589e-05, -2.2432359401136637e-05, 3.7111632991582155e-05, 9.66556544881314e-05, 0.00015619967598468065, 0.0002157436974812299, 0.00027528771897777915, 0.00033483171137049794, 0.0003943757328670472, 0.00045391975436359644, 0.0005134637467563152, 0.000573007739149034, 0.0006325517897494137, 0.0006920957821421325, 0.0007516398327425122, 0.000811183825135231, 0.0008707278175279498, 0.0009302718681283295, 0.0009898159187287092, 0.001049359911121428, 0.0011089039035141468]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 1.0, 0.0, 2.0, 2.0, 11.0, 6.0, 14.0, 9.0, 17.0, 15.0, 13.0, 20.0, 25.0, 31.0, 30.0, 22.0, 26.0, 44.0, 27.0, 37.0, 28.0, 38.0, 42.0, 35.0, 33.0, 44.0, 31.0, 43.0, 34.0, 31.0, 34.0, 35.0, 30.0, 37.0, 16.0, 27.0, 20.0, 18.0, 6.0, 12.0, 9.0, 8.0, 7.0, 11.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0004884600639343262, -0.00047395192086696625, -0.0004594437777996063, -0.0004449356347322464, -0.0004304274916648865, -0.00041591934859752655, -0.0004014112055301666, -0.0003869030624628067, -0.0003723949193954468, -0.00035788677632808685, -0.00034337863326072693, -0.000328870490193367, -0.0003143623471260071, -0.00029985420405864716, -0.00028534606099128723, -0.0002708379179239273, -0.0002563297748565674, -0.00024182163178920746, -0.00022731348872184753, -0.0002128053456544876, -0.00019829720258712769, -0.00018378905951976776, -0.00016928091645240784, -0.0001547727733850479, -0.000140264630317688, -0.00012575648725032806, -0.00011124834418296814, -9.674020111560822e-05, -8.223205804824829e-05, -6.772391498088837e-05, -5.321577191352844e-05, -3.870762884616852e-05, -2.4199485778808594e-05, -9.69134271144867e-06, 4.816800355911255e-06, 1.932494342327118e-05, 3.3833086490631104e-05, 4.834122955799103e-05, 6.284937262535095e-05, 7.735751569271088e-05, 9.18656587600708e-05, 0.00010637380182743073, 0.00012088194489479065, 0.00013539008796215057, 0.0001498982310295105, 0.00016440637409687042, 0.00017891451716423035, 0.00019342266023159027, 0.0002079308032989502, 0.00022243894636631012, 0.00023694708943367004, 0.00025145523250102997, 0.0002659633755683899, 0.0002804715186357498, 0.00029497966170310974, 0.00030948780477046967, 0.0003239959478378296, 0.0003385040909051895, 0.00035301223397254944, 0.00036752037703990936, 0.0003820285201072693, 0.0003965366631746292, 0.00041104480624198914, 0.00042555294930934906, 0.000440061092376709]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 5.0, 0.0, 7.0, 4.0, 13.0, 9.0, 9.0, 18.0, 13.0, 19.0, 18.0, 20.0, 33.0, 37.0, 39.0, 42.0, 50.0, 46.0, 46.0, 54.0, 50.0, 44.0, 48.0, 48.0, 36.0, 34.0, 44.0, 34.0, 24.0, 24.0, 20.0, 16.0, 16.0, 14.0, 12.0, 19.0, 6.0, 8.0, 6.0, 8.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.52392578125, -8.2353515625, -7.94677734375, -7.658203125, -7.36962890625, -7.0810546875, -6.79248046875, -6.50390625, -6.21533203125, -5.9267578125, -5.63818359375, -5.349609375, -5.06103515625, -4.7724609375, -4.48388671875, -4.1953125, -3.90673828125, -3.6181640625, -3.32958984375, -3.041015625, -2.75244140625, -2.4638671875, -2.17529296875, -1.88671875, -1.59814453125, -1.3095703125, -1.02099609375, -0.732421875, -0.44384765625, -0.1552734375, 0.13330078125, 0.421875, 0.71044921875, 0.9990234375, 1.28759765625, 1.576171875, 1.86474609375, 2.1533203125, 2.44189453125, 2.73046875, 3.01904296875, 3.3076171875, 3.59619140625, 3.884765625, 4.17333984375, 4.4619140625, 4.75048828125, 5.0390625, 5.32763671875, 5.6162109375, 5.90478515625, 6.193359375, 6.48193359375, 6.7705078125, 7.05908203125, 7.34765625, 7.63623046875, 7.9248046875, 8.21337890625, 8.501953125, 8.79052734375, 9.0791015625, 9.36767578125, 9.65625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 10.0, 17.0, 30.0, 31.0, 40.0, 63.0, 87.0, 136.0, 161.0, 280.0, 429.0, 597.0, 918.0, 1485.0, 2268.0, 3760.0, 6193.0, 11508.0, 23422.0, 58024.0, 177746.0, 451814.0, 193228.0, 62210.0, 25011.0, 11912.0, 6425.0, 3935.0, 2439.0, 1527.0, 926.0, 584.0, 429.0, 306.0, 175.0, 139.0, 88.0, 66.0, 38.0, 26.0, 27.0, 13.0, 10.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.95703125, -5.76812744140625, -5.5792236328125, -5.39031982421875, -5.201416015625, -5.01251220703125, -4.8236083984375, -4.63470458984375, -4.44580078125, -4.25689697265625, -4.0679931640625, -3.87908935546875, -3.690185546875, -3.50128173828125, -3.3123779296875, -3.12347412109375, -2.9345703125, -2.74566650390625, -2.5567626953125, -2.36785888671875, -2.178955078125, -1.99005126953125, -1.8011474609375, -1.61224365234375, -1.42333984375, -1.23443603515625, -1.0455322265625, -0.85662841796875, -0.667724609375, -0.47882080078125, -0.2899169921875, -0.10101318359375, 0.087890625, 0.27679443359375, 0.4656982421875, 0.65460205078125, 0.843505859375, 1.03240966796875, 1.2213134765625, 1.41021728515625, 1.59912109375, 1.78802490234375, 1.9769287109375, 2.16583251953125, 2.354736328125, 2.54364013671875, 2.7325439453125, 2.92144775390625, 3.1103515625, 3.29925537109375, 3.4881591796875, 3.67706298828125, 3.865966796875, 4.05487060546875, 4.2437744140625, 4.43267822265625, 4.62158203125, 4.81048583984375, 4.9993896484375, 5.18829345703125, 5.377197265625, 5.56610107421875, 5.7550048828125, 5.94390869140625, 6.1328125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 11.0, 11.0, 9.0, 9.0, 14.0, 9.0, 13.0, 18.0, 26.0, 21.0, 28.0, 37.0, 39.0, 45.0, 59.0, 59.0, 96.0, 193.0, 1627.0, 188.0, 94.0, 58.0, 49.0, 44.0, 31.0, 27.0, 29.0, 42.0, 18.0, 27.0, 21.0, 15.0, 10.0, 13.0, 15.0, 5.0, 6.0, 6.0, 2.0, 8.0, 6.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.84375, -22.014404296875, -21.18505859375, -20.355712890625, -19.5263671875, -18.697021484375, -17.86767578125, -17.038330078125, -16.208984375, -15.379638671875, -14.55029296875, -13.720947265625, -12.8916015625, -12.062255859375, -11.23291015625, -10.403564453125, -9.57421875, -8.744873046875, -7.91552734375, -7.086181640625, -6.2568359375, -5.427490234375, -4.59814453125, -3.768798828125, -2.939453125, -2.110107421875, -1.28076171875, -0.451416015625, 0.3779296875, 1.207275390625, 2.03662109375, 2.865966796875, 3.6953125, 4.524658203125, 5.35400390625, 6.183349609375, 7.0126953125, 7.842041015625, 8.67138671875, 9.500732421875, 10.330078125, 11.159423828125, 11.98876953125, 12.818115234375, 13.6474609375, 14.476806640625, 15.30615234375, 16.135498046875, 16.96484375, 17.794189453125, 18.62353515625, 19.452880859375, 20.2822265625, 21.111572265625, 21.94091796875, 22.770263671875, 23.599609375, 24.428955078125, 25.25830078125, 26.087646484375, 26.9169921875, 27.746337890625, 28.57568359375, 29.405029296875, 30.234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 7.0, 6.0, 10.0, 11.0, 33.0, 34.0, 56.0, 107.0, 191.0, 340.0, 698.0, 9046.0, 3130135.0, 3801.0, 573.0, 273.0, 150.0, 84.0, 58.0, 43.0, 15.0, 11.0, 8.0, 6.0, 2.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.625, -114.296875, -109.96875, -105.640625, -101.3125, -96.984375, -92.65625, -88.328125, -84.0, -79.671875, -75.34375, -71.015625, -66.6875, -62.359375, -58.03125, -53.703125, -49.375, -45.046875, -40.71875, -36.390625, -32.0625, -27.734375, -23.40625, -19.078125, -14.75, -10.421875, -6.09375, -1.765625, 2.5625, 6.890625, 11.21875, 15.546875, 19.875, 24.203125, 28.53125, 32.859375, 37.1875, 41.515625, 45.84375, 50.171875, 54.5, 58.828125, 63.15625, 67.484375, 71.8125, 76.140625, 80.46875, 84.796875, 89.125, 93.453125, 97.78125, 102.109375, 106.4375, 110.765625, 115.09375, 119.421875, 123.75, 128.078125, 132.40625, 136.734375, 141.0625, 145.390625, 149.71875, 154.046875, 158.375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 21.0, 596.0, 388.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.87799072265625, -26.14935302734375, -19.42071533203125, -12.692075729370117, -5.963438034057617, 0.7652015686035156, 7.493839263916016, 14.222476959228516, 20.951114654541016, 27.679752349853516, 34.408390045166016, 41.13703155517578, 47.86566925048828, 54.59430694580078, 61.32294464111328, 68.05158233642578, 74.78022003173828, 81.50885772705078, 88.23749542236328, 94.96613311767578, 101.69477081298828, 108.42341613769531, 115.15205383300781, 121.88069152832031, 128.6093292236328, 135.3379669189453, 142.0666046142578, 148.7952423095703, 155.5238800048828, 162.2525177001953, 168.9811553955078, 175.7097930908203, 182.4384307861328, 189.1670684814453, 195.8957061767578, 202.6243438720703, 209.3529815673828, 216.0816192626953, 222.8102569580078, 229.5388946533203, 236.2675323486328, 242.9961700439453, 249.7248077392578, 256.4534606933594, 263.1820983886719, 269.9107360839844, 276.6393737792969, 283.3680114746094, 290.0966491699219, 296.8252868652344, 303.5539245605469, 310.2825622558594, 317.0111999511719, 323.7398376464844, 330.4684753417969, 337.1971130371094, 343.9257507324219, 350.6543884277344, 357.3830261230469, 364.1116638183594, 370.8403015136719, 377.5689392089844, 384.2975769042969, 391.0262145996094, 397.7548522949219]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 8.0, 4.0, 7.0, 3.0, 7.0, 14.0, 9.0, 11.0, 13.0, 13.0, 15.0, 27.0, 27.0, 34.0, 36.0, 35.0, 31.0, 47.0, 39.0, 50.0, 40.0, 47.0, 40.0, 32.0, 35.0, 37.0, 42.0, 32.0, 33.0, 30.0, 33.0, 35.0, 23.0, 17.0, 14.0, 12.0, 10.0, 17.0, 4.0, 9.0, 7.0, 5.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.1217041015625, -70.91011047363281, -68.6985092163086, -66.4869155883789, -64.27532196044922, -62.063724517822266, -59.85212707519531, -57.640533447265625, -55.42893600463867, -53.21733856201172, -51.00574493408203, -48.79414749145508, -46.582550048828125, -44.37095642089844, -42.159358978271484, -39.94776153564453, -37.736167907714844, -35.52457046508789, -33.3129768371582, -31.10137939453125, -28.88978385925293, -26.67818832397461, -24.466590881347656, -22.254995346069336, -20.043399810791016, -17.831804275512695, -15.620207786560059, -13.408611297607422, -11.197015762329102, -8.985420227050781, -6.7738237380981445, -4.562227249145508, -2.3506240844726562, -0.13902807235717773, 2.072567939758301, 4.284163951873779, 6.495759963989258, 8.707355499267578, 10.918951988220215, 13.130548477172852, 15.342144012451172, 17.553739547729492, 19.765335083007812, 21.976932525634766, 24.188528060913086, 26.400123596191406, 28.61172103881836, 30.82331657409668, 33.034912109375, 35.24650955200195, 37.45810317993164, 39.669700622558594, 41.88129425048828, 44.092891693115234, 46.30448913574219, 48.516082763671875, 50.72768020629883, 52.93927764892578, 55.15087127685547, 57.36246871948242, 59.574066162109375, 61.78565979003906, 63.997257232666016, 66.20885467529297, 68.42044830322266]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 16.0, 5.0, 16.0, 11.0, 12.0, 24.0, 14.0, 18.0, 30.0, 25.0, 34.0, 50.0, 38.0, 44.0, 60.0, 55.0, 39.0, 55.0, 44.0, 38.0, 48.0, 34.0, 41.0, 34.0, 36.0, 23.0, 25.0, 20.0, 16.0, 15.0, 13.0, 18.0, 8.0, 6.0, 4.0, 8.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.78369140625, -8.4814453125, -8.17919921875, -7.876953125, -7.57470703125, -7.2724609375, -6.97021484375, -6.66796875, -6.36572265625, -6.0634765625, -5.76123046875, -5.458984375, -5.15673828125, -4.8544921875, -4.55224609375, -4.25, -3.94775390625, -3.6455078125, -3.34326171875, -3.041015625, -2.73876953125, -2.4365234375, -2.13427734375, -1.83203125, -1.52978515625, -1.2275390625, -0.92529296875, -0.623046875, -0.32080078125, -0.0185546875, 0.28369140625, 0.5859375, 0.88818359375, 1.1904296875, 1.49267578125, 1.794921875, 2.09716796875, 2.3994140625, 2.70166015625, 3.00390625, 3.30615234375, 3.6083984375, 3.91064453125, 4.212890625, 4.51513671875, 4.8173828125, 5.11962890625, 5.421875, 5.72412109375, 6.0263671875, 6.32861328125, 6.630859375, 6.93310546875, 7.2353515625, 7.53759765625, 7.83984375, 8.14208984375, 8.4443359375, 8.74658203125, 9.048828125, 9.35107421875, 9.6533203125, 9.95556640625, 10.2578125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 9.0, 8.0, 15.0, 13.0, 15.0, 17.0, 27.0, 31.0, 51.0, 54.0, 95.0, 174.0, 374.0, 960.0, 3224.0, 17711.0, 297652.0, 2971328.0, 857773.0, 37111.0, 5190.0, 1328.0, 491.0, 206.0, 131.0, 63.0, 52.0, 36.0, 25.0, 16.0, 17.0, 18.0, 9.0, 8.0, 7.0, 7.0, 9.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.484375, -22.74267578125, -22.0009765625, -21.25927734375, -20.517578125, -19.77587890625, -19.0341796875, -18.29248046875, -17.55078125, -16.80908203125, -16.0673828125, -15.32568359375, -14.583984375, -13.84228515625, -13.1005859375, -12.35888671875, -11.6171875, -10.87548828125, -10.1337890625, -9.39208984375, -8.650390625, -7.90869140625, -7.1669921875, -6.42529296875, -5.68359375, -4.94189453125, -4.2001953125, -3.45849609375, -2.716796875, -1.97509765625, -1.2333984375, -0.49169921875, 0.25, 0.99169921875, 1.7333984375, 2.47509765625, 3.216796875, 3.95849609375, 4.7001953125, 5.44189453125, 6.18359375, 6.92529296875, 7.6669921875, 8.40869140625, 9.150390625, 9.89208984375, 10.6337890625, 11.37548828125, 12.1171875, 12.85888671875, 13.6005859375, 14.34228515625, 15.083984375, 15.82568359375, 16.5673828125, 17.30908203125, 18.05078125, 18.79248046875, 19.5341796875, 20.27587890625, 21.017578125, 21.75927734375, 22.5009765625, 23.24267578125, 23.984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 11.0, 16.0, 17.0, 19.0, 18.0, 37.0, 36.0, 47.0, 76.0, 95.0, 146.0, 205.0, 226.0, 331.0, 453.0, 500.0, 471.0, 324.0, 273.0, 195.0, 148.0, 116.0, 78.0, 58.0, 35.0, 48.0, 29.0, 11.0, 14.0, 5.0, 6.0, 2.0, 4.0, 1.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.765625, -16.252197265625, -15.73876953125, -15.225341796875, -14.7119140625, -14.198486328125, -13.68505859375, -13.171630859375, -12.658203125, -12.144775390625, -11.63134765625, -11.117919921875, -10.6044921875, -10.091064453125, -9.57763671875, -9.064208984375, -8.55078125, -8.037353515625, -7.52392578125, -7.010498046875, -6.4970703125, -5.983642578125, -5.47021484375, -4.956787109375, -4.443359375, -3.929931640625, -3.41650390625, -2.903076171875, -2.3896484375, -1.876220703125, -1.36279296875, -0.849365234375, -0.3359375, 0.177490234375, 0.69091796875, 1.204345703125, 1.7177734375, 2.231201171875, 2.74462890625, 3.258056640625, 3.771484375, 4.284912109375, 4.79833984375, 5.311767578125, 5.8251953125, 6.338623046875, 6.85205078125, 7.365478515625, 7.87890625, 8.392333984375, 8.90576171875, 9.419189453125, 9.9326171875, 10.446044921875, 10.95947265625, 11.472900390625, 11.986328125, 12.499755859375, 13.01318359375, 13.526611328125, 14.0400390625, 14.553466796875, 15.06689453125, 15.580322265625, 16.09375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 2.0, 10.0, 9.0, 14.0, 5.0, 14.0, 24.0, 14.0, 26.0, 33.0, 44.0, 58.0, 78.0, 84.0, 108.0, 141.0, 159.0, 208.0, 335.0, 734.0, 4489.0, 388171.0, 3774647.0, 21808.0, 1273.0, 512.0, 294.0, 213.0, 128.0, 128.0, 109.0, 79.0, 63.0, 59.0, 37.0, 37.0, 35.0, 13.0, 23.0, 11.0, 15.0, 5.0, 8.0, 3.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-69.5, -67.408203125, -65.31640625, -63.224609375, -61.1328125, -59.041015625, -56.94921875, -54.857421875, -52.765625, -50.673828125, -48.58203125, -46.490234375, -44.3984375, -42.306640625, -40.21484375, -38.123046875, -36.03125, -33.939453125, -31.84765625, -29.755859375, -27.6640625, -25.572265625, -23.48046875, -21.388671875, -19.296875, -17.205078125, -15.11328125, -13.021484375, -10.9296875, -8.837890625, -6.74609375, -4.654296875, -2.5625, -0.470703125, 1.62109375, 3.712890625, 5.8046875, 7.896484375, 9.98828125, 12.080078125, 14.171875, 16.263671875, 18.35546875, 20.447265625, 22.5390625, 24.630859375, 26.72265625, 28.814453125, 30.90625, 32.998046875, 35.08984375, 37.181640625, 39.2734375, 41.365234375, 43.45703125, 45.548828125, 47.640625, 49.732421875, 51.82421875, 53.916015625, 56.0078125, 58.099609375, 60.19140625, 62.283203125, 64.375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 12.0, 26.0, 24.0, 42.0, 51.0, 76.0, 85.0, 115.0, 97.0, 116.0, 87.0, 72.0, 61.0, 30.0, 28.0, 30.0, 13.0, 9.0, 10.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-61.30390548706055, -59.600975036621094, -57.89804458618164, -56.19511413574219, -54.492183685302734, -52.78925323486328, -51.08631896972656, -49.38338851928711, -47.680458068847656, -45.9775276184082, -44.27459716796875, -42.5716667175293, -40.868736267089844, -39.165802001953125, -37.46287536621094, -35.75994110107422, -34.05701446533203, -32.35408401489258, -30.651153564453125, -28.948223114013672, -27.245290756225586, -25.542360305786133, -23.83942985534668, -22.136497497558594, -20.43356704711914, -18.730636596679688, -17.027706146240234, -15.324774742126465, -13.621843338012695, -11.918912887573242, -10.215982437133789, -8.51305103302002, -6.81011962890625, -5.107188701629639, -3.4042580127716064, -1.7013273239135742, 0.0016036033630371094, 1.7045345306396484, 3.4074649810791016, 5.110396385192871, 6.813326835632324, 8.516257286071777, 10.219188690185547, 11.922119140625, 13.625049591064453, 15.327980995178223, 17.03091049194336, 18.733842849731445, 20.4367733001709, 22.13970375061035, 23.842634201049805, 25.54556655883789, 27.248497009277344, 28.951427459716797, 30.65435791015625, 32.3572883605957, 34.060218811035156, 35.76314926147461, 37.46607971191406, 39.169010162353516, 40.87194061279297, 42.57487487792969, 44.277801513671875, 45.980735778808594, 47.68366622924805]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 5.0, 3.0, 3.0, 8.0, 8.0, 9.0, 12.0, 17.0, 16.0, 17.0, 25.0, 20.0, 24.0, 31.0, 26.0, 30.0, 31.0, 39.0, 47.0, 38.0, 25.0, 44.0, 39.0, 39.0, 43.0, 41.0, 34.0, 37.0, 29.0, 31.0, 33.0, 28.0, 23.0, 19.0, 13.0, 17.0, 17.0, 18.0, 13.0, 9.0, 9.0, 3.0, 5.0, 6.0, 2.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-46.829139709472656, -45.19583511352539, -43.562530517578125, -41.92922592163086, -40.295921325683594, -38.66261672973633, -37.02931213378906, -35.3960075378418, -33.76270294189453, -32.129398345947266, -30.49609375, -28.862789154052734, -27.22948455810547, -25.596179962158203, -23.962875366210938, -22.329570770263672, -20.696264266967773, -19.062959671020508, -17.429655075073242, -15.796350479125977, -14.163045883178711, -12.529740333557129, -10.896435737609863, -9.263131141662598, -7.629826545715332, -5.996521949768066, -4.363217353820801, -2.729912281036377, -1.0966076850891113, 0.5366973876953125, 2.170001983642578, 3.8033065795898438, 5.436611175537109, 7.069915771484375, 8.70322036743164, 10.336524963378906, 11.969829559326172, 13.603135108947754, 15.23643970489502, 16.86974334716797, 18.503047943115234, 20.1363525390625, 21.769657135009766, 23.40296173095703, 25.036266326904297, 26.669570922851562, 28.302875518798828, 29.936180114746094, 31.569486618041992, 33.20279312133789, 34.836097717285156, 36.46940231323242, 38.10270690917969, 39.73601150512695, 41.36931610107422, 43.002620697021484, 44.63592529296875, 46.269229888916016, 47.90253448486328, 49.53583908081055, 51.16914367675781, 52.80244827270508, 54.435752868652344, 56.06905746459961, 57.702362060546875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 11.0, 9.0, 12.0, 21.0, 16.0, 23.0, 22.0, 25.0, 32.0, 38.0, 31.0, 45.0, 44.0, 51.0, 40.0, 37.0, 61.0, 51.0, 46.0, 46.0, 44.0, 36.0, 39.0, 20.0, 30.0, 26.0, 20.0, 17.0, 18.0, 17.0, 18.0, 9.0, 3.0, 9.0, 6.0, 1.0, 2.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.6884765625, -8.400390625, -8.1123046875, -7.82421875, -7.5361328125, -7.248046875, -6.9599609375, -6.671875, -6.3837890625, -6.095703125, -5.8076171875, -5.51953125, -5.2314453125, -4.943359375, -4.6552734375, -4.3671875, -4.0791015625, -3.791015625, -3.5029296875, -3.21484375, -2.9267578125, -2.638671875, -2.3505859375, -2.0625, -1.7744140625, -1.486328125, -1.1982421875, -0.91015625, -0.6220703125, -0.333984375, -0.0458984375, 0.2421875, 0.5302734375, 0.818359375, 1.1064453125, 1.39453125, 1.6826171875, 1.970703125, 2.2587890625, 2.546875, 2.8349609375, 3.123046875, 3.4111328125, 3.69921875, 3.9873046875, 4.275390625, 4.5634765625, 4.8515625, 5.1396484375, 5.427734375, 5.7158203125, 6.00390625, 6.2919921875, 6.580078125, 6.8681640625, 7.15625, 7.4443359375, 7.732421875, 8.0205078125, 8.30859375, 8.5966796875, 8.884765625, 9.1728515625, 9.4609375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 10.0, 9.0, 18.0, 26.0, 38.0, 43.0, 69.0, 86.0, 132.0, 198.0, 253.0, 420.0, 624.0, 860.0, 1370.0, 2085.0, 3277.0, 5191.0, 8250.0, 13367.0, 22017.0, 37347.0, 67428.0, 140900.0, 372828.0, 180964.0, 80789.0, 43560.0, 25227.0, 15139.0, 9435.0, 5861.0, 3636.0, 2392.0, 1530.0, 992.0, 728.0, 417.0, 340.0, 218.0, 142.0, 106.0, 70.0, 41.0, 29.0, 23.0, 28.0, 12.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.947265625, -1.885711669921875, -1.82415771484375, -1.762603759765625, -1.7010498046875, -1.639495849609375, -1.57794189453125, -1.516387939453125, -1.454833984375, -1.393280029296875, -1.33172607421875, -1.270172119140625, -1.2086181640625, -1.147064208984375, -1.08551025390625, -1.023956298828125, -0.96240234375, -0.900848388671875, -0.83929443359375, -0.777740478515625, -0.7161865234375, -0.654632568359375, -0.59307861328125, -0.531524658203125, -0.469970703125, -0.408416748046875, -0.34686279296875, -0.285308837890625, -0.2237548828125, -0.162200927734375, -0.10064697265625, -0.039093017578125, 0.0224609375, 0.084014892578125, 0.14556884765625, 0.207122802734375, 0.2686767578125, 0.330230712890625, 0.39178466796875, 0.453338623046875, 0.514892578125, 0.576446533203125, 0.63800048828125, 0.699554443359375, 0.7611083984375, 0.822662353515625, 0.88421630859375, 0.945770263671875, 1.00732421875, 1.068878173828125, 1.13043212890625, 1.191986083984375, 1.2535400390625, 1.315093994140625, 1.37664794921875, 1.438201904296875, 1.499755859375, 1.561309814453125, 1.62286376953125, 1.684417724609375, 1.7459716796875, 1.807525634765625, 1.86907958984375, 1.930633544921875, 1.9921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 9.0, 8.0, 6.0, 12.0, 14.0, 12.0, 16.0, 13.0, 19.0, 22.0, 23.0, 27.0, 20.0, 37.0, 33.0, 27.0, 33.0, 41.0, 38.0, 44.0, 1068.0, 36.0, 48.0, 31.0, 36.0, 37.0, 31.0, 32.0, 33.0, 21.0, 28.0, 29.0, 25.0, 19.0, 11.0, 12.0, 11.0, 11.0, 13.0, 7.0, 6.0, 2.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.06640625, -4.90777587890625, -4.7491455078125, -4.59051513671875, -4.431884765625, -4.27325439453125, -4.1146240234375, -3.95599365234375, -3.79736328125, -3.63873291015625, -3.4801025390625, -3.32147216796875, -3.162841796875, -3.00421142578125, -2.8455810546875, -2.68695068359375, -2.5283203125, -2.36968994140625, -2.2110595703125, -2.05242919921875, -1.893798828125, -1.73516845703125, -1.5765380859375, -1.41790771484375, -1.25927734375, -1.10064697265625, -0.9420166015625, -0.78338623046875, -0.624755859375, -0.46612548828125, -0.3074951171875, -0.14886474609375, 0.009765625, 0.16839599609375, 0.3270263671875, 0.48565673828125, 0.644287109375, 0.80291748046875, 0.9615478515625, 1.12017822265625, 1.27880859375, 1.43743896484375, 1.5960693359375, 1.75469970703125, 1.913330078125, 2.07196044921875, 2.2305908203125, 2.38922119140625, 2.5478515625, 2.70648193359375, 2.8651123046875, 3.02374267578125, 3.182373046875, 3.34100341796875, 3.4996337890625, 3.65826416015625, 3.81689453125, 3.97552490234375, 4.1341552734375, 4.29278564453125, 4.451416015625, 4.61004638671875, 4.7686767578125, 4.92730712890625, 5.0859375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 7.0, 10.0, 10.0, 20.0, 28.0, 43.0, 88.0, 126.0, 177.0, 290.0, 430.0, 679.0, 1008.0, 1536.0, 2377.0, 3621.0, 5406.0, 8418.0, 13189.0, 20738.0, 33595.0, 55756.0, 98523.0, 242613.0, 1342575.0, 107821.0, 59945.0, 35683.0, 22529.0, 14069.0, 9033.0, 5745.0, 3780.0, 2521.0, 1624.0, 1122.0, 720.0, 444.0, 304.0, 181.0, 136.0, 85.0, 49.0, 29.0, 15.0, 16.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.78125, -1.7257080078125, -1.670166015625, -1.6146240234375, -1.55908203125, -1.5035400390625, -1.447998046875, -1.3924560546875, -1.3369140625, -1.2813720703125, -1.225830078125, -1.1702880859375, -1.11474609375, -1.0592041015625, -1.003662109375, -0.9481201171875, -0.892578125, -0.8370361328125, -0.781494140625, -0.7259521484375, -0.67041015625, -0.6148681640625, -0.559326171875, -0.5037841796875, -0.4482421875, -0.3927001953125, -0.337158203125, -0.2816162109375, -0.22607421875, -0.1705322265625, -0.114990234375, -0.0594482421875, -0.00390625, 0.0516357421875, 0.107177734375, 0.1627197265625, 0.21826171875, 0.2738037109375, 0.329345703125, 0.3848876953125, 0.4404296875, 0.4959716796875, 0.551513671875, 0.6070556640625, 0.66259765625, 0.7181396484375, 0.773681640625, 0.8292236328125, 0.884765625, 0.9403076171875, 0.995849609375, 1.0513916015625, 1.10693359375, 1.1624755859375, 1.218017578125, 1.2735595703125, 1.3291015625, 1.3846435546875, 1.440185546875, 1.4957275390625, 1.55126953125, 1.6068115234375, 1.662353515625, 1.7178955078125, 1.7734375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 4.0, 5.0, 5.0, 9.0, 7.0, 7.0, 13.0, 11.0, 17.0, 19.0, 36.0, 25.0, 37.0, 47.0, 74.0, 84.0, 69.0, 84.0, 83.0, 65.0, 49.0, 47.0, 30.0, 27.0, 23.0, 21.0, 16.0, 13.0, 11.0, 9.0, 13.0, 11.0, 5.0, 7.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0011539459228515625, -0.0011247247457504272, -0.001095503568649292, -0.0010662823915481567, -0.0010370612144470215, -0.0010078400373458862, -0.000978618860244751, -0.0009493976831436157, -0.0009201765060424805, -0.0008909553289413452, -0.00086173415184021, -0.0008325129747390747, -0.0008032917976379395, -0.0007740706205368042, -0.0007448494434356689, -0.0007156282663345337, -0.0006864070892333984, -0.0006571859121322632, -0.0006279647350311279, -0.0005987435579299927, -0.0005695223808288574, -0.0005403012037277222, -0.0005110800266265869, -0.00048185884952545166, -0.0004526376724243164, -0.00042341649532318115, -0.0003941953182220459, -0.00036497414112091064, -0.0003357529640197754, -0.00030653178691864014, -0.0002773106098175049, -0.00024808943271636963, -0.00021886825561523438, -0.00018964707851409912, -0.00016042590141296387, -0.0001312047243118286, -0.00010198354721069336, -7.27623701095581e-05, -4.354119300842285e-05, -1.4320015907287598e-05, 1.4901161193847656e-05, 4.412233829498291e-05, 7.334351539611816e-05, 0.00010256469249725342, 0.00013178586959838867, 0.00016100704669952393, 0.00019022822380065918, 0.00021944940090179443, 0.0002486705780029297, 0.00027789175510406494, 0.0003071129322052002, 0.00033633410930633545, 0.0003655552864074707, 0.00039477646350860596, 0.0004239976406097412, 0.00045321881771087646, 0.0004824399948120117, 0.000511661171913147, 0.0005408823490142822, 0.0005701035261154175, 0.0005993247032165527, 0.000628545880317688, 0.0006577670574188232, 0.0006869882345199585, 0.0007162094116210938]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 3.0, 7.0, 13.0, 20.0, 10.0, 17.0, 25.0, 31.0, 41.0, 49.0, 74.0, 139.0, 274.0, 956.0, 246177.0, 798636.0, 1231.0, 332.0, 139.0, 110.0, 63.0, 54.0, 29.0, 19.0, 16.0, 11.0, 13.0, 11.0, 9.0, 8.0, 6.0, 6.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017669677734375, -0.01696467399597168, -0.01625967025756836, -0.015554666519165039, -0.014849662780761719, -0.014144659042358398, -0.013439655303955078, -0.012734651565551758, -0.012029647827148438, -0.011324644088745117, -0.010619640350341797, -0.009914636611938477, -0.009209632873535156, -0.008504629135131836, -0.007799625396728516, -0.007094621658325195, -0.006389617919921875, -0.005684614181518555, -0.004979610443115234, -0.004274606704711914, -0.0035696029663085938, -0.0028645992279052734, -0.002159595489501953, -0.0014545917510986328, -0.0007495880126953125, -4.458427429199219e-05, 0.0006604194641113281, 0.0013654232025146484, 0.0020704269409179688, 0.002775430679321289, 0.0034804344177246094, 0.00418543815612793, 0.00489044189453125, 0.00559544563293457, 0.006300449371337891, 0.007005453109741211, 0.007710456848144531, 0.008415460586547852, 0.009120464324951172, 0.009825468063354492, 0.010530471801757812, 0.011235475540161133, 0.011940479278564453, 0.012645483016967773, 0.013350486755371094, 0.014055490493774414, 0.014760494232177734, 0.015465497970581055, 0.016170501708984375, 0.016875505447387695, 0.017580509185791016, 0.018285512924194336, 0.018990516662597656, 0.019695520401000977, 0.020400524139404297, 0.021105527877807617, 0.021810531616210938, 0.022515535354614258, 0.023220539093017578, 0.0239255428314209, 0.02463054656982422, 0.02533555030822754, 0.02604055404663086, 0.02674555778503418, 0.0274505615234375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 18.0, 81.0, 267.0, 405.0, 179.0, 50.0, 12.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024106139317154884, -0.0023536216467618942, -0.0022966293618083, -0.0022396373096853495, -0.0021826450247317553, -0.002125652739778161, -0.002068660454824567, -0.0020116684027016163, -0.001954676117748022, -0.0018976838327944279, -0.0018406916642561555, -0.0017836993793025613, -0.001726707210764289, -0.0016697149258106947, -0.0016127226408571005, -0.001555730472318828, -0.001498738187365234, -0.0014417459024116397, -0.0013847537338733673, -0.001327761448919773, -0.0012707692803815007, -0.0012137769954279065, -0.0011567848268896341, -0.00109979254193604, -0.0010428002569824457, -0.0009858079720288515, -0.0009288158034905791, -0.0008718235185369849, -0.0008148313499987125, -0.0007578390650451183, -0.000700846838299185, -0.0006438546115532517, -0.0005868623265996575, -0.0005298700998537242, -0.00047287787310779095, -0.0004158856172580272, -0.0003588933905120939, -0.0003019011637661606, -0.00024490890791639686, -0.00018791668117046356, -0.00013092445442453027, -7.393222040263936e-05, -1.693998638074845e-05, 4.005225491710007e-05, 9.704448166303337e-05, 0.00015403670840896666, 0.0002110289642587304, 0.0002680211910046637, 0.000325013417750597, 0.0003820056444965303, 0.0004389978712424636, 0.0004959901561960578, 0.0005529823247343302, 0.0006099746096879244, 0.0006669668364338577, 0.000723959063179791, 0.0007809512899257243, 0.0008379435166716576, 0.0008949357434175909, 0.0009519279701635242, 0.0010089202551171184, 0.0010659124236553907, 0.001122904708608985, 0.0011798969935625792, 0.0012368891621008515]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 7.0, 9.0, 9.0, 9.0, 15.0, 19.0, 15.0, 20.0, 23.0, 30.0, 46.0, 33.0, 38.0, 34.0, 43.0, 44.0, 47.0, 50.0, 39.0, 50.0, 25.0, 51.0, 36.0, 42.0, 35.0, 31.0, 34.0, 14.0, 35.0, 21.0, 12.0, 17.0, 19.0, 7.0, 10.0, 6.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00048023462295532227, -0.0004647737368941307, -0.00044931285083293915, -0.0004338519647717476, -0.00041839107871055603, -0.00040293019264936447, -0.0003874693065881729, -0.00037200842052698135, -0.0003565475344657898, -0.00034108664840459824, -0.0003256257623434067, -0.0003101648762822151, -0.00029470399022102356, -0.000279243104159832, -0.00026378221809864044, -0.0002483213320374489, -0.00023286044597625732, -0.00021739955991506577, -0.0002019386738538742, -0.00018647778779268265, -0.0001710169017314911, -0.00015555601567029953, -0.00014009512960910797, -0.0001246342435479164, -0.00010917335748672485, -9.37124714255333e-05, -7.825158536434174e-05, -6.279069930315018e-05, -4.732981324195862e-05, -3.186892718076706e-05, -1.64080411195755e-05, -9.471550583839417e-07, 1.4513731002807617e-05, 2.9974617063999176e-05, 4.5435503125190735e-05, 6.0896389186382294e-05, 7.635727524757385e-05, 9.181816130876541e-05, 0.00010727904736995697, 0.00012273993343114853, 0.0001382008194923401, 0.00015366170555353165, 0.0001691225916147232, 0.00018458347767591476, 0.00020004436373710632, 0.00021550524979829788, 0.00023096613585948944, 0.000246427021920681, 0.00026188790798187256, 0.0002773487940430641, 0.0002928096801042557, 0.00030827056616544724, 0.0003237314522266388, 0.00033919233828783035, 0.0003546532243490219, 0.00037011411041021347, 0.00038557499647140503, 0.0004010358825325966, 0.00041649676859378815, 0.0004319576546549797, 0.00044741854071617126, 0.0004628794267773628, 0.0004783403128385544, 0.0004938011988997459, 0.0005092620849609375]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 11.0, 9.0, 12.0, 21.0, 16.0, 23.0, 22.0, 25.0, 32.0, 38.0, 31.0, 45.0, 44.0, 51.0, 40.0, 37.0, 61.0, 51.0, 46.0, 46.0, 44.0, 36.0, 38.0, 21.0, 30.0, 26.0, 20.0, 17.0, 18.0, 17.0, 18.0, 9.0, 3.0, 9.0, 6.0, 1.0, 2.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.6884765625, -8.400390625, -8.1123046875, -7.82421875, -7.5361328125, -7.248046875, -6.9599609375, -6.671875, -6.3837890625, -6.095703125, -5.8076171875, -5.51953125, -5.2314453125, -4.943359375, -4.6552734375, -4.3671875, -4.0791015625, -3.791015625, -3.5029296875, -3.21484375, -2.9267578125, -2.638671875, -2.3505859375, -2.0625, -1.7744140625, -1.486328125, -1.1982421875, -0.91015625, -0.6220703125, -0.333984375, -0.0458984375, 0.2421875, 0.5302734375, 0.818359375, 1.1064453125, 1.39453125, 1.6826171875, 1.970703125, 2.2587890625, 2.546875, 2.8349609375, 3.123046875, 3.4111328125, 3.69921875, 3.9873046875, 4.275390625, 4.5634765625, 4.8515625, 5.1396484375, 5.427734375, 5.7158203125, 6.00390625, 6.2919921875, 6.580078125, 6.8681640625, 7.15625, 7.4443359375, 7.732421875, 8.0205078125, 8.30859375, 8.5966796875, 8.884765625, 9.1728515625, 9.4609375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 8.0, 12.0, 14.0, 21.0, 27.0, 44.0, 49.0, 64.0, 113.0, 166.0, 267.0, 480.0, 948.0, 2032.0, 4921.0, 13195.0, 46688.0, 297749.0, 572376.0, 78261.0, 19147.0, 6601.0, 2661.0, 1181.0, 599.0, 315.0, 187.0, 125.0, 76.0, 58.0, 46.0, 32.0, 29.0, 15.0, 8.0, 10.0, 7.0, 3.0, 2.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.40869140625, -8.1298828125, -7.85107421875, -7.572265625, -7.29345703125, -7.0146484375, -6.73583984375, -6.45703125, -6.17822265625, -5.8994140625, -5.62060546875, -5.341796875, -5.06298828125, -4.7841796875, -4.50537109375, -4.2265625, -3.94775390625, -3.6689453125, -3.39013671875, -3.111328125, -2.83251953125, -2.5537109375, -2.27490234375, -1.99609375, -1.71728515625, -1.4384765625, -1.15966796875, -0.880859375, -0.60205078125, -0.3232421875, -0.04443359375, 0.234375, 0.51318359375, 0.7919921875, 1.07080078125, 1.349609375, 1.62841796875, 1.9072265625, 2.18603515625, 2.46484375, 2.74365234375, 3.0224609375, 3.30126953125, 3.580078125, 3.85888671875, 4.1376953125, 4.41650390625, 4.6953125, 4.97412109375, 5.2529296875, 5.53173828125, 5.810546875, 6.08935546875, 6.3681640625, 6.64697265625, 6.92578125, 7.20458984375, 7.4833984375, 7.76220703125, 8.041015625, 8.31982421875, 8.5986328125, 8.87744140625, 9.15625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 1.0, 7.0, 8.0, 13.0, 7.0, 16.0, 11.0, 15.0, 25.0, 17.0, 32.0, 39.0, 28.0, 29.0, 33.0, 39.0, 59.0, 45.0, 56.0, 246.0, 1741.0, 122.0, 54.0, 53.0, 49.0, 27.0, 37.0, 31.0, 31.0, 18.0, 25.0, 28.0, 15.0, 13.0, 19.0, 17.0, 8.0, 8.0, 10.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.640625, -25.842529296875, -25.04443359375, -24.246337890625, -23.4482421875, -22.650146484375, -21.85205078125, -21.053955078125, -20.255859375, -19.457763671875, -18.65966796875, -17.861572265625, -17.0634765625, -16.265380859375, -15.46728515625, -14.669189453125, -13.87109375, -13.072998046875, -12.27490234375, -11.476806640625, -10.6787109375, -9.880615234375, -9.08251953125, -8.284423828125, -7.486328125, -6.688232421875, -5.89013671875, -5.092041015625, -4.2939453125, -3.495849609375, -2.69775390625, -1.899658203125, -1.1015625, -0.303466796875, 0.49462890625, 1.292724609375, 2.0908203125, 2.888916015625, 3.68701171875, 4.485107421875, 5.283203125, 6.081298828125, 6.87939453125, 7.677490234375, 8.4755859375, 9.273681640625, 10.07177734375, 10.869873046875, 11.66796875, 12.466064453125, 13.26416015625, 14.062255859375, 14.8603515625, 15.658447265625, 16.45654296875, 17.254638671875, 18.052734375, 18.850830078125, 19.64892578125, 20.447021484375, 21.2451171875, 22.043212890625, 22.84130859375, 23.639404296875, 24.4375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 0.0, 5.0, 5.0, 12.0, 12.0, 11.0, 21.0, 27.0, 32.0, 27.0, 48.0, 65.0, 85.0, 136.0, 182.0, 251.0, 455.0, 1572.0, 37211.0, 3096944.0, 6536.0, 818.0, 360.0, 261.0, 158.0, 99.0, 88.0, 72.0, 43.0, 40.0, 23.0, 21.0, 21.0, 15.0, 14.0, 9.0, 4.0, 6.0, 4.0, 5.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.5625, -51.525390625, -49.48828125, -47.451171875, -45.4140625, -43.376953125, -41.33984375, -39.302734375, -37.265625, -35.228515625, -33.19140625, -31.154296875, -29.1171875, -27.080078125, -25.04296875, -23.005859375, -20.96875, -18.931640625, -16.89453125, -14.857421875, -12.8203125, -10.783203125, -8.74609375, -6.708984375, -4.671875, -2.634765625, -0.59765625, 1.439453125, 3.4765625, 5.513671875, 7.55078125, 9.587890625, 11.625, 13.662109375, 15.69921875, 17.736328125, 19.7734375, 21.810546875, 23.84765625, 25.884765625, 27.921875, 29.958984375, 31.99609375, 34.033203125, 36.0703125, 38.107421875, 40.14453125, 42.181640625, 44.21875, 46.255859375, 48.29296875, 50.330078125, 52.3671875, 54.404296875, 56.44140625, 58.478515625, 60.515625, 62.552734375, 64.58984375, 66.626953125, 68.6640625, 70.701171875, 72.73828125, 74.775390625, 76.8125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 786.0, 218.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.787872314453125, -41.64041519165039, -35.49296188354492, -29.345504760742188, -23.198049545288086, -17.050594329833984, -10.90313720703125, -4.755683898925781, 1.3917732238769531, 7.539228916168213, 13.686684608459473, 19.83414077758789, 25.981595993041992, 32.129051208496094, 38.27650833129883, 44.4239616394043, 50.57141876220703, 56.718875885009766, 62.866329193115234, 69.01378631591797, 75.16123962402344, 81.30870056152344, 87.4561538696289, 93.60360717773438, 99.75106811523438, 105.89852142333984, 112.04598236083984, 118.19343566894531, 124.34088897705078, 130.48834228515625, 136.63580322265625, 142.78326416015625, 148.9307098388672, 155.0781707763672, 161.22561645507812, 167.37307739257812, 173.52053833007812, 179.66798400878906, 185.81544494628906, 191.962890625, 198.1103515625, 204.2578125, 210.40525817871094, 216.55271911621094, 222.70018005371094, 228.84762573242188, 234.99508666992188, 241.14254760742188, 247.29000854492188, 253.43746948242188, 259.5849304199219, 265.73236083984375, 271.87982177734375, 278.02728271484375, 284.17474365234375, 290.32220458984375, 296.4696350097656, 302.6170959472656, 308.7645568847656, 314.9119873046875, 321.0594482421875, 327.2069091796875, 333.3543701171875, 339.5018310546875, 345.6492919921875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 9.0, 7.0, 12.0, 8.0, 13.0, 23.0, 26.0, 24.0, 32.0, 30.0, 36.0, 34.0, 34.0, 42.0, 36.0, 51.0, 48.0, 45.0, 44.0, 49.0, 44.0, 38.0, 47.0, 43.0, 41.0, 29.0, 24.0, 22.0, 23.0, 19.0, 11.0, 10.0, 11.0, 3.0, 13.0, 4.0, 2.0, 10.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-76.33177185058594, -74.00592803955078, -71.6800765991211, -69.35423278808594, -67.02838134765625, -64.7025375366211, -62.37669372558594, -60.050846099853516, -57.724998474121094, -55.39915084838867, -53.07330322265625, -50.747459411621094, -48.42161178588867, -46.09576416015625, -43.769920349121094, -41.44407272338867, -39.11822509765625, -36.79237747192383, -34.466529846191406, -32.14068603515625, -29.814838409423828, -27.488990783691406, -25.163145065307617, -22.837299346923828, -20.511451721191406, -18.185604095458984, -15.859758377075195, -13.53391170501709, -11.208065032958984, -8.882218360900879, -6.556371688842773, -4.230525970458984, -1.9046783447265625, 0.42116832733154297, 2.7470149993896484, 5.072861671447754, 7.398708343505859, 9.724555015563965, 12.05040168762207, 14.37624740600586, 16.70209503173828, 19.027942657470703, 21.353788375854492, 23.67963409423828, 26.005481719970703, 28.331329345703125, 30.657175064086914, 32.9830207824707, 35.308868408203125, 37.63471603393555, 39.96056365966797, 42.286407470703125, 44.61225509643555, 46.93810272216797, 49.263946533203125, 51.58979415893555, 53.91564178466797, 56.24148941040039, 58.56733703613281, 60.89318084716797, 63.21902847290039, 65.54487609863281, 67.87071990966797, 70.19656372070312, 72.52241516113281]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 3.0, 6.0, 8.0, 12.0, 14.0, 13.0, 19.0, 21.0, 22.0, 22.0, 24.0, 31.0, 38.0, 37.0, 45.0, 43.0, 48.0, 50.0, 43.0, 53.0, 46.0, 55.0, 39.0, 39.0, 33.0, 37.0, 32.0, 18.0, 25.0, 20.0, 20.0, 16.0, 17.0, 11.0, 7.0, 9.0, 5.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.2890625, -8.9967041015625, -8.704345703125, -8.4119873046875, -8.11962890625, -7.8272705078125, -7.534912109375, -7.2425537109375, -6.9501953125, -6.6578369140625, -6.365478515625, -6.0731201171875, -5.78076171875, -5.4884033203125, -5.196044921875, -4.9036865234375, -4.611328125, -4.3189697265625, -4.026611328125, -3.7342529296875, -3.44189453125, -3.1495361328125, -2.857177734375, -2.5648193359375, -2.2724609375, -1.9801025390625, -1.687744140625, -1.3953857421875, -1.10302734375, -0.8106689453125, -0.518310546875, -0.2259521484375, 0.06640625, 0.3587646484375, 0.651123046875, 0.9434814453125, 1.23583984375, 1.5281982421875, 1.820556640625, 2.1129150390625, 2.4052734375, 2.6976318359375, 2.989990234375, 3.2823486328125, 3.57470703125, 3.8670654296875, 4.159423828125, 4.4517822265625, 4.744140625, 5.0364990234375, 5.328857421875, 5.6212158203125, 5.91357421875, 6.2059326171875, 6.498291015625, 6.7906494140625, 7.0830078125, 7.3753662109375, 7.667724609375, 7.9600830078125, 8.25244140625, 8.5447998046875, 8.837158203125, 9.1295166015625, 9.421875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 7.0, 5.0, 5.0, 2.0, 9.0, 13.0, 12.0, 15.0, 31.0, 39.0, 41.0, 47.0, 38.0, 69.0, 102.0, 184.0, 345.0, 715.0, 1935.0, 7772.0, 63203.0, 1385514.0, 2544028.0, 171491.0, 13701.0, 2891.0, 915.0, 409.0, 205.0, 146.0, 87.0, 59.0, 46.0, 47.0, 30.0, 25.0, 15.0, 21.0, 16.0, 9.0, 10.0, 5.0, 5.0, 6.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-24.0625, -23.3369140625, -22.611328125, -21.8857421875, -21.16015625, -20.4345703125, -19.708984375, -18.9833984375, -18.2578125, -17.5322265625, -16.806640625, -16.0810546875, -15.35546875, -14.6298828125, -13.904296875, -13.1787109375, -12.453125, -11.7275390625, -11.001953125, -10.2763671875, -9.55078125, -8.8251953125, -8.099609375, -7.3740234375, -6.6484375, -5.9228515625, -5.197265625, -4.4716796875, -3.74609375, -3.0205078125, -2.294921875, -1.5693359375, -0.84375, -0.1181640625, 0.607421875, 1.3330078125, 2.05859375, 2.7841796875, 3.509765625, 4.2353515625, 4.9609375, 5.6865234375, 6.412109375, 7.1376953125, 7.86328125, 8.5888671875, 9.314453125, 10.0400390625, 10.765625, 11.4912109375, 12.216796875, 12.9423828125, 13.66796875, 14.3935546875, 15.119140625, 15.8447265625, 16.5703125, 17.2958984375, 18.021484375, 18.7470703125, 19.47265625, 20.1982421875, 20.923828125, 21.6494140625, 22.375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 26.0, 33.0, 44.0, 40.0, 63.0, 101.0, 117.0, 189.0, 259.0, 384.0, 483.0, 510.0, 491.0, 379.0, 248.0, 181.0, 130.0, 119.0, 70.0, 48.0, 44.0, 28.0, 19.0, 14.0, 7.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2265625, -14.6729736328125, -14.119384765625, -13.5657958984375, -13.01220703125, -12.4586181640625, -11.905029296875, -11.3514404296875, -10.7978515625, -10.2442626953125, -9.690673828125, -9.1370849609375, -8.58349609375, -8.0299072265625, -7.476318359375, -6.9227294921875, -6.369140625, -5.8155517578125, -5.261962890625, -4.7083740234375, -4.15478515625, -3.6011962890625, -3.047607421875, -2.4940185546875, -1.9404296875, -1.3868408203125, -0.833251953125, -0.2796630859375, 0.27392578125, 0.8275146484375, 1.381103515625, 1.9346923828125, 2.48828125, 3.0418701171875, 3.595458984375, 4.1490478515625, 4.70263671875, 5.2562255859375, 5.809814453125, 6.3634033203125, 6.9169921875, 7.4705810546875, 8.024169921875, 8.5777587890625, 9.13134765625, 9.6849365234375, 10.238525390625, 10.7921142578125, 11.345703125, 11.8992919921875, 12.452880859375, 13.0064697265625, 13.56005859375, 14.1136474609375, 14.667236328125, 15.2208251953125, 15.7744140625, 16.3280029296875, 16.881591796875, 17.4351806640625, 17.98876953125, 18.5423583984375, 19.095947265625, 19.6495361328125, 20.203125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 12.0, 12.0, 11.0, 26.0, 30.0, 41.0, 51.0, 78.0, 103.0, 118.0, 150.0, 200.0, 262.0, 419.0, 1222.0, 34341.0, 4117412.0, 37035.0, 1279.0, 415.0, 254.0, 188.0, 132.0, 110.0, 99.0, 65.0, 55.0, 50.0, 21.0, 29.0, 15.0, 14.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-107.8125, -105.0126953125, -102.212890625, -99.4130859375, -96.61328125, -93.8134765625, -91.013671875, -88.2138671875, -85.4140625, -82.6142578125, -79.814453125, -77.0146484375, -74.21484375, -71.4150390625, -68.615234375, -65.8154296875, -63.015625, -60.2158203125, -57.416015625, -54.6162109375, -51.81640625, -49.0166015625, -46.216796875, -43.4169921875, -40.6171875, -37.8173828125, -35.017578125, -32.2177734375, -29.41796875, -26.6181640625, -23.818359375, -21.0185546875, -18.21875, -15.4189453125, -12.619140625, -9.8193359375, -7.01953125, -4.2197265625, -1.419921875, 1.3798828125, 4.1796875, 6.9794921875, 9.779296875, 12.5791015625, 15.37890625, 18.1787109375, 20.978515625, 23.7783203125, 26.578125, 29.3779296875, 32.177734375, 34.9775390625, 37.77734375, 40.5771484375, 43.376953125, 46.1767578125, 48.9765625, 51.7763671875, 54.576171875, 57.3759765625, 60.17578125, 62.9755859375, 65.775390625, 68.5751953125, 71.375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 112.0, 674.0, 219.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.99546813964844, -82.35614776611328, -67.71682739257812, -53.0775032043457, -38.43818283081055, -23.798858642578125, -9.159538269042969, 5.4797821044921875, 20.119102478027344, 34.7584228515625, 49.397743225097656, 64.03706359863281, 78.6763916015625, 93.31571197509766, 107.95503234863281, 122.59435272216797, 137.23367309570312, 151.8730010986328, 166.51231384277344, 181.15164184570312, 195.79095458984375, 210.43028259277344, 225.06961059570312, 239.70892333984375, 254.34823608398438, 268.987548828125, 283.62689208984375, 298.2662048339844, 312.905517578125, 327.54486083984375, 342.1841735839844, 356.823486328125, 371.4627990722656, 386.10211181640625, 400.741455078125, 415.3807678222656, 430.02008056640625, 444.659423828125, 459.2987365722656, 473.93804931640625, 488.5773620605469, 503.2166748046875, 517.8560180664062, 532.4953002929688, 547.1346435546875, 561.7739868164062, 576.4132690429688, 591.0526123046875, 605.6919555664062, 620.331298828125, 634.9705810546875, 649.6099243164062, 664.249267578125, 678.8885498046875, 693.5278930664062, 708.167236328125, 722.8065185546875, 737.4458618164062, 752.0851440429688, 766.7244873046875, 781.3638305664062, 796.0031127929688, 810.6424560546875, 825.28173828125, 839.9210815429688]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 6.0, 7.0, 7.0, 16.0, 8.0, 15.0, 17.0, 20.0, 22.0, 30.0, 27.0, 33.0, 33.0, 33.0, 40.0, 44.0, 49.0, 50.0, 49.0, 48.0, 53.0, 34.0, 53.0, 38.0, 44.0, 34.0, 41.0, 25.0, 23.0, 22.0, 17.0, 14.0, 7.0, 15.0, 7.0, 9.0, 3.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.69015502929688, -66.78227233886719, -64.8743896484375, -62.96651077270508, -61.058631896972656, -59.15074920654297, -57.24287033081055, -55.33498764038086, -53.42710876464844, -51.51922607421875, -49.61134719848633, -47.70346450805664, -45.79558563232422, -43.88770294189453, -41.97982406616211, -40.07194137573242, -38.1640625, -36.25617980957031, -34.34830093383789, -32.4404182434082, -30.53253936767578, -28.624656677246094, -26.716777801513672, -24.808895111083984, -22.901012420654297, -20.993131637573242, -19.085250854492188, -17.177370071411133, -15.269489288330078, -13.361607551574707, -11.453726768493652, -9.545845985412598, -7.637966156005859, -5.730085372924805, -3.822204351425171, -1.914323329925537, -0.006442546844482422, 1.9014387130737305, 3.809319496154785, 5.71720027923584, 7.6250810623168945, 9.53296184539795, 11.440842628479004, 13.348724365234375, 15.25660514831543, 17.164485931396484, 19.07236671447754, 20.980247497558594, 22.88812828063965, 24.796009063720703, 26.703889846801758, 28.611770629882812, 30.519651412963867, 32.42753219604492, 34.33541488647461, 36.24329376220703, 38.15117645263672, 40.059059143066406, 41.96693801879883, 43.874820709228516, 45.78269958496094, 47.690582275390625, 49.59846115112305, 51.506343841552734, 53.414222717285156]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 0.0, 2.0, 9.0, 4.0, 11.0, 6.0, 11.0, 11.0, 14.0, 18.0, 16.0, 29.0, 19.0, 31.0, 34.0, 42.0, 26.0, 42.0, 38.0, 32.0, 36.0, 48.0, 49.0, 51.0, 56.0, 35.0, 35.0, 31.0, 31.0, 41.0, 38.0, 18.0, 18.0, 17.0, 19.0, 12.0, 19.0, 5.0, 11.0, 10.0, 3.0, 9.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.9609375, -8.6903076171875, -8.419677734375, -8.1490478515625, -7.87841796875, -7.6077880859375, -7.337158203125, -7.0665283203125, -6.7958984375, -6.5252685546875, -6.254638671875, -5.9840087890625, -5.71337890625, -5.4427490234375, -5.172119140625, -4.9014892578125, -4.630859375, -4.3602294921875, -4.089599609375, -3.8189697265625, -3.54833984375, -3.2777099609375, -3.007080078125, -2.7364501953125, -2.4658203125, -2.1951904296875, -1.924560546875, -1.6539306640625, -1.38330078125, -1.1126708984375, -0.842041015625, -0.5714111328125, -0.30078125, -0.0301513671875, 0.240478515625, 0.5111083984375, 0.78173828125, 1.0523681640625, 1.322998046875, 1.5936279296875, 1.8642578125, 2.1348876953125, 2.405517578125, 2.6761474609375, 2.94677734375, 3.2174072265625, 3.488037109375, 3.7586669921875, 4.029296875, 4.2999267578125, 4.570556640625, 4.8411865234375, 5.11181640625, 5.3824462890625, 5.653076171875, 5.9237060546875, 6.1943359375, 6.4649658203125, 6.735595703125, 7.0062255859375, 7.27685546875, 7.5474853515625, 7.818115234375, 8.0887451171875, 8.359375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 5.0, 8.0, 3.0, 11.0, 21.0, 28.0, 39.0, 51.0, 81.0, 99.0, 159.0, 216.0, 272.0, 427.0, 618.0, 915.0, 1306.0, 1922.0, 2805.0, 4234.0, 6286.0, 9861.0, 15112.0, 23762.0, 39084.0, 66038.0, 120133.0, 311423.0, 204175.0, 94602.0, 54126.0, 32567.0, 20067.0, 12905.0, 8292.0, 5462.0, 3634.0, 2466.0, 1653.0, 1109.0, 783.0, 541.0, 384.0, 262.0, 171.0, 139.0, 94.0, 65.0, 55.0, 23.0, 18.0, 18.0, 15.0, 8.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.7275390625, -1.671478271484375, -1.61541748046875, -1.559356689453125, -1.5032958984375, -1.447235107421875, -1.39117431640625, -1.335113525390625, -1.279052734375, -1.222991943359375, -1.16693115234375, -1.110870361328125, -1.0548095703125, -0.998748779296875, -0.94268798828125, -0.886627197265625, -0.83056640625, -0.774505615234375, -0.71844482421875, -0.662384033203125, -0.6063232421875, -0.550262451171875, -0.49420166015625, -0.438140869140625, -0.382080078125, -0.326019287109375, -0.26995849609375, -0.213897705078125, -0.1578369140625, -0.101776123046875, -0.04571533203125, 0.010345458984375, 0.06640625, 0.122467041015625, 0.17852783203125, 0.234588623046875, 0.2906494140625, 0.346710205078125, 0.40277099609375, 0.458831787109375, 0.514892578125, 0.570953369140625, 0.62701416015625, 0.683074951171875, 0.7391357421875, 0.795196533203125, 0.85125732421875, 0.907318115234375, 0.96337890625, 1.019439697265625, 1.07550048828125, 1.131561279296875, 1.1876220703125, 1.243682861328125, 1.29974365234375, 1.355804443359375, 1.411865234375, 1.467926025390625, 1.52398681640625, 1.580047607421875, 1.6361083984375, 1.692169189453125, 1.74822998046875, 1.804290771484375, 1.8603515625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 6.0, 4.0, 3.0, 7.0, 8.0, 9.0, 9.0, 16.0, 18.0, 19.0, 20.0, 26.0, 36.0, 30.0, 28.0, 36.0, 36.0, 35.0, 30.0, 52.0, 31.0, 32.0, 1075.0, 46.0, 38.0, 32.0, 35.0, 34.0, 40.0, 23.0, 28.0, 26.0, 22.0, 26.0, 18.0, 18.0, 16.0, 11.0, 13.0, 9.0, 6.0, 3.0, 5.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.41796875, -5.2490234375, -5.080078125, -4.9111328125, -4.7421875, -4.5732421875, -4.404296875, -4.2353515625, -4.06640625, -3.8974609375, -3.728515625, -3.5595703125, -3.390625, -3.2216796875, -3.052734375, -2.8837890625, -2.71484375, -2.5458984375, -2.376953125, -2.2080078125, -2.0390625, -1.8701171875, -1.701171875, -1.5322265625, -1.36328125, -1.1943359375, -1.025390625, -0.8564453125, -0.6875, -0.5185546875, -0.349609375, -0.1806640625, -0.01171875, 0.1572265625, 0.326171875, 0.4951171875, 0.6640625, 0.8330078125, 1.001953125, 1.1708984375, 1.33984375, 1.5087890625, 1.677734375, 1.8466796875, 2.015625, 2.1845703125, 2.353515625, 2.5224609375, 2.69140625, 2.8603515625, 3.029296875, 3.1982421875, 3.3671875, 3.5361328125, 3.705078125, 3.8740234375, 4.04296875, 4.2119140625, 4.380859375, 4.5498046875, 4.71875, 4.8876953125, 5.056640625, 5.2255859375, 5.39453125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 14.0, 14.0, 24.0, 43.0, 66.0, 104.0, 156.0, 229.0, 380.0, 540.0, 808.0, 1239.0, 1928.0, 2990.0, 4842.0, 7664.0, 12169.0, 19648.0, 32355.0, 54415.0, 97905.0, 232048.0, 1358051.0, 112993.0, 61740.0, 36462.0, 21932.0, 13422.0, 8479.0, 5141.0, 3292.0, 2100.0, 1338.0, 897.0, 588.0, 375.0, 248.0, 187.0, 117.0, 67.0, 44.0, 27.0, 18.0, 11.0, 7.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.8994140625, -1.8402557373046875, -1.781097412109375, -1.7219390869140625, -1.66278076171875, -1.6036224365234375, -1.544464111328125, -1.4853057861328125, -1.4261474609375, -1.3669891357421875, -1.307830810546875, -1.2486724853515625, -1.18951416015625, -1.1303558349609375, -1.071197509765625, -1.0120391845703125, -0.952880859375, -0.8937225341796875, -0.834564208984375, -0.7754058837890625, -0.71624755859375, -0.6570892333984375, -0.597930908203125, -0.5387725830078125, -0.4796142578125, -0.4204559326171875, -0.361297607421875, -0.3021392822265625, -0.24298095703125, -0.1838226318359375, -0.124664306640625, -0.0655059814453125, -0.00634765625, 0.0528106689453125, 0.111968994140625, 0.1711273193359375, 0.23028564453125, 0.2894439697265625, 0.348602294921875, 0.4077606201171875, 0.4669189453125, 0.5260772705078125, 0.585235595703125, 0.6443939208984375, 0.70355224609375, 0.7627105712890625, 0.821868896484375, 0.8810272216796875, 0.940185546875, 0.9993438720703125, 1.058502197265625, 1.1176605224609375, 1.17681884765625, 1.2359771728515625, 1.295135498046875, 1.3542938232421875, 1.4134521484375, 1.4726104736328125, 1.531768798828125, 1.5909271240234375, 1.65008544921875, 1.7092437744140625, 1.768402099609375, 1.8275604248046875, 1.88671875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 8.0, 10.0, 13.0, 16.0, 20.0, 21.0, 27.0, 29.0, 33.0, 49.0, 82.0, 91.0, 113.0, 74.0, 65.0, 80.0, 53.0, 43.0, 32.0, 35.0, 19.0, 14.0, 10.0, 7.0, 7.0, 2.0, 3.0, 5.0, 6.0, 2.0, 2.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0011472702026367188, -0.001113101840019226, -0.0010789334774017334, -0.0010447651147842407, -0.001010596752166748, -0.0009764283895492554, -0.0009422600269317627, -0.00090809166431427, -0.0008739233016967773, -0.0008397549390792847, -0.000805586576461792, -0.0007714182138442993, -0.0007372498512268066, -0.000703081488609314, -0.0006689131259918213, -0.0006347447633743286, -0.0006005764007568359, -0.0005664080381393433, -0.0005322396755218506, -0.0004980713129043579, -0.00046390295028686523, -0.00042973458766937256, -0.0003955662250518799, -0.0003613978624343872, -0.00032722949981689453, -0.00029306113719940186, -0.0002588927745819092, -0.0002247244119644165, -0.00019055604934692383, -0.00015638768672943115, -0.00012221932411193848, -8.80509614944458e-05, -5.3882598876953125e-05, -1.971423625946045e-05, 1.4454126358032227e-05, 4.86224889755249e-05, 8.279085159301758e-05, 0.00011695921421051025, 0.00015112757682800293, 0.0001852959394454956, 0.00021946430206298828, 0.00025363266468048096, 0.00028780102729797363, 0.0003219693899154663, 0.000356137752532959, 0.00039030611515045166, 0.00042447447776794434, 0.000458642840385437, 0.0004928112030029297, 0.0005269795656204224, 0.000561147928237915, 0.0005953162908554077, 0.0006294846534729004, 0.0006636530160903931, 0.0006978213787078857, 0.0007319897413253784, 0.0007661581039428711, 0.0008003264665603638, 0.0008344948291778564, 0.0008686631917953491, 0.0009028315544128418, 0.0009369999170303345, 0.0009711682796478271, 0.0010053366422653198, 0.0010395050048828125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 3.0, 4.0, 11.0, 7.0, 15.0, 9.0, 19.0, 32.0, 38.0, 53.0, 105.0, 175.0, 428.0, 4763.0, 1039942.0, 2188.0, 329.0, 141.0, 67.0, 49.0, 39.0, 26.0, 22.0, 18.0, 12.0, 14.0, 5.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0268707275390625, -0.025987625122070312, -0.025104522705078125, -0.024221420288085938, -0.02333831787109375, -0.022455215454101562, -0.021572113037109375, -0.020689010620117188, -0.019805908203125, -0.018922805786132812, -0.018039703369140625, -0.017156600952148438, -0.01627349853515625, -0.015390396118164062, -0.014507293701171875, -0.013624191284179688, -0.0127410888671875, -0.011857986450195312, -0.010974884033203125, -0.010091781616210938, -0.00920867919921875, -0.008325576782226562, -0.007442474365234375, -0.0065593719482421875, -0.00567626953125, -0.0047931671142578125, -0.003910064697265625, -0.0030269622802734375, -0.00214385986328125, -0.0012607574462890625, -0.000377655029296875, 0.0005054473876953125, 0.0013885498046875, 0.0022716522216796875, 0.003154754638671875, 0.0040378570556640625, 0.00492095947265625, 0.0058040618896484375, 0.006687164306640625, 0.0075702667236328125, 0.008453369140625, 0.009336471557617188, 0.010219573974609375, 0.011102676391601562, 0.01198577880859375, 0.012868881225585938, 0.013751983642578125, 0.014635086059570312, 0.0155181884765625, 0.016401290893554688, 0.017284393310546875, 0.018167495727539062, 0.01905059814453125, 0.019933700561523438, 0.020816802978515625, 0.021699905395507812, 0.0225830078125, 0.023466110229492188, 0.024349212646484375, 0.025232315063476562, 0.02611541748046875, 0.026998519897460938, 0.027881622314453125, 0.028764724731445312, 0.0296478271484375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 103.0, 371.0, 373.0, 135.0, 21.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003414158010855317, -0.003351028775796294, -0.0032878993079066277, -0.0032247700728476048, -0.003161640837788582, -0.0030985113698989153, -0.0030353821348398924, -0.0029722528997808695, -0.002909123431891203, -0.00284599419683218, -0.0027828647289425135, -0.0027197354938834906, -0.0026566062588244677, -0.002593476790934801, -0.002530347555875778, -0.0024672183208167553, -0.0024040890857577324, -0.0023409598506987095, -0.002277830382809043, -0.00221470114775002, -0.002151571912690997, -0.0020884424448013306, -0.0020253132097423077, -0.0019621839746832848, -0.0018990545067936182, -0.0018359251553192735, -0.0017727959202602506, -0.0017096665687859058, -0.001646537217311561, -0.0015834078658372164, -0.0015202786307781935, -0.0014571492793038487, -0.0013940201606601477, -0.001330890809185803, -0.00126776157412678, -0.0012046322226524353, -0.0011415028711780906, -0.0010783735197037458, -0.001015244284644723, -0.0009521149331703782, -0.0008889855816960335, -0.0008258562884293497, -0.0007627269369550049, -0.0006995976436883211, -0.0006364682922139764, -0.0005733389989472926, -0.0005102097056806087, -0.0004470803833100945, -0.0003839510609395802, -0.00032082173856906593, -0.00025769241619855165, -0.00019456312293186784, -0.00013143380056135356, -6.830447819083929e-05, -5.175184924155474e-06, 5.79541374463588e-05, 0.00012108345981687307, 0.00018421278218738735, 0.0002473421045579016, 0.00031047139782458544, 0.0003736007201950997, 0.000436730042565614, 0.0004998593358322978, 0.0005629886873066425, 0.0006261179805733263]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 5.0, 10.0, 9.0, 7.0, 5.0, 10.0, 14.0, 20.0, 21.0, 25.0, 21.0, 26.0, 33.0, 41.0, 29.0, 29.0, 38.0, 40.0, 39.0, 45.0, 30.0, 35.0, 37.0, 20.0, 46.0, 35.0, 35.0, 41.0, 32.0, 29.0, 37.0, 23.0, 17.0, 15.0, 15.0, 10.0, 14.0, 13.0, 10.0, 9.0, 8.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00045734643936157227, -0.0004432797431945801, -0.0004292130470275879, -0.0004151463508605957, -0.0004010796546936035, -0.00038701295852661133, -0.00037294626235961914, -0.00035887956619262695, -0.00034481287002563477, -0.0003307461738586426, -0.0003166794776916504, -0.0003026127815246582, -0.000288546085357666, -0.00027447938919067383, -0.00026041269302368164, -0.00024634599685668945, -0.00023227930068969727, -0.00021821260452270508, -0.0002041459083557129, -0.0001900792121887207, -0.00017601251602172852, -0.00016194581985473633, -0.00014787912368774414, -0.00013381242752075195, -0.00011974573135375977, -0.00010567903518676758, -9.161233901977539e-05, -7.75456428527832e-05, -6.347894668579102e-05, -4.941225051879883e-05, -3.534555435180664e-05, -2.1278858184814453e-05, -7.212162017822266e-06, 6.854534149169922e-06, 2.092123031616211e-05, 3.49879264831543e-05, 4.9054622650146484e-05, 6.312131881713867e-05, 7.718801498413086e-05, 9.125471115112305e-05, 0.00010532140731811523, 0.00011938810348510742, 0.0001334547996520996, 0.0001475214958190918, 0.00016158819198608398, 0.00017565488815307617, 0.00018972158432006836, 0.00020378828048706055, 0.00021785497665405273, 0.00023192167282104492, 0.0002459883689880371, 0.0002600550651550293, 0.0002741217613220215, 0.00028818845748901367, 0.00030225515365600586, 0.00031632184982299805, 0.00033038854598999023, 0.0003444552421569824, 0.0003585219383239746, 0.0003725886344909668, 0.000386655330657959, 0.00040072202682495117, 0.00041478872299194336, 0.00042885541915893555, 0.00044292211532592773]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 0.0, 2.0, 9.0, 4.0, 11.0, 6.0, 11.0, 11.0, 14.0, 18.0, 16.0, 29.0, 19.0, 31.0, 34.0, 42.0, 26.0, 42.0, 38.0, 32.0, 36.0, 48.0, 49.0, 51.0, 56.0, 35.0, 35.0, 31.0, 31.0, 41.0, 38.0, 18.0, 18.0, 17.0, 19.0, 12.0, 19.0, 5.0, 11.0, 10.0, 3.0, 9.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.9609375, -8.6903076171875, -8.419677734375, -8.1490478515625, -7.87841796875, -7.6077880859375, -7.337158203125, -7.0665283203125, -6.7958984375, -6.5252685546875, -6.254638671875, -5.9840087890625, -5.71337890625, -5.4427490234375, -5.172119140625, -4.9014892578125, -4.630859375, -4.3602294921875, -4.089599609375, -3.8189697265625, -3.54833984375, -3.2777099609375, -3.007080078125, -2.7364501953125, -2.4658203125, -2.1951904296875, -1.924560546875, -1.6539306640625, -1.38330078125, -1.1126708984375, -0.842041015625, -0.5714111328125, -0.30078125, -0.0301513671875, 0.240478515625, 0.5111083984375, 0.78173828125, 1.0523681640625, 1.322998046875, 1.5936279296875, 1.8642578125, 2.1348876953125, 2.405517578125, 2.6761474609375, 2.94677734375, 3.2174072265625, 3.488037109375, 3.7586669921875, 4.029296875, 4.2999267578125, 4.570556640625, 4.8411865234375, 5.11181640625, 5.3824462890625, 5.653076171875, 5.9237060546875, 6.1943359375, 6.4649658203125, 6.735595703125, 7.0062255859375, 7.27685546875, 7.5474853515625, 7.818115234375, 8.0887451171875, 8.359375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 5.0, 20.0, 15.0, 28.0, 35.0, 34.0, 79.0, 129.0, 177.0, 304.0, 479.0, 726.0, 1169.0, 2043.0, 3571.0, 6729.0, 13155.0, 27606.0, 63905.0, 162403.0, 382888.0, 225175.0, 86341.0, 36036.0, 16551.0, 8291.0, 4307.0, 2435.0, 1445.0, 909.0, 580.0, 350.0, 203.0, 154.0, 90.0, 59.0, 35.0, 32.0, 19.0, 9.0, 8.0, 7.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.6953125, -5.53997802734375, -5.3846435546875, -5.22930908203125, -5.073974609375, -4.91864013671875, -4.7633056640625, -4.60797119140625, -4.45263671875, -4.29730224609375, -4.1419677734375, -3.98663330078125, -3.831298828125, -3.67596435546875, -3.5206298828125, -3.36529541015625, -3.2099609375, -3.05462646484375, -2.8992919921875, -2.74395751953125, -2.588623046875, -2.43328857421875, -2.2779541015625, -2.12261962890625, -1.96728515625, -1.81195068359375, -1.6566162109375, -1.50128173828125, -1.345947265625, -1.19061279296875, -1.0352783203125, -0.87994384765625, -0.724609375, -0.56927490234375, -0.4139404296875, -0.25860595703125, -0.103271484375, 0.05206298828125, 0.2073974609375, 0.36273193359375, 0.51806640625, 0.67340087890625, 0.8287353515625, 0.98406982421875, 1.139404296875, 1.29473876953125, 1.4500732421875, 1.60540771484375, 1.7607421875, 1.91607666015625, 2.0714111328125, 2.22674560546875, 2.382080078125, 2.53741455078125, 2.6927490234375, 2.84808349609375, 3.00341796875, 3.15875244140625, 3.3140869140625, 3.46942138671875, 3.624755859375, 3.78009033203125, 3.9354248046875, 4.09075927734375, 4.24609375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 11.0, 10.0, 9.0, 12.0, 14.0, 14.0, 22.0, 23.0, 19.0, 26.0, 29.0, 36.0, 44.0, 38.0, 50.0, 77.0, 287.0, 1703.0, 167.0, 56.0, 51.0, 57.0, 39.0, 37.0, 37.0, 36.0, 26.0, 28.0, 18.0, 8.0, 13.0, 10.0, 13.0, 13.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.765625, -25.819580078125, -24.87353515625, -23.927490234375, -22.9814453125, -22.035400390625, -21.08935546875, -20.143310546875, -19.197265625, -18.251220703125, -17.30517578125, -16.359130859375, -15.4130859375, -14.467041015625, -13.52099609375, -12.574951171875, -11.62890625, -10.682861328125, -9.73681640625, -8.790771484375, -7.8447265625, -6.898681640625, -5.95263671875, -5.006591796875, -4.060546875, -3.114501953125, -2.16845703125, -1.222412109375, -0.2763671875, 0.669677734375, 1.61572265625, 2.561767578125, 3.5078125, 4.453857421875, 5.39990234375, 6.345947265625, 7.2919921875, 8.238037109375, 9.18408203125, 10.130126953125, 11.076171875, 12.022216796875, 12.96826171875, 13.914306640625, 14.8603515625, 15.806396484375, 16.75244140625, 17.698486328125, 18.64453125, 19.590576171875, 20.53662109375, 21.482666015625, 22.4287109375, 23.374755859375, 24.32080078125, 25.266845703125, 26.212890625, 27.158935546875, 28.10498046875, 29.051025390625, 29.9970703125, 30.943115234375, 31.88916015625, 32.835205078125, 33.78125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 9.0, 11.0, 16.0, 13.0, 15.0, 25.0, 34.0, 31.0, 61.0, 74.0, 100.0, 131.0, 194.0, 250.0, 406.0, 1159.0, 46636.0, 3089858.0, 4992.0, 582.0, 315.0, 175.0, 128.0, 117.0, 92.0, 66.0, 47.0, 36.0, 26.0, 23.0, 20.0, 18.0, 9.0, 9.0, 11.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-77.375, -75.1826171875, -72.990234375, -70.7978515625, -68.60546875, -66.4130859375, -64.220703125, -62.0283203125, -59.8359375, -57.6435546875, -55.451171875, -53.2587890625, -51.06640625, -48.8740234375, -46.681640625, -44.4892578125, -42.296875, -40.1044921875, -37.912109375, -35.7197265625, -33.52734375, -31.3349609375, -29.142578125, -26.9501953125, -24.7578125, -22.5654296875, -20.373046875, -18.1806640625, -15.98828125, -13.7958984375, -11.603515625, -9.4111328125, -7.21875, -5.0263671875, -2.833984375, -0.6416015625, 1.55078125, 3.7431640625, 5.935546875, 8.1279296875, 10.3203125, 12.5126953125, 14.705078125, 16.8974609375, 19.08984375, 21.2822265625, 23.474609375, 25.6669921875, 27.859375, 30.0517578125, 32.244140625, 34.4365234375, 36.62890625, 38.8212890625, 41.013671875, 43.2060546875, 45.3984375, 47.5908203125, 49.783203125, 51.9755859375, 54.16796875, 56.3603515625, 58.552734375, 60.7451171875, 62.9375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 22.0, 515.0, 465.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.35816764831543, -19.481565475463867, -14.604963302612305, -9.728361129760742, -4.85175895690918, 0.024843215942382812, 4.901445388793945, 9.778047561645508, 14.65464973449707, 19.531251907348633, 24.407854080200195, 29.284456253051758, 34.16105651855469, 39.03765869140625, 43.91426086425781, 48.790863037109375, 53.66746520996094, 58.5440673828125, 63.42066955566406, 68.29727172851562, 73.17387390136719, 78.05047607421875, 82.92707824707031, 87.80368041992188, 92.68028259277344, 97.556884765625, 102.43348693847656, 107.31008911132812, 112.18669128417969, 117.06329345703125, 121.93989562988281, 126.81649780273438, 131.693115234375, 136.56971740722656, 141.44631958007812, 146.3229217529297, 151.19952392578125, 156.0761260986328, 160.95272827148438, 165.82933044433594, 170.7059326171875, 175.58253479003906, 180.45913696289062, 185.3357391357422, 190.21234130859375, 195.0889434814453, 199.96554565429688, 204.84214782714844, 209.71875, 214.59535217285156, 219.47195434570312, 224.3485565185547, 229.22515869140625, 234.1017608642578, 238.97836303710938, 243.85496520996094, 248.7315673828125, 253.60816955566406, 258.4847717285156, 263.36138916015625, 268.23797607421875, 273.11456298828125, 277.9911804199219, 282.8677978515625, 287.744384765625]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 9.0, 7.0, 5.0, 8.0, 16.0, 8.0, 21.0, 20.0, 26.0, 15.0, 13.0, 37.0, 34.0, 48.0, 27.0, 41.0, 36.0, 25.0, 40.0, 46.0, 36.0, 50.0, 38.0, 38.0, 37.0, 44.0, 35.0, 30.0, 32.0, 28.0, 27.0, 19.0, 23.0, 13.0, 16.0, 18.0, 6.0, 5.0, 7.0, 5.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.71034240722656, -58.72969055175781, -56.74903869628906, -54.76838684082031, -52.7877311706543, -50.80707931518555, -48.8264274597168, -46.84577560424805, -44.8651237487793, -42.88447189331055, -40.9038200378418, -38.92316436767578, -36.94251251220703, -34.96186065673828, -32.98120880126953, -31.00055694580078, -29.0199031829834, -27.03925132751465, -25.058597564697266, -23.077945709228516, -21.097293853759766, -19.116641998291016, -17.135988235473633, -15.155336380004883, -13.174683570861816, -11.19403076171875, -9.21337890625, -7.232726097106934, -5.252073764801025, -3.271421432495117, -1.2907686233520508, 0.6898832321166992, 2.6705360412597656, 4.651188373565674, 6.631840705871582, 8.612493515014648, 10.593145370483398, 12.573798179626465, 14.554450988769531, 16.53510284423828, 18.51575469970703, 20.49640655517578, 22.477060317993164, 24.457712173461914, 26.438364028930664, 28.419017791748047, 30.399669647216797, 32.38032150268555, 34.36097717285156, 36.34162902832031, 38.32228088378906, 40.30293273925781, 42.28358840942383, 44.26424026489258, 46.24489212036133, 48.22554397583008, 50.20619583129883, 52.18684768676758, 54.16749954223633, 56.148155212402344, 58.128807067871094, 60.109458923339844, 62.090110778808594, 64.07076263427734, 66.0514144897461]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 5.0, 4.0, 10.0, 7.0, 6.0, 14.0, 5.0, 14.0, 17.0, 16.0, 29.0, 26.0, 29.0, 27.0, 41.0, 37.0, 32.0, 31.0, 40.0, 31.0, 27.0, 54.0, 59.0, 51.0, 39.0, 39.0, 36.0, 35.0, 27.0, 27.0, 28.0, 31.0, 19.0, 21.0, 11.0, 13.0, 10.0, 12.0, 9.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.328125, -9.0570068359375, -8.785888671875, -8.5147705078125, -8.24365234375, -7.9725341796875, -7.701416015625, -7.4302978515625, -7.1591796875, -6.8880615234375, -6.616943359375, -6.3458251953125, -6.07470703125, -5.8035888671875, -5.532470703125, -5.2613525390625, -4.990234375, -4.7191162109375, -4.447998046875, -4.1768798828125, -3.90576171875, -3.6346435546875, -3.363525390625, -3.0924072265625, -2.8212890625, -2.5501708984375, -2.279052734375, -2.0079345703125, -1.73681640625, -1.4656982421875, -1.194580078125, -0.9234619140625, -0.65234375, -0.3812255859375, -0.110107421875, 0.1610107421875, 0.43212890625, 0.7032470703125, 0.974365234375, 1.2454833984375, 1.5166015625, 1.7877197265625, 2.058837890625, 2.3299560546875, 2.60107421875, 2.8721923828125, 3.143310546875, 3.4144287109375, 3.685546875, 3.9566650390625, 4.227783203125, 4.4989013671875, 4.77001953125, 5.0411376953125, 5.312255859375, 5.5833740234375, 5.8544921875, 6.1256103515625, 6.396728515625, 6.6678466796875, 6.93896484375, 7.2100830078125, 7.481201171875, 7.7523193359375, 8.0234375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 5.0, 3.0, 10.0, 6.0, 7.0, 11.0, 11.0, 18.0, 14.0, 16.0, 25.0, 35.0, 39.0, 41.0, 80.0, 115.0, 234.0, 535.0, 1578.0, 6813.0, 72936.0, 2532796.0, 1532437.0, 39319.0, 4839.0, 1307.0, 439.0, 229.0, 96.0, 65.0, 42.0, 33.0, 25.0, 20.0, 15.0, 16.0, 13.0, 5.0, 12.0, 5.0, 10.0, 6.0, 8.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-31.234375, -30.33935546875, -29.4443359375, -28.54931640625, -27.654296875, -26.75927734375, -25.8642578125, -24.96923828125, -24.07421875, -23.17919921875, -22.2841796875, -21.38916015625, -20.494140625, -19.59912109375, -18.7041015625, -17.80908203125, -16.9140625, -16.01904296875, -15.1240234375, -14.22900390625, -13.333984375, -12.43896484375, -11.5439453125, -10.64892578125, -9.75390625, -8.85888671875, -7.9638671875, -7.06884765625, -6.173828125, -5.27880859375, -4.3837890625, -3.48876953125, -2.59375, -1.69873046875, -0.8037109375, 0.09130859375, 0.986328125, 1.88134765625, 2.7763671875, 3.67138671875, 4.56640625, 5.46142578125, 6.3564453125, 7.25146484375, 8.146484375, 9.04150390625, 9.9365234375, 10.83154296875, 11.7265625, 12.62158203125, 13.5166015625, 14.41162109375, 15.306640625, 16.20166015625, 17.0966796875, 17.99169921875, 18.88671875, 19.78173828125, 20.6767578125, 21.57177734375, 22.466796875, 23.36181640625, 24.2568359375, 25.15185546875, 26.046875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 8.0, 13.0, 26.0, 24.0, 36.0, 38.0, 52.0, 73.0, 118.0, 130.0, 185.0, 248.0, 336.0, 444.0, 468.0, 478.0, 312.0, 258.0, 183.0, 150.0, 103.0, 87.0, 70.0, 52.0, 40.0, 22.0, 21.0, 19.0, 14.0, 16.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.984375, -13.510986328125, -13.03759765625, -12.564208984375, -12.0908203125, -11.617431640625, -11.14404296875, -10.670654296875, -10.197265625, -9.723876953125, -9.25048828125, -8.777099609375, -8.3037109375, -7.830322265625, -7.35693359375, -6.883544921875, -6.41015625, -5.936767578125, -5.46337890625, -4.989990234375, -4.5166015625, -4.043212890625, -3.56982421875, -3.096435546875, -2.623046875, -2.149658203125, -1.67626953125, -1.202880859375, -0.7294921875, -0.256103515625, 0.21728515625, 0.690673828125, 1.1640625, 1.637451171875, 2.11083984375, 2.584228515625, 3.0576171875, 3.531005859375, 4.00439453125, 4.477783203125, 4.951171875, 5.424560546875, 5.89794921875, 6.371337890625, 6.8447265625, 7.318115234375, 7.79150390625, 8.264892578125, 8.73828125, 9.211669921875, 9.68505859375, 10.158447265625, 10.6318359375, 11.105224609375, 11.57861328125, 12.052001953125, 12.525390625, 12.998779296875, 13.47216796875, 13.945556640625, 14.4189453125, 14.892333984375, 15.36572265625, 15.839111328125, 16.3125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 3.0, 9.0, 5.0, 15.0, 12.0, 17.0, 20.0, 47.0, 50.0, 53.0, 47.0, 93.0, 114.0, 122.0, 164.0, 201.0, 290.0, 411.0, 1342.0, 37682.0, 4084989.0, 65278.0, 1656.0, 449.0, 312.0, 197.0, 145.0, 116.0, 107.0, 75.0, 60.0, 38.0, 37.0, 33.0, 29.0, 12.0, 12.0, 9.0, 9.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.8125, -87.2861328125, -84.759765625, -82.2333984375, -79.70703125, -77.1806640625, -74.654296875, -72.1279296875, -69.6015625, -67.0751953125, -64.548828125, -62.0224609375, -59.49609375, -56.9697265625, -54.443359375, -51.9169921875, -49.390625, -46.8642578125, -44.337890625, -41.8115234375, -39.28515625, -36.7587890625, -34.232421875, -31.7060546875, -29.1796875, -26.6533203125, -24.126953125, -21.6005859375, -19.07421875, -16.5478515625, -14.021484375, -11.4951171875, -8.96875, -6.4423828125, -3.916015625, -1.3896484375, 1.13671875, 3.6630859375, 6.189453125, 8.7158203125, 11.2421875, 13.7685546875, 16.294921875, 18.8212890625, 21.34765625, 23.8740234375, 26.400390625, 28.9267578125, 31.453125, 33.9794921875, 36.505859375, 39.0322265625, 41.55859375, 44.0849609375, 46.611328125, 49.1376953125, 51.6640625, 54.1904296875, 56.716796875, 59.2431640625, 61.76953125, 64.2958984375, 66.822265625, 69.3486328125, 71.875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 66.0, 278.0, 447.0, 188.0, 30.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.51374053955078, -62.92089080810547, -55.32804489135742, -47.735198974609375, -40.14234924316406, -32.54949951171875, -24.956653594970703, -17.363807678222656, -9.770957946777344, -2.178110122680664, 5.414737701416016, 13.007585525512695, 20.600433349609375, 28.193283081054688, 35.786128997802734, 43.37897491455078, 50.971824645996094, 58.564674377441406, 66.15751647949219, 73.7503662109375, 81.34321594238281, 88.93606567382812, 96.52891540527344, 104.12175750732422, 111.71460723876953, 119.30745697021484, 126.90029907226562, 134.49314880371094, 142.08599853515625, 149.67884826660156, 157.27169799804688, 164.86453247070312, 172.4573974609375, 180.0502471923828, 187.64309692382812, 195.23594665527344, 202.82879638671875, 210.421630859375, 218.0144805908203, 225.60733032226562, 233.20018005371094, 240.79302978515625, 248.38587951660156, 255.97872924804688, 263.5715637207031, 271.1644287109375, 278.75726318359375, 286.35009765625, 293.9429626464844, 301.5357971191406, 309.128662109375, 316.72149658203125, 324.3143615722656, 331.9071960449219, 339.50006103515625, 347.0928955078125, 354.68572998046875, 362.278564453125, 369.8714294433594, 377.4642639160156, 385.05712890625, 392.64996337890625, 400.2428283691406, 407.8356628417969, 415.42852783203125]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 8.0, 4.0, 12.0, 9.0, 9.0, 14.0, 12.0, 14.0, 30.0, 15.0, 23.0, 33.0, 37.0, 37.0, 40.0, 40.0, 47.0, 37.0, 42.0, 34.0, 39.0, 32.0, 28.0, 42.0, 28.0, 40.0, 38.0, 29.0, 31.0, 26.0, 21.0, 30.0, 12.0, 21.0, 9.0, 19.0, 9.0, 7.0, 10.0, 6.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-48.150299072265625, -46.565155029296875, -44.98001480102539, -43.394874572753906, -41.809730529785156, -40.224586486816406, -38.63944625854492, -37.05430603027344, -35.46916198730469, -33.88401794433594, -32.29887771606445, -30.713735580444336, -29.12859344482422, -27.5434513092041, -25.958309173583984, -24.373167037963867, -22.78802490234375, -21.202882766723633, -19.617740631103516, -18.0325984954834, -16.44745635986328, -14.862314224243164, -13.277172088623047, -11.69202995300293, -10.106887817382812, -8.521745681762695, -6.936603546142578, -5.351461410522461, -3.7663192749023438, -2.1811771392822266, -0.5960350036621094, 0.9891071319580078, 2.574249267578125, 4.159391403198242, 5.744533538818359, 7.329675674438477, 8.914817810058594, 10.499959945678711, 12.085102081298828, 13.670244216918945, 15.255386352539062, 16.84052848815918, 18.425670623779297, 20.010812759399414, 21.59595489501953, 23.18109703063965, 24.766239166259766, 26.351381301879883, 27.9365234375, 29.521665573120117, 31.106807708740234, 32.69194793701172, 34.27709197998047, 35.86223602294922, 37.4473762512207, 39.03251647949219, 40.61766052246094, 42.20280456542969, 43.78794479370117, 45.373085021972656, 46.958229064941406, 48.543373107910156, 50.12851333618164, 51.713653564453125, 53.298797607421875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 6.0, 9.0, 6.0, 8.0, 9.0, 7.0, 15.0, 11.0, 23.0, 15.0, 20.0, 35.0, 19.0, 17.0, 28.0, 37.0, 31.0, 42.0, 31.0, 29.0, 54.0, 52.0, 30.0, 36.0, 45.0, 34.0, 41.0, 36.0, 35.0, 33.0, 29.0, 30.0, 23.0, 17.0, 13.0, 11.0, 11.0, 13.0, 11.0, 7.0, 9.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.140625, -7.8858642578125, -7.631103515625, -7.3763427734375, -7.12158203125, -6.8668212890625, -6.612060546875, -6.3572998046875, -6.1025390625, -5.8477783203125, -5.593017578125, -5.3382568359375, -5.08349609375, -4.8287353515625, -4.573974609375, -4.3192138671875, -4.064453125, -3.8096923828125, -3.554931640625, -3.3001708984375, -3.04541015625, -2.7906494140625, -2.535888671875, -2.2811279296875, -2.0263671875, -1.7716064453125, -1.516845703125, -1.2620849609375, -1.00732421875, -0.7525634765625, -0.497802734375, -0.2430419921875, 0.01171875, 0.2664794921875, 0.521240234375, 0.7760009765625, 1.03076171875, 1.2855224609375, 1.540283203125, 1.7950439453125, 2.0498046875, 2.3045654296875, 2.559326171875, 2.8140869140625, 3.06884765625, 3.3236083984375, 3.578369140625, 3.8331298828125, 4.087890625, 4.3426513671875, 4.597412109375, 4.8521728515625, 5.10693359375, 5.3616943359375, 5.616455078125, 5.8712158203125, 6.1259765625, 6.3807373046875, 6.635498046875, 6.8902587890625, 7.14501953125, 7.3997802734375, 7.654541015625, 7.9093017578125, 8.1640625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 10.0, 16.0, 19.0, 29.0, 51.0, 67.0, 76.0, 93.0, 136.0, 212.0, 297.0, 398.0, 513.0, 691.0, 958.0, 1374.0, 1985.0, 2589.0, 3720.0, 5329.0, 7517.0, 10778.0, 15736.0, 23843.0, 36419.0, 58869.0, 102515.0, 240046.0, 254520.0, 104484.0, 60507.0, 37075.0, 24172.0, 16086.0, 11110.0, 7481.0, 5467.0, 3767.0, 2683.0, 1901.0, 1367.0, 974.0, 726.0, 529.0, 400.0, 308.0, 210.0, 144.0, 99.0, 75.0, 63.0, 45.0, 27.0, 25.0, 13.0, 11.0, 7.0, 3.0, 0.0, 2.0], "bins": [-1.5576171875, -1.50897216796875, -1.4603271484375, -1.41168212890625, -1.363037109375, -1.31439208984375, -1.2657470703125, -1.21710205078125, -1.16845703125, -1.11981201171875, -1.0711669921875, -1.02252197265625, -0.973876953125, -0.92523193359375, -0.8765869140625, -0.82794189453125, -0.779296875, -0.73065185546875, -0.6820068359375, -0.63336181640625, -0.584716796875, -0.53607177734375, -0.4874267578125, -0.43878173828125, -0.39013671875, -0.34149169921875, -0.2928466796875, -0.24420166015625, -0.195556640625, -0.14691162109375, -0.0982666015625, -0.04962158203125, -0.0009765625, 0.04766845703125, 0.0963134765625, 0.14495849609375, 0.193603515625, 0.24224853515625, 0.2908935546875, 0.33953857421875, 0.38818359375, 0.43682861328125, 0.4854736328125, 0.53411865234375, 0.582763671875, 0.63140869140625, 0.6800537109375, 0.72869873046875, 0.77734375, 0.82598876953125, 0.8746337890625, 0.92327880859375, 0.971923828125, 1.02056884765625, 1.0692138671875, 1.11785888671875, 1.16650390625, 1.21514892578125, 1.2637939453125, 1.31243896484375, 1.361083984375, 1.40972900390625, 1.4583740234375, 1.50701904296875, 1.5556640625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 9.0, 17.0, 17.0, 29.0, 19.0, 22.0, 34.0, 25.0, 27.0, 39.0, 40.0, 44.0, 39.0, 49.0, 44.0, 1079.0, 37.0, 45.0, 40.0, 34.0, 38.0, 27.0, 38.0, 30.0, 28.0, 25.0, 24.0, 16.0, 15.0, 18.0, 14.0, 14.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.296875, -6.11444091796875, -5.9320068359375, -5.74957275390625, -5.567138671875, -5.38470458984375, -5.2022705078125, -5.01983642578125, -4.83740234375, -4.65496826171875, -4.4725341796875, -4.29010009765625, -4.107666015625, -3.92523193359375, -3.7427978515625, -3.56036376953125, -3.3779296875, -3.19549560546875, -3.0130615234375, -2.83062744140625, -2.648193359375, -2.46575927734375, -2.2833251953125, -2.10089111328125, -1.91845703125, -1.73602294921875, -1.5535888671875, -1.37115478515625, -1.188720703125, -1.00628662109375, -0.8238525390625, -0.64141845703125, -0.458984375, -0.27655029296875, -0.0941162109375, 0.08831787109375, 0.270751953125, 0.45318603515625, 0.6356201171875, 0.81805419921875, 1.00048828125, 1.18292236328125, 1.3653564453125, 1.54779052734375, 1.730224609375, 1.91265869140625, 2.0950927734375, 2.27752685546875, 2.4599609375, 2.64239501953125, 2.8248291015625, 3.00726318359375, 3.189697265625, 3.37213134765625, 3.5545654296875, 3.73699951171875, 3.91943359375, 4.10186767578125, 4.2843017578125, 4.46673583984375, 4.649169921875, 4.83160400390625, 5.0140380859375, 5.19647216796875, 5.37890625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 16.0, 20.0, 30.0, 54.0, 83.0, 112.0, 210.0, 309.0, 447.0, 709.0, 1125.0, 1926.0, 3151.0, 5217.0, 8647.0, 14430.0, 23797.0, 40985.0, 73058.0, 148535.0, 1430355.0, 160841.0, 77014.0, 43249.0, 24992.0, 14726.0, 8983.0, 5529.0, 3286.0, 1965.0, 1206.0, 759.0, 453.0, 311.0, 226.0, 136.0, 84.0, 51.0, 36.0, 23.0, 15.0, 11.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.1953125, -2.1317596435546875, -2.068206787109375, -2.0046539306640625, -1.94110107421875, -1.8775482177734375, -1.813995361328125, -1.7504425048828125, -1.6868896484375, -1.6233367919921875, -1.559783935546875, -1.4962310791015625, -1.43267822265625, -1.3691253662109375, -1.305572509765625, -1.2420196533203125, -1.178466796875, -1.1149139404296875, -1.051361083984375, -0.9878082275390625, -0.92425537109375, -0.8607025146484375, -0.797149658203125, -0.7335968017578125, -0.6700439453125, -0.6064910888671875, -0.542938232421875, -0.4793853759765625, -0.41583251953125, -0.3522796630859375, -0.288726806640625, -0.2251739501953125, -0.16162109375, -0.0980682373046875, -0.034515380859375, 0.0290374755859375, 0.09259033203125, 0.1561431884765625, 0.219696044921875, 0.2832489013671875, 0.3468017578125, 0.4103546142578125, 0.473907470703125, 0.5374603271484375, 0.60101318359375, 0.6645660400390625, 0.728118896484375, 0.7916717529296875, 0.855224609375, 0.9187774658203125, 0.982330322265625, 1.0458831787109375, 1.10943603515625, 1.1729888916015625, 1.236541748046875, 1.3000946044921875, 1.3636474609375, 1.4272003173828125, 1.490753173828125, 1.5543060302734375, 1.61785888671875, 1.6814117431640625, 1.744964599609375, 1.8085174560546875, 1.8720703125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 10.0, 10.0, 8.0, 11.0, 9.0, 17.0, 22.0, 29.0, 34.0, 30.0, 50.0, 75.0, 74.0, 100.0, 81.0, 77.0, 81.0, 63.0, 42.0, 43.0, 26.0, 22.0, 15.0, 9.0, 22.0, 8.0, 10.0, 3.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008649826049804688, -0.0008322298526763916, -0.0007994771003723145, -0.0007667243480682373, -0.0007339715957641602, -0.000701218843460083, -0.0006684660911560059, -0.0006357133388519287, -0.0006029605865478516, -0.0005702078342437744, -0.0005374550819396973, -0.0005047023296356201, -0.00047194957733154297, -0.0004391968250274658, -0.00040644407272338867, -0.0003736913204193115, -0.0003409385681152344, -0.0003081858158111572, -0.0002754330635070801, -0.00024268031120300293, -0.00020992755889892578, -0.00017717480659484863, -0.00014442205429077148, -0.00011166930198669434, -7.891654968261719e-05, -4.616379737854004e-05, -1.341104507446289e-05, 1.9341707229614258e-05, 5.2094459533691406e-05, 8.484721183776855e-05, 0.0001175999641418457, 0.00015035271644592285, 0.00018310546875, 0.00021585822105407715, 0.0002486109733581543, 0.00028136372566223145, 0.0003141164779663086, 0.00034686923027038574, 0.0003796219825744629, 0.00041237473487854004, 0.0004451274871826172, 0.00047788023948669434, 0.0005106329917907715, 0.0005433857440948486, 0.0005761384963989258, 0.0006088912487030029, 0.0006416440010070801, 0.0006743967533111572, 0.0007071495056152344, 0.0007399022579193115, 0.0007726550102233887, 0.0008054077625274658, 0.000838160514831543, 0.0008709132671356201, 0.0009036660194396973, 0.0009364187717437744, 0.0009691715240478516, 0.0010019242763519287, 0.0010346770286560059, 0.001067429780960083, 0.0011001825332641602, 0.0011329352855682373, 0.0011656880378723145, 0.0011984407901763916, 0.0012311935424804688]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 14.0, 5.0, 13.0, 14.0, 23.0, 7.0, 25.0, 30.0, 51.0, 59.0, 76.0, 105.0, 227.0, 509.0, 5362.0, 1032509.0, 8283.0, 545.0, 220.0, 146.0, 76.0, 61.0, 34.0, 39.0, 25.0, 20.0, 15.0, 11.0, 12.0, 11.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.026123046875, -0.02542710304260254, -0.024731159210205078, -0.024035215377807617, -0.023339271545410156, -0.022643327713012695, -0.021947383880615234, -0.021251440048217773, -0.020555496215820312, -0.01985955238342285, -0.01916360855102539, -0.01846766471862793, -0.01777172088623047, -0.017075777053833008, -0.016379833221435547, -0.015683889389038086, -0.014987945556640625, -0.014292001724243164, -0.013596057891845703, -0.012900114059448242, -0.012204170227050781, -0.01150822639465332, -0.01081228256225586, -0.010116338729858398, -0.009420394897460938, -0.008724451065063477, -0.008028507232666016, -0.007332563400268555, -0.006636619567871094, -0.005940675735473633, -0.005244731903076172, -0.004548788070678711, -0.00385284423828125, -0.003156900405883789, -0.002460956573486328, -0.0017650127410888672, -0.0010690689086914062, -0.0003731250762939453, 0.0003228187561035156, 0.0010187625885009766, 0.0017147064208984375, 0.0024106502532958984, 0.0031065940856933594, 0.0038025379180908203, 0.004498481750488281, 0.005194425582885742, 0.005890369415283203, 0.006586313247680664, 0.007282257080078125, 0.007978200912475586, 0.008674144744873047, 0.009370088577270508, 0.010066032409667969, 0.01076197624206543, 0.01145792007446289, 0.012153863906860352, 0.012849807739257812, 0.013545751571655273, 0.014241695404052734, 0.014937639236450195, 0.015633583068847656, 0.016329526901245117, 0.017025470733642578, 0.01772141456604004, 0.0184173583984375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 36.0, 119.0, 280.0, 292.0, 189.0, 58.0, 20.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019203094998374581, -0.0018758170772343874, -0.0018313246546313167, -0.001786832232028246, -0.0017423396930098534, -0.0016978472704067826, -0.0016533548478037119, -0.0016088624252006412, -0.0015643700025975704, -0.0015198775799944997, -0.001475385157391429, -0.0014308926183730364, -0.0013864001957699656, -0.001341907773166895, -0.0012974153505638242, -0.0012529229279607534, -0.0012084303889423609, -0.0011639379663392901, -0.0011194455437362194, -0.0010749530047178268, -0.001030460582114756, -0.0009859681595116854, -0.0009414757369086146, -0.0008969833143055439, -0.0008524908334948123, -0.0008079984108917415, -0.0007635059300810099, -0.0007190135074779391, -0.0006745210848748684, -0.0006300286040641367, -0.000585536181461066, -0.0005410437006503344, -0.0004965513362549245, -0.00045205888454802334, -0.00040756643284112215, -0.0003630740102380514, -0.0003185815585311502, -0.00027408910682424903, -0.0002295966842211783, -0.0001851042325142771, -0.0001406117808073759, -9.611933637643233e-05, -5.162689194548875e-05, -7.134454790502787e-06, 3.7357996916398406e-05, 8.18504486232996e-05, 0.00012634287122637033, 0.00017083532293327153, 0.00021532777464017272, 0.0002598202263470739, 0.0003043126780539751, 0.00034880510065704584, 0.00039329755236394703, 0.0004377900040708482, 0.00048228242667391896, 0.0005267749074846506, 0.0005712673300877213, 0.0006157597526907921, 0.0006602522335015237, 0.0007047446561045945, 0.0007492371369153261, 0.0007937295595183969, 0.0008382219821214676, 0.0008827144047245383, 0.00092720688553527]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 3.0, 5.0, 4.0, 11.0, 8.0, 10.0, 15.0, 12.0, 23.0, 22.0, 24.0, 26.0, 19.0, 36.0, 43.0, 28.0, 32.0, 34.0, 51.0, 35.0, 45.0, 53.0, 27.0, 39.0, 53.0, 39.0, 41.0, 41.0, 30.0, 24.0, 23.0, 22.0, 22.0, 12.0, 12.0, 13.0, 20.0, 10.0, 11.0, 2.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004221200942993164, -0.0004078652709722519, -0.0003936104476451874, -0.00037935562431812286, -0.00036510080099105835, -0.00035084597766399384, -0.0003365911543369293, -0.0003223363310098648, -0.0003080815076828003, -0.0002938266843557358, -0.00027957186102867126, -0.00026531703770160675, -0.00025106221437454224, -0.00023680739104747772, -0.0002225525677204132, -0.0002082977443933487, -0.00019404292106628418, -0.00017978809773921967, -0.00016553327441215515, -0.00015127845108509064, -0.00013702362775802612, -0.0001227688044309616, -0.0001085139811038971, -9.425915777683258e-05, -8.000433444976807e-05, -6.574951112270355e-05, -5.149468779563904e-05, -3.7239864468574524e-05, -2.298504114151001e-05, -8.730217814445496e-06, 5.5246055126190186e-06, 1.9779428839683533e-05, 3.403425216674805e-05, 4.828907549381256e-05, 6.254389882087708e-05, 7.679872214794159e-05, 9.10535454750061e-05, 0.00010530836880207062, 0.00011956319212913513, 0.00013381801545619965, 0.00014807283878326416, 0.00016232766211032867, 0.0001765824854373932, 0.0001908373087644577, 0.00020509213209152222, 0.00021934695541858673, 0.00023360177874565125, 0.00024785660207271576, 0.0002621114253997803, 0.0002763662487268448, 0.0002906210720539093, 0.0003048758953809738, 0.00031913071870803833, 0.00033338554203510284, 0.00034764036536216736, 0.00036189518868923187, 0.0003761500120162964, 0.0003904048353433609, 0.0004046596586704254, 0.00041891448199748993, 0.00043316930532455444, 0.00044742412865161896, 0.00046167895197868347, 0.000475933775305748, 0.0004901885986328125]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 6.0, 9.0, 6.0, 8.0, 9.0, 7.0, 15.0, 11.0, 23.0, 15.0, 20.0, 35.0, 19.0, 17.0, 28.0, 37.0, 31.0, 42.0, 31.0, 29.0, 54.0, 52.0, 30.0, 37.0, 44.0, 34.0, 41.0, 36.0, 35.0, 33.0, 29.0, 30.0, 23.0, 17.0, 13.0, 11.0, 11.0, 13.0, 11.0, 7.0, 9.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.140625, -7.8858642578125, -7.631103515625, -7.3763427734375, -7.12158203125, -6.8668212890625, -6.612060546875, -6.3572998046875, -6.1025390625, -5.8477783203125, -5.593017578125, -5.3382568359375, -5.08349609375, -4.8287353515625, -4.573974609375, -4.3192138671875, -4.064453125, -3.8096923828125, -3.554931640625, -3.3001708984375, -3.04541015625, -2.7906494140625, -2.535888671875, -2.2811279296875, -2.0263671875, -1.7716064453125, -1.516845703125, -1.2620849609375, -1.00732421875, -0.7525634765625, -0.497802734375, -0.2430419921875, 0.01171875, 0.2664794921875, 0.521240234375, 0.7760009765625, 1.03076171875, 1.2855224609375, 1.540283203125, 1.7950439453125, 2.0498046875, 2.3045654296875, 2.559326171875, 2.8140869140625, 3.06884765625, 3.3236083984375, 3.578369140625, 3.8331298828125, 4.087890625, 4.3426513671875, 4.597412109375, 4.8521728515625, 5.10693359375, 5.3616943359375, 5.616455078125, 5.8712158203125, 6.1259765625, 6.3807373046875, 6.635498046875, 6.8902587890625, 7.14501953125, 7.3997802734375, 7.654541015625, 7.9093017578125, 8.1640625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 9.0, 21.0, 15.0, 17.0, 24.0, 33.0, 53.0, 59.0, 86.0, 128.0, 168.0, 256.0, 450.0, 839.0, 2031.0, 5728.0, 17539.0, 59880.0, 229520.0, 526430.0, 145619.0, 39880.0, 12320.0, 4108.0, 1603.0, 649.0, 352.0, 199.0, 120.0, 94.0, 69.0, 61.0, 47.0, 25.0, 21.0, 19.0, 19.0, 5.0, 16.0, 9.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-9.6796875, -9.38037109375, -9.0810546875, -8.78173828125, -8.482421875, -8.18310546875, -7.8837890625, -7.58447265625, -7.28515625, -6.98583984375, -6.6865234375, -6.38720703125, -6.087890625, -5.78857421875, -5.4892578125, -5.18994140625, -4.890625, -4.59130859375, -4.2919921875, -3.99267578125, -3.693359375, -3.39404296875, -3.0947265625, -2.79541015625, -2.49609375, -2.19677734375, -1.8974609375, -1.59814453125, -1.298828125, -0.99951171875, -0.7001953125, -0.40087890625, -0.1015625, 0.19775390625, 0.4970703125, 0.79638671875, 1.095703125, 1.39501953125, 1.6943359375, 1.99365234375, 2.29296875, 2.59228515625, 2.8916015625, 3.19091796875, 3.490234375, 3.78955078125, 4.0888671875, 4.38818359375, 4.6875, 4.98681640625, 5.2861328125, 5.58544921875, 5.884765625, 6.18408203125, 6.4833984375, 6.78271484375, 7.08203125, 7.38134765625, 7.6806640625, 7.97998046875, 8.279296875, 8.57861328125, 8.8779296875, 9.17724609375, 9.4765625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 8.0, 5.0, 10.0, 14.0, 8.0, 17.0, 10.0, 25.0, 30.0, 29.0, 38.0, 34.0, 30.0, 36.0, 33.0, 47.0, 62.0, 107.0, 354.0, 1567.0, 117.0, 61.0, 53.0, 34.0, 40.0, 37.0, 38.0, 30.0, 21.0, 16.0, 23.0, 15.0, 13.0, 16.0, 13.0, 13.0, 6.0, 5.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.171875, -21.436279296875, -20.70068359375, -19.965087890625, -19.2294921875, -18.493896484375, -17.75830078125, -17.022705078125, -16.287109375, -15.551513671875, -14.81591796875, -14.080322265625, -13.3447265625, -12.609130859375, -11.87353515625, -11.137939453125, -10.40234375, -9.666748046875, -8.93115234375, -8.195556640625, -7.4599609375, -6.724365234375, -5.98876953125, -5.253173828125, -4.517578125, -3.781982421875, -3.04638671875, -2.310791015625, -1.5751953125, -0.839599609375, -0.10400390625, 0.631591796875, 1.3671875, 2.102783203125, 2.83837890625, 3.573974609375, 4.3095703125, 5.045166015625, 5.78076171875, 6.516357421875, 7.251953125, 7.987548828125, 8.72314453125, 9.458740234375, 10.1943359375, 10.929931640625, 11.66552734375, 12.401123046875, 13.13671875, 13.872314453125, 14.60791015625, 15.343505859375, 16.0791015625, 16.814697265625, 17.55029296875, 18.285888671875, 19.021484375, 19.757080078125, 20.49267578125, 21.228271484375, 21.9638671875, 22.699462890625, 23.43505859375, 24.170654296875, 24.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 6.0, 12.0, 15.0, 26.0, 50.0, 65.0, 102.0, 188.0, 321.0, 697.0, 10494.0, 3128856.0, 3476.0, 581.0, 306.0, 173.0, 119.0, 60.0, 58.0, 30.0, 17.0, 12.0, 13.0, 9.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-110.625, -107.3125, -104.0, -100.6875, -97.375, -94.0625, -90.75, -87.4375, -84.125, -80.8125, -77.5, -74.1875, -70.875, -67.5625, -64.25, -60.9375, -57.625, -54.3125, -51.0, -47.6875, -44.375, -41.0625, -37.75, -34.4375, -31.125, -27.8125, -24.5, -21.1875, -17.875, -14.5625, -11.25, -7.9375, -4.625, -1.3125, 2.0, 5.3125, 8.625, 11.9375, 15.25, 18.5625, 21.875, 25.1875, 28.5, 31.8125, 35.125, 38.4375, 41.75, 45.0625, 48.375, 51.6875, 55.0, 58.3125, 61.625, 64.9375, 68.25, 71.5625, 74.875, 78.1875, 81.5, 84.8125, 88.125, 91.4375, 94.75, 98.0625, 101.375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 126.0, 678.0, 201.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-257.965087890625, -253.48416137695312, -249.0032501220703, -244.5223388671875, -240.04141235351562, -235.56048583984375, -231.07957458496094, -226.59866333007812, -222.11773681640625, -217.63681030273438, -213.15589904785156, -208.67498779296875, -204.19406127929688, -199.713134765625, -195.2322235107422, -190.75131225585938, -186.2703857421875, -181.78945922851562, -177.3085479736328, -172.82763671875, -168.34671020507812, -163.86578369140625, -159.38487243652344, -154.90396118164062, -150.42303466796875, -145.94210815429688, -141.46119689941406, -136.98028564453125, -132.49935913085938, -128.0184326171875, -123.53752136230469, -119.05660247802734, -114.57566833496094, -110.0947494506836, -105.61383056640625, -101.1329116821289, -96.65199279785156, -92.17107391357422, -87.69015502929688, -83.20923614501953, -78.72831726074219, -74.24739837646484, -69.7664794921875, -65.28556060791016, -60.80464172363281, -56.32372283935547, -51.842803955078125, -47.36188507080078, -42.88096618652344, -38.400047302246094, -33.91912841796875, -29.438209533691406, -24.957290649414062, -20.47637176513672, -15.995452880859375, -11.514533996582031, -7.0336151123046875, -2.5526962280273438, 1.92822265625, 6.409141540527344, 10.890060424804688, 15.370979309082031, 19.851898193359375, 24.33281707763672, 28.813735961914062]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 4.0, 10.0, 14.0, 14.0, 18.0, 18.0, 31.0, 33.0, 23.0, 35.0, 30.0, 32.0, 34.0, 38.0, 37.0, 44.0, 42.0, 40.0, 49.0, 56.0, 44.0, 41.0, 42.0, 41.0, 32.0, 31.0, 23.0, 24.0, 17.0, 25.0, 15.0, 16.0, 16.0, 7.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.27882385253906, -59.11931228637695, -56.959800720214844, -54.800289154052734, -52.640777587890625, -50.48126983642578, -48.32175827026367, -46.16224670410156, -44.00273513793945, -41.843223571777344, -39.683712005615234, -37.524200439453125, -35.36469268798828, -33.205177307128906, -31.045669555664062, -28.886157989501953, -26.726646423339844, -24.567134857177734, -22.407623291015625, -20.24811363220215, -18.08860206604004, -15.92909049987793, -13.769579887390137, -11.610069274902344, -9.450557708740234, -7.291046619415283, -5.131535530090332, -2.972024440765381, -0.8125133514404297, 1.3469982147216797, 3.5065088272094727, 5.666019439697266, 7.825538635253906, 9.985050201416016, 12.144560813903809, 14.304071426391602, 16.46358299255371, 18.62309455871582, 20.782604217529297, 22.942115783691406, 25.101627349853516, 27.261138916015625, 29.420650482177734, 31.58016014099121, 33.73966979980469, 35.89918518066406, 38.058692932128906, 40.218204498291016, 42.377716064453125, 44.537227630615234, 46.696739196777344, 48.85625076293945, 51.01576232910156, 53.175270080566406, 55.334781646728516, 57.494293212890625, 59.653804779052734, 61.813316345214844, 63.97282791137695, 66.13233947753906, 68.2918472290039, 70.45136260986328, 72.61087036132812, 74.7703857421875, 76.92989349365234]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 11.0, 7.0, 15.0, 15.0, 13.0, 24.0, 11.0, 17.0, 33.0, 22.0, 21.0, 29.0, 23.0, 29.0, 36.0, 28.0, 35.0, 51.0, 51.0, 50.0, 34.0, 41.0, 38.0, 34.0, 46.0, 36.0, 33.0, 30.0, 27.0, 27.0, 17.0, 14.0, 10.0, 10.0, 17.0, 9.0, 6.0, 11.0, 10.0, 2.0, 3.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -8.0078125, -7.7421875, -7.4765625, -7.2109375, -6.9453125, -6.6796875, -6.4140625, -6.1484375, -5.8828125, -5.6171875, -5.3515625, -5.0859375, -4.8203125, -4.5546875, -4.2890625, -4.0234375, -3.7578125, -3.4921875, -3.2265625, -2.9609375, -2.6953125, -2.4296875, -2.1640625, -1.8984375, -1.6328125, -1.3671875, -1.1015625, -0.8359375, -0.5703125, -0.3046875, -0.0390625, 0.2265625, 0.4921875, 0.7578125, 1.0234375, 1.2890625, 1.5546875, 1.8203125, 2.0859375, 2.3515625, 2.6171875, 2.8828125, 3.1484375, 3.4140625, 3.6796875, 3.9453125, 4.2109375, 4.4765625, 4.7421875, 5.0078125, 5.2734375, 5.5390625, 5.8046875, 6.0703125, 6.3359375, 6.6015625, 6.8671875, 7.1328125, 7.3984375, 7.6640625, 7.9296875, 8.1953125, 8.4609375, 8.7265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 11.0, 13.0, 10.0, 10.0, 18.0, 23.0, 24.0, 36.0, 46.0, 46.0, 73.0, 104.0, 132.0, 216.0, 391.0, 968.0, 2640.0, 12344.0, 183779.0, 3147061.0, 809546.0, 29125.0, 4750.0, 1387.0, 621.0, 267.0, 163.0, 120.0, 80.0, 53.0, 25.0, 33.0, 32.0, 19.0, 17.0, 18.0, 8.0, 10.0, 6.0, 5.0, 11.0, 0.0, 7.0, 6.0, 1.0, 0.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-26.828125, -25.981689453125, -25.13525390625, -24.288818359375, -23.4423828125, -22.595947265625, -21.74951171875, -20.903076171875, -20.056640625, -19.210205078125, -18.36376953125, -17.517333984375, -16.6708984375, -15.824462890625, -14.97802734375, -14.131591796875, -13.28515625, -12.438720703125, -11.59228515625, -10.745849609375, -9.8994140625, -9.052978515625, -8.20654296875, -7.360107421875, -6.513671875, -5.667236328125, -4.82080078125, -3.974365234375, -3.1279296875, -2.281494140625, -1.43505859375, -0.588623046875, 0.2578125, 1.104248046875, 1.95068359375, 2.797119140625, 3.6435546875, 4.489990234375, 5.33642578125, 6.182861328125, 7.029296875, 7.875732421875, 8.72216796875, 9.568603515625, 10.4150390625, 11.261474609375, 12.10791015625, 12.954345703125, 13.80078125, 14.647216796875, 15.49365234375, 16.340087890625, 17.1865234375, 18.032958984375, 18.87939453125, 19.725830078125, 20.572265625, 21.418701171875, 22.26513671875, 23.111572265625, 23.9580078125, 24.804443359375, 25.65087890625, 26.497314453125, 27.34375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 6.0, 7.0, 10.0, 9.0, 22.0, 26.0, 39.0, 40.0, 65.0, 78.0, 102.0, 142.0, 203.0, 238.0, 321.0, 382.0, 448.0, 431.0, 349.0, 232.0, 218.0, 174.0, 108.0, 82.0, 80.0, 65.0, 43.0, 25.0, 31.0, 20.0, 10.0, 12.0, 6.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-15.203125, -14.76416015625, -14.3251953125, -13.88623046875, -13.447265625, -13.00830078125, -12.5693359375, -12.13037109375, -11.69140625, -11.25244140625, -10.8134765625, -10.37451171875, -9.935546875, -9.49658203125, -9.0576171875, -8.61865234375, -8.1796875, -7.74072265625, -7.3017578125, -6.86279296875, -6.423828125, -5.98486328125, -5.5458984375, -5.10693359375, -4.66796875, -4.22900390625, -3.7900390625, -3.35107421875, -2.912109375, -2.47314453125, -2.0341796875, -1.59521484375, -1.15625, -0.71728515625, -0.2783203125, 0.16064453125, 0.599609375, 1.03857421875, 1.4775390625, 1.91650390625, 2.35546875, 2.79443359375, 3.2333984375, 3.67236328125, 4.111328125, 4.55029296875, 4.9892578125, 5.42822265625, 5.8671875, 6.30615234375, 6.7451171875, 7.18408203125, 7.623046875, 8.06201171875, 8.5009765625, 8.93994140625, 9.37890625, 9.81787109375, 10.2568359375, 10.69580078125, 11.134765625, 11.57373046875, 12.0126953125, 12.45166015625, 12.890625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 2.0, 7.0, 9.0, 11.0, 10.0, 9.0, 10.0, 17.0, 25.0, 33.0, 53.0, 51.0, 71.0, 94.0, 109.0, 156.0, 161.0, 202.0, 291.0, 448.0, 1801.0, 53407.0, 4080822.0, 53009.0, 1783.0, 503.0, 267.0, 206.0, 153.0, 150.0, 84.0, 79.0, 67.0, 37.0, 33.0, 31.0, 20.0, 14.0, 13.0, 8.0, 11.0, 9.0, 4.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.4375, -67.779296875, -65.12109375, -62.462890625, -59.8046875, -57.146484375, -54.48828125, -51.830078125, -49.171875, -46.513671875, -43.85546875, -41.197265625, -38.5390625, -35.880859375, -33.22265625, -30.564453125, -27.90625, -25.248046875, -22.58984375, -19.931640625, -17.2734375, -14.615234375, -11.95703125, -9.298828125, -6.640625, -3.982421875, -1.32421875, 1.333984375, 3.9921875, 6.650390625, 9.30859375, 11.966796875, 14.625, 17.283203125, 19.94140625, 22.599609375, 25.2578125, 27.916015625, 30.57421875, 33.232421875, 35.890625, 38.548828125, 41.20703125, 43.865234375, 46.5234375, 49.181640625, 51.83984375, 54.498046875, 57.15625, 59.814453125, 62.47265625, 65.130859375, 67.7890625, 70.447265625, 73.10546875, 75.763671875, 78.421875, 81.080078125, 83.73828125, 86.396484375, 89.0546875, 91.712890625, 94.37109375, 97.029296875, 99.6875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 25.0, 167.0, 404.0, 324.0, 88.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-347.5029602050781, -339.74420166015625, -331.9854431152344, -324.2266845703125, -316.4679260253906, -308.70916748046875, -300.95037841796875, -293.1916198730469, -285.432861328125, -277.6741027832031, -269.91534423828125, -262.1565856933594, -254.39781188964844, -246.63905334472656, -238.8802947998047, -231.1215362548828, -223.36277770996094, -215.60401916503906, -207.8452606201172, -200.08648681640625, -192.32772827148438, -184.5689697265625, -176.81021118164062, -169.05145263671875, -161.29269409179688, -153.533935546875, -145.77517700195312, -138.01641845703125, -130.2576446533203, -122.49888610839844, -114.74012756347656, -106.98136901855469, -99.22259521484375, -91.46383666992188, -83.70507049560547, -75.9463119506836, -68.18754577636719, -60.42878723144531, -52.67002868652344, -44.9112663269043, -37.152503967285156, -29.393741607666016, -21.634981155395508, -13.876220703125, -6.117458343505859, 1.6413040161132812, 9.400062561035156, 17.158824920654297, 24.917587280273438, 32.67634963989258, 40.43511199951172, 48.193870544433594, 55.952632904052734, 63.711395263671875, 71.47015380859375, 79.22891235351562, 86.98767852783203, 94.7464370727539, 102.50520324707031, 110.26396179199219, 118.02272033691406, 125.78148651123047, 133.54025268554688, 141.29901123046875, 149.05776977539062]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 12.0, 8.0, 11.0, 11.0, 10.0, 18.0, 18.0, 23.0, 24.0, 43.0, 33.0, 35.0, 40.0, 32.0, 38.0, 35.0, 48.0, 40.0, 53.0, 43.0, 53.0, 54.0, 50.0, 35.0, 38.0, 24.0, 20.0, 23.0, 17.0, 23.0, 17.0, 10.0, 10.0, 15.0, 8.0, 4.0, 6.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.57706832885742, -44.775665283203125, -42.97426223754883, -41.17285919189453, -39.3714599609375, -37.5700569152832, -35.768653869628906, -33.96725082397461, -32.16584777832031, -30.364444732666016, -28.56304359436035, -26.761640548706055, -24.96023941040039, -23.158836364746094, -21.357433319091797, -19.5560302734375, -17.75463104248047, -15.953228950500488, -14.151826858520508, -12.350423812866211, -10.54902172088623, -8.74761962890625, -6.946216583251953, -5.144814491271973, -3.343412399291992, -1.5420100688934326, 0.25939226150512695, 2.0607948303222656, 3.862196922302246, 5.663599014282227, 7.465002059936523, 9.266404151916504, 11.06781005859375, 12.86921215057373, 14.670614242553711, 16.472017288208008, 18.273418426513672, 20.07482147216797, 21.876224517822266, 23.677627563476562, 25.479028701782227, 27.280431747436523, 29.081832885742188, 30.883235931396484, 32.68463897705078, 34.48603820800781, 36.287445068359375, 38.088844299316406, 39.8902473449707, 41.691650390625, 43.4930534362793, 45.294456481933594, 47.095855712890625, 48.89725875854492, 50.69866180419922, 52.500064849853516, 54.30146789550781, 56.10287094116211, 57.904273986816406, 59.70567321777344, 61.507076263427734, 63.30847930908203, 65.10987854003906, 66.91128540039062, 68.71268463134766]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 5.0, 9.0, 14.0, 13.0, 18.0, 20.0, 16.0, 24.0, 22.0, 26.0, 34.0, 35.0, 25.0, 29.0, 36.0, 41.0, 39.0, 43.0, 47.0, 43.0, 37.0, 36.0, 34.0, 35.0, 47.0, 38.0, 27.0, 36.0, 27.0, 25.0, 22.0, 17.0, 7.0, 10.0, 8.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.0546875, -9.7713623046875, -9.488037109375, -9.2047119140625, -8.92138671875, -8.6380615234375, -8.354736328125, -8.0714111328125, -7.7880859375, -7.5047607421875, -7.221435546875, -6.9381103515625, -6.65478515625, -6.3714599609375, -6.088134765625, -5.8048095703125, -5.521484375, -5.2381591796875, -4.954833984375, -4.6715087890625, -4.38818359375, -4.1048583984375, -3.821533203125, -3.5382080078125, -3.2548828125, -2.9715576171875, -2.688232421875, -2.4049072265625, -2.12158203125, -1.8382568359375, -1.554931640625, -1.2716064453125, -0.98828125, -0.7049560546875, -0.421630859375, -0.1383056640625, 0.14501953125, 0.4283447265625, 0.711669921875, 0.9949951171875, 1.2783203125, 1.5616455078125, 1.844970703125, 2.1282958984375, 2.41162109375, 2.6949462890625, 2.978271484375, 3.2615966796875, 3.544921875, 3.8282470703125, 4.111572265625, 4.3948974609375, 4.67822265625, 4.9615478515625, 5.244873046875, 5.5281982421875, 5.8115234375, 6.0948486328125, 6.378173828125, 6.6614990234375, 6.94482421875, 7.2281494140625, 7.511474609375, 7.7947998046875, 8.078125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 12.0, 15.0, 30.0, 39.0, 59.0, 88.0, 133.0, 206.0, 304.0, 420.0, 654.0, 981.0, 1398.0, 2199.0, 3310.0, 5129.0, 7745.0, 11858.0, 19228.0, 31014.0, 51745.0, 91756.0, 199099.0, 330774.0, 120636.0, 65328.0, 38884.0, 23582.0, 14838.0, 9351.0, 6026.0, 3798.0, 2607.0, 1794.0, 1154.0, 801.0, 512.0, 367.0, 230.0, 151.0, 100.0, 72.0, 42.0, 37.0, 16.0, 11.0, 12.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.966796875, -1.9057464599609375, -1.844696044921875, -1.7836456298828125, -1.72259521484375, -1.6615447998046875, -1.600494384765625, -1.5394439697265625, -1.4783935546875, -1.4173431396484375, -1.356292724609375, -1.2952423095703125, -1.23419189453125, -1.1731414794921875, -1.112091064453125, -1.0510406494140625, -0.989990234375, -0.9289398193359375, -0.867889404296875, -0.8068389892578125, -0.74578857421875, -0.6847381591796875, -0.623687744140625, -0.5626373291015625, -0.5015869140625, -0.4405364990234375, -0.379486083984375, -0.3184356689453125, -0.25738525390625, -0.1963348388671875, -0.135284423828125, -0.0742340087890625, -0.01318359375, 0.0478668212890625, 0.108917236328125, 0.1699676513671875, 0.23101806640625, 0.2920684814453125, 0.353118896484375, 0.4141693115234375, 0.4752197265625, 0.5362701416015625, 0.597320556640625, 0.6583709716796875, 0.71942138671875, 0.7804718017578125, 0.841522216796875, 0.9025726318359375, 0.963623046875, 1.0246734619140625, 1.085723876953125, 1.1467742919921875, 1.20782470703125, 1.2688751220703125, 1.329925537109375, 1.3909759521484375, 1.4520263671875, 1.5130767822265625, 1.574127197265625, 1.6351776123046875, 1.69622802734375, 1.7572784423828125, 1.818328857421875, 1.8793792724609375, 1.9404296875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 11.0, 4.0, 9.0, 13.0, 8.0, 15.0, 12.0, 15.0, 24.0, 24.0, 33.0, 30.0, 28.0, 37.0, 53.0, 40.0, 35.0, 38.0, 44.0, 1062.0, 50.0, 52.0, 52.0, 42.0, 27.0, 34.0, 40.0, 30.0, 28.0, 32.0, 22.0, 16.0, 9.0, 9.0, 9.0, 11.0, 12.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7421875, -6.5482177734375, -6.354248046875, -6.1602783203125, -5.96630859375, -5.7723388671875, -5.578369140625, -5.3843994140625, -5.1904296875, -4.9964599609375, -4.802490234375, -4.6085205078125, -4.41455078125, -4.2205810546875, -4.026611328125, -3.8326416015625, -3.638671875, -3.4447021484375, -3.250732421875, -3.0567626953125, -2.86279296875, -2.6688232421875, -2.474853515625, -2.2808837890625, -2.0869140625, -1.8929443359375, -1.698974609375, -1.5050048828125, -1.31103515625, -1.1170654296875, -0.923095703125, -0.7291259765625, -0.53515625, -0.3411865234375, -0.147216796875, 0.0467529296875, 0.24072265625, 0.4346923828125, 0.628662109375, 0.8226318359375, 1.0166015625, 1.2105712890625, 1.404541015625, 1.5985107421875, 1.79248046875, 1.9864501953125, 2.180419921875, 2.3743896484375, 2.568359375, 2.7623291015625, 2.956298828125, 3.1502685546875, 3.34423828125, 3.5382080078125, 3.732177734375, 3.9261474609375, 4.1201171875, 4.3140869140625, 4.508056640625, 4.7020263671875, 4.89599609375, 5.0899658203125, 5.283935546875, 5.4779052734375, 5.671875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 6.0, 19.0, 22.0, 33.0, 63.0, 74.0, 156.0, 240.0, 364.0, 630.0, 1094.0, 1851.0, 2825.0, 4544.0, 7542.0, 12800.0, 21926.0, 37959.0, 69245.0, 140094.0, 1426779.0, 179072.0, 82209.0, 44383.0, 25698.0, 14832.0, 8843.0, 5335.0, 3276.0, 2014.0, 1286.0, 757.0, 474.0, 250.0, 165.0, 93.0, 63.0, 42.0, 22.0, 20.0, 11.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.2855682373046875, -2.217620849609375, -2.1496734619140625, -2.08172607421875, -2.0137786865234375, -1.945831298828125, -1.8778839111328125, -1.8099365234375, -1.7419891357421875, -1.674041748046875, -1.6060943603515625, -1.53814697265625, -1.4701995849609375, -1.402252197265625, -1.3343048095703125, -1.266357421875, -1.1984100341796875, -1.130462646484375, -1.0625152587890625, -0.99456787109375, -0.9266204833984375, -0.858673095703125, -0.7907257080078125, -0.7227783203125, -0.6548309326171875, -0.586883544921875, -0.5189361572265625, -0.45098876953125, -0.3830413818359375, -0.315093994140625, -0.2471466064453125, -0.17919921875, -0.1112518310546875, -0.043304443359375, 0.0246429443359375, 0.09259033203125, 0.1605377197265625, 0.228485107421875, 0.2964324951171875, 0.3643798828125, 0.4323272705078125, 0.500274658203125, 0.5682220458984375, 0.63616943359375, 0.7041168212890625, 0.772064208984375, 0.8400115966796875, 0.907958984375, 0.9759063720703125, 1.043853759765625, 1.1118011474609375, 1.17974853515625, 1.2476959228515625, 1.315643310546875, 1.3835906982421875, 1.4515380859375, 1.5194854736328125, 1.587432861328125, 1.6553802490234375, 1.72332763671875, 1.7912750244140625, 1.859222412109375, 1.9271697998046875, 1.9951171875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 10.0, 4.0, 8.0, 10.0, 13.0, 7.0, 26.0, 16.0, 34.0, 34.0, 54.0, 80.0, 82.0, 111.0, 113.0, 94.0, 73.0, 47.0, 30.0, 35.0, 17.0, 15.0, 17.0, 5.0, 18.0, 7.0, 9.0, 7.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0009708404541015625, -0.0009403228759765625, -0.0009098052978515625, -0.0008792877197265625, -0.0008487701416015625, -0.0008182525634765625, -0.0007877349853515625, -0.0007572174072265625, -0.0007266998291015625, -0.0006961822509765625, -0.0006656646728515625, -0.0006351470947265625, -0.0006046295166015625, -0.0005741119384765625, -0.0005435943603515625, -0.0005130767822265625, -0.0004825592041015625, -0.0004520416259765625, -0.0004215240478515625, -0.0003910064697265625, -0.0003604888916015625, -0.0003299713134765625, -0.0002994537353515625, -0.0002689361572265625, -0.0002384185791015625, -0.0002079010009765625, -0.0001773834228515625, -0.0001468658447265625, -0.0001163482666015625, -8.58306884765625e-05, -5.53131103515625e-05, -2.47955322265625e-05, 5.7220458984375e-06, 3.62396240234375e-05, 6.67572021484375e-05, 9.72747802734375e-05, 0.0001277923583984375, 0.0001583099365234375, 0.0001888275146484375, 0.0002193450927734375, 0.0002498626708984375, 0.0002803802490234375, 0.0003108978271484375, 0.0003414154052734375, 0.0003719329833984375, 0.0004024505615234375, 0.0004329681396484375, 0.0004634857177734375, 0.0004940032958984375, 0.0005245208740234375, 0.0005550384521484375, 0.0005855560302734375, 0.0006160736083984375, 0.0006465911865234375, 0.0006771087646484375, 0.0007076263427734375, 0.0007381439208984375, 0.0007686614990234375, 0.0007991790771484375, 0.0008296966552734375, 0.0008602142333984375, 0.0008907318115234375, 0.0009212493896484375, 0.0009517669677734375, 0.0009822845458984375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 10.0, 13.0, 10.0, 10.0, 13.0, 14.0, 22.0, 33.0, 38.0, 56.0, 89.0, 122.0, 222.0, 615.0, 15836.0, 1027355.0, 3137.0, 399.0, 170.0, 118.0, 69.0, 43.0, 35.0, 27.0, 16.0, 11.0, 7.0, 17.0, 6.0, 3.0, 7.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0214691162109375, -0.020805835723876953, -0.020142555236816406, -0.01947927474975586, -0.018815994262695312, -0.018152713775634766, -0.01748943328857422, -0.016826152801513672, -0.016162872314453125, -0.015499591827392578, -0.014836311340332031, -0.014173030853271484, -0.013509750366210938, -0.01284646987915039, -0.012183189392089844, -0.011519908905029297, -0.01085662841796875, -0.010193347930908203, -0.009530067443847656, -0.00886678695678711, -0.008203506469726562, -0.007540225982666016, -0.006876945495605469, -0.006213665008544922, -0.005550384521484375, -0.004887104034423828, -0.004223823547363281, -0.0035605430603027344, -0.0028972625732421875, -0.0022339820861816406, -0.0015707015991210938, -0.0009074211120605469, -0.000244140625, 0.0004191398620605469, 0.0010824203491210938, 0.0017457008361816406, 0.0024089813232421875, 0.0030722618103027344, 0.0037355422973632812, 0.004398822784423828, 0.005062103271484375, 0.005725383758544922, 0.006388664245605469, 0.007051944732666016, 0.0077152252197265625, 0.00837850570678711, 0.009041786193847656, 0.009705066680908203, 0.01036834716796875, 0.011031627655029297, 0.011694908142089844, 0.01235818862915039, 0.013021469116210938, 0.013684749603271484, 0.014348030090332031, 0.015011310577392578, 0.015674591064453125, 0.016337871551513672, 0.01700115203857422, 0.017664432525634766, 0.018327713012695312, 0.01899099349975586, 0.019654273986816406, 0.020317554473876953, 0.0209808349609375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 24.0, 115.0, 267.0, 374.0, 167.0, 52.0, 11.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.002958074677735567, -0.0029054125770926476, -0.0028527502436190844, -0.002800088142976165, -0.0027474258095026016, -0.002694763708859682, -0.002642101375386119, -0.0025894392747431993, -0.002536776941269636, -0.0024841148406267166, -0.0024314525071531534, -0.002378790406510234, -0.0023261280730366707, -0.002273465972393751, -0.002220803638920188, -0.0021681415382772684, -0.002115479437634349, -0.0020628173369914293, -0.002010155003517866, -0.0019574929028749466, -0.0019048305694013834, -0.0018521684687584639, -0.0017995061352849007, -0.0017468440346419811, -0.001694181701168418, -0.0016415194841101766, -0.0015888572670519352, -0.0015361950499936938, -0.0014835328329354525, -0.001430870732292533, -0.0013782083988189697, -0.0013255462981760502, -0.0012728840811178088, -0.0012202218640595675, -0.001167559647001326, -0.0011148974299430847, -0.0010622352128848433, -0.001009572995826602, -0.0009569108369760215, -0.0009042486781254411, -0.0008515864028595388, -0.0007989241858012974, -0.0007462619687430561, -0.0006935998098924756, -0.0006409375928342342, -0.0005882753757759929, -0.0005356131587177515, -0.0004829509707633406, -0.0004302887537050992, -0.00037762653664685786, -0.00032496434869244695, -0.0002723021316342056, -0.00021963992912787944, -0.0001669777266215533, -0.00011431550956331193, -6.165332160890102e-05, -8.991104550659657e-06, 4.367110159364529e-05, 9.633330773795024e-05, 0.000148995517520234, 0.00020165772002656013, 0.00025431992253288627, 0.00030698213959112763, 0.00035964432754553854, 0.0004123065446037799]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 3.0, 8.0, 6.0, 14.0, 10.0, 12.0, 22.0, 15.0, 23.0, 29.0, 33.0, 36.0, 36.0, 34.0, 44.0, 39.0, 52.0, 41.0, 48.0, 42.0, 35.0, 47.0, 43.0, 40.0, 33.0, 28.0, 33.0, 28.0, 32.0, 21.0, 21.0, 13.0, 18.0, 8.0, 13.0, 4.0, 6.0, 4.0, 7.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042116641998291016, -0.000407366082072258, -0.00039356574416160583, -0.0003797654062509537, -0.0003659650683403015, -0.00035216473042964935, -0.0003383643925189972, -0.00032456405460834503, -0.00031076371669769287, -0.0002969633787870407, -0.00028316304087638855, -0.0002693627029657364, -0.00025556236505508423, -0.00024176202714443207, -0.0002279616892337799, -0.00021416135132312775, -0.00020036101341247559, -0.00018656067550182343, -0.00017276033759117126, -0.0001589599996805191, -0.00014515966176986694, -0.00013135932385921478, -0.00011755898594856262, -0.00010375864803791046, -8.99583101272583e-05, -7.615797221660614e-05, -6.235763430595398e-05, -4.855729639530182e-05, -3.475695848464966e-05, -2.0956620573997498e-05, -7.156282663345337e-06, 6.644055247306824e-06, 2.0444393157958984e-05, 3.4244731068611145e-05, 4.8045068979263306e-05, 6.184540688991547e-05, 7.564574480056763e-05, 8.944608271121979e-05, 0.00010324642062187195, 0.00011704675853252411, 0.00013084709644317627, 0.00014464743435382843, 0.0001584477722644806, 0.00017224811017513275, 0.0001860484480857849, 0.00019984878599643707, 0.00021364912390708923, 0.0002274494618177414, 0.00024124979972839355, 0.0002550501376390457, 0.0002688504755496979, 0.00028265081346035004, 0.0002964511513710022, 0.00031025148928165436, 0.0003240518271923065, 0.0003378521651029587, 0.00035165250301361084, 0.000365452840924263, 0.00037925317883491516, 0.0003930535167455673, 0.0004068538546562195, 0.00042065419256687164, 0.0004344545304775238, 0.00044825486838817596, 0.0004620552062988281]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 5.0, 9.0, 14.0, 13.0, 18.0, 20.0, 16.0, 24.0, 22.0, 26.0, 34.0, 35.0, 25.0, 29.0, 36.0, 41.0, 39.0, 43.0, 47.0, 43.0, 37.0, 36.0, 34.0, 35.0, 47.0, 38.0, 27.0, 36.0, 27.0, 25.0, 22.0, 17.0, 7.0, 10.0, 8.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.0546875, -9.7713623046875, -9.488037109375, -9.2047119140625, -8.92138671875, -8.6380615234375, -8.354736328125, -8.0714111328125, -7.7880859375, -7.5047607421875, -7.221435546875, -6.9381103515625, -6.65478515625, -6.3714599609375, -6.088134765625, -5.8048095703125, -5.521484375, -5.2381591796875, -4.954833984375, -4.6715087890625, -4.38818359375, -4.1048583984375, -3.821533203125, -3.5382080078125, -3.2548828125, -2.9715576171875, -2.688232421875, -2.4049072265625, -2.12158203125, -1.8382568359375, -1.554931640625, -1.2716064453125, -0.98828125, -0.7049560546875, -0.421630859375, -0.1383056640625, 0.14501953125, 0.4283447265625, 0.711669921875, 0.9949951171875, 1.2783203125, 1.5616455078125, 1.844970703125, 2.1282958984375, 2.41162109375, 2.6949462890625, 2.978271484375, 3.2615966796875, 3.544921875, 3.8282470703125, 4.111572265625, 4.3948974609375, 4.67822265625, 4.9615478515625, 5.244873046875, 5.5281982421875, 5.8115234375, 6.0948486328125, 6.378173828125, 6.6614990234375, 6.94482421875, 7.2281494140625, 7.511474609375, 7.7947998046875, 8.078125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 4.0, 9.0, 11.0, 13.0, 17.0, 27.0, 28.0, 36.0, 34.0, 61.0, 75.0, 109.0, 135.0, 245.0, 333.0, 665.0, 1423.0, 3895.0, 17873.0, 141884.0, 748014.0, 112120.0, 14988.0, 3502.0, 1245.0, 625.0, 387.0, 238.0, 143.0, 99.0, 77.0, 61.0, 43.0, 29.0, 22.0, 20.0, 12.0, 19.0, 4.0, 8.0, 3.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.546875, -18.023681640625, -17.50048828125, -16.977294921875, -16.4541015625, -15.930908203125, -15.40771484375, -14.884521484375, -14.361328125, -13.838134765625, -13.31494140625, -12.791748046875, -12.2685546875, -11.745361328125, -11.22216796875, -10.698974609375, -10.17578125, -9.652587890625, -9.12939453125, -8.606201171875, -8.0830078125, -7.559814453125, -7.03662109375, -6.513427734375, -5.990234375, -5.467041015625, -4.94384765625, -4.420654296875, -3.8974609375, -3.374267578125, -2.85107421875, -2.327880859375, -1.8046875, -1.281494140625, -0.75830078125, -0.235107421875, 0.2880859375, 0.811279296875, 1.33447265625, 1.857666015625, 2.380859375, 2.904052734375, 3.42724609375, 3.950439453125, 4.4736328125, 4.996826171875, 5.52001953125, 6.043212890625, 6.56640625, 7.089599609375, 7.61279296875, 8.135986328125, 8.6591796875, 9.182373046875, 9.70556640625, 10.228759765625, 10.751953125, 11.275146484375, 11.79833984375, 12.321533203125, 12.8447265625, 13.367919921875, 13.89111328125, 14.414306640625, 14.9375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 4.0, 7.0, 9.0, 7.0, 9.0, 18.0, 18.0, 24.0, 26.0, 28.0, 35.0, 38.0, 29.0, 42.0, 52.0, 64.0, 84.0, 240.0, 1632.0, 181.0, 75.0, 48.0, 49.0, 50.0, 34.0, 33.0, 39.0, 30.0, 25.0, 25.0, 20.0, 14.0, 12.0, 5.0, 9.0, 8.0, 7.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.84375, -24.96240234375, -24.0810546875, -23.19970703125, -22.318359375, -21.43701171875, -20.5556640625, -19.67431640625, -18.79296875, -17.91162109375, -17.0302734375, -16.14892578125, -15.267578125, -14.38623046875, -13.5048828125, -12.62353515625, -11.7421875, -10.86083984375, -9.9794921875, -9.09814453125, -8.216796875, -7.33544921875, -6.4541015625, -5.57275390625, -4.69140625, -3.81005859375, -2.9287109375, -2.04736328125, -1.166015625, -0.28466796875, 0.5966796875, 1.47802734375, 2.359375, 3.24072265625, 4.1220703125, 5.00341796875, 5.884765625, 6.76611328125, 7.6474609375, 8.52880859375, 9.41015625, 10.29150390625, 11.1728515625, 12.05419921875, 12.935546875, 13.81689453125, 14.6982421875, 15.57958984375, 16.4609375, 17.34228515625, 18.2236328125, 19.10498046875, 19.986328125, 20.86767578125, 21.7490234375, 22.63037109375, 23.51171875, 24.39306640625, 25.2744140625, 26.15576171875, 27.037109375, 27.91845703125, 28.7998046875, 29.68115234375, 30.5625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 7.0, 8.0, 11.0, 10.0, 12.0, 18.0, 21.0, 25.0, 28.0, 40.0, 53.0, 43.0, 78.0, 121.0, 191.0, 308.0, 768.0, 8611.0, 3112821.0, 20556.0, 966.0, 330.0, 192.0, 107.0, 96.0, 51.0, 50.0, 31.0, 32.0, 30.0, 23.0, 13.0, 8.0, 12.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-92.75, -90.068359375, -87.38671875, -84.705078125, -82.0234375, -79.341796875, -76.66015625, -73.978515625, -71.296875, -68.615234375, -65.93359375, -63.251953125, -60.5703125, -57.888671875, -55.20703125, -52.525390625, -49.84375, -47.162109375, -44.48046875, -41.798828125, -39.1171875, -36.435546875, -33.75390625, -31.072265625, -28.390625, -25.708984375, -23.02734375, -20.345703125, -17.6640625, -14.982421875, -12.30078125, -9.619140625, -6.9375, -4.255859375, -1.57421875, 1.107421875, 3.7890625, 6.470703125, 9.15234375, 11.833984375, 14.515625, 17.197265625, 19.87890625, 22.560546875, 25.2421875, 27.923828125, 30.60546875, 33.287109375, 35.96875, 38.650390625, 41.33203125, 44.013671875, 46.6953125, 49.376953125, 52.05859375, 54.740234375, 57.421875, 60.103515625, 62.78515625, 65.466796875, 68.1484375, 70.830078125, 73.51171875, 76.193359375, 78.875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 38.0, 288.0, 545.0, 134.0, 13.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.62013244628906, -151.75836181640625, -147.89659118652344, -144.03482055664062, -140.1730499267578, -136.311279296875, -132.4495086669922, -128.58773803710938, -124.72596740722656, -120.86419677734375, -117.00242614746094, -113.14065551757812, -109.27888488769531, -105.4171142578125, -101.55534362792969, -97.69357299804688, -93.83180236816406, -89.97003173828125, -86.10826110839844, -82.24649047851562, -78.38471984863281, -74.52294921875, -70.66117858886719, -66.79940795898438, -62.93763732910156, -59.07586669921875, -55.21409606933594, -51.352325439453125, -47.49055480957031, -43.6287841796875, -39.76701354980469, -35.905242919921875, -32.04346466064453, -28.18169403076172, -24.319923400878906, -20.458152770996094, -16.59638214111328, -12.734611511230469, -8.872840881347656, -5.011070251464844, -1.1492996215820312, 2.7124710083007812, 6.574241638183594, 10.436012268066406, 14.297782897949219, 18.15955352783203, 22.021324157714844, 25.883094787597656, 29.74486541748047, 33.60663604736328, 37.468406677246094, 41.330177307128906, 45.19194793701172, 49.05371856689453, 52.915489196777344, 56.777259826660156, 60.63903045654297, 64.50080108642578, 68.3625717163086, 72.2243423461914, 76.08611297607422, 79.94788360595703, 83.80965423583984, 87.67142486572266, 91.53319549560547]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 12.0, 8.0, 14.0, 20.0, 24.0, 16.0, 22.0, 31.0, 26.0, 34.0, 29.0, 36.0, 37.0, 43.0, 50.0, 41.0, 46.0, 41.0, 39.0, 40.0, 42.0, 36.0, 24.0, 45.0, 29.0, 22.0, 28.0, 25.0, 17.0, 17.0, 15.0, 12.0, 13.0, 13.0, 9.0, 9.0, 6.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.28752899169922, -77.75121307373047, -75.21489715576172, -72.67858123779297, -70.14226531982422, -67.60594940185547, -65.06963348388672, -62.53331756591797, -59.99700164794922, -57.46068572998047, -54.92436981201172, -52.38805389404297, -49.85173797607422, -47.31542205810547, -44.77910614013672, -42.24279022216797, -39.70647430419922, -37.17015838623047, -34.63384246826172, -32.09752655029297, -29.56121063232422, -27.02489471435547, -24.48857879638672, -21.95226287841797, -19.41594696044922, -16.87963104248047, -14.343315124511719, -11.806999206542969, -9.270683288574219, -6.734367370605469, -4.198051452636719, -1.6617355346679688, 0.8745803833007812, 3.4108963012695312, 5.947212219238281, 8.483528137207031, 11.019844055175781, 13.556159973144531, 16.09247589111328, 18.62879180908203, 21.16510772705078, 23.70142364501953, 26.23773956298828, 28.77405548095703, 31.31037139892578, 33.84668731689453, 36.38300323486328, 38.91931915283203, 41.45563507080078, 43.99195098876953, 46.52826690673828, 49.06458282470703, 51.60089874267578, 54.13721466064453, 56.67353057861328, 59.20984649658203, 61.74616241455078, 64.28247833251953, 66.81879425048828, 69.35511016845703, 71.89142608642578, 74.42774200439453, 76.96405792236328, 79.50037384033203, 82.03668975830078]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 5.0, 10.0, 9.0, 19.0, 14.0, 13.0, 17.0, 24.0, 23.0, 33.0, 22.0, 30.0, 31.0, 48.0, 39.0, 35.0, 37.0, 38.0, 49.0, 45.0, 38.0, 47.0, 40.0, 48.0, 40.0, 29.0, 26.0, 30.0, 35.0, 12.0, 22.0, 23.0, 10.0, 9.0, 6.0, 14.0, 2.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.9921875, -10.683837890625, -10.37548828125, -10.067138671875, -9.7587890625, -9.450439453125, -9.14208984375, -8.833740234375, -8.525390625, -8.217041015625, -7.90869140625, -7.600341796875, -7.2919921875, -6.983642578125, -6.67529296875, -6.366943359375, -6.05859375, -5.750244140625, -5.44189453125, -5.133544921875, -4.8251953125, -4.516845703125, -4.20849609375, -3.900146484375, -3.591796875, -3.283447265625, -2.97509765625, -2.666748046875, -2.3583984375, -2.050048828125, -1.74169921875, -1.433349609375, -1.125, -0.816650390625, -0.50830078125, -0.199951171875, 0.1083984375, 0.416748046875, 0.72509765625, 1.033447265625, 1.341796875, 1.650146484375, 1.95849609375, 2.266845703125, 2.5751953125, 2.883544921875, 3.19189453125, 3.500244140625, 3.80859375, 4.116943359375, 4.42529296875, 4.733642578125, 5.0419921875, 5.350341796875, 5.65869140625, 5.967041015625, 6.275390625, 6.583740234375, 6.89208984375, 7.200439453125, 7.5087890625, 7.817138671875, 8.12548828125, 8.433837890625, 8.7421875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 11.0, 6.0, 8.0, 12.0, 18.0, 16.0, 26.0, 65.0, 74.0, 83.0, 138.0, 211.0, 330.0, 590.0, 1118.0, 2107.0, 4494.0, 10586.0, 30032.0, 125737.0, 645829.0, 1747614.0, 1224016.0, 307265.0, 62213.0, 17958.0, 7062.0, 3128.0, 1508.0, 783.0, 451.0, 291.0, 154.0, 101.0, 80.0, 45.0, 39.0, 23.0, 22.0, 10.0, 4.0, 9.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0], "bins": [-15.078125, -14.66796875, -14.2578125, -13.84765625, -13.4375, -13.02734375, -12.6171875, -12.20703125, -11.796875, -11.38671875, -10.9765625, -10.56640625, -10.15625, -9.74609375, -9.3359375, -8.92578125, -8.515625, -8.10546875, -7.6953125, -7.28515625, -6.875, -6.46484375, -6.0546875, -5.64453125, -5.234375, -4.82421875, -4.4140625, -4.00390625, -3.59375, -3.18359375, -2.7734375, -2.36328125, -1.953125, -1.54296875, -1.1328125, -0.72265625, -0.3125, 0.09765625, 0.5078125, 0.91796875, 1.328125, 1.73828125, 2.1484375, 2.55859375, 2.96875, 3.37890625, 3.7890625, 4.19921875, 4.609375, 5.01953125, 5.4296875, 5.83984375, 6.25, 6.66015625, 7.0703125, 7.48046875, 7.890625, 8.30078125, 8.7109375, 9.12109375, 9.53125, 9.94140625, 10.3515625, 10.76171875, 11.171875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 7.0, 8.0, 5.0, 8.0, 9.0, 17.0, 13.0, 29.0, 27.0, 49.0, 82.0, 73.0, 98.0, 136.0, 163.0, 217.0, 287.0, 359.0, 426.0, 412.0, 364.0, 268.0, 232.0, 170.0, 165.0, 126.0, 87.0, 54.0, 39.0, 32.0, 33.0, 17.0, 11.0, 11.0, 11.0, 9.0, 7.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.1015625, -14.6002197265625, -14.098876953125, -13.5975341796875, -13.09619140625, -12.5948486328125, -12.093505859375, -11.5921630859375, -11.0908203125, -10.5894775390625, -10.088134765625, -9.5867919921875, -9.08544921875, -8.5841064453125, -8.082763671875, -7.5814208984375, -7.080078125, -6.5787353515625, -6.077392578125, -5.5760498046875, -5.07470703125, -4.5733642578125, -4.072021484375, -3.5706787109375, -3.0693359375, -2.5679931640625, -2.066650390625, -1.5653076171875, -1.06396484375, -0.5626220703125, -0.061279296875, 0.4400634765625, 0.94140625, 1.4427490234375, 1.944091796875, 2.4454345703125, 2.94677734375, 3.4481201171875, 3.949462890625, 4.4508056640625, 4.9521484375, 5.4534912109375, 5.954833984375, 6.4561767578125, 6.95751953125, 7.4588623046875, 7.960205078125, 8.4615478515625, 8.962890625, 9.4642333984375, 9.965576171875, 10.4669189453125, 10.96826171875, 11.4696044921875, 11.970947265625, 12.4722900390625, 12.9736328125, 13.4749755859375, 13.976318359375, 14.4776611328125, 14.97900390625, 15.4803466796875, 15.981689453125, 16.4830322265625, 16.984375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 2.0, 8.0, 9.0, 22.0, 22.0, 24.0, 27.0, 40.0, 52.0, 57.0, 78.0, 86.0, 110.0, 145.0, 181.0, 257.0, 325.0, 530.0, 1239.0, 10676.0, 1123397.0, 3034870.0, 18248.0, 1687.0, 603.0, 346.0, 252.0, 198.0, 153.0, 140.0, 95.0, 86.0, 77.0, 57.0, 44.0, 28.0, 23.0, 24.0, 18.0, 14.0, 9.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-78.1875, -76.0791015625, -73.970703125, -71.8623046875, -69.75390625, -67.6455078125, -65.537109375, -63.4287109375, -61.3203125, -59.2119140625, -57.103515625, -54.9951171875, -52.88671875, -50.7783203125, -48.669921875, -46.5615234375, -44.453125, -42.3447265625, -40.236328125, -38.1279296875, -36.01953125, -33.9111328125, -31.802734375, -29.6943359375, -27.5859375, -25.4775390625, -23.369140625, -21.2607421875, -19.15234375, -17.0439453125, -14.935546875, -12.8271484375, -10.71875, -8.6103515625, -6.501953125, -4.3935546875, -2.28515625, -0.1767578125, 1.931640625, 4.0400390625, 6.1484375, 8.2568359375, 10.365234375, 12.4736328125, 14.58203125, 16.6904296875, 18.798828125, 20.9072265625, 23.015625, 25.1240234375, 27.232421875, 29.3408203125, 31.44921875, 33.5576171875, 35.666015625, 37.7744140625, 39.8828125, 41.9912109375, 44.099609375, 46.2080078125, 48.31640625, 50.4248046875, 52.533203125, 54.6416015625, 56.75]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 17.0, 981.0, 18.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-880.4454345703125, -848.4639892578125, -816.4825439453125, -784.5010375976562, -752.5195922851562, -720.5381469726562, -688.5567016601562, -656.5751953125, -624.59375, -592.6123046875, -560.630859375, -528.6493530273438, -496.66790771484375, -464.68646240234375, -432.70501708984375, -400.7235412597656, -368.7420959472656, -336.7606506347656, -304.7791748046875, -272.7977294921875, -240.81625366210938, -208.83480834960938, -176.8533477783203, -144.87188720703125, -112.89042663574219, -80.90896606445312, -48.92750930786133, -16.94605255126953, 15.035408020019531, 47.01686096191406, 78.99832153320312, 110.97978210449219, 142.96124267578125, 174.9427032470703, 206.92416381835938, 238.90560913085938, 270.8870849609375, 302.8685302734375, 334.8499755859375, 366.8314514160156, 398.81292724609375, 430.79437255859375, 462.7758483886719, 494.7572937011719, 526.73876953125, 558.72021484375, 590.70166015625, 622.68310546875, 654.66455078125, 686.64599609375, 718.62744140625, 750.6089477539062, 782.5903930664062, 814.5718383789062, 846.5532836914062, 878.5347900390625, 910.5162353515625, 942.4976806640625, 974.4791259765625, 1006.4606323242188, 1038.4420166015625, 1070.423583984375, 1102.405029296875, 1134.386474609375, 1166.367919921875]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 4.0, 2.0, 8.0, 8.0, 6.0, 11.0, 18.0, 18.0, 22.0, 31.0, 31.0, 25.0, 33.0, 51.0, 42.0, 47.0, 49.0, 48.0, 46.0, 53.0, 42.0, 62.0, 50.0, 38.0, 35.0, 43.0, 39.0, 22.0, 20.0, 21.0, 15.0, 15.0, 11.0, 8.0, 2.0, 8.0, 4.0, 3.0, 8.0, 2.0, 1.0, 0.0, 1.0], "bins": [-84.360107421875, -82.2020034790039, -80.04390716552734, -77.88580322265625, -75.72770690917969, -73.5696029663086, -71.4114990234375, -69.25340270996094, -67.09529876708984, -64.93719482421875, -62.77909851074219, -60.620994567871094, -58.462894439697266, -56.30479431152344, -54.146690368652344, -51.988590240478516, -49.83049011230469, -47.67238998413086, -45.51428985595703, -43.35618591308594, -41.19808578491211, -39.03998565673828, -36.88188171386719, -34.72378158569336, -32.56568145751953, -30.407581329345703, -28.249479293823242, -26.09137725830078, -23.933277130126953, -21.775177001953125, -19.617074966430664, -17.458972930908203, -15.300872802734375, -13.14277172088623, -10.984670639038086, -8.826569557189941, -6.668468475341797, -4.510367393493652, -2.352266311645508, -0.19416522979736328, 1.9639358520507812, 4.122036933898926, 6.28013801574707, 8.438239097595215, 10.59634017944336, 12.754441261291504, 14.912542343139648, 17.07064437866211, 19.228744506835938, 21.386844635009766, 23.544946670532227, 25.703048706054688, 27.861148834228516, 30.019248962402344, 32.17735290527344, 34.335453033447266, 36.493553161621094, 38.65165328979492, 40.80975341796875, 42.967857360839844, 45.12595748901367, 47.2840576171875, 49.442161560058594, 51.60026168823242, 53.75836181640625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 13.0, 8.0, 5.0, 6.0, 16.0, 15.0, 16.0, 21.0, 29.0, 31.0, 22.0, 29.0, 33.0, 40.0, 33.0, 28.0, 48.0, 36.0, 47.0, 42.0, 40.0, 43.0, 38.0, 50.0, 33.0, 49.0, 29.0, 32.0, 29.0, 25.0, 26.0, 13.0, 18.0, 10.0, 11.0, 5.0, 4.0, 6.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-11.078125, -10.772705078125, -10.46728515625, -10.161865234375, -9.8564453125, -9.551025390625, -9.24560546875, -8.940185546875, -8.634765625, -8.329345703125, -8.02392578125, -7.718505859375, -7.4130859375, -7.107666015625, -6.80224609375, -6.496826171875, -6.19140625, -5.885986328125, -5.58056640625, -5.275146484375, -4.9697265625, -4.664306640625, -4.35888671875, -4.053466796875, -3.748046875, -3.442626953125, -3.13720703125, -2.831787109375, -2.5263671875, -2.220947265625, -1.91552734375, -1.610107421875, -1.3046875, -0.999267578125, -0.69384765625, -0.388427734375, -0.0830078125, 0.222412109375, 0.52783203125, 0.833251953125, 1.138671875, 1.444091796875, 1.74951171875, 2.054931640625, 2.3603515625, 2.665771484375, 2.97119140625, 3.276611328125, 3.58203125, 3.887451171875, 4.19287109375, 4.498291015625, 4.8037109375, 5.109130859375, 5.41455078125, 5.719970703125, 6.025390625, 6.330810546875, 6.63623046875, 6.941650390625, 7.2470703125, 7.552490234375, 7.85791015625, 8.163330078125, 8.46875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 10.0, 15.0, 21.0, 36.0, 43.0, 98.0, 127.0, 168.0, 305.0, 401.0, 692.0, 1011.0, 1497.0, 2378.0, 3820.0, 5857.0, 9563.0, 15313.0, 25372.0, 42361.0, 75272.0, 149650.0, 339873.0, 172018.0, 83804.0, 46329.0, 27701.0, 16669.0, 10232.0, 6335.0, 4236.0, 2537.0, 1685.0, 1095.0, 677.0, 473.0, 308.0, 208.0, 136.0, 65.0, 65.0, 34.0, 22.0, 16.0, 13.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.123046875, -2.057891845703125, -1.99273681640625, -1.927581787109375, -1.8624267578125, -1.797271728515625, -1.73211669921875, -1.666961669921875, -1.601806640625, -1.536651611328125, -1.47149658203125, -1.406341552734375, -1.3411865234375, -1.276031494140625, -1.21087646484375, -1.145721435546875, -1.08056640625, -1.015411376953125, -0.95025634765625, -0.885101318359375, -0.8199462890625, -0.754791259765625, -0.68963623046875, -0.624481201171875, -0.559326171875, -0.494171142578125, -0.42901611328125, -0.363861083984375, -0.2987060546875, -0.233551025390625, -0.16839599609375, -0.103240966796875, -0.0380859375, 0.027069091796875, 0.09222412109375, 0.157379150390625, 0.2225341796875, 0.287689208984375, 0.35284423828125, 0.417999267578125, 0.483154296875, 0.548309326171875, 0.61346435546875, 0.678619384765625, 0.7437744140625, 0.808929443359375, 0.87408447265625, 0.939239501953125, 1.00439453125, 1.069549560546875, 1.13470458984375, 1.199859619140625, 1.2650146484375, 1.330169677734375, 1.39532470703125, 1.460479736328125, 1.525634765625, 1.590789794921875, 1.65594482421875, 1.721099853515625, 1.7862548828125, 1.851409912109375, 1.91656494140625, 1.981719970703125, 2.046875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 5.0, 12.0, 9.0, 16.0, 16.0, 9.0, 32.0, 21.0, 25.0, 37.0, 31.0, 29.0, 34.0, 42.0, 32.0, 29.0, 47.0, 1067.0, 47.0, 52.0, 40.0, 36.0, 30.0, 34.0, 33.0, 35.0, 29.0, 30.0, 20.0, 23.0, 22.0, 23.0, 15.0, 14.0, 11.0, 9.0, 6.0, 7.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.453125, -6.25665283203125, -6.0601806640625, -5.86370849609375, -5.667236328125, -5.47076416015625, -5.2742919921875, -5.07781982421875, -4.88134765625, -4.68487548828125, -4.4884033203125, -4.29193115234375, -4.095458984375, -3.89898681640625, -3.7025146484375, -3.50604248046875, -3.3095703125, -3.11309814453125, -2.9166259765625, -2.72015380859375, -2.523681640625, -2.32720947265625, -2.1307373046875, -1.93426513671875, -1.73779296875, -1.54132080078125, -1.3448486328125, -1.14837646484375, -0.951904296875, -0.75543212890625, -0.5589599609375, -0.36248779296875, -0.166015625, 0.03045654296875, 0.2269287109375, 0.42340087890625, 0.619873046875, 0.81634521484375, 1.0128173828125, 1.20928955078125, 1.40576171875, 1.60223388671875, 1.7987060546875, 1.99517822265625, 2.191650390625, 2.38812255859375, 2.5845947265625, 2.78106689453125, 2.9775390625, 3.17401123046875, 3.3704833984375, 3.56695556640625, 3.763427734375, 3.95989990234375, 4.1563720703125, 4.35284423828125, 4.54931640625, 4.74578857421875, 4.9422607421875, 5.13873291015625, 5.335205078125, 5.53167724609375, 5.7281494140625, 5.92462158203125, 6.12109375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 9.0, 17.0, 27.0, 42.0, 68.0, 97.0, 162.0, 260.0, 364.0, 627.0, 1003.0, 1711.0, 2729.0, 4520.0, 7289.0, 12031.0, 19923.0, 33013.0, 55605.0, 100376.0, 254222.0, 1347820.0, 107807.0, 59600.0, 34757.0, 20546.0, 12533.0, 7735.0, 4754.0, 2875.0, 1707.0, 1089.0, 665.0, 410.0, 272.0, 158.0, 113.0, 69.0, 41.0, 35.0, 20.0, 13.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.26953125, -2.20086669921875, -2.1322021484375, -2.06353759765625, -1.994873046875, -1.92620849609375, -1.8575439453125, -1.78887939453125, -1.72021484375, -1.65155029296875, -1.5828857421875, -1.51422119140625, -1.445556640625, -1.37689208984375, -1.3082275390625, -1.23956298828125, -1.1708984375, -1.10223388671875, -1.0335693359375, -0.96490478515625, -0.896240234375, -0.82757568359375, -0.7589111328125, -0.69024658203125, -0.62158203125, -0.55291748046875, -0.4842529296875, -0.41558837890625, -0.346923828125, -0.27825927734375, -0.2095947265625, -0.14093017578125, -0.072265625, -0.00360107421875, 0.0650634765625, 0.13372802734375, 0.202392578125, 0.27105712890625, 0.3397216796875, 0.40838623046875, 0.47705078125, 0.54571533203125, 0.6143798828125, 0.68304443359375, 0.751708984375, 0.82037353515625, 0.8890380859375, 0.95770263671875, 1.0263671875, 1.09503173828125, 1.1636962890625, 1.23236083984375, 1.301025390625, 1.36968994140625, 1.4383544921875, 1.50701904296875, 1.57568359375, 1.64434814453125, 1.7130126953125, 1.78167724609375, 1.850341796875, 1.91900634765625, 1.9876708984375, 2.05633544921875, 2.125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 6.0, 4.0, 10.0, 8.0, 11.0, 13.0, 20.0, 24.0, 21.0, 44.0, 67.0, 73.0, 74.0, 95.0, 100.0, 76.0, 77.0, 59.0, 47.0, 27.0, 27.0, 22.0, 12.0, 11.0, 9.0, 7.0, 10.0, 6.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0010318756103515625, -0.0009996891021728516, -0.0009675025939941406, -0.0009353160858154297, -0.0009031295776367188, -0.0008709430694580078, -0.0008387565612792969, -0.0008065700531005859, -0.000774383544921875, -0.0007421970367431641, -0.0007100105285644531, -0.0006778240203857422, -0.0006456375122070312, -0.0006134510040283203, -0.0005812644958496094, -0.0005490779876708984, -0.0005168914794921875, -0.00048470497131347656, -0.0004525184631347656, -0.0004203319549560547, -0.00038814544677734375, -0.0003559589385986328, -0.0003237724304199219, -0.00029158592224121094, -0.0002593994140625, -0.00022721290588378906, -0.00019502639770507812, -0.0001628398895263672, -0.00013065338134765625, -9.846687316894531e-05, -6.628036499023438e-05, -3.409385681152344e-05, -1.9073486328125e-06, 3.0279159545898438e-05, 6.246566772460938e-05, 9.465217590332031e-05, 0.00012683868408203125, 0.0001590251922607422, 0.00019121170043945312, 0.00022339820861816406, 0.000255584716796875, 0.00028777122497558594, 0.0003199577331542969, 0.0003521442413330078, 0.00038433074951171875, 0.0004165172576904297, 0.0004487037658691406, 0.00048089027404785156, 0.0005130767822265625, 0.0005452632904052734, 0.0005774497985839844, 0.0006096363067626953, 0.0006418228149414062, 0.0006740093231201172, 0.0007061958312988281, 0.0007383823394775391, 0.00077056884765625, 0.0008027553558349609, 0.0008349418640136719, 0.0008671283721923828, 0.0008993148803710938, 0.0009315013885498047, 0.0009636878967285156, 0.0009958744049072266, 0.0010280609130859375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 0.0, 3.0, 4.0, 3.0, 9.0, 10.0, 13.0, 8.0, 18.0, 12.0, 21.0, 33.0, 44.0, 54.0, 93.0, 145.0, 234.0, 595.0, 11942.0, 1029262.0, 4823.0, 511.0, 235.0, 142.0, 85.0, 55.0, 41.0, 28.0, 22.0, 17.0, 19.0, 10.0, 7.0, 7.0, 9.0, 7.0, 7.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.020263671875, -0.019575119018554688, -0.018886566162109375, -0.018198013305664062, -0.01750946044921875, -0.016820907592773438, -0.016132354736328125, -0.015443801879882812, -0.0147552490234375, -0.014066696166992188, -0.013378143310546875, -0.012689590454101562, -0.01200103759765625, -0.011312484741210938, -0.010623931884765625, -0.009935379028320312, -0.009246826171875, -0.008558273315429688, -0.007869720458984375, -0.0071811676025390625, -0.00649261474609375, -0.0058040618896484375, -0.005115509033203125, -0.0044269561767578125, -0.0037384033203125, -0.0030498504638671875, -0.002361297607421875, -0.0016727447509765625, -0.00098419189453125, -0.0002956390380859375, 0.000392913818359375, 0.0010814666748046875, 0.00177001953125, 0.0024585723876953125, 0.003147125244140625, 0.0038356781005859375, 0.00452423095703125, 0.0052127838134765625, 0.005901336669921875, 0.0065898895263671875, 0.0072784423828125, 0.007966995239257812, 0.008655548095703125, 0.009344100952148438, 0.01003265380859375, 0.010721206665039062, 0.011409759521484375, 0.012098312377929688, 0.012786865234375, 0.013475418090820312, 0.014163970947265625, 0.014852523803710938, 0.01554107666015625, 0.016229629516601562, 0.016918182373046875, 0.017606735229492188, 0.0182952880859375, 0.018983840942382812, 0.019672393798828125, 0.020360946655273438, 0.02104949951171875, 0.021738052368164062, 0.022426605224609375, 0.023115158081054688, 0.0238037109375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 170.0, 683.0, 145.0, 10.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004098684526979923, -0.0039830864407122135, -0.00386748812161386, -0.0037518900353461504, -0.0036362919490784407, -0.0035206936299800873, -0.0034050955437123775, -0.003289497457444668, -0.003173899371176958, -0.0030583012849092484, -0.002942702965810895, -0.0028271048795431852, -0.0027115067932754755, -0.002595908474177122, -0.0024803103879094124, -0.0023647123016417027, -0.0022491139825433493, -0.0021335158962756395, -0.002017917577177286, -0.0019023194909095764, -0.0017867214046418667, -0.0016711232019588351, -0.0015555249992758036, -0.0014399269130080938, -0.0013243287103250623, -0.0012087305076420307, -0.001093132421374321, -0.0009775342186912894, -0.0008619360742159188, -0.0007463379297405481, -0.0006307397270575166, -0.0005151415825821459, -0.0003995434381067753, -0.00028394529363140464, -0.00016834712005220354, -5.2748946473002434e-05, 6.284919800236821e-05, 0.00017844734247773886, 0.0002940455451607704, 0.00040964368963614106, 0.0005252418341115117, 0.0006408399785868824, 0.000756438123062253, 0.0008720363257452846, 0.0009876345284283161, 0.0011032326146960258, 0.0012188308173790574, 0.001334429020062089, 0.0014500271063297987, 0.0015656253090128303, 0.00168122339528054, 0.0017968215979635715, 0.0019124196842312813, 0.002028017770498991, 0.0021436160895973444, 0.002259214175865054, 0.0023748124949634075, 0.0024904105812311172, 0.0026060089003294706, 0.0027216069865971804, 0.00283720507286489, 0.0029528033919632435, 0.003068401478230953, 0.003183999564498663, 0.0032995976507663727]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 3.0, 0.0, 4.0, 4.0, 7.0, 7.0, 2.0, 13.0, 17.0, 9.0, 16.0, 16.0, 26.0, 21.0, 34.0, 31.0, 35.0, 31.0, 39.0, 31.0, 47.0, 46.0, 48.0, 44.0, 40.0, 27.0, 35.0, 34.0, 36.0, 39.0, 35.0, 31.0, 35.0, 29.0, 20.0, 21.0, 23.0, 16.0, 13.0, 15.0, 5.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00040471553802490234, -0.00038951169699430466, -0.00037430785596370697, -0.0003591040149331093, -0.0003439001739025116, -0.0003286963328719139, -0.0003134924918413162, -0.00029828865081071854, -0.00028308480978012085, -0.00026788096874952316, -0.0002526771277189255, -0.0002374732866883278, -0.0002222694456577301, -0.00020706560462713242, -0.00019186176359653473, -0.00017665792256593704, -0.00016145408153533936, -0.00014625024050474167, -0.00013104639947414398, -0.0001158425584435463, -0.00010063871741294861, -8.543487638235092e-05, -7.023103535175323e-05, -5.502719432115555e-05, -3.982335329055786e-05, -2.4619512259960175e-05, -9.415671229362488e-06, 5.788169801235199e-06, 2.0992010831832886e-05, 3.619585186243057e-05, 5.139969289302826e-05, 6.660353392362595e-05, 8.180737495422363e-05, 9.701121598482132e-05, 0.000112215057015419, 0.0001274188980460167, 0.00014262273907661438, 0.00015782658010721207, 0.00017303042113780975, 0.00018823426216840744, 0.00020343810319900513, 0.00021864194422960281, 0.0002338457852602005, 0.0002490496262907982, 0.0002642534673213959, 0.00027945730835199356, 0.00029466114938259125, 0.00030986499041318893, 0.0003250688314437866, 0.0003402726724743843, 0.000355476513504982, 0.0003706803545355797, 0.00038588419556617737, 0.00040108803659677505, 0.00041629187762737274, 0.00043149571865797043, 0.0004466995596885681, 0.0004619034007191658, 0.0004771072417497635, 0.0004923110827803612, 0.0005075149238109589, 0.0005227187648415565, 0.0005379226058721542, 0.0005531264469027519, 0.0005683302879333496]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 13.0, 8.0, 5.0, 6.0, 16.0, 15.0, 16.0, 21.0, 29.0, 31.0, 22.0, 29.0, 33.0, 40.0, 33.0, 28.0, 48.0, 36.0, 47.0, 42.0, 40.0, 43.0, 38.0, 50.0, 33.0, 49.0, 29.0, 32.0, 29.0, 25.0, 26.0, 13.0, 18.0, 10.0, 11.0, 5.0, 4.0, 6.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-11.078125, -10.772705078125, -10.46728515625, -10.161865234375, -9.8564453125, -9.551025390625, -9.24560546875, -8.940185546875, -8.634765625, -8.329345703125, -8.02392578125, -7.718505859375, -7.4130859375, -7.107666015625, -6.80224609375, -6.496826171875, -6.19140625, -5.885986328125, -5.58056640625, -5.275146484375, -4.9697265625, -4.664306640625, -4.35888671875, -4.053466796875, -3.748046875, -3.442626953125, -3.13720703125, -2.831787109375, -2.5263671875, -2.220947265625, -1.91552734375, -1.610107421875, -1.3046875, -0.999267578125, -0.69384765625, -0.388427734375, -0.0830078125, 0.222412109375, 0.52783203125, 0.833251953125, 1.138671875, 1.444091796875, 1.74951171875, 2.054931640625, 2.3603515625, 2.665771484375, 2.97119140625, 3.276611328125, 3.58203125, 3.887451171875, 4.19287109375, 4.498291015625, 4.8037109375, 5.109130859375, 5.41455078125, 5.719970703125, 6.025390625, 6.330810546875, 6.63623046875, 6.941650390625, 7.2470703125, 7.552490234375, 7.85791015625, 8.163330078125, 8.46875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 14.0, 17.0, 23.0, 22.0, 37.0, 52.0, 85.0, 105.0, 176.0, 280.0, 488.0, 782.0, 1594.0, 2937.0, 6448.0, 13636.0, 31802.0, 79646.0, 237871.0, 409657.0, 161299.0, 56759.0, 23757.0, 10537.0, 5066.0, 2492.0, 1258.0, 703.0, 361.0, 207.0, 139.0, 88.0, 57.0, 42.0, 33.0, 20.0, 12.0, 10.0, 7.0, 12.0, 7.0, 6.0, 5.0, 1.0, 0.0, 2.0], "bins": [-9.8359375, -9.57244873046875, -9.3089599609375, -9.04547119140625, -8.781982421875, -8.51849365234375, -8.2550048828125, -7.99151611328125, -7.72802734375, -7.46453857421875, -7.2010498046875, -6.93756103515625, -6.674072265625, -6.41058349609375, -6.1470947265625, -5.88360595703125, -5.6201171875, -5.35662841796875, -5.0931396484375, -4.82965087890625, -4.566162109375, -4.30267333984375, -4.0391845703125, -3.77569580078125, -3.51220703125, -3.24871826171875, -2.9852294921875, -2.72174072265625, -2.458251953125, -2.19476318359375, -1.9312744140625, -1.66778564453125, -1.404296875, -1.14080810546875, -0.8773193359375, -0.61383056640625, -0.350341796875, -0.08685302734375, 0.1766357421875, 0.44012451171875, 0.70361328125, 0.96710205078125, 1.2305908203125, 1.49407958984375, 1.757568359375, 2.02105712890625, 2.2845458984375, 2.54803466796875, 2.8115234375, 3.07501220703125, 3.3385009765625, 3.60198974609375, 3.865478515625, 4.12896728515625, 4.3924560546875, 4.65594482421875, 4.91943359375, 5.18292236328125, 5.4464111328125, 5.70989990234375, 5.973388671875, 6.23687744140625, 6.5003662109375, 6.76385498046875, 7.02734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 6.0, 1.0, 4.0, 6.0, 11.0, 10.0, 15.0, 12.0, 18.0, 29.0, 25.0, 40.0, 27.0, 46.0, 34.0, 48.0, 49.0, 62.0, 93.0, 285.0, 1562.0, 173.0, 84.0, 56.0, 53.0, 38.0, 38.0, 29.0, 28.0, 31.0, 23.0, 22.0, 23.0, 11.0, 10.0, 14.0, 7.0, 5.0, 8.0, 7.0, 3.0, 0.0, 3.0, 0.0, 6.0, 0.0, 0.0, 2.0], "bins": [-32.3125, -31.4208984375, -30.529296875, -29.6376953125, -28.74609375, -27.8544921875, -26.962890625, -26.0712890625, -25.1796875, -24.2880859375, -23.396484375, -22.5048828125, -21.61328125, -20.7216796875, -19.830078125, -18.9384765625, -18.046875, -17.1552734375, -16.263671875, -15.3720703125, -14.48046875, -13.5888671875, -12.697265625, -11.8056640625, -10.9140625, -10.0224609375, -9.130859375, -8.2392578125, -7.34765625, -6.4560546875, -5.564453125, -4.6728515625, -3.78125, -2.8896484375, -1.998046875, -1.1064453125, -0.21484375, 0.6767578125, 1.568359375, 2.4599609375, 3.3515625, 4.2431640625, 5.134765625, 6.0263671875, 6.91796875, 7.8095703125, 8.701171875, 9.5927734375, 10.484375, 11.3759765625, 12.267578125, 13.1591796875, 14.05078125, 14.9423828125, 15.833984375, 16.7255859375, 17.6171875, 18.5087890625, 19.400390625, 20.2919921875, 21.18359375, 22.0751953125, 22.966796875, 23.8583984375, 24.75]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 1.0, 5.0, 4.0, 8.0, 8.0, 12.0, 16.0, 16.0, 15.0, 25.0, 30.0, 40.0, 53.0, 68.0, 90.0, 114.0, 161.0, 225.0, 368.0, 631.0, 2419.0, 55151.0, 3017170.0, 64690.0, 2526.0, 636.0, 364.0, 229.0, 147.0, 114.0, 74.0, 69.0, 55.0, 46.0, 28.0, 29.0, 17.0, 10.0, 10.0, 10.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.21875, -40.73828125, -39.2578125, -37.77734375, -36.296875, -34.81640625, -33.3359375, -31.85546875, -30.375, -28.89453125, -27.4140625, -25.93359375, -24.453125, -22.97265625, -21.4921875, -20.01171875, -18.53125, -17.05078125, -15.5703125, -14.08984375, -12.609375, -11.12890625, -9.6484375, -8.16796875, -6.6875, -5.20703125, -3.7265625, -2.24609375, -0.765625, 0.71484375, 2.1953125, 3.67578125, 5.15625, 6.63671875, 8.1171875, 9.59765625, 11.078125, 12.55859375, 14.0390625, 15.51953125, 17.0, 18.48046875, 19.9609375, 21.44140625, 22.921875, 24.40234375, 25.8828125, 27.36328125, 28.84375, 30.32421875, 31.8046875, 33.28515625, 34.765625, 36.24609375, 37.7265625, 39.20703125, 40.6875, 42.16796875, 43.6484375, 45.12890625, 46.609375, 48.08984375, 49.5703125, 51.05078125, 52.53125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 281.0, 736.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-564.71337890625, -555.0004272460938, -545.2874145507812, -535.574462890625, -525.8614501953125, -516.1484985351562, -506.4355163574219, -496.7225341796875, -487.00958251953125, -477.2966003417969, -467.5836181640625, -457.87066650390625, -448.1576843261719, -438.4447021484375, -428.7317199707031, -419.01873779296875, -409.3057861328125, -399.5928039550781, -389.87982177734375, -380.1668701171875, -370.4538879394531, -360.74090576171875, -351.0279235839844, -341.31494140625, -331.6019592285156, -321.88897705078125, -312.1759948730469, -302.4630432128906, -292.75006103515625, -283.0370788574219, -273.3240966796875, -263.61114501953125, -253.89816284179688, -244.1851806640625, -234.4722137451172, -224.7592315673828, -215.0462646484375, -205.33328247070312, -195.62030029296875, -185.90733337402344, -176.19435119628906, -166.4813690185547, -156.76840209960938, -147.055419921875, -137.3424530029297, -127.62947082519531, -117.91649627685547, -108.20352172851562, -98.49054718017578, -88.77757263183594, -79.0645980834961, -69.35162353515625, -59.63864517211914, -49.9256706237793, -40.21269226074219, -30.499717712402344, -20.7867431640625, -11.07376766204834, -1.3607921600341797, 8.352184295654297, 18.06515884399414, 27.778133392333984, 37.491111755371094, 47.20408630371094, 56.91706085205078]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 7.0, 7.0, 9.0, 20.0, 12.0, 19.0, 17.0, 16.0, 29.0, 23.0, 23.0, 20.0, 34.0, 27.0, 40.0, 45.0, 55.0, 39.0, 51.0, 45.0, 45.0, 37.0, 31.0, 38.0, 48.0, 34.0, 20.0, 37.0, 16.0, 22.0, 23.0, 12.0, 17.0, 14.0, 12.0, 8.0, 6.0, 7.0, 7.0, 6.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-67.30718994140625, -65.1917953491211, -63.07639694213867, -60.96099853515625, -58.845603942871094, -56.73020553588867, -54.61480712890625, -52.499412536621094, -50.38401794433594, -48.268619537353516, -46.15322494506836, -44.03782653808594, -41.92243194580078, -39.80703353881836, -37.69163513183594, -35.57624053955078, -33.46084213256836, -31.34544563293457, -29.23004913330078, -27.11465072631836, -24.999256134033203, -22.88385772705078, -20.768461227416992, -18.653064727783203, -16.537668228149414, -14.422271728515625, -12.306875228881836, -10.19147777557373, -8.076081275939941, -5.960684776306152, -3.845287322998047, -1.7298908233642578, 0.38550567626953125, 2.5009024143218994, 4.616299152374268, 6.731696128845215, 8.847092628479004, 10.962489128112793, 13.077886581420898, 15.193283081054688, 17.308679580688477, 19.424076080322266, 21.539472579956055, 23.654869079589844, 25.770267486572266, 27.885662078857422, 30.001060485839844, 32.116455078125, 34.23185348510742, 36.347251892089844, 38.462646484375, 40.57804489135742, 42.69343948364258, 44.808837890625, 46.924232482910156, 49.03963088989258, 51.155029296875, 53.27042770385742, 55.38582229614258, 57.501220703125, 59.616615295410156, 61.73201370239258, 63.847412109375, 65.96280670166016, 68.07820129394531]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 7.0, 4.0, 9.0, 14.0, 13.0, 16.0, 22.0, 33.0, 22.0, 26.0, 33.0, 30.0, 28.0, 35.0, 31.0, 37.0, 52.0, 51.0, 36.0, 54.0, 46.0, 39.0, 45.0, 34.0, 38.0, 39.0, 26.0, 38.0, 26.0, 13.0, 16.0, 9.0, 9.0, 17.0, 8.0, 7.0, 6.0, 9.0, 3.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.8515625, -10.5380859375, -10.224609375, -9.9111328125, -9.59765625, -9.2841796875, -8.970703125, -8.6572265625, -8.34375, -8.0302734375, -7.716796875, -7.4033203125, -7.08984375, -6.7763671875, -6.462890625, -6.1494140625, -5.8359375, -5.5224609375, -5.208984375, -4.8955078125, -4.58203125, -4.2685546875, -3.955078125, -3.6416015625, -3.328125, -3.0146484375, -2.701171875, -2.3876953125, -2.07421875, -1.7607421875, -1.447265625, -1.1337890625, -0.8203125, -0.5068359375, -0.193359375, 0.1201171875, 0.43359375, 0.7470703125, 1.060546875, 1.3740234375, 1.6875, 2.0009765625, 2.314453125, 2.6279296875, 2.94140625, 3.2548828125, 3.568359375, 3.8818359375, 4.1953125, 4.5087890625, 4.822265625, 5.1357421875, 5.44921875, 5.7626953125, 6.076171875, 6.3896484375, 6.703125, 7.0166015625, 7.330078125, 7.6435546875, 7.95703125, 8.2705078125, 8.583984375, 8.8974609375, 9.2109375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 3.0, 4.0, 14.0, 11.0, 12.0, 12.0, 13.0, 19.0, 30.0, 31.0, 38.0, 45.0, 50.0, 71.0, 126.0, 296.0, 971.0, 3579.0, 20060.0, 411543.0, 3487713.0, 249290.0, 15418.0, 3187.0, 942.0, 310.0, 133.0, 83.0, 56.0, 29.0, 30.0, 29.0, 28.0, 19.0, 23.0, 8.0, 12.0, 11.0, 7.0, 5.0, 7.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-35.96875, -34.92431640625, -33.8798828125, -32.83544921875, -31.791015625, -30.74658203125, -29.7021484375, -28.65771484375, -27.61328125, -26.56884765625, -25.5244140625, -24.47998046875, -23.435546875, -22.39111328125, -21.3466796875, -20.30224609375, -19.2578125, -18.21337890625, -17.1689453125, -16.12451171875, -15.080078125, -14.03564453125, -12.9912109375, -11.94677734375, -10.90234375, -9.85791015625, -8.8134765625, -7.76904296875, -6.724609375, -5.68017578125, -4.6357421875, -3.59130859375, -2.546875, -1.50244140625, -0.4580078125, 0.58642578125, 1.630859375, 2.67529296875, 3.7197265625, 4.76416015625, 5.80859375, 6.85302734375, 7.8974609375, 8.94189453125, 9.986328125, 11.03076171875, 12.0751953125, 13.11962890625, 14.1640625, 15.20849609375, 16.2529296875, 17.29736328125, 18.341796875, 19.38623046875, 20.4306640625, 21.47509765625, 22.51953125, 23.56396484375, 24.6083984375, 25.65283203125, 26.697265625, 27.74169921875, 28.7861328125, 29.83056640625, 30.875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 9.0, 7.0, 7.0, 20.0, 23.0, 42.0, 55.0, 53.0, 79.0, 120.0, 164.0, 221.0, 299.0, 474.0, 519.0, 524.0, 415.0, 279.0, 208.0, 139.0, 115.0, 100.0, 51.0, 53.0, 30.0, 17.0, 9.0, 13.0, 8.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -17.975830078125, -17.37353515625, -16.771240234375, -16.1689453125, -15.566650390625, -14.96435546875, -14.362060546875, -13.759765625, -13.157470703125, -12.55517578125, -11.952880859375, -11.3505859375, -10.748291015625, -10.14599609375, -9.543701171875, -8.94140625, -8.339111328125, -7.73681640625, -7.134521484375, -6.5322265625, -5.929931640625, -5.32763671875, -4.725341796875, -4.123046875, -3.520751953125, -2.91845703125, -2.316162109375, -1.7138671875, -1.111572265625, -0.50927734375, 0.093017578125, 0.6953125, 1.297607421875, 1.89990234375, 2.502197265625, 3.1044921875, 3.706787109375, 4.30908203125, 4.911376953125, 5.513671875, 6.115966796875, 6.71826171875, 7.320556640625, 7.9228515625, 8.525146484375, 9.12744140625, 9.729736328125, 10.33203125, 10.934326171875, 11.53662109375, 12.138916015625, 12.7412109375, 13.343505859375, 13.94580078125, 14.548095703125, 15.150390625, 15.752685546875, 16.35498046875, 16.957275390625, 17.5595703125, 18.161865234375, 18.76416015625, 19.366455078125, 19.96875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 8.0, 14.0, 16.0, 27.0, 33.0, 56.0, 47.0, 81.0, 97.0, 144.0, 169.0, 221.0, 363.0, 821.0, 5185.0, 370223.0, 3794390.0, 19452.0, 1389.0, 443.0, 250.0, 202.0, 150.0, 116.0, 72.0, 74.0, 51.0, 40.0, 36.0, 23.0, 19.0, 10.0, 9.0, 10.0, 8.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.1875, -79.466796875, -76.74609375, -74.025390625, -71.3046875, -68.583984375, -65.86328125, -63.142578125, -60.421875, -57.701171875, -54.98046875, -52.259765625, -49.5390625, -46.818359375, -44.09765625, -41.376953125, -38.65625, -35.935546875, -33.21484375, -30.494140625, -27.7734375, -25.052734375, -22.33203125, -19.611328125, -16.890625, -14.169921875, -11.44921875, -8.728515625, -6.0078125, -3.287109375, -0.56640625, 2.154296875, 4.875, 7.595703125, 10.31640625, 13.037109375, 15.7578125, 18.478515625, 21.19921875, 23.919921875, 26.640625, 29.361328125, 32.08203125, 34.802734375, 37.5234375, 40.244140625, 42.96484375, 45.685546875, 48.40625, 51.126953125, 53.84765625, 56.568359375, 59.2890625, 62.009765625, 64.73046875, 67.451171875, 70.171875, 72.892578125, 75.61328125, 78.333984375, 81.0546875, 83.775390625, 86.49609375, 89.216796875, 91.9375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 133.0, 698.0, 182.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-600.0150146484375, -585.2247314453125, -570.4343872070312, -555.64404296875, -540.853759765625, -526.0634765625, -511.27313232421875, -496.4828186035156, -481.6925048828125, -466.9021911621094, -452.11187744140625, -437.3215637207031, -422.53125, -407.7409362792969, -392.95062255859375, -378.1603088378906, -363.3699951171875, -348.5796813964844, -333.78936767578125, -318.9990539550781, -304.208740234375, -289.4184265136719, -274.62811279296875, -259.8377990722656, -245.0474853515625, -230.25717163085938, -215.46685791015625, -200.67654418945312, -185.88623046875, -171.09591674804688, -156.30560302734375, -141.51528930664062, -126.7249755859375, -111.93466186523438, -97.14434814453125, -82.35403442382812, -67.563720703125, -52.773406982421875, -37.98309326171875, -23.192779541015625, -8.4024658203125, 6.387847900390625, 21.17816162109375, 35.968475341796875, 50.7587890625, 65.54910278320312, 80.33941650390625, 95.12973022460938, 109.9200439453125, 124.71035766601562, 139.50067138671875, 154.29098510742188, 169.081298828125, 183.87161254882812, 198.66192626953125, 213.45223999023438, 228.2425537109375, 243.03286743164062, 257.82318115234375, 272.6134948730469, 287.40380859375, 302.1941223144531, 316.98443603515625, 331.7747497558594, 346.5650634765625]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 6.0, 7.0, 8.0, 15.0, 12.0, 15.0, 16.0, 20.0, 31.0, 27.0, 24.0, 20.0, 36.0, 37.0, 32.0, 41.0, 54.0, 39.0, 45.0, 43.0, 42.0, 46.0, 37.0, 25.0, 39.0, 33.0, 36.0, 25.0, 28.0, 23.0, 22.0, 15.0, 17.0, 12.0, 10.0, 12.0, 3.0, 5.0, 5.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.37525177001953, -49.582191467285156, -47.78913116455078, -45.99606704711914, -44.203006744384766, -42.40994644165039, -40.616886138916016, -38.823822021484375, -37.03076171875, -35.237701416015625, -33.44464111328125, -31.651578903198242, -29.858516693115234, -28.06545639038086, -26.272396087646484, -24.479333877563477, -22.6862735748291, -20.893213272094727, -19.10015106201172, -17.307090759277344, -15.514028549194336, -13.720968246459961, -11.92790699005127, -10.134845733642578, -8.341784477233887, -6.548723220825195, -4.755661964416504, -2.9626011848449707, -1.1695399284362793, 0.6235208511352539, 2.4165821075439453, 4.209643363952637, 6.002704620361328, 7.7957658767700195, 9.588827133178711, 11.381887435913086, 13.174949645996094, 14.968009948730469, 16.761070251464844, 18.55413246154785, 20.34719467163086, 22.140254974365234, 23.933317184448242, 25.726377487182617, 27.519439697265625, 29.3125, 31.105560302734375, 32.89862060546875, 34.691680908203125, 36.4847412109375, 38.277801513671875, 40.070865631103516, 41.86392593383789, 43.656986236572266, 45.45004653930664, 47.24311065673828, 49.036170959472656, 50.82923126220703, 52.622291564941406, 54.41535568237305, 56.20841598510742, 58.0014762878418, 59.79453659057617, 61.58760070800781, 63.38066101074219]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 11.0, 7.0, 12.0, 17.0, 16.0, 20.0, 15.0, 31.0, 25.0, 28.0, 28.0, 33.0, 34.0, 48.0, 38.0, 37.0, 47.0, 51.0, 41.0, 40.0, 36.0, 47.0, 47.0, 36.0, 34.0, 32.0, 29.0, 25.0, 17.0, 20.0, 17.0, 9.0, 18.0, 9.0, 11.0, 8.0, 8.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-11.1796875, -10.8505859375, -10.521484375, -10.1923828125, -9.86328125, -9.5341796875, -9.205078125, -8.8759765625, -8.546875, -8.2177734375, -7.888671875, -7.5595703125, -7.23046875, -6.9013671875, -6.572265625, -6.2431640625, -5.9140625, -5.5849609375, -5.255859375, -4.9267578125, -4.59765625, -4.2685546875, -3.939453125, -3.6103515625, -3.28125, -2.9521484375, -2.623046875, -2.2939453125, -1.96484375, -1.6357421875, -1.306640625, -0.9775390625, -0.6484375, -0.3193359375, 0.009765625, 0.3388671875, 0.66796875, 0.9970703125, 1.326171875, 1.6552734375, 1.984375, 2.3134765625, 2.642578125, 2.9716796875, 3.30078125, 3.6298828125, 3.958984375, 4.2880859375, 4.6171875, 4.9462890625, 5.275390625, 5.6044921875, 5.93359375, 6.2626953125, 6.591796875, 6.9208984375, 7.25, 7.5791015625, 7.908203125, 8.2373046875, 8.56640625, 8.8955078125, 9.224609375, 9.5537109375, 9.8828125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 9.0, 11.0, 10.0, 15.0, 31.0, 35.0, 42.0, 75.0, 97.0, 148.0, 227.0, 283.0, 452.0, 662.0, 939.0, 1415.0, 1964.0, 2983.0, 4498.0, 6547.0, 9925.0, 15053.0, 22466.0, 36003.0, 58980.0, 103168.0, 242869.0, 264925.0, 106871.0, 61187.0, 36988.0, 23455.0, 15155.0, 9952.0, 6705.0, 4657.0, 3116.0, 2066.0, 1483.0, 968.0, 649.0, 467.0, 311.0, 225.0, 153.0, 96.0, 70.0, 41.0, 34.0, 28.0, 20.0, 15.0, 10.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8701171875, -1.8078460693359375, -1.745574951171875, -1.6833038330078125, -1.62103271484375, -1.5587615966796875, -1.496490478515625, -1.4342193603515625, -1.3719482421875, -1.3096771240234375, -1.247406005859375, -1.1851348876953125, -1.12286376953125, -1.0605926513671875, -0.998321533203125, -0.9360504150390625, -0.873779296875, -0.8115081787109375, -0.749237060546875, -0.6869659423828125, -0.62469482421875, -0.5624237060546875, -0.500152587890625, -0.4378814697265625, -0.3756103515625, -0.3133392333984375, -0.251068115234375, -0.1887969970703125, -0.12652587890625, -0.0642547607421875, -0.001983642578125, 0.0602874755859375, 0.12255859375, 0.1848297119140625, 0.247100830078125, 0.3093719482421875, 0.37164306640625, 0.4339141845703125, 0.496185302734375, 0.5584564208984375, 0.6207275390625, 0.6829986572265625, 0.745269775390625, 0.8075408935546875, 0.86981201171875, 0.9320831298828125, 0.994354248046875, 1.0566253662109375, 1.118896484375, 1.1811676025390625, 1.243438720703125, 1.3057098388671875, 1.36798095703125, 1.4302520751953125, 1.492523193359375, 1.5547943115234375, 1.6170654296875, 1.6793365478515625, 1.741607666015625, 1.8038787841796875, 1.86614990234375, 1.9284210205078125, 1.990692138671875, 2.0529632568359375, 2.115234375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 10.0, 4.0, 4.0, 9.0, 6.0, 10.0, 20.0, 20.0, 18.0, 10.0, 29.0, 36.0, 31.0, 29.0, 35.0, 36.0, 43.0, 48.0, 42.0, 33.0, 1066.0, 47.0, 32.0, 43.0, 35.0, 24.0, 38.0, 30.0, 29.0, 32.0, 27.0, 27.0, 19.0, 20.0, 6.0, 14.0, 13.0, 12.0, 4.0, 13.0, 6.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.4609375, -6.25592041015625, -6.0509033203125, -5.84588623046875, -5.640869140625, -5.43585205078125, -5.2308349609375, -5.02581787109375, -4.82080078125, -4.61578369140625, -4.4107666015625, -4.20574951171875, -4.000732421875, -3.79571533203125, -3.5906982421875, -3.38568115234375, -3.1806640625, -2.97564697265625, -2.7706298828125, -2.56561279296875, -2.360595703125, -2.15557861328125, -1.9505615234375, -1.74554443359375, -1.54052734375, -1.33551025390625, -1.1304931640625, -0.92547607421875, -0.720458984375, -0.51544189453125, -0.3104248046875, -0.10540771484375, 0.099609375, 0.30462646484375, 0.5096435546875, 0.71466064453125, 0.919677734375, 1.12469482421875, 1.3297119140625, 1.53472900390625, 1.73974609375, 1.94476318359375, 2.1497802734375, 2.35479736328125, 2.559814453125, 2.76483154296875, 2.9698486328125, 3.17486572265625, 3.3798828125, 3.58489990234375, 3.7899169921875, 3.99493408203125, 4.199951171875, 4.40496826171875, 4.6099853515625, 4.81500244140625, 5.02001953125, 5.22503662109375, 5.4300537109375, 5.63507080078125, 5.840087890625, 6.04510498046875, 6.2501220703125, 6.45513916015625, 6.66015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 12.0, 26.0, 26.0, 36.0, 79.0, 98.0, 174.0, 297.0, 419.0, 634.0, 1062.0, 1615.0, 2606.0, 3961.0, 6098.0, 10089.0, 16131.0, 26733.0, 44371.0, 78720.0, 158578.0, 1412048.0, 148537.0, 75077.0, 42707.0, 25381.0, 15466.0, 9494.0, 6138.0, 3723.0, 2417.0, 1527.0, 1071.0, 661.0, 404.0, 240.0, 163.0, 117.0, 73.0, 44.0, 27.0, 21.0, 6.0, 8.0, 1.0, 6.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.26953125, -2.1973876953125, -2.125244140625, -2.0531005859375, -1.98095703125, -1.9088134765625, -1.836669921875, -1.7645263671875, -1.6923828125, -1.6202392578125, -1.548095703125, -1.4759521484375, -1.40380859375, -1.3316650390625, -1.259521484375, -1.1873779296875, -1.115234375, -1.0430908203125, -0.970947265625, -0.8988037109375, -0.82666015625, -0.7545166015625, -0.682373046875, -0.6102294921875, -0.5380859375, -0.4659423828125, -0.393798828125, -0.3216552734375, -0.24951171875, -0.1773681640625, -0.105224609375, -0.0330810546875, 0.0390625, 0.1112060546875, 0.183349609375, 0.2554931640625, 0.32763671875, 0.3997802734375, 0.471923828125, 0.5440673828125, 0.6162109375, 0.6883544921875, 0.760498046875, 0.8326416015625, 0.90478515625, 0.9769287109375, 1.049072265625, 1.1212158203125, 1.193359375, 1.2655029296875, 1.337646484375, 1.4097900390625, 1.48193359375, 1.5540771484375, 1.626220703125, 1.6983642578125, 1.7705078125, 1.8426513671875, 1.914794921875, 1.9869384765625, 2.05908203125, 2.1312255859375, 2.203369140625, 2.2755126953125, 2.34765625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 5.0, 12.0, 16.0, 14.0, 12.0, 24.0, 52.0, 52.0, 46.0, 94.0, 112.0, 126.0, 110.0, 84.0, 44.0, 41.0, 28.0, 26.0, 19.0, 17.0, 13.0, 9.0, 4.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012569427490234375, -0.0012155324220657349, -0.0011741220951080322, -0.0011327117681503296, -0.001091301441192627, -0.0010498911142349243, -0.0010084807872772217, -0.000967070460319519, -0.0009256601333618164, -0.0008842498064041138, -0.0008428394794464111, -0.0008014291524887085, -0.0007600188255310059, -0.0007186084985733032, -0.0006771981716156006, -0.000635787844657898, -0.0005943775177001953, -0.0005529671907424927, -0.00051155686378479, -0.0004701465368270874, -0.00042873620986938477, -0.00038732588291168213, -0.0003459155559539795, -0.00030450522899627686, -0.0002630949020385742, -0.00022168457508087158, -0.00018027424812316895, -0.0001388639211654663, -9.745359420776367e-05, -5.6043267250061035e-05, -1.4632940292358398e-05, 2.6777386665344238e-05, 6.818771362304688e-05, 0.00010959804058074951, 0.00015100836753845215, 0.00019241869449615479, 0.00023382902145385742, 0.00027523934841156006, 0.0003166496753692627, 0.00035806000232696533, 0.00039947032928466797, 0.0004408806562423706, 0.00048229098320007324, 0.0005237013101577759, 0.0005651116371154785, 0.0006065219640731812, 0.0006479322910308838, 0.0006893426179885864, 0.0007307529449462891, 0.0007721632719039917, 0.0008135735988616943, 0.000854983925819397, 0.0008963942527770996, 0.0009378045797348022, 0.0009792149066925049, 0.0010206252336502075, 0.0010620355606079102, 0.0011034458875656128, 0.0011448562145233154, 0.001186266541481018, 0.0012276768684387207, 0.0012690871953964233, 0.001310497522354126, 0.0013519078493118286, 0.0013933181762695312]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 7.0, 12.0, 6.0, 17.0, 33.0, 29.0, 45.0, 59.0, 99.0, 163.0, 294.0, 1143.0, 935199.0, 109973.0, 695.0, 262.0, 150.0, 100.0, 60.0, 53.0, 27.0, 33.0, 19.0, 7.0, 7.0, 14.0, 5.0, 5.0, 4.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03204345703125, -0.031174659729003906, -0.030305862426757812, -0.02943706512451172, -0.028568267822265625, -0.02769947052001953, -0.026830673217773438, -0.025961875915527344, -0.02509307861328125, -0.024224281311035156, -0.023355484008789062, -0.02248668670654297, -0.021617889404296875, -0.02074909210205078, -0.019880294799804688, -0.019011497497558594, -0.0181427001953125, -0.017273902893066406, -0.016405105590820312, -0.015536308288574219, -0.014667510986328125, -0.013798713684082031, -0.012929916381835938, -0.012061119079589844, -0.01119232177734375, -0.010323524475097656, -0.009454727172851562, -0.008585929870605469, -0.007717132568359375, -0.006848335266113281, -0.0059795379638671875, -0.005110740661621094, -0.004241943359375, -0.0033731460571289062, -0.0025043487548828125, -0.0016355514526367188, -0.000766754150390625, 0.00010204315185546875, 0.0009708404541015625, 0.0018396377563476562, 0.00270843505859375, 0.0035772323608398438, 0.0044460296630859375, 0.005314826965332031, 0.006183624267578125, 0.007052421569824219, 0.007921218872070312, 0.008790016174316406, 0.0096588134765625, 0.010527610778808594, 0.011396408081054688, 0.012265205383300781, 0.013134002685546875, 0.014002799987792969, 0.014871597290039062, 0.015740394592285156, 0.01660919189453125, 0.017477989196777344, 0.018346786499023438, 0.01921558380126953, 0.020084381103515625, 0.02095317840576172, 0.021821975708007812, 0.022690773010253906, 0.0235595703125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 44.0, 333.0, 520.0, 101.0, 9.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00434431666508317, -0.00425597233697772, -0.004167628008872271, -0.004079283680766821, -0.003990939352661371, -0.003902594791725278, -0.0038142504636198282, -0.0037259061355143785, -0.0036375615745782852, -0.0035492172464728355, -0.003460872918367386, -0.003372528590261936, -0.003284184029325843, -0.003195839701220393, -0.0031074953731149435, -0.003019151045009494, -0.002930806716904044, -0.0028424623887985945, -0.002754118060693145, -0.0026657734997570515, -0.002577429171651602, -0.002489084843546152, -0.0024007405154407024, -0.0023123961873352528, -0.002224051859229803, -0.0021357075311243534, -0.0020473632030189037, -0.001959018874913454, -0.0018706743139773607, -0.001782329985871911, -0.0016939856577664614, -0.0016056413296610117, -0.001517297001555562, -0.0014289526734501123, -0.0013406082289293408, -0.0012522639008238912, -0.0011639194563031197, -0.00107557512819767, -0.0009872308000922203, -0.0008988864137791097, -0.0008105420274659991, -0.0007221976411528885, -0.000633853254839778, -0.0005455089267343283, -0.0004571645404212177, -0.0003688201541081071, -0.0002804758260026574, -0.00019213143968954682, -0.00010378705337643623, -1.5442681615240872e-05, 7.290169014595449e-05, 0.00016124604735523462, 0.0002495904336683452, 0.0003379348199814558, 0.0004262791480869055, 0.0005146235344000161, 0.0006029679207131267, 0.0006913123070262372, 0.0007796566933393478, 0.0008680010214447975, 0.0009563454077579081, 0.0010446897940710187, 0.0011330341221764684, 0.0012213785666972399, 0.0013097228948026896]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 14.0, 5.0, 9.0, 9.0, 14.0, 10.0, 16.0, 26.0, 23.0, 18.0, 36.0, 24.0, 30.0, 32.0, 46.0, 46.0, 28.0, 39.0, 41.0, 45.0, 57.0, 25.0, 31.0, 30.0, 40.0, 33.0, 25.0, 30.0, 19.0, 32.0, 21.0, 20.0, 18.0, 14.0, 15.0, 22.0, 11.0, 8.0, 3.0, 8.0, 4.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.0005609989166259766, -0.000545215792953968, -0.0005294326692819595, -0.000513649545609951, -0.0004978664219379425, -0.000482083298265934, -0.0004663001745939255, -0.00045051705092191696, -0.00043473392724990845, -0.00041895080357789993, -0.0004031676799058914, -0.0003873845562338829, -0.0003716014325618744, -0.0003558183088898659, -0.00034003518521785736, -0.00032425206154584885, -0.00030846893787384033, -0.0002926858142018318, -0.0002769026905298233, -0.0002611195668578148, -0.0002453364431858063, -0.00022955331951379776, -0.00021377019584178925, -0.00019798707216978073, -0.00018220394849777222, -0.0001664208248257637, -0.0001506377011537552, -0.00013485457748174667, -0.00011907145380973816, -0.00010328833013772964, -8.750520646572113e-05, -7.172208279371262e-05, -5.59389591217041e-05, -4.015583544969559e-05, -2.4372711777687073e-05, -8.589588105678558e-06, 7.193535566329956e-06, 2.297665923833847e-05, 3.8759782910346985e-05, 5.45429065823555e-05, 7.032603025436401e-05, 8.610915392637253e-05, 0.00010189227759838104, 0.00011767540127038956, 0.00013345852494239807, 0.00014924164861440659, 0.0001650247722864151, 0.00018080789595842361, 0.00019659101963043213, 0.00021237414330244064, 0.00022815726697444916, 0.00024394039064645767, 0.0002597235143184662, 0.0002755066379904747, 0.0002912897616624832, 0.00030707288533449173, 0.00032285600900650024, 0.00033863913267850876, 0.0003544222563505173, 0.0003702053800225258, 0.0003859885036945343, 0.0004017716273665428, 0.00041755475103855133, 0.00043333787471055984, 0.00044912099838256836]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 11.0, 7.0, 12.0, 17.0, 16.0, 20.0, 15.0, 31.0, 25.0, 28.0, 28.0, 33.0, 34.0, 48.0, 38.0, 37.0, 47.0, 51.0, 41.0, 40.0, 36.0, 47.0, 47.0, 36.0, 34.0, 32.0, 29.0, 25.0, 17.0, 20.0, 17.0, 9.0, 18.0, 9.0, 11.0, 8.0, 8.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-11.1796875, -10.8505859375, -10.521484375, -10.1923828125, -9.86328125, -9.5341796875, -9.205078125, -8.8759765625, -8.546875, -8.2177734375, -7.888671875, -7.5595703125, -7.23046875, -6.9013671875, -6.572265625, -6.2431640625, -5.9140625, -5.5849609375, -5.255859375, -4.9267578125, -4.59765625, -4.2685546875, -3.939453125, -3.6103515625, -3.28125, -2.9521484375, -2.623046875, -2.2939453125, -1.96484375, -1.6357421875, -1.306640625, -0.9775390625, -0.6484375, -0.3193359375, 0.009765625, 0.3388671875, 0.66796875, 0.9970703125, 1.326171875, 1.6552734375, 1.984375, 2.3134765625, 2.642578125, 2.9716796875, 3.30078125, 3.6298828125, 3.958984375, 4.2880859375, 4.6171875, 4.9462890625, 5.275390625, 5.6044921875, 5.93359375, 6.2626953125, 6.591796875, 6.9208984375, 7.25, 7.5791015625, 7.908203125, 8.2373046875, 8.56640625, 8.8955078125, 9.224609375, 9.5537109375, 9.8828125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 9.0, 10.0, 19.0, 22.0, 23.0, 31.0, 41.0, 59.0, 82.0, 94.0, 181.0, 273.0, 551.0, 1368.0, 3835.0, 14076.0, 94097.0, 752240.0, 154266.0, 19224.0, 4844.0, 1636.0, 639.0, 318.0, 178.0, 132.0, 65.0, 57.0, 37.0, 25.0, 24.0, 17.0, 23.0, 10.0, 14.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-21.671875, -21.02685546875, -20.3818359375, -19.73681640625, -19.091796875, -18.44677734375, -17.8017578125, -17.15673828125, -16.51171875, -15.86669921875, -15.2216796875, -14.57666015625, -13.931640625, -13.28662109375, -12.6416015625, -11.99658203125, -11.3515625, -10.70654296875, -10.0615234375, -9.41650390625, -8.771484375, -8.12646484375, -7.4814453125, -6.83642578125, -6.19140625, -5.54638671875, -4.9013671875, -4.25634765625, -3.611328125, -2.96630859375, -2.3212890625, -1.67626953125, -1.03125, -0.38623046875, 0.2587890625, 0.90380859375, 1.548828125, 2.19384765625, 2.8388671875, 3.48388671875, 4.12890625, 4.77392578125, 5.4189453125, 6.06396484375, 6.708984375, 7.35400390625, 7.9990234375, 8.64404296875, 9.2890625, 9.93408203125, 10.5791015625, 11.22412109375, 11.869140625, 12.51416015625, 13.1591796875, 13.80419921875, 14.44921875, 15.09423828125, 15.7392578125, 16.38427734375, 17.029296875, 17.67431640625, 18.3193359375, 18.96435546875, 19.609375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 1.0, 4.0, 3.0, 8.0, 4.0, 11.0, 9.0, 19.0, 17.0, 21.0, 26.0, 23.0, 34.0, 26.0, 37.0, 50.0, 58.0, 56.0, 138.0, 1558.0, 393.0, 88.0, 61.0, 54.0, 45.0, 43.0, 51.0, 30.0, 26.0, 38.0, 24.0, 21.0, 9.0, 7.0, 10.0, 10.0, 5.0, 6.0, 7.0, 4.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-35.15625, -34.175537109375, -33.19482421875, -32.214111328125, -31.2333984375, -30.252685546875, -29.27197265625, -28.291259765625, -27.310546875, -26.329833984375, -25.34912109375, -24.368408203125, -23.3876953125, -22.406982421875, -21.42626953125, -20.445556640625, -19.46484375, -18.484130859375, -17.50341796875, -16.522705078125, -15.5419921875, -14.561279296875, -13.58056640625, -12.599853515625, -11.619140625, -10.638427734375, -9.65771484375, -8.677001953125, -7.6962890625, -6.715576171875, -5.73486328125, -4.754150390625, -3.7734375, -2.792724609375, -1.81201171875, -0.831298828125, 0.1494140625, 1.130126953125, 2.11083984375, 3.091552734375, 4.072265625, 5.052978515625, 6.03369140625, 7.014404296875, 7.9951171875, 8.975830078125, 9.95654296875, 10.937255859375, 11.91796875, 12.898681640625, 13.87939453125, 14.860107421875, 15.8408203125, 16.821533203125, 17.80224609375, 18.782958984375, 19.763671875, 20.744384765625, 21.72509765625, 22.705810546875, 23.6865234375, 24.667236328125, 25.64794921875, 26.628662109375, 27.609375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 0.0, 8.0, 5.0, 7.0, 4.0, 6.0, 9.0, 11.0, 11.0, 8.0, 23.0, 27.0, 44.0, 44.0, 44.0, 79.0, 115.0, 135.0, 264.0, 510.0, 2363.0, 83835.0, 3046595.0, 9713.0, 926.0, 319.0, 164.0, 114.0, 71.0, 58.0, 38.0, 37.0, 30.0, 18.0, 19.0, 11.0, 13.0, 9.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.125, -61.8564453125, -59.587890625, -57.3193359375, -55.05078125, -52.7822265625, -50.513671875, -48.2451171875, -45.9765625, -43.7080078125, -41.439453125, -39.1708984375, -36.90234375, -34.6337890625, -32.365234375, -30.0966796875, -27.828125, -25.5595703125, -23.291015625, -21.0224609375, -18.75390625, -16.4853515625, -14.216796875, -11.9482421875, -9.6796875, -7.4111328125, -5.142578125, -2.8740234375, -0.60546875, 1.6630859375, 3.931640625, 6.2001953125, 8.46875, 10.7373046875, 13.005859375, 15.2744140625, 17.54296875, 19.8115234375, 22.080078125, 24.3486328125, 26.6171875, 28.8857421875, 31.154296875, 33.4228515625, 35.69140625, 37.9599609375, 40.228515625, 42.4970703125, 44.765625, 47.0341796875, 49.302734375, 51.5712890625, 53.83984375, 56.1083984375, 58.376953125, 60.6455078125, 62.9140625, 65.1826171875, 67.451171875, 69.7197265625, 71.98828125, 74.2568359375, 76.525390625, 78.7939453125, 81.0625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 11.0, 42.0, 136.0, 251.0, 283.0, 192.0, 74.0, 18.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-110.24053955078125, -108.04467010498047, -105.84880065917969, -103.65292358398438, -101.4570541381836, -99.26118469238281, -97.06531524658203, -94.86944580078125, -92.67357635498047, -90.47770690917969, -88.2818374633789, -86.08596801757812, -83.89009094238281, -81.69422149658203, -79.49835205078125, -77.30248260498047, -75.10661315917969, -72.9107437133789, -70.71487426757812, -68.51899719238281, -66.32312774658203, -64.12725830078125, -61.93138885498047, -59.73551940917969, -57.539642333984375, -55.343772888183594, -53.14789962768555, -50.952030181884766, -48.756160736083984, -46.56028747558594, -44.364418029785156, -42.168548583984375, -39.972679138183594, -37.77680969238281, -35.580936431884766, -33.385066986083984, -31.189197540283203, -28.99332618713379, -26.797454833984375, -24.601585388183594, -22.405715942382812, -20.2098445892334, -18.013975143432617, -15.818103790283203, -13.622233390808105, -11.426362991333008, -9.230491638183594, -7.034621238708496, -4.838750839233398, -2.6428802013397217, -0.4470095634460449, 1.748861312866211, 3.9447317123413086, 6.140602111816406, 8.33647346496582, 10.532343864440918, 12.728214263916016, 14.924084663391113, 17.11995506286621, 19.315826416015625, 21.511695861816406, 23.70756721496582, 25.903438568115234, 28.099308013916016, 30.29517936706543]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 2.0, 4.0, 7.0, 9.0, 5.0, 13.0, 12.0, 9.0, 12.0, 11.0, 14.0, 24.0, 19.0, 22.0, 32.0, 35.0, 45.0, 36.0, 28.0, 41.0, 33.0, 40.0, 43.0, 38.0, 46.0, 40.0, 48.0, 44.0, 35.0, 28.0, 31.0, 28.0, 22.0, 17.0, 20.0, 17.0, 15.0, 18.0, 12.0, 12.0, 8.0, 7.0, 8.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.76341247558594, -74.45433807373047, -72.145263671875, -69.836181640625, -67.52710723876953, -65.21803283691406, -62.908958435058594, -60.599884033203125, -58.29080581665039, -55.98173141479492, -53.67265319824219, -51.36357879638672, -49.05450439453125, -46.745426177978516, -44.43635177612305, -42.12727355957031, -39.818199157714844, -37.509124755859375, -35.20004653930664, -32.89097213745117, -30.58189582824707, -28.27281951904297, -25.9637451171875, -23.6546688079834, -21.345592498779297, -19.036516189575195, -16.727439880371094, -14.418365478515625, -12.109289169311523, -9.800212860107422, -7.491137504577637, -5.182062149047852, -2.8729934692382812, -0.5639176368713379, 1.7451581954956055, 4.054234027862549, 6.363309860229492, 8.672386169433594, 10.981461524963379, 13.290536880493164, 15.599613189697266, 17.908689498901367, 20.21776580810547, 22.526840209960938, 24.83591651916504, 27.14499282836914, 29.45406723022461, 31.76314353942871, 34.07221984863281, 36.38129425048828, 38.690372467041016, 40.999446868896484, 43.30852508544922, 45.61759948730469, 47.926673889160156, 50.235748291015625, 52.54482650756836, 54.85390090942383, 57.16297912597656, 59.47205352783203, 61.7811279296875, 64.0902099609375, 66.39928436279297, 68.70835876464844, 71.0174331665039]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 13.0, 13.0, 8.0, 25.0, 23.0, 21.0, 27.0, 32.0, 35.0, 43.0, 28.0, 38.0, 43.0, 50.0, 41.0, 42.0, 46.0, 43.0, 44.0, 55.0, 38.0, 31.0, 36.0, 35.0, 28.0, 25.0, 15.0, 22.0, 15.0, 17.0, 17.0, 2.0, 12.0, 10.0, 9.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5625, -11.21337890625, -10.8642578125, -10.51513671875, -10.166015625, -9.81689453125, -9.4677734375, -9.11865234375, -8.76953125, -8.42041015625, -8.0712890625, -7.72216796875, -7.373046875, -7.02392578125, -6.6748046875, -6.32568359375, -5.9765625, -5.62744140625, -5.2783203125, -4.92919921875, -4.580078125, -4.23095703125, -3.8818359375, -3.53271484375, -3.18359375, -2.83447265625, -2.4853515625, -2.13623046875, -1.787109375, -1.43798828125, -1.0888671875, -0.73974609375, -0.390625, -0.04150390625, 0.3076171875, 0.65673828125, 1.005859375, 1.35498046875, 1.7041015625, 2.05322265625, 2.40234375, 2.75146484375, 3.1005859375, 3.44970703125, 3.798828125, 4.14794921875, 4.4970703125, 4.84619140625, 5.1953125, 5.54443359375, 5.8935546875, 6.24267578125, 6.591796875, 6.94091796875, 7.2900390625, 7.63916015625, 7.98828125, 8.33740234375, 8.6865234375, 9.03564453125, 9.384765625, 9.73388671875, 10.0830078125, 10.43212890625, 10.78125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 12.0, 13.0, 17.0, 23.0, 19.0, 31.0, 23.0, 47.0, 58.0, 108.0, 249.0, 543.0, 1520.0, 5307.0, 30848.0, 664882.0, 3210650.0, 255650.0, 18451.0, 3689.0, 1126.0, 433.0, 211.0, 97.0, 60.0, 43.0, 24.0, 28.0, 15.0, 20.0, 15.0, 13.0, 10.0, 11.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.21875, -32.252197265625, -31.28564453125, -30.319091796875, -29.3525390625, -28.385986328125, -27.41943359375, -26.452880859375, -25.486328125, -24.519775390625, -23.55322265625, -22.586669921875, -21.6201171875, -20.653564453125, -19.68701171875, -18.720458984375, -17.75390625, -16.787353515625, -15.82080078125, -14.854248046875, -13.8876953125, -12.921142578125, -11.95458984375, -10.988037109375, -10.021484375, -9.054931640625, -8.08837890625, -7.121826171875, -6.1552734375, -5.188720703125, -4.22216796875, -3.255615234375, -2.2890625, -1.322509765625, -0.35595703125, 0.610595703125, 1.5771484375, 2.543701171875, 3.51025390625, 4.476806640625, 5.443359375, 6.409912109375, 7.37646484375, 8.343017578125, 9.3095703125, 10.276123046875, 11.24267578125, 12.209228515625, 13.17578125, 14.142333984375, 15.10888671875, 16.075439453125, 17.0419921875, 18.008544921875, 18.97509765625, 19.941650390625, 20.908203125, 21.874755859375, 22.84130859375, 23.807861328125, 24.7744140625, 25.740966796875, 26.70751953125, 27.674072265625, 28.640625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 9.0, 12.0, 22.0, 23.0, 34.0, 53.0, 80.0, 105.0, 146.0, 202.0, 278.0, 378.0, 514.0, 517.0, 453.0, 355.0, 242.0, 168.0, 138.0, 88.0, 62.0, 45.0, 40.0, 28.0, 19.0, 13.0, 8.0, 8.0, 5.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7890625, -15.1878662109375, -14.586669921875, -13.9854736328125, -13.38427734375, -12.7830810546875, -12.181884765625, -11.5806884765625, -10.9794921875, -10.3782958984375, -9.777099609375, -9.1759033203125, -8.57470703125, -7.9735107421875, -7.372314453125, -6.7711181640625, -6.169921875, -5.5687255859375, -4.967529296875, -4.3663330078125, -3.76513671875, -3.1639404296875, -2.562744140625, -1.9615478515625, -1.3603515625, -0.7591552734375, -0.157958984375, 0.4432373046875, 1.04443359375, 1.6456298828125, 2.246826171875, 2.8480224609375, 3.44921875, 4.0504150390625, 4.651611328125, 5.2528076171875, 5.85400390625, 6.4552001953125, 7.056396484375, 7.6575927734375, 8.2587890625, 8.8599853515625, 9.461181640625, 10.0623779296875, 10.66357421875, 11.2647705078125, 11.865966796875, 12.4671630859375, 13.068359375, 13.6695556640625, 14.270751953125, 14.8719482421875, 15.47314453125, 16.0743408203125, 16.675537109375, 17.2767333984375, 17.8779296875, 18.4791259765625, 19.080322265625, 19.6815185546875, 20.28271484375, 20.8839111328125, 21.485107421875, 22.0863037109375, 22.6875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 7.0, 5.0, 14.0, 13.0, 19.0, 18.0, 26.0, 26.0, 39.0, 43.0, 67.0, 59.0, 117.0, 114.0, 170.0, 265.0, 412.0, 896.0, 4554.0, 77686.0, 3840390.0, 257392.0, 9058.0, 1333.0, 482.0, 259.0, 174.0, 147.0, 103.0, 80.0, 50.0, 49.0, 51.0, 40.0, 28.0, 25.0, 18.0, 14.0, 10.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-66.1875, -64.22021484375, -62.2529296875, -60.28564453125, -58.318359375, -56.35107421875, -54.3837890625, -52.41650390625, -50.44921875, -48.48193359375, -46.5146484375, -44.54736328125, -42.580078125, -40.61279296875, -38.6455078125, -36.67822265625, -34.7109375, -32.74365234375, -30.7763671875, -28.80908203125, -26.841796875, -24.87451171875, -22.9072265625, -20.93994140625, -18.97265625, -17.00537109375, -15.0380859375, -13.07080078125, -11.103515625, -9.13623046875, -7.1689453125, -5.20166015625, -3.234375, -1.26708984375, 0.7001953125, 2.66748046875, 4.634765625, 6.60205078125, 8.5693359375, 10.53662109375, 12.50390625, 14.47119140625, 16.4384765625, 18.40576171875, 20.373046875, 22.34033203125, 24.3076171875, 26.27490234375, 28.2421875, 30.20947265625, 32.1767578125, 34.14404296875, 36.111328125, 38.07861328125, 40.0458984375, 42.01318359375, 43.98046875, 45.94775390625, 47.9150390625, 49.88232421875, 51.849609375, 53.81689453125, 55.7841796875, 57.75146484375, 59.71875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 10.0, 30.0, 69.0, 145.0, 270.0, 248.0, 150.0, 59.0, 21.0, 12.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.48428344726562, -162.82244873046875, -158.1605987548828, -153.49876403808594, -148.8369140625, -144.17507934570312, -139.51324462890625, -134.85140991210938, -130.18955993652344, -125.52771759033203, -120.86587524414062, -116.20404052734375, -111.54219818115234, -106.88035583496094, -102.21852111816406, -97.55667877197266, -92.89483642578125, -88.23299407958984, -83.57115173339844, -78.90931701660156, -74.24747467041016, -69.58563232421875, -64.92379760742188, -60.26195526123047, -55.60011291503906, -50.938270568847656, -46.276432037353516, -41.614593505859375, -36.95275115966797, -32.29090881347656, -27.629070281982422, -22.96723175048828, -18.305404663085938, -13.643564224243164, -8.98172378540039, -4.319883346557617, 0.34195709228515625, 5.00379753112793, 9.665637969970703, 14.327476501464844, 18.98931884765625, 23.651159286499023, 28.312999725341797, 32.97483825683594, 37.636680603027344, 42.29852294921875, 46.96036148071289, 51.62220001220703, 56.28404235839844, 60.945884704589844, 65.60772705078125, 70.26956176757812, 74.93140411376953, 79.59324645996094, 84.25508117675781, 88.91692352294922, 93.57876586914062, 98.24060821533203, 102.90245056152344, 107.56428527832031, 112.22612762451172, 116.88796997070312, 121.5498046875, 126.2116470336914, 130.8734893798828]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 10.0, 11.0, 9.0, 14.0, 14.0, 6.0, 18.0, 28.0, 23.0, 18.0, 28.0, 35.0, 25.0, 40.0, 38.0, 43.0, 35.0, 36.0, 51.0, 40.0, 43.0, 43.0, 44.0, 35.0, 46.0, 32.0, 34.0, 31.0, 18.0, 23.0, 20.0, 15.0, 12.0, 16.0, 8.0, 15.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0], "bins": [-65.46153259277344, -63.687564849853516, -61.91359329223633, -60.139625549316406, -58.36565399169922, -56.5916862487793, -54.817718505859375, -53.04374694824219, -51.269779205322266, -49.495811462402344, -47.721839904785156, -45.947872161865234, -44.17390441894531, -42.399932861328125, -40.6259651184082, -38.85199737548828, -37.078025817871094, -35.30405807495117, -33.530086517333984, -31.756118774414062, -29.982149124145508, -28.208179473876953, -26.43421173095703, -24.660242080688477, -22.886272430419922, -21.112302780151367, -19.338333129882812, -17.56436538696289, -15.790395736694336, -14.016426086425781, -12.242457389831543, -10.468488693237305, -8.69451904296875, -6.9205498695373535, -5.146580696105957, -3.3726115226745605, -1.598642349243164, 0.17532730102539062, 1.949295997619629, 3.723264694213867, 5.497234344482422, 7.271203517913818, 9.045172691345215, 10.819141387939453, 12.593111038208008, 14.367080688476562, 16.141048431396484, 17.91501808166504, 19.688987731933594, 21.46295738220215, 23.236927032470703, 25.010894775390625, 26.78486442565918, 28.558834075927734, 30.332801818847656, 32.106773376464844, 33.880741119384766, 35.65470886230469, 37.428680419921875, 39.2026481628418, 40.97661590576172, 42.750587463378906, 44.52455520629883, 46.29852294921875, 48.07249450683594]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 8.0, 13.0, 10.0, 12.0, 15.0, 17.0, 21.0, 15.0, 26.0, 26.0, 25.0, 42.0, 38.0, 35.0, 35.0, 36.0, 41.0, 42.0, 38.0, 34.0, 45.0, 44.0, 32.0, 32.0, 35.0, 29.0, 33.0, 26.0, 18.0, 28.0, 23.0, 31.0, 11.0, 14.0, 7.0, 8.0, 11.0, 6.0, 12.0, 1.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-10.6875, -10.37109375, -10.0546875, -9.73828125, -9.421875, -9.10546875, -8.7890625, -8.47265625, -8.15625, -7.83984375, -7.5234375, -7.20703125, -6.890625, -6.57421875, -6.2578125, -5.94140625, -5.625, -5.30859375, -4.9921875, -4.67578125, -4.359375, -4.04296875, -3.7265625, -3.41015625, -3.09375, -2.77734375, -2.4609375, -2.14453125, -1.828125, -1.51171875, -1.1953125, -0.87890625, -0.5625, -0.24609375, 0.0703125, 0.38671875, 0.703125, 1.01953125, 1.3359375, 1.65234375, 1.96875, 2.28515625, 2.6015625, 2.91796875, 3.234375, 3.55078125, 3.8671875, 4.18359375, 4.5, 4.81640625, 5.1328125, 5.44921875, 5.765625, 6.08203125, 6.3984375, 6.71484375, 7.03125, 7.34765625, 7.6640625, 7.98046875, 8.296875, 8.61328125, 8.9296875, 9.24609375, 9.5625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 7.0, 15.0, 26.0, 34.0, 50.0, 53.0, 103.0, 107.0, 200.0, 230.0, 340.0, 532.0, 646.0, 963.0, 1367.0, 1963.0, 2753.0, 4137.0, 6118.0, 8821.0, 13209.0, 20055.0, 31148.0, 48528.0, 78297.0, 139541.0, 311531.0, 148869.0, 82141.0, 50574.0, 32148.0, 20777.0, 13790.0, 9185.0, 6266.0, 4161.0, 2909.0, 2061.0, 1500.0, 963.0, 714.0, 512.0, 329.0, 264.0, 190.0, 115.0, 91.0, 57.0, 60.0, 26.0, 28.0, 12.0, 11.0, 11.0, 9.0, 1.0, 0.0, 3.0], "bins": [-2.044921875, -1.982086181640625, -1.91925048828125, -1.856414794921875, -1.7935791015625, -1.730743408203125, -1.66790771484375, -1.605072021484375, -1.542236328125, -1.479400634765625, -1.41656494140625, -1.353729248046875, -1.2908935546875, -1.228057861328125, -1.16522216796875, -1.102386474609375, -1.03955078125, -0.976715087890625, -0.91387939453125, -0.851043701171875, -0.7882080078125, -0.725372314453125, -0.66253662109375, -0.599700927734375, -0.536865234375, -0.474029541015625, -0.41119384765625, -0.348358154296875, -0.2855224609375, -0.222686767578125, -0.15985107421875, -0.097015380859375, -0.0341796875, 0.028656005859375, 0.09149169921875, 0.154327392578125, 0.2171630859375, 0.279998779296875, 0.34283447265625, 0.405670166015625, 0.468505859375, 0.531341552734375, 0.59417724609375, 0.657012939453125, 0.7198486328125, 0.782684326171875, 0.84552001953125, 0.908355712890625, 0.97119140625, 1.034027099609375, 1.09686279296875, 1.159698486328125, 1.2225341796875, 1.285369873046875, 1.34820556640625, 1.411041259765625, 1.473876953125, 1.536712646484375, 1.59954833984375, 1.662384033203125, 1.7252197265625, 1.788055419921875, 1.85089111328125, 1.913726806640625, 1.9765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 13.0, 14.0, 11.0, 16.0, 25.0, 27.0, 29.0, 30.0, 31.0, 32.0, 31.0, 36.0, 39.0, 35.0, 37.0, 36.0, 1066.0, 42.0, 48.0, 53.0, 43.0, 40.0, 39.0, 38.0, 32.0, 24.0, 32.0, 26.0, 18.0, 14.0, 11.0, 12.0, 6.0, 11.0, 6.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.34375, -8.1085205078125, -7.873291015625, -7.6380615234375, -7.40283203125, -7.1676025390625, -6.932373046875, -6.6971435546875, -6.4619140625, -6.2266845703125, -5.991455078125, -5.7562255859375, -5.52099609375, -5.2857666015625, -5.050537109375, -4.8153076171875, -4.580078125, -4.3448486328125, -4.109619140625, -3.8743896484375, -3.63916015625, -3.4039306640625, -3.168701171875, -2.9334716796875, -2.6982421875, -2.4630126953125, -2.227783203125, -1.9925537109375, -1.75732421875, -1.5220947265625, -1.286865234375, -1.0516357421875, -0.81640625, -0.5811767578125, -0.345947265625, -0.1107177734375, 0.12451171875, 0.3597412109375, 0.594970703125, 0.8302001953125, 1.0654296875, 1.3006591796875, 1.535888671875, 1.7711181640625, 2.00634765625, 2.2415771484375, 2.476806640625, 2.7120361328125, 2.947265625, 3.1824951171875, 3.417724609375, 3.6529541015625, 3.88818359375, 4.1234130859375, 4.358642578125, 4.5938720703125, 4.8291015625, 5.0643310546875, 5.299560546875, 5.5347900390625, 5.77001953125, 6.0052490234375, 6.240478515625, 6.4757080078125, 6.7109375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 14.0, 14.0, 25.0, 44.0, 63.0, 93.0, 131.0, 237.0, 377.0, 632.0, 1078.0, 1856.0, 3061.0, 5236.0, 8930.0, 15181.0, 26012.0, 45875.0, 83931.0, 176200.0, 1416673.0, 144180.0, 71443.0, 40016.0, 23199.0, 13386.0, 7802.0, 4643.0, 2718.0, 1654.0, 956.0, 546.0, 354.0, 188.0, 123.0, 91.0, 47.0, 40.0, 28.0, 21.0, 9.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.912109375, -2.829803466796875, -2.74749755859375, -2.665191650390625, -2.5828857421875, -2.500579833984375, -2.41827392578125, -2.335968017578125, -2.253662109375, -2.171356201171875, -2.08905029296875, -2.006744384765625, -1.9244384765625, -1.842132568359375, -1.75982666015625, -1.677520751953125, -1.59521484375, -1.512908935546875, -1.43060302734375, -1.348297119140625, -1.2659912109375, -1.183685302734375, -1.10137939453125, -1.019073486328125, -0.936767578125, -0.854461669921875, -0.77215576171875, -0.689849853515625, -0.6075439453125, -0.525238037109375, -0.44293212890625, -0.360626220703125, -0.2783203125, -0.196014404296875, -0.11370849609375, -0.031402587890625, 0.0509033203125, 0.133209228515625, 0.21551513671875, 0.297821044921875, 0.380126953125, 0.462432861328125, 0.54473876953125, 0.627044677734375, 0.7093505859375, 0.791656494140625, 0.87396240234375, 0.956268310546875, 1.03857421875, 1.120880126953125, 1.20318603515625, 1.285491943359375, 1.3677978515625, 1.450103759765625, 1.53240966796875, 1.614715576171875, 1.697021484375, 1.779327392578125, 1.86163330078125, 1.943939208984375, 2.0262451171875, 2.108551025390625, 2.19085693359375, 2.273162841796875, 2.35546875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 6.0, 16.0, 19.0, 30.0, 29.0, 50.0, 37.0, 52.0, 56.0, 78.0, 81.0, 81.0, 79.0, 74.0, 65.0, 57.0, 31.0, 44.0, 19.0, 24.0, 15.0, 10.0, 8.0, 4.0, 6.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011262893676757812, -0.001081913709640503, -0.0010375380516052246, -0.0009931623935699463, -0.000948786735534668, -0.0009044110774993896, -0.0008600354194641113, -0.000815659761428833, -0.0007712841033935547, -0.0007269084453582764, -0.000682532787322998, -0.0006381571292877197, -0.0005937814712524414, -0.0005494058132171631, -0.0005050301551818848, -0.00046065449714660645, -0.0004162788391113281, -0.0003719031810760498, -0.0003275275230407715, -0.00028315186500549316, -0.00023877620697021484, -0.00019440054893493652, -0.0001500248908996582, -0.00010564923286437988, -6.127357482910156e-05, -1.6897916793823242e-05, 2.7477741241455078e-05, 7.18533992767334e-05, 0.00011622905731201172, 0.00016060471534729004, 0.00020498037338256836, 0.0002493560314178467, 0.000293731689453125, 0.0003381073474884033, 0.00038248300552368164, 0.00042685866355895996, 0.0004712343215942383, 0.0005156099796295166, 0.0005599856376647949, 0.0006043612957000732, 0.0006487369537353516, 0.0006931126117706299, 0.0007374882698059082, 0.0007818639278411865, 0.0008262395858764648, 0.0008706152439117432, 0.0009149909019470215, 0.0009593665599822998, 0.0010037422180175781, 0.0010481178760528564, 0.0010924935340881348, 0.001136869192123413, 0.0011812448501586914, 0.0012256205081939697, 0.001269996166229248, 0.0013143718242645264, 0.0013587474822998047, 0.001403123140335083, 0.0014474987983703613, 0.0014918744564056396, 0.001536250114440918, 0.0015806257724761963, 0.0016250014305114746, 0.001669377088546753, 0.0017137527465820312]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 11.0, 7.0, 11.0, 9.0, 12.0, 19.0, 33.0, 35.0, 56.0, 55.0, 97.0, 168.0, 287.0, 586.0, 3576.0, 1033211.0, 8802.0, 687.0, 305.0, 179.0, 118.0, 66.0, 60.0, 44.0, 32.0, 20.0, 16.0, 12.0, 10.0, 12.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.033843994140625, -0.03296661376953125, -0.0320892333984375, -0.03121185302734375, -0.03033447265625, -0.02945709228515625, -0.0285797119140625, -0.02770233154296875, -0.026824951171875, -0.02594757080078125, -0.0250701904296875, -0.02419281005859375, -0.0233154296875, -0.02243804931640625, -0.0215606689453125, -0.02068328857421875, -0.019805908203125, -0.01892852783203125, -0.0180511474609375, -0.01717376708984375, -0.01629638671875, -0.01541900634765625, -0.0145416259765625, -0.01366424560546875, -0.012786865234375, -0.01190948486328125, -0.0110321044921875, -0.01015472412109375, -0.00927734375, -0.00839996337890625, -0.0075225830078125, -0.00664520263671875, -0.005767822265625, -0.00489044189453125, -0.0040130615234375, -0.00313568115234375, -0.00225830078125, -0.00138092041015625, -0.0005035400390625, 0.00037384033203125, 0.001251220703125, 0.00212860107421875, 0.0030059814453125, 0.00388336181640625, 0.0047607421875, 0.00563812255859375, 0.0065155029296875, 0.00739288330078125, 0.008270263671875, 0.00914764404296875, 0.0100250244140625, 0.01090240478515625, 0.01177978515625, 0.01265716552734375, 0.0135345458984375, 0.01441192626953125, 0.015289306640625, 0.01616668701171875, 0.0170440673828125, 0.01792144775390625, 0.018798828125, 0.01967620849609375, 0.0205535888671875, 0.02143096923828125, 0.022308349609375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 51.0, 465.0, 435.0, 55.0, 8.0, 4.0], "bins": [-0.006527237128466368, -0.006418544799089432, -0.0063098520040512085, -0.0062011596746742725, -0.006092467345297337, -0.005983775015920401, -0.005875082220882177, -0.005766389891505241, -0.0056576975621283054, -0.0055490052327513695, -0.005440312437713146, -0.00533162010833621, -0.005222927778959274, -0.005114235449582338, -0.005005542654544115, -0.004896850325167179, -0.004788157995790243, -0.004679465666413307, -0.004570772871375084, -0.004462080541998148, -0.004353388212621212, -0.004244695883244276, -0.004136003088206053, -0.004027310758829117, -0.003918618429452181, -0.0038099258672446012, -0.0037012335378676653, -0.0035925409756600857, -0.0034838486462831497, -0.00337515608407557, -0.003266463754698634, -0.0031577711924910545, -0.003049078630283475, -0.0029403860680758953, -0.0028316937386989594, -0.0027230011764913797, -0.0026143088471144438, -0.002505616284906864, -0.002396923955529928, -0.0022882313933223486, -0.0021795390639454126, -0.002070846501737833, -0.001962154172360897, -0.0018534617265686393, -0.0017447692807763815, -0.0016360767185688019, -0.001527384389191866, -0.0014186918269842863, -0.0013099993811920285, -0.0012013069353997707, -0.001092614489607513, -0.0009839220438152552, -0.0008752295980229974, -0.0007665370940230787, -0.0006578446482308209, -0.0005491522024385631, -0.00044045972754247487, -0.0003317672817502171, -0.00022307482140604407, -0.00011438236106187105, -5.689915269613266e-06, 0.00010300255962647498, 0.00021169500541873276, 0.00032038745121099055, 0.00042907989700324833]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 6.0, 4.0, 4.0, 2.0, 8.0, 14.0, 16.0, 14.0, 20.0, 15.0, 27.0, 12.0, 31.0, 22.0, 30.0, 30.0, 37.0, 35.0, 41.0, 39.0, 39.0, 45.0, 46.0, 52.0, 29.0, 43.0, 42.0, 33.0, 35.0, 25.0, 37.0, 18.0, 22.0, 21.0, 19.0, 10.0, 16.0, 14.0, 8.0, 14.0, 5.0, 5.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0005852580070495605, -0.000567510724067688, -0.0005497634410858154, -0.0005320161581039429, -0.0005142688751220703, -0.0004965215921401978, -0.0004787743091583252, -0.00046102702617645264, -0.0004432797431945801, -0.0004255324602127075, -0.00040778517723083496, -0.0003900378942489624, -0.00037229061126708984, -0.0003545433282852173, -0.0003367960453033447, -0.00031904876232147217, -0.0003013014793395996, -0.00028355419635772705, -0.0002658069133758545, -0.00024805963039398193, -0.00023031234741210938, -0.00021256506443023682, -0.00019481778144836426, -0.0001770704984664917, -0.00015932321548461914, -0.00014157593250274658, -0.00012382864952087402, -0.00010608136653900146, -8.83340835571289e-05, -7.058680057525635e-05, -5.283951759338379e-05, -3.509223461151123e-05, -1.7344951629638672e-05, 4.023313522338867e-07, 1.8149614334106445e-05, 3.5896897315979004e-05, 5.364418029785156e-05, 7.139146327972412e-05, 8.913874626159668e-05, 0.00010688602924346924, 0.0001246333122253418, 0.00014238059520721436, 0.00016012787818908691, 0.00017787516117095947, 0.00019562244415283203, 0.0002133697271347046, 0.00023111701011657715, 0.0002488642930984497, 0.00026661157608032227, 0.0002843588590621948, 0.0003021061420440674, 0.00031985342502593994, 0.0003376007080078125, 0.00035534799098968506, 0.0003730952739715576, 0.0003908425569534302, 0.00040858983993530273, 0.0004263371229171753, 0.00044408440589904785, 0.0004618316888809204, 0.00047957897186279297, 0.0004973262548446655, 0.0005150735378265381, 0.0005328208208084106, 0.0005505681037902832]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 8.0, 13.0, 10.0, 12.0, 15.0, 17.0, 21.0, 15.0, 26.0, 26.0, 25.0, 42.0, 38.0, 35.0, 35.0, 36.0, 41.0, 42.0, 38.0, 34.0, 45.0, 44.0, 32.0, 32.0, 35.0, 29.0, 33.0, 26.0, 18.0, 28.0, 23.0, 31.0, 11.0, 14.0, 7.0, 8.0, 11.0, 6.0, 12.0, 1.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-10.6875, -10.37109375, -10.0546875, -9.73828125, -9.421875, -9.10546875, -8.7890625, -8.47265625, -8.15625, -7.83984375, -7.5234375, -7.20703125, -6.890625, -6.57421875, -6.2578125, -5.94140625, -5.625, -5.30859375, -4.9921875, -4.67578125, -4.359375, -4.04296875, -3.7265625, -3.41015625, -3.09375, -2.77734375, -2.4609375, -2.14453125, -1.828125, -1.51171875, -1.1953125, -0.87890625, -0.5625, -0.24609375, 0.0703125, 0.38671875, 0.703125, 1.01953125, 1.3359375, 1.65234375, 1.96875, 2.28515625, 2.6015625, 2.91796875, 3.234375, 3.55078125, 3.8671875, 4.18359375, 4.5, 4.81640625, 5.1328125, 5.44921875, 5.765625, 6.08203125, 6.3984375, 6.71484375, 7.03125, 7.34765625, 7.6640625, 7.98046875, 8.296875, 8.61328125, 8.9296875, 9.24609375, 9.5625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 8.0, 8.0, 11.0, 18.0, 24.0, 31.0, 37.0, 41.0, 63.0, 66.0, 100.0, 136.0, 188.0, 232.0, 351.0, 498.0, 793.0, 1639.0, 4732.0, 17432.0, 117753.0, 809321.0, 73972.0, 13409.0, 3839.0, 1468.0, 677.0, 477.0, 307.0, 200.0, 160.0, 126.0, 101.0, 70.0, 67.0, 40.0, 21.0, 28.0, 22.0, 19.0, 13.0, 9.0, 10.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-26.578125, -25.782470703125, -24.98681640625, -24.191162109375, -23.3955078125, -22.599853515625, -21.80419921875, -21.008544921875, -20.212890625, -19.417236328125, -18.62158203125, -17.825927734375, -17.0302734375, -16.234619140625, -15.43896484375, -14.643310546875, -13.84765625, -13.052001953125, -12.25634765625, -11.460693359375, -10.6650390625, -9.869384765625, -9.07373046875, -8.278076171875, -7.482421875, -6.686767578125, -5.89111328125, -5.095458984375, -4.2998046875, -3.504150390625, -2.70849609375, -1.912841796875, -1.1171875, -0.321533203125, 0.47412109375, 1.269775390625, 2.0654296875, 2.861083984375, 3.65673828125, 4.452392578125, 5.248046875, 6.043701171875, 6.83935546875, 7.635009765625, 8.4306640625, 9.226318359375, 10.02197265625, 10.817626953125, 11.61328125, 12.408935546875, 13.20458984375, 14.000244140625, 14.7958984375, 15.591552734375, 16.38720703125, 17.182861328125, 17.978515625, 18.774169921875, 19.56982421875, 20.365478515625, 21.1611328125, 21.956787109375, 22.75244140625, 23.548095703125, 24.34375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 12.0, 7.0, 13.0, 8.0, 17.0, 21.0, 13.0, 26.0, 22.0, 28.0, 44.0, 40.0, 50.0, 53.0, 57.0, 133.0, 427.0, 1484.0, 137.0, 52.0, 67.0, 44.0, 31.0, 38.0, 28.0, 30.0, 23.0, 22.0, 15.0, 20.0, 14.0, 12.0, 8.0, 12.0, 6.0, 2.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-32.5625, -31.576171875, -30.58984375, -29.603515625, -28.6171875, -27.630859375, -26.64453125, -25.658203125, -24.671875, -23.685546875, -22.69921875, -21.712890625, -20.7265625, -19.740234375, -18.75390625, -17.767578125, -16.78125, -15.794921875, -14.80859375, -13.822265625, -12.8359375, -11.849609375, -10.86328125, -9.876953125, -8.890625, -7.904296875, -6.91796875, -5.931640625, -4.9453125, -3.958984375, -2.97265625, -1.986328125, -1.0, -0.013671875, 0.97265625, 1.958984375, 2.9453125, 3.931640625, 4.91796875, 5.904296875, 6.890625, 7.876953125, 8.86328125, 9.849609375, 10.8359375, 11.822265625, 12.80859375, 13.794921875, 14.78125, 15.767578125, 16.75390625, 17.740234375, 18.7265625, 19.712890625, 20.69921875, 21.685546875, 22.671875, 23.658203125, 24.64453125, 25.630859375, 26.6171875, 27.603515625, 28.58984375, 29.576171875, 30.5625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 10.0, 5.0, 5.0, 4.0, 12.0, 7.0, 17.0, 23.0, 13.0, 13.0, 31.0, 43.0, 42.0, 42.0, 47.0, 99.0, 152.0, 319.0, 997.0, 12698.0, 3082412.0, 45993.0, 1715.0, 360.0, 187.0, 115.0, 62.0, 68.0, 29.0, 31.0, 29.0, 21.0, 18.0, 21.0, 8.0, 11.0, 10.0, 11.0, 11.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-83.5, -80.775390625, -78.05078125, -75.326171875, -72.6015625, -69.876953125, -67.15234375, -64.427734375, -61.703125, -58.978515625, -56.25390625, -53.529296875, -50.8046875, -48.080078125, -45.35546875, -42.630859375, -39.90625, -37.181640625, -34.45703125, -31.732421875, -29.0078125, -26.283203125, -23.55859375, -20.833984375, -18.109375, -15.384765625, -12.66015625, -9.935546875, -7.2109375, -4.486328125, -1.76171875, 0.962890625, 3.6875, 6.412109375, 9.13671875, 11.861328125, 14.5859375, 17.310546875, 20.03515625, 22.759765625, 25.484375, 28.208984375, 30.93359375, 33.658203125, 36.3828125, 39.107421875, 41.83203125, 44.556640625, 47.28125, 50.005859375, 52.73046875, 55.455078125, 58.1796875, 60.904296875, 63.62890625, 66.353515625, 69.078125, 71.802734375, 74.52734375, 77.251953125, 79.9765625, 82.701171875, 85.42578125, 88.150390625, 90.875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 20.0, 328.0, 602.0, 66.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.14654541015625, -188.8876953125, -182.62884521484375, -176.37001037597656, -170.1111602783203, -163.85231018066406, -157.59347534179688, -151.33462524414062, -145.07577514648438, -138.81692504882812, -132.55807495117188, -126.29924011230469, -120.04039001464844, -113.78153991699219, -107.52269744873047, -101.26385498046875, -95.0050048828125, -88.74615478515625, -82.48731231689453, -76.22846984863281, -69.96961975097656, -63.71077346801758, -57.451927185058594, -51.19308090209961, -44.934234619140625, -38.67538833618164, -32.416542053222656, -26.157695770263672, -19.898849487304688, -13.640003204345703, -7.381156921386719, -1.1223106384277344, 5.1365509033203125, 11.395397186279297, 17.65424346923828, 23.913089752197266, 30.17193603515625, 36.430782318115234, 42.68962860107422, 48.9484748840332, 55.20732116699219, 61.46616744995117, 67.72501373291016, 73.98385620117188, 80.24270629882812, 86.50155639648438, 92.7603988647461, 99.01924133300781, 105.27809143066406, 111.53694152832031, 117.79578399658203, 124.05462646484375, 130.3134765625, 136.57232666015625, 142.8311767578125, 149.0900115966797, 155.34886169433594, 161.6077117919922, 167.86654663085938, 174.12539672851562, 180.38424682617188, 186.64309692382812, 192.90194702148438, 199.16078186035156, 205.4196319580078]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 10.0, 11.0, 14.0, 6.0, 14.0, 11.0, 15.0, 29.0, 19.0, 24.0, 28.0, 27.0, 39.0, 40.0, 38.0, 44.0, 49.0, 47.0, 42.0, 39.0, 34.0, 41.0, 40.0, 34.0, 41.0, 30.0, 29.0, 33.0, 28.0, 18.0, 12.0, 13.0, 19.0, 16.0, 15.0, 7.0, 15.0, 6.0, 5.0, 6.0, 1.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-84.1413803100586, -81.71475982666016, -79.28813171386719, -76.86151123046875, -74.43488311767578, -72.00826263427734, -69.58163452148438, -67.15501403808594, -64.72838592529297, -62.301761627197266, -59.87513732910156, -57.44851303100586, -55.021888732910156, -52.59526443481445, -50.16864013671875, -47.74201965332031, -45.31539535522461, -42.888771057128906, -40.4621467590332, -38.0355224609375, -35.6088981628418, -33.182273864746094, -30.755651473999023, -28.32902717590332, -25.902402877807617, -23.475778579711914, -21.04915428161621, -18.62253189086914, -16.195907592773438, -13.769282341003418, -11.342658996582031, -8.916034698486328, -6.489410400390625, -4.062786102294922, -1.636162281036377, 0.790461540222168, 3.217085838317871, 5.643710136413574, 8.070333480834961, 10.496957778930664, 12.923582077026367, 15.35020637512207, 17.776830673217773, 20.203453063964844, 22.630077362060547, 25.05670166015625, 27.483325958251953, 29.909950256347656, 32.33657455444336, 34.76319885253906, 37.189823150634766, 39.61644744873047, 42.04307174682617, 44.469696044921875, 46.89631652832031, 49.32294464111328, 51.74956512451172, 54.17618942260742, 56.602813720703125, 59.02943801879883, 61.45606231689453, 63.882686614990234, 66.30931091308594, 68.73593139648438, 71.16255950927734]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 2.0, 0.0, 4.0, 0.0, 7.0, 5.0, 11.0, 12.0, 15.0, 12.0, 21.0, 19.0, 22.0, 25.0, 34.0, 26.0, 31.0, 42.0, 44.0, 38.0, 39.0, 34.0, 43.0, 45.0, 33.0, 37.0, 38.0, 37.0, 32.0, 24.0, 35.0, 27.0, 33.0, 33.0, 24.0, 12.0, 20.0, 17.0, 14.0, 9.0, 7.0, 5.0, 11.0, 7.0, 5.0, 4.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.0703125, -10.739990234375, -10.40966796875, -10.079345703125, -9.7490234375, -9.418701171875, -9.08837890625, -8.758056640625, -8.427734375, -8.097412109375, -7.76708984375, -7.436767578125, -7.1064453125, -6.776123046875, -6.44580078125, -6.115478515625, -5.78515625, -5.454833984375, -5.12451171875, -4.794189453125, -4.4638671875, -4.133544921875, -3.80322265625, -3.472900390625, -3.142578125, -2.812255859375, -2.48193359375, -2.151611328125, -1.8212890625, -1.490966796875, -1.16064453125, -0.830322265625, -0.5, -0.169677734375, 0.16064453125, 0.490966796875, 0.8212890625, 1.151611328125, 1.48193359375, 1.812255859375, 2.142578125, 2.472900390625, 2.80322265625, 3.133544921875, 3.4638671875, 3.794189453125, 4.12451171875, 4.454833984375, 4.78515625, 5.115478515625, 5.44580078125, 5.776123046875, 6.1064453125, 6.436767578125, 6.76708984375, 7.097412109375, 7.427734375, 7.758056640625, 8.08837890625, 8.418701171875, 8.7490234375, 9.079345703125, 9.40966796875, 9.739990234375, 10.0703125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 4.0, 14.0, 12.0, 18.0, 18.0, 24.0, 39.0, 41.0, 58.0, 75.0, 95.0, 149.0, 164.0, 279.0, 455.0, 851.0, 1751.0, 4632.0, 14289.0, 67237.0, 727936.0, 2666645.0, 625876.0, 61462.0, 13458.0, 4405.0, 1825.0, 869.0, 497.0, 296.0, 209.0, 138.0, 98.0, 72.0, 51.0, 55.0, 33.0, 27.0, 20.0, 16.0, 13.0, 18.0, 6.0, 11.0, 9.0, 7.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0], "bins": [-23.984375, -23.267822265625, -22.55126953125, -21.834716796875, -21.1181640625, -20.401611328125, -19.68505859375, -18.968505859375, -18.251953125, -17.535400390625, -16.81884765625, -16.102294921875, -15.3857421875, -14.669189453125, -13.95263671875, -13.236083984375, -12.51953125, -11.802978515625, -11.08642578125, -10.369873046875, -9.6533203125, -8.936767578125, -8.22021484375, -7.503662109375, -6.787109375, -6.070556640625, -5.35400390625, -4.637451171875, -3.9208984375, -3.204345703125, -2.48779296875, -1.771240234375, -1.0546875, -0.338134765625, 0.37841796875, 1.094970703125, 1.8115234375, 2.528076171875, 3.24462890625, 3.961181640625, 4.677734375, 5.394287109375, 6.11083984375, 6.827392578125, 7.5439453125, 8.260498046875, 8.97705078125, 9.693603515625, 10.41015625, 11.126708984375, 11.84326171875, 12.559814453125, 13.2763671875, 13.992919921875, 14.70947265625, 15.426025390625, 16.142578125, 16.859130859375, 17.57568359375, 18.292236328125, 19.0087890625, 19.725341796875, 20.44189453125, 21.158447265625, 21.875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 9.0, 7.0, 11.0, 14.0, 14.0, 22.0, 28.0, 34.0, 58.0, 84.0, 108.0, 143.0, 223.0, 322.0, 448.0, 513.0, 530.0, 412.0, 327.0, 225.0, 168.0, 103.0, 72.0, 69.0, 42.0, 21.0, 16.0, 17.0, 9.0, 5.0, 6.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0], "bins": [-26.796875, -26.1727294921875, -25.548583984375, -24.9244384765625, -24.30029296875, -23.6761474609375, -23.052001953125, -22.4278564453125, -21.8037109375, -21.1795654296875, -20.555419921875, -19.9312744140625, -19.30712890625, -18.6829833984375, -18.058837890625, -17.4346923828125, -16.810546875, -16.1864013671875, -15.562255859375, -14.9381103515625, -14.31396484375, -13.6898193359375, -13.065673828125, -12.4415283203125, -11.8173828125, -11.1932373046875, -10.569091796875, -9.9449462890625, -9.32080078125, -8.6966552734375, -8.072509765625, -7.4483642578125, -6.82421875, -6.2000732421875, -5.575927734375, -4.9517822265625, -4.32763671875, -3.7034912109375, -3.079345703125, -2.4552001953125, -1.8310546875, -1.2069091796875, -0.582763671875, 0.0413818359375, 0.66552734375, 1.2896728515625, 1.913818359375, 2.5379638671875, 3.162109375, 3.7862548828125, 4.410400390625, 5.0345458984375, 5.65869140625, 6.2828369140625, 6.906982421875, 7.5311279296875, 8.1552734375, 8.7794189453125, 9.403564453125, 10.0277099609375, 10.65185546875, 11.2760009765625, 11.900146484375, 12.5242919921875, 13.1484375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 4.0, 12.0, 10.0, 16.0, 19.0, 34.0, 33.0, 47.0, 57.0, 81.0, 98.0, 159.0, 230.0, 361.0, 696.0, 1855.0, 10401.0, 161117.0, 3785103.0, 218021.0, 12084.0, 1997.0, 690.0, 348.0, 223.0, 141.0, 95.0, 77.0, 63.0, 40.0, 53.0, 33.0, 19.0, 15.0, 10.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-50.46875, -48.63623046875, -46.8037109375, -44.97119140625, -43.138671875, -41.30615234375, -39.4736328125, -37.64111328125, -35.80859375, -33.97607421875, -32.1435546875, -30.31103515625, -28.478515625, -26.64599609375, -24.8134765625, -22.98095703125, -21.1484375, -19.31591796875, -17.4833984375, -15.65087890625, -13.818359375, -11.98583984375, -10.1533203125, -8.32080078125, -6.48828125, -4.65576171875, -2.8232421875, -0.99072265625, 0.841796875, 2.67431640625, 4.5068359375, 6.33935546875, 8.171875, 10.00439453125, 11.8369140625, 13.66943359375, 15.501953125, 17.33447265625, 19.1669921875, 20.99951171875, 22.83203125, 24.66455078125, 26.4970703125, 28.32958984375, 30.162109375, 31.99462890625, 33.8271484375, 35.65966796875, 37.4921875, 39.32470703125, 41.1572265625, 42.98974609375, 44.822265625, 46.65478515625, 48.4873046875, 50.31982421875, 52.15234375, 53.98486328125, 55.8173828125, 57.64990234375, 59.482421875, 61.31494140625, 63.1474609375, 64.97998046875, 66.8125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 58.0, 432.0, 458.0, 60.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-499.60028076171875, -487.4222412109375, -475.2442321777344, -463.0661926269531, -450.88818359375, -438.71014404296875, -426.5321044921875, -414.35406494140625, -402.1760559082031, -389.9980163574219, -377.82000732421875, -365.6419677734375, -353.46392822265625, -341.2859191894531, -329.1078796386719, -316.92987060546875, -304.7518310546875, -292.57379150390625, -280.3957824707031, -268.2177429199219, -256.03973388671875, -243.8616943359375, -231.68365478515625, -219.50563049316406, -207.32760620117188, -195.1495819091797, -182.9715576171875, -170.79351806640625, -158.61549377441406, -146.43746948242188, -134.25942993164062, -122.08140563964844, -109.90335083007812, -97.72532653808594, -85.54729461669922, -73.3692626953125, -61.19123840332031, -49.01321029663086, -36.835182189941406, -24.657150268554688, -12.4791259765625, -0.3010978698730469, 11.876930236816406, 24.05495834350586, 36.23298645019531, 48.411014556884766, 60.58904266357422, 72.76707458496094, 84.94509887695312, 97.12312316894531, 109.30115509033203, 121.47918701171875, 133.65721130371094, 145.83523559570312, 158.01327514648438, 170.19129943847656, 182.36932373046875, 194.54734802246094, 206.72537231445312, 218.90341186523438, 231.08143615722656, 243.25946044921875, 255.4375, 267.61553955078125, 279.7935485839844]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 7.0, 5.0, 10.0, 9.0, 14.0, 15.0, 16.0, 22.0, 18.0, 26.0, 17.0, 39.0, 34.0, 46.0, 33.0, 43.0, 42.0, 35.0, 35.0, 44.0, 44.0, 40.0, 35.0, 41.0, 48.0, 35.0, 22.0, 31.0, 26.0, 26.0, 14.0, 21.0, 22.0, 16.0, 7.0, 9.0, 16.0, 9.0, 7.0, 4.0, 5.0, 4.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.89879608154297, -51.96471405029297, -50.03063201904297, -48.09654998779297, -46.1624641418457, -44.2283821105957, -42.2943000793457, -40.3602180480957, -38.4261360168457, -36.4920539855957, -34.5579719543457, -32.62388610839844, -30.68980598449707, -28.755722045898438, -26.821640014648438, -24.887557983398438, -22.953474044799805, -21.019392013549805, -19.085308074951172, -17.151226043701172, -15.217144012451172, -13.283061027526855, -11.348978042602539, -9.414896011352539, -7.480813026428223, -5.5467305183410645, -3.612647771835327, -1.6785650253295898, 0.25551748275756836, 2.1895999908447266, 4.123682975769043, 6.057765007019043, 7.991847991943359, 9.925930976867676, 11.860013008117676, 13.794095993041992, 15.728178024291992, 17.662261962890625, 19.596343994140625, 21.530426025390625, 23.464508056640625, 25.398590087890625, 27.332674026489258, 29.266756057739258, 31.200838088989258, 33.13492202758789, 35.06900405883789, 37.00308609008789, 38.937171936035156, 40.871253967285156, 42.805335998535156, 44.739418029785156, 46.67350387573242, 48.60758590698242, 50.54166793823242, 52.47574996948242, 54.40983200073242, 56.34391403198242, 58.27799606323242, 60.21208190917969, 62.14616394042969, 64.08024597167969, 66.01432800292969, 67.94841003417969, 69.88249206542969]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 9.0, 9.0, 6.0, 3.0, 11.0, 15.0, 21.0, 21.0, 24.0, 36.0, 27.0, 26.0, 36.0, 43.0, 37.0, 23.0, 36.0, 46.0, 38.0, 28.0, 39.0, 54.0, 46.0, 38.0, 35.0, 39.0, 39.0, 38.0, 15.0, 30.0, 21.0, 18.0, 17.0, 14.0, 10.0, 7.0, 10.0, 3.0, 4.0, 6.0, 2.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.604736328125, -10.25634765625, -9.907958984375, -9.5595703125, -9.211181640625, -8.86279296875, -8.514404296875, -8.166015625, -7.817626953125, -7.46923828125, -7.120849609375, -6.7724609375, -6.424072265625, -6.07568359375, -5.727294921875, -5.37890625, -5.030517578125, -4.68212890625, -4.333740234375, -3.9853515625, -3.636962890625, -3.28857421875, -2.940185546875, -2.591796875, -2.243408203125, -1.89501953125, -1.546630859375, -1.1982421875, -0.849853515625, -0.50146484375, -0.153076171875, 0.1953125, 0.543701171875, 0.89208984375, 1.240478515625, 1.5888671875, 1.937255859375, 2.28564453125, 2.634033203125, 2.982421875, 3.330810546875, 3.67919921875, 4.027587890625, 4.3759765625, 4.724365234375, 5.07275390625, 5.421142578125, 5.76953125, 6.117919921875, 6.46630859375, 6.814697265625, 7.1630859375, 7.511474609375, 7.85986328125, 8.208251953125, 8.556640625, 8.905029296875, 9.25341796875, 9.601806640625, 9.9501953125, 10.298583984375, 10.64697265625, 10.995361328125, 11.34375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 11.0, 4.0, 14.0, 27.0, 36.0, 42.0, 65.0, 97.0, 136.0, 213.0, 323.0, 452.0, 690.0, 971.0, 1425.0, 2006.0, 3080.0, 4744.0, 7262.0, 11478.0, 18028.0, 30144.0, 51135.0, 90022.0, 185515.0, 325507.0, 134375.0, 71484.0, 41531.0, 24430.0, 15330.0, 9548.0, 6184.0, 3889.0, 2740.0, 1777.0, 1167.0, 870.0, 584.0, 408.0, 247.0, 188.0, 135.0, 75.0, 55.0, 41.0, 26.0, 17.0, 16.0, 8.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.37890625, -2.30291748046875, -2.2269287109375, -2.15093994140625, -2.074951171875, -1.99896240234375, -1.9229736328125, -1.84698486328125, -1.77099609375, -1.69500732421875, -1.6190185546875, -1.54302978515625, -1.467041015625, -1.39105224609375, -1.3150634765625, -1.23907470703125, -1.1630859375, -1.08709716796875, -1.0111083984375, -0.93511962890625, -0.859130859375, -0.78314208984375, -0.7071533203125, -0.63116455078125, -0.55517578125, -0.47918701171875, -0.4031982421875, -0.32720947265625, -0.251220703125, -0.17523193359375, -0.0992431640625, -0.02325439453125, 0.052734375, 0.12872314453125, 0.2047119140625, 0.28070068359375, 0.356689453125, 0.43267822265625, 0.5086669921875, 0.58465576171875, 0.66064453125, 0.73663330078125, 0.8126220703125, 0.88861083984375, 0.964599609375, 1.04058837890625, 1.1165771484375, 1.19256591796875, 1.2685546875, 1.34454345703125, 1.4205322265625, 1.49652099609375, 1.572509765625, 1.64849853515625, 1.7244873046875, 1.80047607421875, 1.87646484375, 1.95245361328125, 2.0284423828125, 2.10443115234375, 2.180419921875, 2.25640869140625, 2.3323974609375, 2.40838623046875, 2.484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 0.0, 9.0, 6.0, 5.0, 9.0, 11.0, 14.0, 10.0, 14.0, 18.0, 20.0, 17.0, 22.0, 29.0, 27.0, 34.0, 41.0, 50.0, 52.0, 35.0, 43.0, 1058.0, 52.0, 44.0, 46.0, 39.0, 44.0, 38.0, 33.0, 32.0, 27.0, 32.0, 13.0, 13.0, 22.0, 14.0, 17.0, 14.0, 7.0, 3.0, 2.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.98046875, -7.75146484375, -7.5224609375, -7.29345703125, -7.064453125, -6.83544921875, -6.6064453125, -6.37744140625, -6.1484375, -5.91943359375, -5.6904296875, -5.46142578125, -5.232421875, -5.00341796875, -4.7744140625, -4.54541015625, -4.31640625, -4.08740234375, -3.8583984375, -3.62939453125, -3.400390625, -3.17138671875, -2.9423828125, -2.71337890625, -2.484375, -2.25537109375, -2.0263671875, -1.79736328125, -1.568359375, -1.33935546875, -1.1103515625, -0.88134765625, -0.65234375, -0.42333984375, -0.1943359375, 0.03466796875, 0.263671875, 0.49267578125, 0.7216796875, 0.95068359375, 1.1796875, 1.40869140625, 1.6376953125, 1.86669921875, 2.095703125, 2.32470703125, 2.5537109375, 2.78271484375, 3.01171875, 3.24072265625, 3.4697265625, 3.69873046875, 3.927734375, 4.15673828125, 4.3857421875, 4.61474609375, 4.84375, 5.07275390625, 5.3017578125, 5.53076171875, 5.759765625, 5.98876953125, 6.2177734375, 6.44677734375, 6.67578125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 8.0, 5.0, 5.0, 13.0, 20.0, 26.0, 38.0, 75.0, 114.0, 167.0, 263.0, 439.0, 697.0, 1109.0, 1824.0, 2854.0, 4791.0, 7360.0, 12097.0, 19921.0, 34567.0, 61239.0, 122583.0, 1396629.0, 217455.0, 93180.0, 48554.0, 27593.0, 16449.0, 10278.0, 6320.0, 3921.0, 2482.0, 1520.0, 952.0, 593.0, 368.0, 250.0, 139.0, 91.0, 60.0, 32.0, 15.0, 17.0, 14.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.78125, -2.70135498046875, -2.6214599609375, -2.54156494140625, -2.461669921875, -2.38177490234375, -2.3018798828125, -2.22198486328125, -2.14208984375, -2.06219482421875, -1.9822998046875, -1.90240478515625, -1.822509765625, -1.74261474609375, -1.6627197265625, -1.58282470703125, -1.5029296875, -1.42303466796875, -1.3431396484375, -1.26324462890625, -1.183349609375, -1.10345458984375, -1.0235595703125, -0.94366455078125, -0.86376953125, -0.78387451171875, -0.7039794921875, -0.62408447265625, -0.544189453125, -0.46429443359375, -0.3843994140625, -0.30450439453125, -0.224609375, -0.14471435546875, -0.0648193359375, 0.01507568359375, 0.094970703125, 0.17486572265625, 0.2547607421875, 0.33465576171875, 0.41455078125, 0.49444580078125, 0.5743408203125, 0.65423583984375, 0.734130859375, 0.81402587890625, 0.8939208984375, 0.97381591796875, 1.0537109375, 1.13360595703125, 1.2135009765625, 1.29339599609375, 1.373291015625, 1.45318603515625, 1.5330810546875, 1.61297607421875, 1.69287109375, 1.77276611328125, 1.8526611328125, 1.93255615234375, 2.012451171875, 2.09234619140625, 2.1722412109375, 2.25213623046875, 2.33203125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 3.0, 7.0, 7.0, 8.0, 17.0, 23.0, 26.0, 26.0, 46.0, 53.0, 79.0, 105.0, 124.0, 101.0, 92.0, 61.0, 49.0, 35.0, 17.0, 19.0, 13.0, 15.0, 13.0, 7.0, 9.0, 3.0, 2.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015707015991210938, -0.0015177279710769653, -0.001464754343032837, -0.0014117807149887085, -0.00135880708694458, -0.0013058334589004517, -0.0012528598308563232, -0.0011998862028121948, -0.0011469125747680664, -0.001093938946723938, -0.0010409653186798096, -0.0009879916906356812, -0.0009350180625915527, -0.0008820444345474243, -0.0008290708065032959, -0.0007760971784591675, -0.0007231235504150391, -0.0006701499223709106, -0.0006171762943267822, -0.0005642026662826538, -0.0005112290382385254, -0.00045825541019439697, -0.00040528178215026855, -0.00035230815410614014, -0.0002993345260620117, -0.0002463608980178833, -0.00019338726997375488, -0.00014041364192962646, -8.744001388549805e-05, -3.446638584136963e-05, 1.850724220275879e-05, 7.148087024688721e-05, 0.00012445449829101562, 0.00017742812633514404, 0.00023040175437927246, 0.0002833753824234009, 0.0003363490104675293, 0.0003893226385116577, 0.00044229626655578613, 0.0004952698945999146, 0.000548243522644043, 0.0006012171506881714, 0.0006541907787322998, 0.0007071644067764282, 0.0007601380348205566, 0.0008131116628646851, 0.0008660852909088135, 0.0009190589189529419, 0.0009720325469970703, 0.0010250061750411987, 0.0010779798030853271, 0.0011309534311294556, 0.001183927059173584, 0.0012369006872177124, 0.0012898743152618408, 0.0013428479433059692, 0.0013958215713500977, 0.001448795199394226, 0.0015017688274383545, 0.001554742455482483, 0.0016077160835266113, 0.0016606897115707397, 0.0017136633396148682, 0.0017666369676589966, 0.001819610595703125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 4.0, 6.0, 9.0, 10.0, 10.0, 19.0, 14.0, 30.0, 41.0, 51.0, 47.0, 72.0, 121.0, 220.0, 353.0, 1089.0, 789650.0, 254894.0, 960.0, 301.0, 180.0, 133.0, 75.0, 71.0, 35.0, 27.0, 20.0, 14.0, 14.0, 14.0, 11.0, 8.0, 5.0, 7.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.032257080078125, -0.03127789497375488, -0.030298709869384766, -0.02931952476501465, -0.02834033966064453, -0.027361154556274414, -0.026381969451904297, -0.02540278434753418, -0.024423599243164062, -0.023444414138793945, -0.022465229034423828, -0.02148604393005371, -0.020506858825683594, -0.019527673721313477, -0.01854848861694336, -0.017569303512573242, -0.016590118408203125, -0.015610933303833008, -0.01463174819946289, -0.013652563095092773, -0.012673377990722656, -0.011694192886352539, -0.010715007781982422, -0.009735822677612305, -0.008756637573242188, -0.00777745246887207, -0.006798267364501953, -0.005819082260131836, -0.004839897155761719, -0.0038607120513916016, -0.0028815269470214844, -0.0019023418426513672, -0.00092315673828125, 5.602836608886719e-05, 0.0010352134704589844, 0.0020143985748291016, 0.0029935836791992188, 0.003972768783569336, 0.004951953887939453, 0.00593113899230957, 0.0069103240966796875, 0.007889509201049805, 0.008868694305419922, 0.009847879409790039, 0.010827064514160156, 0.011806249618530273, 0.01278543472290039, 0.013764619827270508, 0.014743804931640625, 0.015722990036010742, 0.01670217514038086, 0.017681360244750977, 0.018660545349121094, 0.01963973045349121, 0.020618915557861328, 0.021598100662231445, 0.022577285766601562, 0.02355647087097168, 0.024535655975341797, 0.025514841079711914, 0.02649402618408203, 0.02747321128845215, 0.028452396392822266, 0.029431581497192383, 0.0304107666015625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 12.0, 31.0, 59.0, 92.0, 171.0, 185.0, 181.0, 118.0, 88.0, 42.0, 17.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004482787335291505, -0.0004132545436732471, -0.0003782303538173437, -0.0003432061639614403, -0.00030818197410553694, -0.00027315778424963355, -0.00023813362349756062, -0.00020310943364165723, -0.00016808524378575385, -0.00013306105392985046, -9.803687134990469e-05, -6.301268876995891e-05, -2.7988498914055526e-05, 7.035690941847861e-06, 4.205986624583602e-05, 7.70840561017394e-05, 0.0001121082459576428, 0.00014713243581354618, 0.00018215662566944957, 0.00021718080097343773, 0.00025220500538125634, 0.00028722919523715973, 0.00032225335598923266, 0.00035727754584513605, 0.00039230173570103943, 0.0004273259255569428, 0.0004623501154128462, 0.0004973742761649191, 0.0005323984660208225, 0.0005674226558767259, 0.0006024468457326293, 0.0006374710355885327, 0.0006724952254444361, 0.0007075194153003395, 0.0007425436051562428, 0.0007775677950121462, 0.0008125919848680496, 0.000847616174723953, 0.0008826403645798564, 0.0009176644962280989, 0.0009526887442916632, 0.0009877128759399056, 0.00102273712400347, 0.0010577612556517124, 0.0010927855037152767, 0.0011278096353635192, 0.0011628338834270835, 0.001197858015075326, 0.0012328822631388903, 0.0012679063947871327, 0.001302930642850697, 0.0013379547744989395, 0.0013729790225625038, 0.0014080031542107463, 0.0014430274022743106, 0.001478051533922553, 0.0015130756655707955, 0.001548099797219038, 0.0015831240452826023, 0.0016181481769308448, 0.001653172424994409, 0.0016881965566426516, 0.0017232208047062159, 0.0017582449363544583, 0.0017932691844180226]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 5.0, 11.0, 10.0, 12.0, 14.0, 16.0, 22.0, 24.0, 29.0, 31.0, 23.0, 28.0, 25.0, 41.0, 32.0, 29.0, 40.0, 38.0, 46.0, 36.0, 37.0, 46.0, 33.0, 25.0, 28.0, 39.0, 34.0, 36.0, 29.0, 21.0, 18.0, 26.0, 18.0, 11.0, 11.0, 12.0, 5.0, 9.0, 7.0, 5.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0006909370422363281, -0.0006699580699205399, -0.0006489790976047516, -0.0006280001252889633, -0.000607021152973175, -0.0005860421806573868, -0.0005650632083415985, -0.0005440842360258102, -0.000523105263710022, -0.0005021262913942337, -0.00048114731907844543, -0.00046016834676265717, -0.0004391893744468689, -0.00041821040213108063, -0.00039723142981529236, -0.0003762524574995041, -0.0003552734851837158, -0.00033429451286792755, -0.0003133155405521393, -0.000292336568236351, -0.00027135759592056274, -0.0002503786236047745, -0.0002293996512889862, -0.00020842067897319794, -0.00018744170665740967, -0.0001664627343416214, -0.00014548376202583313, -0.00012450478971004486, -0.00010352581739425659, -8.254684507846832e-05, -6.156787276268005e-05, -4.0588900446891785e-05, -1.9609928131103516e-05, 1.3690441846847534e-06, 2.2348016500473022e-05, 4.332698881626129e-05, 6.430596113204956e-05, 8.528493344783783e-05, 0.0001062639057636261, 0.00012724287807941437, 0.00014822185039520264, 0.0001692008227109909, 0.00019017979502677917, 0.00021115876734256744, 0.0002321377396583557, 0.000253116711974144, 0.00027409568428993225, 0.0002950746566057205, 0.0003160536289215088, 0.00033703260123729706, 0.00035801157355308533, 0.0003789905458688736, 0.00039996951818466187, 0.00042094849050045013, 0.0004419274628162384, 0.00046290643513202667, 0.00048388540744781494, 0.0005048643797636032, 0.0005258433520793915, 0.0005468223243951797, 0.000567801296710968, 0.0005887802690267563, 0.0006097592413425446, 0.0006307382136583328, 0.0006517171859741211]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 9.0, 9.0, 6.0, 3.0, 11.0, 15.0, 21.0, 21.0, 24.0, 36.0, 27.0, 26.0, 36.0, 43.0, 37.0, 23.0, 36.0, 46.0, 38.0, 28.0, 39.0, 54.0, 46.0, 38.0, 35.0, 39.0, 39.0, 38.0, 15.0, 30.0, 21.0, 18.0, 17.0, 14.0, 10.0, 7.0, 10.0, 3.0, 4.0, 6.0, 2.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.604736328125, -10.25634765625, -9.907958984375, -9.5595703125, -9.211181640625, -8.86279296875, -8.514404296875, -8.166015625, -7.817626953125, -7.46923828125, -7.120849609375, -6.7724609375, -6.424072265625, -6.07568359375, -5.727294921875, -5.37890625, -5.030517578125, -4.68212890625, -4.333740234375, -3.9853515625, -3.636962890625, -3.28857421875, -2.940185546875, -2.591796875, -2.243408203125, -1.89501953125, -1.546630859375, -1.1982421875, -0.849853515625, -0.50146484375, -0.153076171875, 0.1953125, 0.543701171875, 0.89208984375, 1.240478515625, 1.5888671875, 1.937255859375, 2.28564453125, 2.634033203125, 2.982421875, 3.330810546875, 3.67919921875, 4.027587890625, 4.3759765625, 4.724365234375, 5.07275390625, 5.421142578125, 5.76953125, 6.117919921875, 6.46630859375, 6.814697265625, 7.1630859375, 7.511474609375, 7.85986328125, 8.208251953125, 8.556640625, 8.905029296875, 9.25341796875, 9.601806640625, 9.9501953125, 10.298583984375, 10.64697265625, 10.995361328125, 11.34375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 12.0, 4.0, 8.0, 15.0, 23.0, 18.0, 25.0, 44.0, 53.0, 84.0, 112.0, 148.0, 244.0, 399.0, 732.0, 1280.0, 2453.0, 5004.0, 10679.0, 25415.0, 68400.0, 233418.0, 475855.0, 142778.0, 46652.0, 18276.0, 8076.0, 3822.0, 1916.0, 1004.0, 586.0, 330.0, 214.0, 141.0, 98.0, 48.0, 45.0, 26.0, 29.0, 30.0, 14.0, 12.0, 12.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1328125, -13.6815185546875, -13.230224609375, -12.7789306640625, -12.32763671875, -11.8763427734375, -11.425048828125, -10.9737548828125, -10.5224609375, -10.0711669921875, -9.619873046875, -9.1685791015625, -8.71728515625, -8.2659912109375, -7.814697265625, -7.3634033203125, -6.912109375, -6.4608154296875, -6.009521484375, -5.5582275390625, -5.10693359375, -4.6556396484375, -4.204345703125, -3.7530517578125, -3.3017578125, -2.8504638671875, -2.399169921875, -1.9478759765625, -1.49658203125, -1.0452880859375, -0.593994140625, -0.1427001953125, 0.30859375, 0.7598876953125, 1.211181640625, 1.6624755859375, 2.11376953125, 2.5650634765625, 3.016357421875, 3.4676513671875, 3.9189453125, 4.3702392578125, 4.821533203125, 5.2728271484375, 5.72412109375, 6.1754150390625, 6.626708984375, 7.0780029296875, 7.529296875, 7.9805908203125, 8.431884765625, 8.8831787109375, 9.33447265625, 9.7857666015625, 10.237060546875, 10.6883544921875, 11.1396484375, 11.5909423828125, 12.042236328125, 12.4935302734375, 12.94482421875, 13.3961181640625, 13.847412109375, 14.2987060546875, 14.75]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 7.0, 5.0, 8.0, 6.0, 9.0, 11.0, 17.0, 20.0, 23.0, 22.0, 22.0, 32.0, 29.0, 34.0, 39.0, 44.0, 65.0, 90.0, 165.0, 1464.0, 299.0, 140.0, 80.0, 61.0, 45.0, 45.0, 41.0, 35.0, 32.0, 31.0, 26.0, 15.0, 16.0, 15.0, 18.0, 11.0, 7.0, 5.0, 5.0, 4.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.6875, -32.75, -31.8125, -30.875, -29.9375, -29.0, -28.0625, -27.125, -26.1875, -25.25, -24.3125, -23.375, -22.4375, -21.5, -20.5625, -19.625, -18.6875, -17.75, -16.8125, -15.875, -14.9375, -14.0, -13.0625, -12.125, -11.1875, -10.25, -9.3125, -8.375, -7.4375, -6.5, -5.5625, -4.625, -3.6875, -2.75, -1.8125, -0.875, 0.0625, 1.0, 1.9375, 2.875, 3.8125, 4.75, 5.6875, 6.625, 7.5625, 8.5, 9.4375, 10.375, 11.3125, 12.25, 13.1875, 14.125, 15.0625, 16.0, 16.9375, 17.875, 18.8125, 19.75, 20.6875, 21.625, 22.5625, 23.5, 24.4375, 25.375, 26.3125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 17.0, 11.0, 19.0, 23.0, 31.0, 38.0, 68.0, 89.0, 148.0, 260.0, 426.0, 1173.0, 7141.0, 140189.0, 2922461.0, 67232.0, 4429.0, 918.0, 367.0, 220.0, 133.0, 93.0, 61.0, 38.0, 32.0, 24.0, 11.0, 5.0, 8.0, 7.0, 4.0, 12.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-64.625, -62.89697265625, -61.1689453125, -59.44091796875, -57.712890625, -55.98486328125, -54.2568359375, -52.52880859375, -50.80078125, -49.07275390625, -47.3447265625, -45.61669921875, -43.888671875, -42.16064453125, -40.4326171875, -38.70458984375, -36.9765625, -35.24853515625, -33.5205078125, -31.79248046875, -30.064453125, -28.33642578125, -26.6083984375, -24.88037109375, -23.15234375, -21.42431640625, -19.6962890625, -17.96826171875, -16.240234375, -14.51220703125, -12.7841796875, -11.05615234375, -9.328125, -7.60009765625, -5.8720703125, -4.14404296875, -2.416015625, -0.68798828125, 1.0400390625, 2.76806640625, 4.49609375, 6.22412109375, 7.9521484375, 9.68017578125, 11.408203125, 13.13623046875, 14.8642578125, 16.59228515625, 18.3203125, 20.04833984375, 21.7763671875, 23.50439453125, 25.232421875, 26.96044921875, 28.6884765625, 30.41650390625, 32.14453125, 33.87255859375, 35.6005859375, 37.32861328125, 39.056640625, 40.78466796875, 42.5126953125, 44.24072265625, 45.96875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 586.0, 419.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-586.7003784179688, -574.4678955078125, -562.2354125976562, -550.0028686523438, -537.7703857421875, -525.5379028320312, -513.305419921875, -501.0729064941406, -488.84039306640625, -476.60791015625, -464.3753967285156, -452.1429138183594, -439.910400390625, -427.67791748046875, -415.4454040527344, -403.2129211425781, -390.98040771484375, -378.7479248046875, -366.5154113769531, -354.2829284667969, -342.0504150390625, -329.81793212890625, -317.5854187011719, -305.3529357910156, -293.1204528808594, -280.8879699707031, -268.65545654296875, -256.4229736328125, -244.19046020507812, -231.9579620361328, -219.7254638671875, -207.49298095703125, -195.26048278808594, -183.02798461914062, -170.7954864501953, -158.56298828125, -146.3304901123047, -134.09799194335938, -121.8655014038086, -109.63300323486328, -97.40050506591797, -85.16800689697266, -72.93550872802734, -60.7030143737793, -48.470516204833984, -36.23801803588867, -24.005523681640625, -11.773025512695312, 0.45947265625, 12.691969871520996, 24.924467086791992, 37.15696334838867, 49.389461517333984, 61.6219596862793, 73.85445404052734, 86.08695220947266, 98.31945037841797, 110.55194854736328, 122.7844467163086, 135.01693725585938, 147.2494354248047, 159.48193359375, 171.7144317626953, 183.94692993164062, 196.17942810058594]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 7.0, 8.0, 12.0, 13.0, 10.0, 8.0, 32.0, 20.0, 38.0, 26.0, 38.0, 37.0, 36.0, 54.0, 41.0, 51.0, 41.0, 46.0, 58.0, 33.0, 41.0, 36.0, 23.0, 37.0, 27.0, 26.0, 33.0, 28.0, 20.0, 13.0, 19.0, 14.0, 16.0, 3.0, 10.0, 9.0, 11.0, 2.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.1690902709961, -70.10309600830078, -68.037109375, -65.97111511230469, -63.905120849609375, -61.83912658691406, -59.773136138916016, -57.70714569091797, -55.641151428222656, -53.575157165527344, -51.5091667175293, -49.44317626953125, -47.37718200683594, -45.311187744140625, -43.24519729614258, -41.17920684814453, -39.11321258544922, -37.047218322753906, -34.98122787475586, -32.91523742675781, -30.8492431640625, -28.78325080871582, -26.71725845336914, -24.65126609802246, -22.58527374267578, -20.5192813873291, -18.453289031982422, -16.387296676635742, -14.321304321289062, -12.255311965942383, -10.189319610595703, -8.123327255249023, -6.057338714599609, -3.9913463592529297, -1.92535400390625, 0.1406383514404297, 2.2066307067871094, 4.272623062133789, 6.338615417480469, 8.404607772827148, 10.470600128173828, 12.536592483520508, 14.602584838867188, 16.668577194213867, 18.734569549560547, 20.800561904907227, 22.866554260253906, 24.932546615600586, 26.998538970947266, 29.064531326293945, 31.130523681640625, 33.19651794433594, 35.262508392333984, 37.32849884033203, 39.394493103027344, 41.460487365722656, 43.5264778137207, 45.59246826171875, 47.65846252441406, 49.724456787109375, 51.79044723510742, 53.85643768310547, 55.92243194580078, 57.988426208496094, 60.05441665649414]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 6.0, 8.0, 12.0, 8.0, 7.0, 10.0, 22.0, 24.0, 30.0, 20.0, 28.0, 32.0, 38.0, 41.0, 28.0, 33.0, 32.0, 36.0, 47.0, 41.0, 48.0, 33.0, 42.0, 42.0, 31.0, 43.0, 32.0, 29.0, 28.0, 24.0, 26.0, 20.0, 15.0, 13.0, 6.0, 11.0, 7.0, 6.0, 7.0, 6.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.828125, -10.47216796875, -10.1162109375, -9.76025390625, -9.404296875, -9.04833984375, -8.6923828125, -8.33642578125, -7.98046875, -7.62451171875, -7.2685546875, -6.91259765625, -6.556640625, -6.20068359375, -5.8447265625, -5.48876953125, -5.1328125, -4.77685546875, -4.4208984375, -4.06494140625, -3.708984375, -3.35302734375, -2.9970703125, -2.64111328125, -2.28515625, -1.92919921875, -1.5732421875, -1.21728515625, -0.861328125, -0.50537109375, -0.1494140625, 0.20654296875, 0.5625, 0.91845703125, 1.2744140625, 1.63037109375, 1.986328125, 2.34228515625, 2.6982421875, 3.05419921875, 3.41015625, 3.76611328125, 4.1220703125, 4.47802734375, 4.833984375, 5.18994140625, 5.5458984375, 5.90185546875, 6.2578125, 6.61376953125, 6.9697265625, 7.32568359375, 7.681640625, 8.03759765625, 8.3935546875, 8.74951171875, 9.10546875, 9.46142578125, 9.8173828125, 10.17333984375, 10.529296875, 10.88525390625, 11.2412109375, 11.59716796875, 11.953125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 3.0, 10.0, 9.0, 12.0, 11.0, 15.0, 16.0, 18.0, 25.0, 29.0, 31.0, 44.0, 87.0, 179.0, 483.0, 1582.0, 6037.0, 39708.0, 1047218.0, 2933597.0, 148285.0, 12687.0, 2726.0, 802.0, 260.0, 117.0, 64.0, 45.0, 32.0, 28.0, 19.0, 22.0, 10.0, 12.0, 11.0, 12.0, 7.0, 4.0, 3.0, 5.0, 1.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.625, -32.5126953125, -31.400390625, -30.2880859375, -29.17578125, -28.0634765625, -26.951171875, -25.8388671875, -24.7265625, -23.6142578125, -22.501953125, -21.3896484375, -20.27734375, -19.1650390625, -18.052734375, -16.9404296875, -15.828125, -14.7158203125, -13.603515625, -12.4912109375, -11.37890625, -10.2666015625, -9.154296875, -8.0419921875, -6.9296875, -5.8173828125, -4.705078125, -3.5927734375, -2.48046875, -1.3681640625, -0.255859375, 0.8564453125, 1.96875, 3.0810546875, 4.193359375, 5.3056640625, 6.41796875, 7.5302734375, 8.642578125, 9.7548828125, 10.8671875, 11.9794921875, 13.091796875, 14.2041015625, 15.31640625, 16.4287109375, 17.541015625, 18.6533203125, 19.765625, 20.8779296875, 21.990234375, 23.1025390625, 24.21484375, 25.3271484375, 26.439453125, 27.5517578125, 28.6640625, 29.7763671875, 30.888671875, 32.0009765625, 33.11328125, 34.2255859375, 35.337890625, 36.4501953125, 37.5625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 17.0, 21.0, 16.0, 28.0, 28.0, 57.0, 70.0, 94.0, 123.0, 176.0, 257.0, 339.0, 431.0, 518.0, 477.0, 385.0, 232.0, 210.0, 152.0, 112.0, 48.0, 53.0, 39.0, 49.0, 18.0, 21.0, 23.0, 12.0, 11.0, 10.0, 5.0, 6.0, 0.0, 3.0, 2.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.2418212890625, -14.710205078125, -14.1785888671875, -13.64697265625, -13.1153564453125, -12.583740234375, -12.0521240234375, -11.5205078125, -10.9888916015625, -10.457275390625, -9.9256591796875, -9.39404296875, -8.8624267578125, -8.330810546875, -7.7991943359375, -7.267578125, -6.7359619140625, -6.204345703125, -5.6727294921875, -5.14111328125, -4.6094970703125, -4.077880859375, -3.5462646484375, -3.0146484375, -2.4830322265625, -1.951416015625, -1.4197998046875, -0.88818359375, -0.3565673828125, 0.175048828125, 0.7066650390625, 1.23828125, 1.7698974609375, 2.301513671875, 2.8331298828125, 3.36474609375, 3.8963623046875, 4.427978515625, 4.9595947265625, 5.4912109375, 6.0228271484375, 6.554443359375, 7.0860595703125, 7.61767578125, 8.1492919921875, 8.680908203125, 9.2125244140625, 9.744140625, 10.2757568359375, 10.807373046875, 11.3389892578125, 11.87060546875, 12.4022216796875, 12.933837890625, 13.4654541015625, 13.9970703125, 14.5286865234375, 15.060302734375, 15.5919189453125, 16.12353515625, 16.6551513671875, 17.186767578125, 17.7183837890625, 18.25]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 8.0, 6.0, 7.0, 11.0, 23.0, 23.0, 22.0, 51.0, 54.0, 91.0, 135.0, 232.0, 427.0, 1326.0, 4981.0, 24011.0, 179879.0, 3122031.0, 784065.0, 61556.0, 11129.0, 2612.0, 790.0, 329.0, 173.0, 111.0, 51.0, 39.0, 30.0, 18.0, 19.0, 10.0, 8.0, 9.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.84375, -36.65185546875, -35.4599609375, -34.26806640625, -33.076171875, -31.88427734375, -30.6923828125, -29.50048828125, -28.30859375, -27.11669921875, -25.9248046875, -24.73291015625, -23.541015625, -22.34912109375, -21.1572265625, -19.96533203125, -18.7734375, -17.58154296875, -16.3896484375, -15.19775390625, -14.005859375, -12.81396484375, -11.6220703125, -10.43017578125, -9.23828125, -8.04638671875, -6.8544921875, -5.66259765625, -4.470703125, -3.27880859375, -2.0869140625, -0.89501953125, 0.296875, 1.48876953125, 2.6806640625, 3.87255859375, 5.064453125, 6.25634765625, 7.4482421875, 8.64013671875, 9.83203125, 11.02392578125, 12.2158203125, 13.40771484375, 14.599609375, 15.79150390625, 16.9833984375, 18.17529296875, 19.3671875, 20.55908203125, 21.7509765625, 22.94287109375, 24.134765625, 25.32666015625, 26.5185546875, 27.71044921875, 28.90234375, 30.09423828125, 31.2861328125, 32.47802734375, 33.669921875, 34.86181640625, 36.0537109375, 37.24560546875, 38.4375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 28.0, 158.0, 435.0, 317.0, 63.0, 10.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-407.2605285644531, -398.8970642089844, -390.53363037109375, -382.170166015625, -373.80670166015625, -365.4432373046875, -357.0798034667969, -348.7163391113281, -340.3529052734375, -331.98944091796875, -323.6260070800781, -315.2625427246094, -306.8990783691406, -298.53564453125, -290.17218017578125, -281.8087158203125, -273.44525146484375, -265.081787109375, -256.7183532714844, -248.35488891601562, -239.99142456054688, -231.6279754638672, -223.2645263671875, -214.90106201171875, -206.53761291503906, -198.17416381835938, -189.81069946289062, -181.44725036621094, -173.08380126953125, -164.7203369140625, -156.3568878173828, -147.99343872070312, -139.6299591064453, -131.26651000976562, -122.90304565429688, -114.53959655761719, -106.17613983154297, -97.81268310546875, -89.44923400878906, -81.08577728271484, -72.72232055664062, -64.3588638305664, -55.99541091918945, -47.6319580078125, -39.26850128173828, -30.905044555664062, -22.54159164428711, -14.178138732910156, -5.8146820068359375, 2.5487728118896484, 10.912227630615234, 19.27568244934082, 27.639137268066406, 36.002593994140625, 44.36604690551758, 52.72949981689453, 61.09295654296875, 69.45641326904297, 77.81986999511719, 86.18331909179688, 94.5467758178711, 102.91023254394531, 111.273681640625, 119.63713836669922, 128.00059509277344]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 4.0, 8.0, 8.0, 16.0, 17.0, 10.0, 11.0, 17.0, 28.0, 21.0, 27.0, 31.0, 25.0, 29.0, 27.0, 34.0, 38.0, 36.0, 56.0, 40.0, 33.0, 54.0, 37.0, 40.0, 31.0, 31.0, 38.0, 33.0, 22.0, 36.0, 24.0, 35.0, 16.0, 13.0, 16.0, 10.0, 6.0, 7.0, 3.0, 7.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-53.63995361328125, -51.88966751098633, -50.13938522338867, -48.38909912109375, -46.638816833496094, -44.88853073120117, -43.13824462890625, -41.387962341308594, -39.63767623901367, -37.88739013671875, -36.137107849121094, -34.38682174682617, -32.63653564453125, -30.886253356933594, -29.135967254638672, -27.385683059692383, -25.635398864746094, -23.885114669799805, -22.134830474853516, -20.384544372558594, -18.634260177612305, -16.883975982666016, -15.13369083404541, -13.383405685424805, -11.633121490478516, -9.882837295532227, -8.132552146911621, -6.382267475128174, -4.631982803344727, -2.8816986083984375, -1.131413459777832, 0.6188716888427734, 2.3691558837890625, 4.11944055557251, 5.869725227355957, 7.620009899139404, 9.370294570922852, 11.12057876586914, 12.870863914489746, 14.621149063110352, 16.37143325805664, 18.12171745300293, 19.87200164794922, 21.62228775024414, 23.37257194519043, 25.12285614013672, 26.87314224243164, 28.62342643737793, 30.37371063232422, 32.12399673461914, 33.8742790222168, 35.62456512451172, 37.374847412109375, 39.1251335144043, 40.87541961669922, 42.625701904296875, 44.3759880065918, 46.12627410888672, 47.876556396484375, 49.6268424987793, 51.37712860107422, 53.127410888671875, 54.8776969909668, 56.62798309326172, 58.378265380859375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 7.0, 2.0, 7.0, 3.0, 9.0, 10.0, 10.0, 9.0, 11.0, 18.0, 9.0, 26.0, 26.0, 24.0, 28.0, 28.0, 22.0, 22.0, 38.0, 32.0, 31.0, 32.0, 31.0, 38.0, 54.0, 45.0, 35.0, 32.0, 35.0, 34.0, 28.0, 29.0, 29.0, 23.0, 25.0, 19.0, 25.0, 20.0, 10.0, 12.0, 19.0, 13.0, 12.0, 11.0, 6.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.8125, -10.4697265625, -10.126953125, -9.7841796875, -9.44140625, -9.0986328125, -8.755859375, -8.4130859375, -8.0703125, -7.7275390625, -7.384765625, -7.0419921875, -6.69921875, -6.3564453125, -6.013671875, -5.6708984375, -5.328125, -4.9853515625, -4.642578125, -4.2998046875, -3.95703125, -3.6142578125, -3.271484375, -2.9287109375, -2.5859375, -2.2431640625, -1.900390625, -1.5576171875, -1.21484375, -0.8720703125, -0.529296875, -0.1865234375, 0.15625, 0.4990234375, 0.841796875, 1.1845703125, 1.52734375, 1.8701171875, 2.212890625, 2.5556640625, 2.8984375, 3.2412109375, 3.583984375, 3.9267578125, 4.26953125, 4.6123046875, 4.955078125, 5.2978515625, 5.640625, 5.9833984375, 6.326171875, 6.6689453125, 7.01171875, 7.3544921875, 7.697265625, 8.0400390625, 8.3828125, 8.7255859375, 9.068359375, 9.4111328125, 9.75390625, 10.0966796875, 10.439453125, 10.7822265625, 11.125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 6.0, 5.0, 11.0, 3.0, 12.0, 18.0, 23.0, 43.0, 44.0, 79.0, 105.0, 157.0, 248.0, 320.0, 481.0, 676.0, 1039.0, 1566.0, 2387.0, 3589.0, 5610.0, 8568.0, 13075.0, 20368.0, 31751.0, 49570.0, 81773.0, 154699.0, 333046.0, 135035.0, 74283.0, 46251.0, 28992.0, 19140.0, 12369.0, 7955.0, 5186.0, 3303.0, 2237.0, 1472.0, 1052.0, 637.0, 431.0, 289.0, 215.0, 138.0, 76.0, 70.0, 51.0, 44.0, 22.0, 10.0, 16.0, 6.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-2.4453125, -2.369873046875, -2.29443359375, -2.218994140625, -2.1435546875, -2.068115234375, -1.99267578125, -1.917236328125, -1.841796875, -1.766357421875, -1.69091796875, -1.615478515625, -1.5400390625, -1.464599609375, -1.38916015625, -1.313720703125, -1.23828125, -1.162841796875, -1.08740234375, -1.011962890625, -0.9365234375, -0.861083984375, -0.78564453125, -0.710205078125, -0.634765625, -0.559326171875, -0.48388671875, -0.408447265625, -0.3330078125, -0.257568359375, -0.18212890625, -0.106689453125, -0.03125, 0.044189453125, 0.11962890625, 0.195068359375, 0.2705078125, 0.345947265625, 0.42138671875, 0.496826171875, 0.572265625, 0.647705078125, 0.72314453125, 0.798583984375, 0.8740234375, 0.949462890625, 1.02490234375, 1.100341796875, 1.17578125, 1.251220703125, 1.32666015625, 1.402099609375, 1.4775390625, 1.552978515625, 1.62841796875, 1.703857421875, 1.779296875, 1.854736328125, 1.93017578125, 2.005615234375, 2.0810546875, 2.156494140625, 2.23193359375, 2.307373046875, 2.3828125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 10.0, 11.0, 13.0, 15.0, 16.0, 22.0, 22.0, 31.0, 33.0, 26.0, 39.0, 47.0, 36.0, 53.0, 43.0, 34.0, 1066.0, 47.0, 53.0, 46.0, 48.0, 58.0, 38.0, 30.0, 41.0, 17.0, 26.0, 20.0, 13.0, 11.0, 10.0, 15.0, 11.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.057373046875, -7.77880859375, -7.500244140625, -7.2216796875, -6.943115234375, -6.66455078125, -6.385986328125, -6.107421875, -5.828857421875, -5.55029296875, -5.271728515625, -4.9931640625, -4.714599609375, -4.43603515625, -4.157470703125, -3.87890625, -3.600341796875, -3.32177734375, -3.043212890625, -2.7646484375, -2.486083984375, -2.20751953125, -1.928955078125, -1.650390625, -1.371826171875, -1.09326171875, -0.814697265625, -0.5361328125, -0.257568359375, 0.02099609375, 0.299560546875, 0.578125, 0.856689453125, 1.13525390625, 1.413818359375, 1.6923828125, 1.970947265625, 2.24951171875, 2.528076171875, 2.806640625, 3.085205078125, 3.36376953125, 3.642333984375, 3.9208984375, 4.199462890625, 4.47802734375, 4.756591796875, 5.03515625, 5.313720703125, 5.59228515625, 5.870849609375, 6.1494140625, 6.427978515625, 6.70654296875, 6.985107421875, 7.263671875, 7.542236328125, 7.82080078125, 8.099365234375, 8.3779296875, 8.656494140625, 8.93505859375, 9.213623046875, 9.4921875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 10.0, 20.0, 20.0, 22.0, 58.0, 82.0, 114.0, 186.0, 273.0, 482.0, 735.0, 1179.0, 2050.0, 3475.0, 5661.0, 9788.0, 16599.0, 29577.0, 55754.0, 113268.0, 1370605.0, 266882.0, 102526.0, 51661.0, 28040.0, 15698.0, 8961.0, 5283.0, 3222.0, 1900.0, 1158.0, 678.0, 416.0, 261.0, 149.0, 121.0, 77.0, 48.0, 41.0, 17.0, 11.0, 12.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.921875, -2.82427978515625, -2.7266845703125, -2.62908935546875, -2.531494140625, -2.43389892578125, -2.3363037109375, -2.23870849609375, -2.14111328125, -2.04351806640625, -1.9459228515625, -1.84832763671875, -1.750732421875, -1.65313720703125, -1.5555419921875, -1.45794677734375, -1.3603515625, -1.26275634765625, -1.1651611328125, -1.06756591796875, -0.969970703125, -0.87237548828125, -0.7747802734375, -0.67718505859375, -0.57958984375, -0.48199462890625, -0.3843994140625, -0.28680419921875, -0.189208984375, -0.09161376953125, 0.0059814453125, 0.10357666015625, 0.201171875, 0.29876708984375, 0.3963623046875, 0.49395751953125, 0.591552734375, 0.68914794921875, 0.7867431640625, 0.88433837890625, 0.98193359375, 1.07952880859375, 1.1771240234375, 1.27471923828125, 1.372314453125, 1.46990966796875, 1.5675048828125, 1.66510009765625, 1.7626953125, 1.86029052734375, 1.9578857421875, 2.05548095703125, 2.153076171875, 2.25067138671875, 2.3482666015625, 2.44586181640625, 2.54345703125, 2.64105224609375, 2.7386474609375, 2.83624267578125, 2.933837890625, 3.03143310546875, 3.1290283203125, 3.22662353515625, 3.32421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 10.0, 8.0, 4.0, 13.0, 4.0, 13.0, 19.0, 15.0, 25.0, 28.0, 46.0, 40.0, 64.0, 72.0, 87.0, 89.0, 71.0, 78.0, 54.0, 55.0, 34.0, 25.0, 26.0, 30.0, 18.0, 11.0, 10.0, 9.0, 6.0, 11.0, 3.0, 2.0, 6.0, 3.0, 3.0, 2.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011234283447265625, -0.0010812878608703613, -0.0010391473770141602, -0.000997006893157959, -0.0009548664093017578, -0.0009127259254455566, -0.0008705854415893555, -0.0008284449577331543, -0.0007863044738769531, -0.000744163990020752, -0.0007020235061645508, -0.0006598830223083496, -0.0006177425384521484, -0.0005756020545959473, -0.0005334615707397461, -0.0004913210868835449, -0.00044918060302734375, -0.0004070401191711426, -0.0003648996353149414, -0.00032275915145874023, -0.00028061866760253906, -0.0002384781837463379, -0.00019633769989013672, -0.00015419721603393555, -0.00011205673217773438, -6.99162483215332e-05, -2.777576446533203e-05, 1.436471939086914e-05, 5.650520324707031e-05, 9.864568710327148e-05, 0.00014078617095947266, 0.00018292665481567383, 0.000225067138671875, 0.00026720762252807617, 0.00030934810638427734, 0.0003514885902404785, 0.0003936290740966797, 0.00043576955795288086, 0.00047791004180908203, 0.0005200505256652832, 0.0005621910095214844, 0.0006043314933776855, 0.0006464719772338867, 0.0006886124610900879, 0.0007307529449462891, 0.0007728934288024902, 0.0008150339126586914, 0.0008571743965148926, 0.0008993148803710938, 0.0009414553642272949, 0.000983595848083496, 0.0010257363319396973, 0.0010678768157958984, 0.0011100172996520996, 0.0011521577835083008, 0.001194298267364502, 0.0012364387512207031, 0.0012785792350769043, 0.0013207197189331055, 0.0013628602027893066, 0.0014050006866455078, 0.001447141170501709, 0.0014892816543579102, 0.0015314221382141113, 0.0015735626220703125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 5.0, 5.0, 7.0, 8.0, 10.0, 12.0, 12.0, 10.0, 17.0, 39.0, 34.0, 58.0, 56.0, 99.0, 118.0, 208.0, 357.0, 801.0, 33990.0, 1007664.0, 3631.0, 547.0, 276.0, 170.0, 104.0, 76.0, 53.0, 38.0, 34.0, 24.0, 21.0, 14.0, 18.0, 5.0, 7.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0305328369140625, -0.029714345932006836, -0.028895854949951172, -0.028077363967895508, -0.027258872985839844, -0.02644038200378418, -0.025621891021728516, -0.02480340003967285, -0.023984909057617188, -0.023166418075561523, -0.02234792709350586, -0.021529436111450195, -0.02071094512939453, -0.019892454147338867, -0.019073963165283203, -0.01825547218322754, -0.017436981201171875, -0.01661849021911621, -0.015799999237060547, -0.014981508255004883, -0.014163017272949219, -0.013344526290893555, -0.01252603530883789, -0.011707544326782227, -0.010889053344726562, -0.010070562362670898, -0.009252071380615234, -0.00843358039855957, -0.007615089416503906, -0.006796598434448242, -0.005978107452392578, -0.005159616470336914, -0.00434112548828125, -0.003522634506225586, -0.002704143524169922, -0.0018856525421142578, -0.0010671615600585938, -0.0002486705780029297, 0.0005698204040527344, 0.0013883113861083984, 0.0022068023681640625, 0.0030252933502197266, 0.0038437843322753906, 0.004662275314331055, 0.005480766296386719, 0.006299257278442383, 0.007117748260498047, 0.007936239242553711, 0.008754730224609375, 0.009573221206665039, 0.010391712188720703, 0.011210203170776367, 0.012028694152832031, 0.012847185134887695, 0.01366567611694336, 0.014484167098999023, 0.015302658081054688, 0.01612114906311035, 0.016939640045166016, 0.01775813102722168, 0.018576622009277344, 0.019395112991333008, 0.020213603973388672, 0.021032094955444336, 0.0218505859375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 22.0, 66.0, 165.0, 258.0, 258.0, 151.0, 53.0, 27.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002201684517785907, -0.002147956984117627, -0.0020942294504493475, -0.002040501683950424, -0.0019867741502821445, -0.001933046616613865, -0.0018793190829455853, -0.0018255914328619838, -0.0017718638991937041, -0.0017181363655254245, -0.001664408715441823, -0.0016106811817735434, -0.0015569535316899419, -0.0015032259980216622, -0.0014494983479380608, -0.0013957708142697811, -0.0013420432806015015, -0.0012883157469332218, -0.0012345880968496203, -0.0011808605631813407, -0.0011271329130977392, -0.0010734053794294596, -0.00101967784576118, -0.0009659501956775784, -0.000912222545593977, -0.0008584949537180364, -0.0008047673618420959, -0.0007510398281738162, -0.0006973122362978756, -0.0006435846444219351, -0.0005898570525459945, -0.000536129460670054, -0.0004824019270017743, -0.00042867433512583375, -0.00037494677235372365, -0.0003212191804777831, -0.000267491617705673, -0.00021376402582973242, -0.00016003643395379186, -0.00010630887118168175, -5.258127930574119e-05, 1.1463016562629491e-06, 5.487388261826709e-05, 0.00010860146721825004, 0.00016232904454227537, 0.0002160566218663007, 0.00026978421374224126, 0.00032351177651435137, 0.00037723936839029193, 0.0004309669602662325, 0.0004846945230383426, 0.0005384221440181136, 0.0005921496776863933, 0.0006458772695623338, 0.0006996048614382744, 0.000753332395106554, 0.0008070600451901555, 0.0008607876370660961, 0.0009145152289420366, 0.0009682427626103163, 0.0010219704126939178, 0.0010756979463621974, 0.0011294255964457989, 0.0011831531301140785, 0.0012368806637823582]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 5.0, 6.0, 10.0, 12.0, 12.0, 9.0, 19.0, 20.0, 22.0, 27.0, 39.0, 36.0, 33.0, 32.0, 34.0, 43.0, 48.0, 40.0, 50.0, 47.0, 38.0, 43.0, 44.0, 32.0, 37.0, 36.0, 24.0, 25.0, 31.0, 24.0, 16.0, 13.0, 20.0, 10.0, 9.0, 12.0, 17.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0006681084632873535, -0.0006476240232586861, -0.0006271395832300186, -0.0006066551432013512, -0.0005861707031726837, -0.0005656862631440163, -0.0005452018231153488, -0.0005247173830866814, -0.0005042329430580139, -0.00048374850302934647, -0.000463264063000679, -0.00044277962297201157, -0.0004222951829433441, -0.00040181074291467667, -0.0003813263028860092, -0.00036084186285734177, -0.0003403574228286743, -0.00031987298280000687, -0.0002993885427713394, -0.00027890410274267197, -0.0002584196627140045, -0.00023793522268533707, -0.00021745078265666962, -0.00019696634262800217, -0.00017648190259933472, -0.00015599746257066727, -0.00013551302254199982, -0.00011502858251333237, -9.454414248466492e-05, -7.405970245599747e-05, -5.357526242733002e-05, -3.309082239866257e-05, -1.2606382369995117e-05, 7.878057658672333e-06, 2.8362497687339783e-05, 4.884693771600723e-05, 6.933137774467468e-05, 8.981581777334213e-05, 0.00011030025780200958, 0.00013078469783067703, 0.00015126913785934448, 0.00017175357788801193, 0.00019223801791667938, 0.00021272245794534683, 0.00023320689797401428, 0.00025369133800268173, 0.0002741757780313492, 0.00029466021806001663, 0.0003151446580886841, 0.00033562909811735153, 0.000356113538146019, 0.00037659797817468643, 0.0003970824182033539, 0.00041756685823202133, 0.0004380512982606888, 0.00045853573828935623, 0.0004790201783180237, 0.0004995046183466911, 0.0005199890583753586, 0.000540473498404026, 0.0005609579384326935, 0.0005814423784613609, 0.0006019268184900284, 0.0006224112585186958, 0.0006428956985473633]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 7.0, 2.0, 7.0, 3.0, 9.0, 10.0, 10.0, 9.0, 11.0, 18.0, 9.0, 26.0, 26.0, 24.0, 28.0, 28.0, 22.0, 22.0, 38.0, 32.0, 31.0, 32.0, 31.0, 38.0, 54.0, 45.0, 35.0, 32.0, 35.0, 34.0, 28.0, 29.0, 29.0, 23.0, 25.0, 19.0, 25.0, 20.0, 10.0, 12.0, 19.0, 13.0, 12.0, 11.0, 6.0, 3.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.8125, -10.4697265625, -10.126953125, -9.7841796875, -9.44140625, -9.0986328125, -8.755859375, -8.4130859375, -8.0703125, -7.7275390625, -7.384765625, -7.0419921875, -6.69921875, -6.3564453125, -6.013671875, -5.6708984375, -5.328125, -4.9853515625, -4.642578125, -4.2998046875, -3.95703125, -3.6142578125, -3.271484375, -2.9287109375, -2.5859375, -2.2431640625, -1.900390625, -1.5576171875, -1.21484375, -0.8720703125, -0.529296875, -0.1865234375, 0.15625, 0.4990234375, 0.841796875, 1.1845703125, 1.52734375, 1.8701171875, 2.212890625, 2.5556640625, 2.8984375, 3.2412109375, 3.583984375, 3.9267578125, 4.26953125, 4.6123046875, 4.955078125, 5.2978515625, 5.640625, 5.9833984375, 6.326171875, 6.6689453125, 7.01171875, 7.3544921875, 7.697265625, 8.0400390625, 8.3828125, 8.7255859375, 9.068359375, 9.4111328125, 9.75390625, 10.0966796875, 10.439453125, 10.7822265625, 11.125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 6.0, 6.0, 7.0, 8.0, 11.0, 18.0, 19.0, 34.0, 34.0, 44.0, 75.0, 109.0, 109.0, 171.0, 220.0, 276.0, 413.0, 624.0, 912.0, 1342.0, 2131.0, 3555.0, 6074.0, 11531.0, 24751.0, 60623.0, 176820.0, 403838.0, 219630.0, 74622.0, 29345.0, 13192.0, 6934.0, 3973.0, 2349.0, 1502.0, 945.0, 666.0, 412.0, 321.0, 207.0, 175.0, 135.0, 93.0, 70.0, 61.0, 43.0, 24.0, 27.0, 19.0, 15.0, 15.0, 9.0, 7.0, 3.0, 3.0, 5.0, 6.0], "bins": [-12.625, -12.249267578125, -11.87353515625, -11.497802734375, -11.1220703125, -10.746337890625, -10.37060546875, -9.994873046875, -9.619140625, -9.243408203125, -8.86767578125, -8.491943359375, -8.1162109375, -7.740478515625, -7.36474609375, -6.989013671875, -6.61328125, -6.237548828125, -5.86181640625, -5.486083984375, -5.1103515625, -4.734619140625, -4.35888671875, -3.983154296875, -3.607421875, -3.231689453125, -2.85595703125, -2.480224609375, -2.1044921875, -1.728759765625, -1.35302734375, -0.977294921875, -0.6015625, -0.225830078125, 0.14990234375, 0.525634765625, 0.9013671875, 1.277099609375, 1.65283203125, 2.028564453125, 2.404296875, 2.780029296875, 3.15576171875, 3.531494140625, 3.9072265625, 4.282958984375, 4.65869140625, 5.034423828125, 5.41015625, 5.785888671875, 6.16162109375, 6.537353515625, 6.9130859375, 7.288818359375, 7.66455078125, 8.040283203125, 8.416015625, 8.791748046875, 9.16748046875, 9.543212890625, 9.9189453125, 10.294677734375, 10.67041015625, 11.046142578125, 11.421875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 2.0, 5.0, 5.0, 12.0, 11.0, 25.0, 15.0, 15.0, 32.0, 34.0, 19.0, 48.0, 45.0, 58.0, 59.0, 75.0, 144.0, 1534.0, 323.0, 127.0, 79.0, 47.0, 59.0, 47.0, 36.0, 25.0, 35.0, 27.0, 14.0, 23.0, 13.0, 10.0, 12.0, 4.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.625, -33.602783203125, -32.58056640625, -31.558349609375, -30.5361328125, -29.513916015625, -28.49169921875, -27.469482421875, -26.447265625, -25.425048828125, -24.40283203125, -23.380615234375, -22.3583984375, -21.336181640625, -20.31396484375, -19.291748046875, -18.26953125, -17.247314453125, -16.22509765625, -15.202880859375, -14.1806640625, -13.158447265625, -12.13623046875, -11.114013671875, -10.091796875, -9.069580078125, -8.04736328125, -7.025146484375, -6.0029296875, -4.980712890625, -3.95849609375, -2.936279296875, -1.9140625, -0.891845703125, 0.13037109375, 1.152587890625, 2.1748046875, 3.197021484375, 4.21923828125, 5.241455078125, 6.263671875, 7.285888671875, 8.30810546875, 9.330322265625, 10.3525390625, 11.374755859375, 12.39697265625, 13.419189453125, 14.44140625, 15.463623046875, 16.48583984375, 17.508056640625, 18.5302734375, 19.552490234375, 20.57470703125, 21.596923828125, 22.619140625, 23.641357421875, 24.66357421875, 25.685791015625, 26.7080078125, 27.730224609375, 28.75244140625, 29.774658203125, 30.796875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 8.0, 5.0, 1.0, 7.0, 20.0, 19.0, 26.0, 32.0, 63.0, 65.0, 112.0, 121.0, 186.0, 313.0, 644.0, 3249.0, 44425.0, 2984006.0, 105326.0, 5166.0, 873.0, 340.0, 195.0, 137.0, 85.0, 75.0, 60.0, 33.0, 27.0, 17.0, 17.0, 8.0, 10.0, 7.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.6875, -54.83544921875, -52.9833984375, -51.13134765625, -49.279296875, -47.42724609375, -45.5751953125, -43.72314453125, -41.87109375, -40.01904296875, -38.1669921875, -36.31494140625, -34.462890625, -32.61083984375, -30.7587890625, -28.90673828125, -27.0546875, -25.20263671875, -23.3505859375, -21.49853515625, -19.646484375, -17.79443359375, -15.9423828125, -14.09033203125, -12.23828125, -10.38623046875, -8.5341796875, -6.68212890625, -4.830078125, -2.97802734375, -1.1259765625, 0.72607421875, 2.578125, 4.43017578125, 6.2822265625, 8.13427734375, 9.986328125, 11.83837890625, 13.6904296875, 15.54248046875, 17.39453125, 19.24658203125, 21.0986328125, 22.95068359375, 24.802734375, 26.65478515625, 28.5068359375, 30.35888671875, 32.2109375, 34.06298828125, 35.9150390625, 37.76708984375, 39.619140625, 41.47119140625, 43.3232421875, 45.17529296875, 47.02734375, 48.87939453125, 50.7314453125, 52.58349609375, 54.435546875, 56.28759765625, 58.1396484375, 59.99169921875, 61.84375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 19.0, 141.0, 380.0, 346.0, 108.0, 14.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-173.53314208984375, -169.75173950195312, -165.97032165527344, -162.1889190673828, -158.40750122070312, -154.6260986328125, -150.84469604492188, -147.0632781982422, -143.28187561035156, -139.50047302246094, -135.71905517578125, -131.93765258789062, -128.15623474121094, -124.37483215332031, -120.59342193603516, -116.81201171875, -113.03060150146484, -109.24919128417969, -105.46778106689453, -101.68637084960938, -97.90496826171875, -94.1235580444336, -90.34214782714844, -86.56073760986328, -82.77932739257812, -78.99791717529297, -75.21650695800781, -71.43510437011719, -67.65369415283203, -63.872283935546875, -60.09087371826172, -56.30946350097656, -52.52806854248047, -48.74665832519531, -44.96525192260742, -41.183841705322266, -37.402435302734375, -33.62102508544922, -29.839614868164062, -26.05820655822754, -22.276798248291016, -18.495389938354492, -14.713980674743652, -10.932571411132812, -7.151163101196289, -3.3697547912597656, 0.4116554260253906, 4.193063735961914, 7.9744720458984375, 11.755880355834961, 15.5372896194458, 19.31869888305664, 23.100107192993164, 26.881515502929688, 30.662925720214844, 34.4443359375, 38.22574234008789, 42.00715255737305, 45.78855895996094, 49.569969177246094, 53.35137939453125, 57.13278579711914, 60.9141960144043, 64.69560241699219, 68.47701263427734]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 11.0, 2.0, 7.0, 8.0, 6.0, 6.0, 17.0, 6.0, 16.0, 22.0, 19.0, 17.0, 20.0, 18.0, 26.0, 29.0, 32.0, 30.0, 33.0, 43.0, 30.0, 36.0, 36.0, 35.0, 47.0, 45.0, 42.0, 46.0, 34.0, 26.0, 29.0, 29.0, 20.0, 25.0, 16.0, 16.0, 22.0, 26.0, 13.0, 12.0, 10.0, 11.0, 4.0, 8.0, 4.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-56.85185623168945, -55.06673812866211, -53.2816162109375, -51.496498107910156, -49.71138000488281, -47.92626190185547, -46.14113998413086, -44.356021881103516, -42.570899963378906, -40.78578186035156, -39.00065994262695, -37.21554183959961, -35.430423736572266, -33.645301818847656, -31.860183715820312, -30.07506561279297, -28.289947509765625, -26.50482749938965, -24.719709396362305, -22.934589385986328, -21.149471282958984, -19.364351272583008, -17.57923126220703, -15.794112205505371, -14.008993148803711, -12.22387409210205, -10.43875503540039, -8.653635025024414, -6.868515968322754, -5.083396911621094, -3.298276901245117, -1.513157844543457, 0.2719573974609375, 2.0570766925811768, 3.842195987701416, 5.627315521240234, 7.4124345779418945, 9.197553634643555, 10.982673645019531, 12.767792701721191, 14.552911758422852, 16.338031768798828, 18.123149871826172, 19.90826988220215, 21.693389892578125, 23.47850799560547, 25.263628005981445, 27.048748016357422, 28.833866119384766, 30.618986129760742, 32.40410614013672, 34.18922424316406, 35.974342346191406, 37.75946044921875, 39.54458236694336, 41.3297004699707, 43.11482238769531, 44.899940490722656, 46.685062408447266, 48.47018051147461, 50.25529861450195, 52.04042053222656, 53.825538635253906, 55.61065673828125, 57.395774841308594]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 10.0, 6.0, 7.0, 6.0, 13.0, 11.0, 14.0, 16.0, 13.0, 33.0, 31.0, 21.0, 24.0, 27.0, 32.0, 38.0, 27.0, 33.0, 42.0, 35.0, 38.0, 43.0, 40.0, 38.0, 46.0, 22.0, 49.0, 23.0, 28.0, 26.0, 26.0, 25.0, 20.0, 21.0, 21.0, 16.0, 9.0, 9.0, 9.0, 14.0, 10.0, 13.0, 5.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.1328125, -10.7784423828125, -10.424072265625, -10.0697021484375, -9.71533203125, -9.3609619140625, -9.006591796875, -8.6522216796875, -8.2978515625, -7.9434814453125, -7.589111328125, -7.2347412109375, -6.88037109375, -6.5260009765625, -6.171630859375, -5.8172607421875, -5.462890625, -5.1085205078125, -4.754150390625, -4.3997802734375, -4.04541015625, -3.6910400390625, -3.336669921875, -2.9822998046875, -2.6279296875, -2.2735595703125, -1.919189453125, -1.5648193359375, -1.21044921875, -0.8560791015625, -0.501708984375, -0.1473388671875, 0.20703125, 0.5614013671875, 0.915771484375, 1.2701416015625, 1.62451171875, 1.9788818359375, 2.333251953125, 2.6876220703125, 3.0419921875, 3.3963623046875, 3.750732421875, 4.1051025390625, 4.45947265625, 4.8138427734375, 5.168212890625, 5.5225830078125, 5.876953125, 6.2313232421875, 6.585693359375, 6.9400634765625, 7.29443359375, 7.6488037109375, 8.003173828125, 8.3575439453125, 8.7119140625, 9.0662841796875, 9.420654296875, 9.7750244140625, 10.12939453125, 10.4837646484375, 10.838134765625, 11.1925048828125, 11.546875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 6.0, 8.0, 13.0, 11.0, 19.0, 15.0, 23.0, 27.0, 48.0, 56.0, 56.0, 77.0, 127.0, 174.0, 225.0, 326.0, 368.0, 640.0, 328104.0, 3861617.0, 651.0, 434.0, 302.0, 242.0, 172.0, 129.0, 93.0, 62.0, 60.0, 40.0, 33.0, 28.0, 14.0, 12.0, 20.0, 9.0, 7.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-280.5, -271.171875, -261.84375, -252.515625, -243.1875, -233.859375, -224.53125, -215.203125, -205.875, -196.546875, -187.21875, -177.890625, -168.5625, -159.234375, -149.90625, -140.578125, -131.25, -121.921875, -112.59375, -103.265625, -93.9375, -84.609375, -75.28125, -65.953125, -56.625, -47.296875, -37.96875, -28.640625, -19.3125, -9.984375, -0.65625, 8.671875, 18.0, 27.328125, 36.65625, 45.984375, 55.3125, 64.640625, 73.96875, 83.296875, 92.625, 101.953125, 111.28125, 120.609375, 129.9375, 139.265625, 148.59375, 157.921875, 167.25, 176.578125, 185.90625, 195.234375, 204.5625, 213.890625, 223.21875, 232.546875, 241.875, 251.203125, 260.53125, 269.859375, 279.1875, 288.515625, 297.84375, 307.171875, 316.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 2.0, 11.0, 4.0, 13.0, 15.0, 24.0, 27.0, 28.0, 49.0, 57.0, 69.0, 108.0, 156.0, 237.0, 356.0, 534.0, 659.0, 530.0, 387.0, 237.0, 177.0, 116.0, 65.0, 56.0, 29.0, 39.0, 24.0, 18.0, 11.0, 6.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.96875, -20.341552734375, -19.71435546875, -19.087158203125, -18.4599609375, -17.832763671875, -17.20556640625, -16.578369140625, -15.951171875, -15.323974609375, -14.69677734375, -14.069580078125, -13.4423828125, -12.815185546875, -12.18798828125, -11.560791015625, -10.93359375, -10.306396484375, -9.67919921875, -9.052001953125, -8.4248046875, -7.797607421875, -7.17041015625, -6.543212890625, -5.916015625, -5.288818359375, -4.66162109375, -4.034423828125, -3.4072265625, -2.780029296875, -2.15283203125, -1.525634765625, -0.8984375, -0.271240234375, 0.35595703125, 0.983154296875, 1.6103515625, 2.237548828125, 2.86474609375, 3.491943359375, 4.119140625, 4.746337890625, 5.37353515625, 6.000732421875, 6.6279296875, 7.255126953125, 7.88232421875, 8.509521484375, 9.13671875, 9.763916015625, 10.39111328125, 11.018310546875, 11.6455078125, 12.272705078125, 12.89990234375, 13.527099609375, 14.154296875, 14.781494140625, 15.40869140625, 16.035888671875, 16.6630859375, 17.290283203125, 17.91748046875, 18.544677734375, 19.171875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 11.0, 4.0, 7.0, 13.0, 22.0, 19.0, 25.0, 24.0, 43.0, 39.0, 42.0, 64.0, 72.0, 122.0, 601.0, 54608.0, 4134721.0, 3111.0, 294.0, 94.0, 72.0, 51.0, 42.0, 36.0, 26.0, 24.0, 17.0, 18.0, 18.0, 15.0, 4.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-187.75, -182.576171875, -177.40234375, -172.228515625, -167.0546875, -161.880859375, -156.70703125, -151.533203125, -146.359375, -141.185546875, -136.01171875, -130.837890625, -125.6640625, -120.490234375, -115.31640625, -110.142578125, -104.96875, -99.794921875, -94.62109375, -89.447265625, -84.2734375, -79.099609375, -73.92578125, -68.751953125, -63.578125, -58.404296875, -53.23046875, -48.056640625, -42.8828125, -37.708984375, -32.53515625, -27.361328125, -22.1875, -17.013671875, -11.83984375, -6.666015625, -1.4921875, 3.681640625, 8.85546875, 14.029296875, 19.203125, 24.376953125, 29.55078125, 34.724609375, 39.8984375, 45.072265625, 50.24609375, 55.419921875, 60.59375, 65.767578125, 70.94140625, 76.115234375, 81.2890625, 86.462890625, 91.63671875, 96.810546875, 101.984375, 107.158203125, 112.33203125, 117.505859375, 122.6796875, 127.853515625, 133.02734375, 138.201171875, 143.375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 13.0, 77.0, 319.0, 437.0, 144.0, 23.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.91010284423828, -79.19217681884766, -71.47425079345703, -63.756324768066406, -56.03839874267578, -48.32046890258789, -40.602542877197266, -32.88461685180664, -25.166690826416016, -17.44876480102539, -9.73083782196045, -2.012910842895508, 5.705015182495117, 13.422943115234375, 21.140869140625, 28.858795166015625, 36.57672119140625, 44.294647216796875, 52.0125732421875, 59.730499267578125, 67.44842529296875, 75.16635131835938, 82.88427734375, 90.60220336914062, 98.32012939453125, 106.03805541992188, 113.7559814453125, 121.47390747070312, 129.19183349609375, 136.90975952148438, 144.627685546875, 152.34561157226562, 160.0635528564453, 167.78147888183594, 175.49940490722656, 183.2173309326172, 190.9352569580078, 198.65318298339844, 206.37110900878906, 214.0890350341797, 221.8069610595703, 229.52488708496094, 237.24281311035156, 244.9607391357422, 252.6786651611328, 260.3966064453125, 268.1145324707031, 275.83245849609375, 283.5503845214844, 291.268310546875, 298.9862365722656, 306.70416259765625, 314.4220886230469, 322.1400146484375, 329.8579406738281, 337.57586669921875, 345.2937927246094, 353.01171875, 360.7296447753906, 368.44757080078125, 376.1654968261719, 383.8834228515625, 391.6013488769531, 399.31927490234375, 407.0372009277344]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 2.0, 7.0, 4.0, 6.0, 13.0, 7.0, 10.0, 23.0, 20.0, 16.0, 27.0, 21.0, 22.0, 27.0, 35.0, 44.0, 41.0, 30.0, 48.0, 39.0, 50.0, 45.0, 40.0, 42.0, 37.0, 42.0, 42.0, 33.0, 24.0, 33.0, 30.0, 27.0, 20.0, 15.0, 11.0, 14.0, 9.0, 13.0, 8.0, 6.0, 5.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.14898681640625, -55.15084457397461, -53.152706146240234, -51.154563903808594, -49.15642166137695, -47.15827941894531, -45.16014099121094, -43.1619987487793, -41.163856506347656, -39.165714263916016, -37.16757583618164, -35.16943359375, -33.17129135131836, -31.17315101623535, -29.175010681152344, -27.176868438720703, -25.178730010986328, -23.18058967590332, -21.18244743347168, -19.184307098388672, -17.18616485595703, -15.188024520874023, -13.189884185791016, -11.191742897033691, -9.193601608276367, -7.195460319519043, -5.197319507598877, -3.199178695678711, -1.2010374069213867, 0.7971038818359375, 2.7952442169189453, 4.7933855056762695, 6.791526794433594, 8.789668083190918, 10.787809371948242, 12.78594970703125, 14.784090995788574, 16.7822322845459, 18.780372619628906, 20.778514862060547, 22.776655197143555, 24.774795532226562, 26.772937774658203, 28.77107810974121, 30.76921844482422, 32.76736068725586, 34.7655029296875, 36.763641357421875, 38.761783599853516, 40.759925842285156, 42.75806427001953, 44.75620651245117, 46.75434875488281, 48.75248718261719, 50.75062942504883, 52.74877166748047, 54.746910095214844, 56.745052337646484, 58.74319076538086, 60.7413330078125, 62.73947525024414, 64.73761749267578, 66.73575592041016, 68.73389434814453, 70.73204040527344]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 1.0, 3.0, 8.0, 9.0, 8.0, 5.0, 10.0, 15.0, 11.0, 16.0, 22.0, 13.0, 31.0, 29.0, 26.0, 37.0, 37.0, 37.0, 37.0, 38.0, 44.0, 39.0, 47.0, 31.0, 40.0, 36.0, 28.0, 36.0, 31.0, 24.0, 31.0, 26.0, 23.0, 28.0, 25.0, 20.0, 21.0, 17.0, 13.0, 7.0, 6.0, 10.0, 4.0, 3.0, 7.0, 2.0, 2.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.328125, -10.972412109375, -10.61669921875, -10.260986328125, -9.9052734375, -9.549560546875, -9.19384765625, -8.838134765625, -8.482421875, -8.126708984375, -7.77099609375, -7.415283203125, -7.0595703125, -6.703857421875, -6.34814453125, -5.992431640625, -5.63671875, -5.281005859375, -4.92529296875, -4.569580078125, -4.2138671875, -3.858154296875, -3.50244140625, -3.146728515625, -2.791015625, -2.435302734375, -2.07958984375, -1.723876953125, -1.3681640625, -1.012451171875, -0.65673828125, -0.301025390625, 0.0546875, 0.410400390625, 0.76611328125, 1.121826171875, 1.4775390625, 1.833251953125, 2.18896484375, 2.544677734375, 2.900390625, 3.256103515625, 3.61181640625, 3.967529296875, 4.3232421875, 4.678955078125, 5.03466796875, 5.390380859375, 5.74609375, 6.101806640625, 6.45751953125, 6.813232421875, 7.1689453125, 7.524658203125, 7.88037109375, 8.236083984375, 8.591796875, 8.947509765625, 9.30322265625, 9.658935546875, 10.0146484375, 10.370361328125, 10.72607421875, 11.081787109375, 11.4375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 5.0, 16.0, 26.0, 36.0, 45.0, 70.0, 102.0, 156.0, 225.0, 306.0, 504.0, 730.0, 1111.0, 1655.0, 2445.0, 3788.0, 5797.0, 9276.0, 14371.0, 22987.0, 37892.0, 63955.0, 116034.0, 297505.0, 222635.0, 99466.0, 56369.0, 33852.0, 20650.0, 12867.0, 8365.0, 5142.0, 3352.0, 2233.0, 1500.0, 1017.0, 709.0, 437.0, 300.0, 193.0, 136.0, 96.0, 53.0, 30.0, 31.0, 37.0, 16.0, 4.0, 5.0, 6.0, 9.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.65625, -2.57293701171875, -2.4896240234375, -2.40631103515625, -2.322998046875, -2.23968505859375, -2.1563720703125, -2.07305908203125, -1.98974609375, -1.90643310546875, -1.8231201171875, -1.73980712890625, -1.656494140625, -1.57318115234375, -1.4898681640625, -1.40655517578125, -1.3232421875, -1.23992919921875, -1.1566162109375, -1.07330322265625, -0.989990234375, -0.90667724609375, -0.8233642578125, -0.74005126953125, -0.65673828125, -0.57342529296875, -0.4901123046875, -0.40679931640625, -0.323486328125, -0.24017333984375, -0.1568603515625, -0.07354736328125, 0.009765625, 0.09307861328125, 0.1763916015625, 0.25970458984375, 0.343017578125, 0.42633056640625, 0.5096435546875, 0.59295654296875, 0.67626953125, 0.75958251953125, 0.8428955078125, 0.92620849609375, 1.009521484375, 1.09283447265625, 1.1761474609375, 1.25946044921875, 1.3427734375, 1.42608642578125, 1.5093994140625, 1.59271240234375, 1.676025390625, 1.75933837890625, 1.8426513671875, 1.92596435546875, 2.00927734375, 2.09259033203125, 2.1759033203125, 2.25921630859375, 2.342529296875, 2.42584228515625, 2.5091552734375, 2.59246826171875, 2.67578125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 7.0, 4.0, 8.0, 12.0, 20.0, 21.0, 12.0, 30.0, 34.0, 27.0, 32.0, 29.0, 47.0, 33.0, 35.0, 30.0, 39.0, 43.0, 1054.0, 38.0, 34.0, 45.0, 38.0, 43.0, 35.0, 38.0, 32.0, 23.0, 20.0, 29.0, 20.0, 12.0, 20.0, 17.0, 14.0, 10.0, 12.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.35223388671875, -7.1146240234375, -6.87701416015625, -6.639404296875, -6.40179443359375, -6.1641845703125, -5.92657470703125, -5.68896484375, -5.45135498046875, -5.2137451171875, -4.97613525390625, -4.738525390625, -4.50091552734375, -4.2633056640625, -4.02569580078125, -3.7880859375, -3.55047607421875, -3.3128662109375, -3.07525634765625, -2.837646484375, -2.60003662109375, -2.3624267578125, -2.12481689453125, -1.88720703125, -1.64959716796875, -1.4119873046875, -1.17437744140625, -0.936767578125, -0.69915771484375, -0.4615478515625, -0.22393798828125, 0.013671875, 0.25128173828125, 0.4888916015625, 0.72650146484375, 0.964111328125, 1.20172119140625, 1.4393310546875, 1.67694091796875, 1.91455078125, 2.15216064453125, 2.3897705078125, 2.62738037109375, 2.864990234375, 3.10260009765625, 3.3402099609375, 3.57781982421875, 3.8154296875, 4.05303955078125, 4.2906494140625, 4.52825927734375, 4.765869140625, 5.00347900390625, 5.2410888671875, 5.47869873046875, 5.71630859375, 5.95391845703125, 6.1915283203125, 6.42913818359375, 6.666748046875, 6.90435791015625, 7.1419677734375, 7.37957763671875, 7.6171875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 13.0, 18.0, 37.0, 41.0, 73.0, 136.0, 198.0, 311.0, 477.0, 718.0, 1190.0, 1862.0, 3016.0, 4904.0, 7861.0, 13122.0, 21010.0, 35427.0, 60743.0, 112450.0, 1332828.0, 251279.0, 104508.0, 58351.0, 33887.0, 20048.0, 12434.0, 7649.0, 4786.0, 2873.0, 1774.0, 1126.0, 712.0, 441.0, 297.0, 194.0, 119.0, 83.0, 56.0, 24.0, 17.0, 8.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.658203125, -2.57501220703125, -2.4918212890625, -2.40863037109375, -2.325439453125, -2.24224853515625, -2.1590576171875, -2.07586669921875, -1.99267578125, -1.90948486328125, -1.8262939453125, -1.74310302734375, -1.659912109375, -1.57672119140625, -1.4935302734375, -1.41033935546875, -1.3271484375, -1.24395751953125, -1.1607666015625, -1.07757568359375, -0.994384765625, -0.91119384765625, -0.8280029296875, -0.74481201171875, -0.66162109375, -0.57843017578125, -0.4952392578125, -0.41204833984375, -0.328857421875, -0.24566650390625, -0.1624755859375, -0.07928466796875, 0.00390625, 0.08709716796875, 0.1702880859375, 0.25347900390625, 0.336669921875, 0.41986083984375, 0.5030517578125, 0.58624267578125, 0.66943359375, 0.75262451171875, 0.8358154296875, 0.91900634765625, 1.002197265625, 1.08538818359375, 1.1685791015625, 1.25177001953125, 1.3349609375, 1.41815185546875, 1.5013427734375, 1.58453369140625, 1.667724609375, 1.75091552734375, 1.8341064453125, 1.91729736328125, 2.00048828125, 2.08367919921875, 2.1668701171875, 2.25006103515625, 2.333251953125, 2.41644287109375, 2.4996337890625, 2.58282470703125, 2.666015625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 7.0, 6.0, 6.0, 9.0, 10.0, 11.0, 17.0, 25.0, 25.0, 33.0, 60.0, 65.0, 84.0, 101.0, 109.0, 100.0, 78.0, 53.0, 53.0, 27.0, 25.0, 10.0, 10.0, 8.0, 9.0, 4.0, 8.0, 5.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0016679763793945312, -0.0016219466924667358, -0.0015759170055389404, -0.001529887318611145, -0.0014838576316833496, -0.0014378279447555542, -0.0013917982578277588, -0.0013457685708999634, -0.001299738883972168, -0.0012537091970443726, -0.0012076795101165771, -0.0011616498231887817, -0.0011156201362609863, -0.001069590449333191, -0.0010235607624053955, -0.0009775310754776, -0.0009315013885498047, -0.0008854717016220093, -0.0008394420146942139, -0.0007934123277664185, -0.000747382640838623, -0.0007013529539108276, -0.0006553232669830322, -0.0006092935800552368, -0.0005632638931274414, -0.000517234206199646, -0.0004712045192718506, -0.0004251748323440552, -0.00037914514541625977, -0.00033311545848846436, -0.00028708577156066895, -0.00024105608463287354, -0.00019502639770507812, -0.00014899671077728271, -0.0001029670238494873, -5.6937336921691895e-05, -1.0907649993896484e-05, 3.5122036933898926e-05, 8.115172386169434e-05, 0.00012718141078948975, 0.00017321109771728516, 0.00021924078464508057, 0.000265270471572876, 0.0003113001585006714, 0.0003573298454284668, 0.0004033595323562622, 0.0004493892192840576, 0.000495418906211853, 0.0005414485931396484, 0.0005874782800674438, 0.0006335079669952393, 0.0006795376539230347, 0.0007255673408508301, 0.0007715970277786255, 0.0008176267147064209, 0.0008636564016342163, 0.0009096860885620117, 0.0009557157754898071, 0.0010017454624176025, 0.001047775149345398, 0.0010938048362731934, 0.0011398345232009888, 0.0011858642101287842, 0.0012318938970565796, 0.001277923583984375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 16.0, 12.0, 15.0, 20.0, 35.0, 30.0, 45.0, 68.0, 104.0, 182.0, 276.0, 461.0, 1307.0, 151667.0, 890455.0, 2201.0, 628.0, 303.0, 195.0, 136.0, 92.0, 62.0, 48.0, 33.0, 24.0, 20.0, 14.0, 14.0, 16.0, 8.0, 9.0, 9.0, 7.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0214385986328125, -0.020648479461669922, -0.019858360290527344, -0.019068241119384766, -0.018278121948242188, -0.01748800277709961, -0.01669788360595703, -0.015907764434814453, -0.015117645263671875, -0.014327526092529297, -0.013537406921386719, -0.01274728775024414, -0.011957168579101562, -0.011167049407958984, -0.010376930236816406, -0.009586811065673828, -0.00879669189453125, -0.008006572723388672, -0.007216453552246094, -0.006426334381103516, -0.0056362152099609375, -0.004846096038818359, -0.004055976867675781, -0.003265857696533203, -0.002475738525390625, -0.0016856193542480469, -0.0008955001831054688, -0.00010538101196289062, 0.0006847381591796875, 0.0014748573303222656, 0.0022649765014648438, 0.003055095672607422, 0.00384521484375, 0.004635334014892578, 0.005425453186035156, 0.006215572357177734, 0.0070056915283203125, 0.007795810699462891, 0.008585929870605469, 0.009376049041748047, 0.010166168212890625, 0.010956287384033203, 0.011746406555175781, 0.01253652572631836, 0.013326644897460938, 0.014116764068603516, 0.014906883239746094, 0.015697002410888672, 0.01648712158203125, 0.017277240753173828, 0.018067359924316406, 0.018857479095458984, 0.019647598266601562, 0.02043771743774414, 0.02122783660888672, 0.022017955780029297, 0.022808074951171875, 0.023598194122314453, 0.02438831329345703, 0.02517843246459961, 0.025968551635742188, 0.026758670806884766, 0.027548789978027344, 0.028338909149169922, 0.0291290283203125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 48.0, 452.0, 442.0, 63.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002346406225115061, -0.0022229135502129793, -0.002099420875310898, -0.0019759282004088163, -0.0018524355255067348, -0.0017289428506046534, -0.0016054501757025719, -0.0014819575008004904, -0.0013584648258984089, -0.0012349721509963274, -0.001111479476094246, -0.0009879868011921644, -0.0008644941262900829, -0.0007410014513880014, -0.00061750877648592, -0.0004940161015838385, -0.000370523426681757, -0.0002470307517796755, -0.000123538076877594, -4.540197551250458e-08, 0.00012344727292656898, 0.0002469399478286505, 0.00037043262273073196, 0.0004939252976328135, 0.0006174179725348949, 0.0007409106474369764, 0.0008644033223390579, 0.0009878959972411394, 0.001111388672143221, 0.0012348813470453024, 0.0013583740219473839, 0.0014818666968494654, 0.0016053589060902596, 0.001728851580992341, 0.0018523442558944225, 0.001975836930796504, 0.0020993296056985855, 0.002222822280600667, 0.0023463149555027485, 0.00246980763040483, 0.0025933003053069115, 0.002716792980208993, 0.0028402856551110744, 0.002963778330013156, 0.0030872710049152374, 0.003210763679817319, 0.0033342563547194004, 0.003457749029621482, 0.0035812417045235634, 0.003704734379425645, 0.0038282270543277264, 0.0039517199620604515, 0.004075212404131889, 0.004198704846203327, 0.004322197753936052, 0.0044456906616687775, 0.004569183103740215, 0.004692675545811653, 0.004816168453544378, 0.004939661361277103, 0.005063153803348541, 0.005186646245419979, 0.005310139153152704, 0.005433632060885429, 0.005557124502956867]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 6.0, 2.0, 6.0, 6.0, 5.0, 8.0, 11.0, 16.0, 28.0, 26.0, 18.0, 24.0, 28.0, 25.0, 33.0, 29.0, 37.0, 32.0, 45.0, 47.0, 40.0, 44.0, 47.0, 49.0, 29.0, 29.0, 46.0, 37.0, 26.0, 34.0, 36.0, 24.0, 20.0, 15.0, 20.0, 9.0, 14.0, 11.0, 12.0, 6.0, 3.0, 9.0, 6.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006265044212341309, -0.0006060497835278511, -0.0005855951458215714, -0.0005651405081152916, -0.0005446858704090118, -0.0005242312327027321, -0.0005037765949964523, -0.0004833219572901726, -0.0004628673195838928, -0.00044241268187761307, -0.0004219580441713333, -0.00040150340646505356, -0.0003810487687587738, -0.00036059413105249405, -0.0003401394933462143, -0.00031968485563993454, -0.0002992302179336548, -0.00027877558022737503, -0.0002583209425210953, -0.00023786630481481552, -0.00021741166710853577, -0.000196957029402256, -0.00017650239169597626, -0.0001560477539896965, -0.00013559311628341675, -0.000115138478577137, -9.468384087085724e-05, -7.422920316457748e-05, -5.377456545829773e-05, -3.3319927752017975e-05, -1.286529004573822e-05, 7.5893476605415344e-06, 2.804398536682129e-05, 4.8498623073101044e-05, 6.89532607793808e-05, 8.940789848566055e-05, 0.00010986253619194031, 0.00013031717389822006, 0.00015077181160449982, 0.00017122644931077957, 0.00019168108701705933, 0.00021213572472333908, 0.00023259036242961884, 0.0002530450001358986, 0.00027349963784217834, 0.0002939542755484581, 0.00031440891325473785, 0.0003348635509610176, 0.00035531818866729736, 0.0003757728263735771, 0.00039622746407985687, 0.00041668210178613663, 0.0004371367394924164, 0.00045759137719869614, 0.0004780460149049759, 0.0004985006526112556, 0.0005189552903175354, 0.0005394099280238152, 0.0005598645657300949, 0.0005803192034363747, 0.0006007738411426544, 0.0006212284788489342, 0.0006416831165552139, 0.0006621377542614937, 0.0006825923919677734]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 1.0, 3.0, 8.0, 9.0, 8.0, 5.0, 10.0, 15.0, 11.0, 16.0, 22.0, 13.0, 31.0, 29.0, 26.0, 37.0, 37.0, 37.0, 37.0, 38.0, 44.0, 39.0, 47.0, 31.0, 40.0, 36.0, 28.0, 36.0, 31.0, 24.0, 31.0, 26.0, 23.0, 28.0, 25.0, 20.0, 21.0, 17.0, 13.0, 7.0, 6.0, 10.0, 4.0, 3.0, 7.0, 2.0, 2.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.328125, -10.972412109375, -10.61669921875, -10.260986328125, -9.9052734375, -9.549560546875, -9.19384765625, -8.838134765625, -8.482421875, -8.126708984375, -7.77099609375, -7.415283203125, -7.0595703125, -6.703857421875, -6.34814453125, -5.992431640625, -5.63671875, -5.281005859375, -4.92529296875, -4.569580078125, -4.2138671875, -3.858154296875, -3.50244140625, -3.146728515625, -2.791015625, -2.435302734375, -2.07958984375, -1.723876953125, -1.3681640625, -1.012451171875, -0.65673828125, -0.301025390625, 0.0546875, 0.410400390625, 0.76611328125, 1.121826171875, 1.4775390625, 1.833251953125, 2.18896484375, 2.544677734375, 2.900390625, 3.256103515625, 3.61181640625, 3.967529296875, 4.3232421875, 4.678955078125, 5.03466796875, 5.390380859375, 5.74609375, 6.101806640625, 6.45751953125, 6.813232421875, 7.1689453125, 7.524658203125, 7.88037109375, 8.236083984375, 8.591796875, 8.947509765625, 9.30322265625, 9.658935546875, 10.0146484375, 10.370361328125, 10.72607421875, 11.081787109375, 11.4375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 14.0, 18.0, 19.0, 22.0, 41.0, 40.0, 57.0, 73.0, 117.0, 135.0, 176.0, 215.0, 295.0, 359.0, 537.0, 740.0, 965.0, 1399.0, 2389.0, 4668.0, 12947.0, 54100.0, 254122.0, 512918.0, 151129.0, 32026.0, 8822.0, 3555.0, 1949.0, 1252.0, 849.0, 636.0, 483.0, 362.0, 264.0, 227.0, 153.0, 110.0, 86.0, 72.0, 52.0, 45.0, 30.0, 29.0, 21.0, 8.0, 10.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-19.40625, -18.823974609375, -18.24169921875, -17.659423828125, -17.0771484375, -16.494873046875, -15.91259765625, -15.330322265625, -14.748046875, -14.165771484375, -13.58349609375, -13.001220703125, -12.4189453125, -11.836669921875, -11.25439453125, -10.672119140625, -10.08984375, -9.507568359375, -8.92529296875, -8.343017578125, -7.7607421875, -7.178466796875, -6.59619140625, -6.013916015625, -5.431640625, -4.849365234375, -4.26708984375, -3.684814453125, -3.1025390625, -2.520263671875, -1.93798828125, -1.355712890625, -0.7734375, -0.191162109375, 0.39111328125, 0.973388671875, 1.5556640625, 2.137939453125, 2.72021484375, 3.302490234375, 3.884765625, 4.467041015625, 5.04931640625, 5.631591796875, 6.2138671875, 6.796142578125, 7.37841796875, 7.960693359375, 8.54296875, 9.125244140625, 9.70751953125, 10.289794921875, 10.8720703125, 11.454345703125, 12.03662109375, 12.618896484375, 13.201171875, 13.783447265625, 14.36572265625, 14.947998046875, 15.5302734375, 16.112548828125, 16.69482421875, 17.277099609375, 17.859375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 16.0, 6.0, 15.0, 15.0, 12.0, 24.0, 30.0, 32.0, 46.0, 62.0, 67.0, 80.0, 134.0, 376.0, 1524.0, 161.0, 108.0, 66.0, 50.0, 39.0, 45.0, 40.0, 25.0, 20.0, 18.0, 12.0, 6.0, 3.0, 9.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.3125, -45.96435546875, -44.6162109375, -43.26806640625, -41.919921875, -40.57177734375, -39.2236328125, -37.87548828125, -36.52734375, -35.17919921875, -33.8310546875, -32.48291015625, -31.134765625, -29.78662109375, -28.4384765625, -27.09033203125, -25.7421875, -24.39404296875, -23.0458984375, -21.69775390625, -20.349609375, -19.00146484375, -17.6533203125, -16.30517578125, -14.95703125, -13.60888671875, -12.2607421875, -10.91259765625, -9.564453125, -8.21630859375, -6.8681640625, -5.52001953125, -4.171875, -2.82373046875, -1.4755859375, -0.12744140625, 1.220703125, 2.56884765625, 3.9169921875, 5.26513671875, 6.61328125, 7.96142578125, 9.3095703125, 10.65771484375, 12.005859375, 13.35400390625, 14.7021484375, 16.05029296875, 17.3984375, 18.74658203125, 20.0947265625, 21.44287109375, 22.791015625, 24.13916015625, 25.4873046875, 26.83544921875, 28.18359375, 29.53173828125, 30.8798828125, 32.22802734375, 33.576171875, 34.92431640625, 36.2724609375, 37.62060546875, 38.96875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 7.0, 8.0, 17.0, 11.0, 25.0, 29.0, 33.0, 36.0, 45.0, 65.0, 92.0, 176.0, 316.0, 554.0, 1395.0, 66426.0, 3071952.0, 2714.0, 769.0, 366.0, 223.0, 123.0, 81.0, 60.0, 39.0, 30.0, 26.0, 24.0, 15.0, 8.0, 8.0, 2.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-130.875, -126.93359375, -122.9921875, -119.05078125, -115.109375, -111.16796875, -107.2265625, -103.28515625, -99.34375, -95.40234375, -91.4609375, -87.51953125, -83.578125, -79.63671875, -75.6953125, -71.75390625, -67.8125, -63.87109375, -59.9296875, -55.98828125, -52.046875, -48.10546875, -44.1640625, -40.22265625, -36.28125, -32.33984375, -28.3984375, -24.45703125, -20.515625, -16.57421875, -12.6328125, -8.69140625, -4.75, -0.80859375, 3.1328125, 7.07421875, 11.015625, 14.95703125, 18.8984375, 22.83984375, 26.78125, 30.72265625, 34.6640625, 38.60546875, 42.546875, 46.48828125, 50.4296875, 54.37109375, 58.3125, 62.25390625, 66.1953125, 70.13671875, 74.078125, 78.01953125, 81.9609375, 85.90234375, 89.84375, 93.78515625, 97.7265625, 101.66796875, 105.609375, 109.55078125, 113.4921875, 117.43359375, 121.375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 10.0, 31.0, 107.0, 270.0, 336.0, 180.0, 52.0, 17.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-194.27806091308594, -190.63124084472656, -186.9844207763672, -183.33758544921875, -179.69076538085938, -176.0439453125, -172.39712524414062, -168.75030517578125, -165.10348510742188, -161.4566650390625, -157.80984497070312, -154.16302490234375, -150.5161895751953, -146.86936950683594, -143.22254943847656, -139.5757293701172, -135.92889404296875, -132.28207397460938, -128.63525390625, -124.9884262084961, -121.34160614013672, -117.69477844238281, -114.04795837402344, -110.40113830566406, -106.75431823730469, -103.10749816894531, -99.4606704711914, -95.81385040283203, -92.16703033447266, -88.52020263671875, -84.87338256835938, -81.2265625, -77.57974243164062, -73.93292236328125, -70.28609466552734, -66.63927459716797, -62.992454528808594, -59.34563064575195, -55.69880676269531, -52.05198669433594, -48.40515899658203, -44.75833511352539, -41.111515045166016, -37.464691162109375, -33.81787109375, -30.17104721069336, -26.52422332763672, -22.87740135192871, -19.230579376220703, -15.583757400512695, -11.936934471130371, -8.290111541748047, -4.643289566040039, -0.9964675903320312, 2.6503562927246094, 6.297178268432617, 9.944000244140625, 13.590822219848633, 17.23764419555664, 20.88446807861328, 24.53129005432129, 28.178112030029297, 31.824935913085938, 35.47175598144531, 39.11857986450195]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 9.0, 4.0, 5.0, 17.0, 10.0, 15.0, 21.0, 19.0, 21.0, 29.0, 25.0, 29.0, 25.0, 29.0, 32.0, 29.0, 31.0, 37.0, 48.0, 38.0, 22.0, 52.0, 41.0, 37.0, 33.0, 41.0, 40.0, 30.0, 30.0, 22.0, 30.0, 24.0, 20.0, 26.0, 16.0, 15.0, 7.0, 9.0, 7.0, 4.0, 4.0, 3.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-94.528564453125, -91.73275756835938, -88.93695831298828, -86.14115142822266, -83.34535217285156, -80.54954528808594, -77.75374603271484, -74.95793914794922, -72.16213989257812, -69.3663330078125, -66.5705337524414, -63.77473068237305, -60.97892761230469, -58.18312454223633, -55.38732147216797, -52.591514587402344, -49.795711517333984, -46.999908447265625, -44.204105377197266, -41.408302307128906, -38.61249923706055, -35.81669616699219, -33.02088928222656, -30.225088119506836, -27.429285049438477, -24.633481979370117, -21.837678909301758, -19.041873931884766, -16.246070861816406, -13.450268745422363, -10.654464721679688, -7.858661651611328, -5.062858581542969, -2.2670552730560303, 0.5287480354309082, 3.324551582336426, 6.120354652404785, 8.916157722473145, 11.71196174621582, 14.50776481628418, 17.30356788635254, 20.0993709564209, 22.895174026489258, 25.69097900390625, 28.48678207397461, 31.28258514404297, 34.07838821411133, 36.87419128417969, 39.66999435424805, 42.465797424316406, 45.261600494384766, 48.057403564453125, 50.853206634521484, 53.649009704589844, 56.44481658935547, 59.24061584472656, 62.03642272949219, 64.83222961425781, 67.6280288696289, 70.42383575439453, 73.21963500976562, 76.01544189453125, 78.81124114990234, 81.60704803466797, 84.40284729003906]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 6.0, 10.0, 4.0, 5.0, 9.0, 11.0, 12.0, 16.0, 18.0, 17.0, 15.0, 29.0, 30.0, 29.0, 23.0, 39.0, 33.0, 49.0, 44.0, 45.0, 29.0, 29.0, 32.0, 32.0, 34.0, 27.0, 30.0, 33.0, 33.0, 41.0, 29.0, 28.0, 29.0, 20.0, 12.0, 20.0, 15.0, 8.0, 17.0, 10.0, 6.0, 13.0, 4.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-11.125, -10.7886962890625, -10.452392578125, -10.1160888671875, -9.77978515625, -9.4434814453125, -9.107177734375, -8.7708740234375, -8.4345703125, -8.0982666015625, -7.761962890625, -7.4256591796875, -7.08935546875, -6.7530517578125, -6.416748046875, -6.0804443359375, -5.744140625, -5.4078369140625, -5.071533203125, -4.7352294921875, -4.39892578125, -4.0626220703125, -3.726318359375, -3.3900146484375, -3.0537109375, -2.7174072265625, -2.381103515625, -2.0447998046875, -1.70849609375, -1.3721923828125, -1.035888671875, -0.6995849609375, -0.36328125, -0.0269775390625, 0.309326171875, 0.6456298828125, 0.98193359375, 1.3182373046875, 1.654541015625, 1.9908447265625, 2.3271484375, 2.6634521484375, 2.999755859375, 3.3360595703125, 3.67236328125, 4.0086669921875, 4.344970703125, 4.6812744140625, 5.017578125, 5.3538818359375, 5.690185546875, 6.0264892578125, 6.36279296875, 6.6990966796875, 7.035400390625, 7.3717041015625, 7.7080078125, 8.0443115234375, 8.380615234375, 8.7169189453125, 9.05322265625, 9.3895263671875, 9.725830078125, 10.0621337890625, 10.3984375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 10.0, 5.0, 6.0, 21.0, 12.0, 19.0, 23.0, 38.0, 27.0, 53.0, 53.0, 64.0, 87.0, 107.0, 165.0, 226.0, 535.0, 1460.0, 4500.0, 25185.0, 665233.0, 3164020.0, 311178.0, 15416.0, 3402.0, 1120.0, 436.0, 238.0, 149.0, 119.0, 75.0, 66.0, 46.0, 54.0, 31.0, 18.0, 21.0, 15.0, 12.0, 13.0, 8.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.421875, -29.311279296875, -28.20068359375, -27.090087890625, -25.9794921875, -24.868896484375, -23.75830078125, -22.647705078125, -21.537109375, -20.426513671875, -19.31591796875, -18.205322265625, -17.0947265625, -15.984130859375, -14.87353515625, -13.762939453125, -12.65234375, -11.541748046875, -10.43115234375, -9.320556640625, -8.2099609375, -7.099365234375, -5.98876953125, -4.878173828125, -3.767578125, -2.656982421875, -1.54638671875, -0.435791015625, 0.6748046875, 1.785400390625, 2.89599609375, 4.006591796875, 5.1171875, 6.227783203125, 7.33837890625, 8.448974609375, 9.5595703125, 10.670166015625, 11.78076171875, 12.891357421875, 14.001953125, 15.112548828125, 16.22314453125, 17.333740234375, 18.4443359375, 19.554931640625, 20.66552734375, 21.776123046875, 22.88671875, 23.997314453125, 25.10791015625, 26.218505859375, 27.3291015625, 28.439697265625, 29.55029296875, 30.660888671875, 31.771484375, 32.882080078125, 33.99267578125, 35.103271484375, 36.2138671875, 37.324462890625, 38.43505859375, 39.545654296875, 40.65625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 7.0, 6.0, 9.0, 11.0, 20.0, 12.0, 22.0, 32.0, 35.0, 50.0, 51.0, 82.0, 108.0, 135.0, 159.0, 212.0, 275.0, 356.0, 454.0, 479.0, 340.0, 265.0, 216.0, 137.0, 138.0, 105.0, 78.0, 66.0, 36.0, 36.0, 32.0, 24.0, 14.0, 17.0, 15.0, 9.0, 9.0, 0.0, 1.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-17.875, -17.332275390625, -16.78955078125, -16.246826171875, -15.7041015625, -15.161376953125, -14.61865234375, -14.075927734375, -13.533203125, -12.990478515625, -12.44775390625, -11.905029296875, -11.3623046875, -10.819580078125, -10.27685546875, -9.734130859375, -9.19140625, -8.648681640625, -8.10595703125, -7.563232421875, -7.0205078125, -6.477783203125, -5.93505859375, -5.392333984375, -4.849609375, -4.306884765625, -3.76416015625, -3.221435546875, -2.6787109375, -2.135986328125, -1.59326171875, -1.050537109375, -0.5078125, 0.034912109375, 0.57763671875, 1.120361328125, 1.6630859375, 2.205810546875, 2.74853515625, 3.291259765625, 3.833984375, 4.376708984375, 4.91943359375, 5.462158203125, 6.0048828125, 6.547607421875, 7.09033203125, 7.633056640625, 8.17578125, 8.718505859375, 9.26123046875, 9.803955078125, 10.3466796875, 10.889404296875, 11.43212890625, 11.974853515625, 12.517578125, 13.060302734375, 13.60302734375, 14.145751953125, 14.6884765625, 15.231201171875, 15.77392578125, 16.316650390625, 16.859375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 11.0, 10.0, 13.0, 23.0, 23.0, 37.0, 52.0, 89.0, 141.0, 203.0, 432.0, 1010.0, 3062.0, 28286.0, 3071853.0, 1070112.0, 14948.0, 2313.0, 780.0, 358.0, 186.0, 107.0, 61.0, 43.0, 38.0, 25.0, 17.0, 16.0, 10.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.71875, -44.84228515625, -42.9658203125, -41.08935546875, -39.212890625, -37.33642578125, -35.4599609375, -33.58349609375, -31.70703125, -29.83056640625, -27.9541015625, -26.07763671875, -24.201171875, -22.32470703125, -20.4482421875, -18.57177734375, -16.6953125, -14.81884765625, -12.9423828125, -11.06591796875, -9.189453125, -7.31298828125, -5.4365234375, -3.56005859375, -1.68359375, 0.19287109375, 2.0693359375, 3.94580078125, 5.822265625, 7.69873046875, 9.5751953125, 11.45166015625, 13.328125, 15.20458984375, 17.0810546875, 18.95751953125, 20.833984375, 22.71044921875, 24.5869140625, 26.46337890625, 28.33984375, 30.21630859375, 32.0927734375, 33.96923828125, 35.845703125, 37.72216796875, 39.5986328125, 41.47509765625, 43.3515625, 45.22802734375, 47.1044921875, 48.98095703125, 50.857421875, 52.73388671875, 54.6103515625, 56.48681640625, 58.36328125, 60.23974609375, 62.1162109375, 63.99267578125, 65.869140625, 67.74560546875, 69.6220703125, 71.49853515625, 73.375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 102.0, 836.0, 77.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-833.9146118164062, -812.7756958007812, -791.6367797851562, -770.4978637695312, -749.3589477539062, -728.2200317382812, -707.0811157226562, -685.9421997070312, -664.8032836914062, -643.6643676757812, -622.5254516601562, -601.3865356445312, -580.2476196289062, -559.1087036132812, -537.9697875976562, -516.8308715820312, -495.69195556640625, -474.55303955078125, -453.41412353515625, -432.27520751953125, -411.13629150390625, -389.99737548828125, -368.85845947265625, -347.71954345703125, -326.58062744140625, -305.44171142578125, -284.30279541015625, -263.16387939453125, -242.02496337890625, -220.88604736328125, -199.74713134765625, -178.60821533203125, -157.4693603515625, -136.3304443359375, -115.1915283203125, -94.0526123046875, -72.9136962890625, -51.7747802734375, -30.6358642578125, -9.4969482421875, 11.6419677734375, 32.7808837890625, 53.9197998046875, 75.0587158203125, 96.1976318359375, 117.3365478515625, 138.4754638671875, 159.6143798828125, 180.7532958984375, 201.8922119140625, 223.0311279296875, 244.1700439453125, 265.3089599609375, 286.4478759765625, 307.5867919921875, 328.7257080078125, 349.8646240234375, 371.0035400390625, 392.1424560546875, 413.2813720703125, 434.4202880859375, 455.5592041015625, 476.6981201171875, 497.8370361328125, 518.9759521484375]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 6.0, 5.0, 8.0, 7.0, 11.0, 9.0, 10.0, 20.0, 18.0, 14.0, 28.0, 29.0, 15.0, 31.0, 27.0, 33.0, 43.0, 41.0, 27.0, 39.0, 48.0, 42.0, 41.0, 35.0, 33.0, 37.0, 43.0, 40.0, 32.0, 28.0, 21.0, 27.0, 19.0, 23.0, 24.0, 17.0, 12.0, 8.0, 13.0, 8.0, 8.0, 4.0, 2.0, 4.0, 7.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-75.9619140625, -73.80117797851562, -71.64043426513672, -69.47969818115234, -67.31895446777344, -65.15821838378906, -62.99747848510742, -60.83673858642578, -58.67599868774414, -56.5152587890625, -54.35451889038086, -52.19377899169922, -50.033042907714844, -47.87229919433594, -45.71156311035156, -43.55082321166992, -41.39008331298828, -39.22934341430664, -37.068603515625, -34.90786361694336, -32.74712371826172, -30.58638572692871, -28.425647735595703, -26.264907836914062, -24.104167938232422, -21.94342803955078, -19.78268814086914, -17.621950149536133, -15.461210250854492, -13.300470352172852, -11.139731407165527, -8.978992462158203, -6.8182525634765625, -4.65751314163208, -2.4967737197875977, -0.33603429794311523, 1.8247051239013672, 3.985445022583008, 6.146183967590332, 8.306922912597656, 10.467662811279297, 12.628402709960938, 14.789141654968262, 16.949880599975586, 19.110620498657227, 21.271360397338867, 23.432098388671875, 25.592838287353516, 27.753578186035156, 29.914318084716797, 32.07505798339844, 34.23579788208008, 36.39653778076172, 38.557273864746094, 40.718013763427734, 42.878753662109375, 45.039493560791016, 47.200233459472656, 49.3609733581543, 51.52171325683594, 53.68244934082031, 55.84319305419922, 58.003929138183594, 60.164669036865234, 62.325408935546875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 3.0, 7.0, 8.0, 12.0, 10.0, 8.0, 22.0, 20.0, 29.0, 26.0, 30.0, 31.0, 41.0, 31.0, 40.0, 37.0, 39.0, 33.0, 46.0, 45.0, 34.0, 32.0, 44.0, 43.0, 29.0, 39.0, 30.0, 26.0, 37.0, 24.0, 16.0, 22.0, 12.0, 7.0, 19.0, 15.0, 14.0, 4.0, 6.0, 7.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.9375, -9.6417236328125, -9.345947265625, -9.0501708984375, -8.75439453125, -8.4586181640625, -8.162841796875, -7.8670654296875, -7.5712890625, -7.2755126953125, -6.979736328125, -6.6839599609375, -6.38818359375, -6.0924072265625, -5.796630859375, -5.5008544921875, -5.205078125, -4.9093017578125, -4.613525390625, -4.3177490234375, -4.02197265625, -3.7261962890625, -3.430419921875, -3.1346435546875, -2.8388671875, -2.5430908203125, -2.247314453125, -1.9515380859375, -1.65576171875, -1.3599853515625, -1.064208984375, -0.7684326171875, -0.47265625, -0.1768798828125, 0.118896484375, 0.4146728515625, 0.71044921875, 1.0062255859375, 1.302001953125, 1.5977783203125, 1.8935546875, 2.1893310546875, 2.485107421875, 2.7808837890625, 3.07666015625, 3.3724365234375, 3.668212890625, 3.9639892578125, 4.259765625, 4.5555419921875, 4.851318359375, 5.1470947265625, 5.44287109375, 5.7386474609375, 6.034423828125, 6.3302001953125, 6.6259765625, 6.9217529296875, 7.217529296875, 7.5133056640625, 7.80908203125, 8.1048583984375, 8.400634765625, 8.6964111328125, 8.9921875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 13.0, 12.0, 20.0, 29.0, 40.0, 82.0, 104.0, 175.0, 245.0, 404.0, 623.0, 1020.0, 1581.0, 2614.0, 4065.0, 6331.0, 10218.0, 16441.0, 26975.0, 44604.0, 76582.0, 141068.0, 322343.0, 171594.0, 89294.0, 51634.0, 30873.0, 18766.0, 11308.0, 7305.0, 4446.0, 2909.0, 1706.0, 1128.0, 716.0, 443.0, 268.0, 215.0, 122.0, 77.0, 54.0, 38.0, 21.0, 17.0, 8.0, 11.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.294921875, -2.2266845703125, -2.158447265625, -2.0902099609375, -2.02197265625, -1.9537353515625, -1.885498046875, -1.8172607421875, -1.7490234375, -1.6807861328125, -1.612548828125, -1.5443115234375, -1.47607421875, -1.4078369140625, -1.339599609375, -1.2713623046875, -1.203125, -1.1348876953125, -1.066650390625, -0.9984130859375, -0.93017578125, -0.8619384765625, -0.793701171875, -0.7254638671875, -0.6572265625, -0.5889892578125, -0.520751953125, -0.4525146484375, -0.38427734375, -0.3160400390625, -0.247802734375, -0.1795654296875, -0.111328125, -0.0430908203125, 0.025146484375, 0.0933837890625, 0.16162109375, 0.2298583984375, 0.298095703125, 0.3663330078125, 0.4345703125, 0.5028076171875, 0.571044921875, 0.6392822265625, 0.70751953125, 0.7757568359375, 0.843994140625, 0.9122314453125, 0.98046875, 1.0487060546875, 1.116943359375, 1.1851806640625, 1.25341796875, 1.3216552734375, 1.389892578125, 1.4581298828125, 1.5263671875, 1.5946044921875, 1.662841796875, 1.7310791015625, 1.79931640625, 1.8675537109375, 1.935791015625, 2.0040283203125, 2.072265625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 7.0, 4.0, 11.0, 17.0, 21.0, 18.0, 17.0, 25.0, 28.0, 23.0, 22.0, 46.0, 35.0, 43.0, 40.0, 52.0, 53.0, 1065.0, 47.0, 41.0, 47.0, 40.0, 36.0, 38.0, 36.0, 29.0, 32.0, 30.0, 23.0, 26.0, 25.0, 10.0, 11.0, 6.0, 3.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.52734375, -7.3179931640625, -7.108642578125, -6.8992919921875, -6.68994140625, -6.4805908203125, -6.271240234375, -6.0618896484375, -5.8525390625, -5.6431884765625, -5.433837890625, -5.2244873046875, -5.01513671875, -4.8057861328125, -4.596435546875, -4.3870849609375, -4.177734375, -3.9683837890625, -3.759033203125, -3.5496826171875, -3.34033203125, -3.1309814453125, -2.921630859375, -2.7122802734375, -2.5029296875, -2.2935791015625, -2.084228515625, -1.8748779296875, -1.66552734375, -1.4561767578125, -1.246826171875, -1.0374755859375, -0.828125, -0.6187744140625, -0.409423828125, -0.2000732421875, 0.00927734375, 0.2186279296875, 0.427978515625, 0.6373291015625, 0.8466796875, 1.0560302734375, 1.265380859375, 1.4747314453125, 1.68408203125, 1.8934326171875, 2.102783203125, 2.3121337890625, 2.521484375, 2.7308349609375, 2.940185546875, 3.1495361328125, 3.35888671875, 3.5682373046875, 3.777587890625, 3.9869384765625, 4.1962890625, 4.4056396484375, 4.614990234375, 4.8243408203125, 5.03369140625, 5.2430419921875, 5.452392578125, 5.6617431640625, 5.87109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 10.0, 14.0, 17.0, 23.0, 42.0, 81.0, 103.0, 182.0, 250.0, 445.0, 749.0, 1228.0, 2076.0, 3671.0, 6327.0, 10784.0, 18246.0, 32165.0, 57917.0, 111638.0, 1374514.0, 255263.0, 99402.0, 51950.0, 29148.0, 17027.0, 9869.0, 5742.0, 3361.0, 1997.0, 1087.0, 705.0, 413.0, 264.0, 151.0, 99.0, 60.0, 28.0, 31.0, 17.0, 12.0, 11.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.623046875, -2.550018310546875, -2.47698974609375, -2.403961181640625, -2.3309326171875, -2.257904052734375, -2.18487548828125, -2.111846923828125, -2.038818359375, -1.965789794921875, -1.89276123046875, -1.819732666015625, -1.7467041015625, -1.673675537109375, -1.60064697265625, -1.527618408203125, -1.45458984375, -1.381561279296875, -1.30853271484375, -1.235504150390625, -1.1624755859375, -1.089447021484375, -1.01641845703125, -0.943389892578125, -0.870361328125, -0.797332763671875, -0.72430419921875, -0.651275634765625, -0.5782470703125, -0.505218505859375, -0.43218994140625, -0.359161376953125, -0.2861328125, -0.213104248046875, -0.14007568359375, -0.067047119140625, 0.0059814453125, 0.079010009765625, 0.15203857421875, 0.225067138671875, 0.298095703125, 0.371124267578125, 0.44415283203125, 0.517181396484375, 0.5902099609375, 0.663238525390625, 0.73626708984375, 0.809295654296875, 0.88232421875, 0.955352783203125, 1.02838134765625, 1.101409912109375, 1.1744384765625, 1.247467041015625, 1.32049560546875, 1.393524169921875, 1.466552734375, 1.539581298828125, 1.61260986328125, 1.685638427734375, 1.7586669921875, 1.831695556640625, 1.90472412109375, 1.977752685546875, 2.05078125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 4.0, 14.0, 11.0, 13.0, 17.0, 22.0, 21.0, 22.0, 31.0, 36.0, 39.0, 72.0, 82.0, 109.0, 93.0, 79.0, 72.0, 54.0, 41.0, 28.0, 12.0, 27.0, 17.0, 13.0, 13.0, 7.0, 6.0, 9.0, 2.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012607574462890625, -0.0012213587760925293, -0.001181960105895996, -0.0011425614356994629, -0.0011031627655029297, -0.0010637640953063965, -0.0010243654251098633, -0.00098496675491333, -0.0009455680847167969, -0.0009061694145202637, -0.0008667707443237305, -0.0008273720741271973, -0.0007879734039306641, -0.0007485747337341309, -0.0007091760635375977, -0.0006697773933410645, -0.0006303787231445312, -0.000590980052947998, -0.0005515813827514648, -0.0005121827125549316, -0.00047278404235839844, -0.00043338537216186523, -0.00039398670196533203, -0.00035458803176879883, -0.0003151893615722656, -0.0002757906913757324, -0.00023639202117919922, -0.00019699335098266602, -0.0001575946807861328, -0.00011819601058959961, -7.87973403930664e-05, -3.93986701965332e-05, 0.0, 3.93986701965332e-05, 7.87973403930664e-05, 0.00011819601058959961, 0.0001575946807861328, 0.00019699335098266602, 0.00023639202117919922, 0.0002757906913757324, 0.0003151893615722656, 0.00035458803176879883, 0.00039398670196533203, 0.00043338537216186523, 0.00047278404235839844, 0.0005121827125549316, 0.0005515813827514648, 0.000590980052947998, 0.0006303787231445312, 0.0006697773933410645, 0.0007091760635375977, 0.0007485747337341309, 0.0007879734039306641, 0.0008273720741271973, 0.0008667707443237305, 0.0009061694145202637, 0.0009455680847167969, 0.00098496675491333, 0.0010243654251098633, 0.0010637640953063965, 0.0011031627655029297, 0.0011425614356994629, 0.001181960105895996, 0.0012213587760925293, 0.0012607574462890625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 11.0, 12.0, 13.0, 13.0, 19.0, 25.0, 23.0, 36.0, 56.0, 86.0, 123.0, 165.0, 283.0, 516.0, 1256.0, 742587.0, 300848.0, 1115.0, 490.0, 249.0, 177.0, 117.0, 74.0, 65.0, 43.0, 40.0, 28.0, 20.0, 14.0, 14.0, 5.0, 6.0, 4.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.032073974609375, -0.031206130981445312, -0.030338287353515625, -0.029470443725585938, -0.02860260009765625, -0.027734756469726562, -0.026866912841796875, -0.025999069213867188, -0.0251312255859375, -0.024263381958007812, -0.023395538330078125, -0.022527694702148438, -0.02165985107421875, -0.020792007446289062, -0.019924163818359375, -0.019056320190429688, -0.0181884765625, -0.017320632934570312, -0.016452789306640625, -0.015584945678710938, -0.01471710205078125, -0.013849258422851562, -0.012981414794921875, -0.012113571166992188, -0.0112457275390625, -0.010377883911132812, -0.009510040283203125, -0.008642196655273438, -0.00777435302734375, -0.0069065093994140625, -0.006038665771484375, -0.0051708221435546875, -0.004302978515625, -0.0034351348876953125, -0.002567291259765625, -0.0016994476318359375, -0.00083160400390625, 3.62396240234375e-05, 0.000904083251953125, 0.0017719268798828125, 0.0026397705078125, 0.0035076141357421875, 0.004375457763671875, 0.0052433013916015625, 0.00611114501953125, 0.0069789886474609375, 0.007846832275390625, 0.008714675903320312, 0.00958251953125, 0.010450363159179688, 0.011318206787109375, 0.012186050415039062, 0.01305389404296875, 0.013921737670898438, 0.014789581298828125, 0.015657424926757812, 0.0165252685546875, 0.017393112182617188, 0.018260955810546875, 0.019128799438476562, 0.01999664306640625, 0.020864486694335938, 0.021732330322265625, 0.022600173950195312, 0.023468017578125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 12.0, 25.0, 69.0, 149.0, 226.0, 247.0, 159.0, 62.0, 40.0, 7.0, 12.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007082309457473457, -0.0006711359019391239, -0.000634040858130902, -0.0005969458725303411, -0.0005598508287221193, -0.0005227557849138975, -0.0004856607411056757, -0.00044856572640128434, -0.0004114706825930625, -0.0003743756387848407, -0.00033728062408044934, -0.0003001855802722275, -0.0002630905364640057, -0.00022599552175961435, -0.00018890047795139253, -0.00015180546324700117, -0.00011471041943877935, -7.761539018247277e-05, -4.052035365020856e-05, -3.4253171179443598e-06, 3.366971213836223e-05, 7.076474139466882e-05, 0.00010785978520289063, 0.000144954799907282, 0.0001820498437155038, 0.0002191448729718104, 0.000256239902228117, 0.0002933349460363388, 0.0003304299898445606, 0.000367525004548952, 0.0004046200483571738, 0.00044171506306156516, 0.00047881004866212606, 0.0005159050924703479, 0.0005530001362785697, 0.0005900951800867915, 0.0006271901656873524, 0.0006642852094955742, 0.000701380253303796, 0.000738475238904357, 0.0007755702827125788, 0.0008126653265208006, 0.0008497603703290224, 0.0008868554141372442, 0.0009239503997378051, 0.0009610454435460269, 0.0009981405455619097, 0.0010352354729548097, 0.0010723306331783533, 0.0011094256769865751, 0.001146520720794797, 0.0011836157646030188, 0.0012207108084112406, 0.0012578058522194624, 0.0012949008960276842, 0.0013319958234205842, 0.001369090867228806, 0.0014061859110370278, 0.0014432809548452497, 0.0014803759986534715, 0.0015174710424616933, 0.0015545659698545933, 0.001591661013662815, 0.001628756057471037, 0.0016658511012792587]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 7.0, 6.0, 7.0, 7.0, 11.0, 18.0, 15.0, 28.0, 20.0, 19.0, 30.0, 28.0, 35.0, 20.0, 31.0, 24.0, 44.0, 34.0, 58.0, 49.0, 38.0, 40.0, 42.0, 36.0, 37.0, 43.0, 21.0, 33.0, 34.0, 23.0, 26.0, 20.0, 20.0, 19.0, 22.0, 9.0, 4.0, 8.0, 4.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0005674958229064941, -0.0005499254912137985, -0.0005323551595211029, -0.0005147848278284073, -0.0004972144961357117, -0.00047964416444301605, -0.00046207383275032043, -0.0004445035010576248, -0.0004269331693649292, -0.0004093628376722336, -0.00039179250597953796, -0.00037422217428684235, -0.00035665184259414673, -0.0003390815109014511, -0.0003215111792087555, -0.0003039408475160599, -0.00028637051582336426, -0.00026880018413066864, -0.000251229852437973, -0.0002336595207452774, -0.0002160891890525818, -0.00019851885735988617, -0.00018094852566719055, -0.00016337819397449493, -0.00014580786228179932, -0.0001282375305891037, -0.00011066719889640808, -9.309686720371246e-05, -7.552653551101685e-05, -5.795620381832123e-05, -4.038587212562561e-05, -2.2815540432929993e-05, -5.245208740234375e-06, 1.2325122952461243e-05, 2.989545464515686e-05, 4.746578633785248e-05, 6.50361180305481e-05, 8.260644972324371e-05, 0.00010017678141593933, 0.00011774711310863495, 0.00013531744480133057, 0.00015288777649402618, 0.0001704581081867218, 0.00018802843987941742, 0.00020559877157211304, 0.00022316910326480865, 0.00024073943495750427, 0.0002583097666501999, 0.0002758800983428955, 0.0002934504300355911, 0.00031102076172828674, 0.00032859109342098236, 0.000346161425113678, 0.0003637317568063736, 0.0003813020884990692, 0.00039887242019176483, 0.00041644275188446045, 0.00043401308357715607, 0.0004515834152698517, 0.0004691537469625473, 0.0004867240786552429, 0.0005042944103479385, 0.0005218647420406342, 0.0005394350737333298, 0.0005570054054260254]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 3.0, 7.0, 8.0, 12.0, 10.0, 8.0, 22.0, 20.0, 29.0, 26.0, 30.0, 31.0, 41.0, 31.0, 40.0, 37.0, 39.0, 34.0, 45.0, 45.0, 35.0, 32.0, 43.0, 43.0, 30.0, 38.0, 30.0, 27.0, 37.0, 23.0, 16.0, 22.0, 13.0, 6.0, 19.0, 17.0, 12.0, 4.0, 6.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.9375, -9.6416015625, -9.345703125, -9.0498046875, -8.75390625, -8.4580078125, -8.162109375, -7.8662109375, -7.5703125, -7.2744140625, -6.978515625, -6.6826171875, -6.38671875, -6.0908203125, -5.794921875, -5.4990234375, -5.203125, -4.9072265625, -4.611328125, -4.3154296875, -4.01953125, -3.7236328125, -3.427734375, -3.1318359375, -2.8359375, -2.5400390625, -2.244140625, -1.9482421875, -1.65234375, -1.3564453125, -1.060546875, -0.7646484375, -0.46875, -0.1728515625, 0.123046875, 0.4189453125, 0.71484375, 1.0107421875, 1.306640625, 1.6025390625, 1.8984375, 2.1943359375, 2.490234375, 2.7861328125, 3.08203125, 3.3779296875, 3.673828125, 3.9697265625, 4.265625, 4.5615234375, 4.857421875, 5.1533203125, 5.44921875, 5.7451171875, 6.041015625, 6.3369140625, 6.6328125, 6.9287109375, 7.224609375, 7.5205078125, 7.81640625, 8.1123046875, 8.408203125, 8.7041015625, 9.0]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 6.0, 12.0, 18.0, 24.0, 30.0, 40.0, 57.0, 86.0, 104.0, 168.0, 210.0, 311.0, 420.0, 576.0, 818.0, 1201.0, 1789.0, 3075.0, 6211.0, 19166.0, 115386.0, 641382.0, 209791.0, 29302.0, 8048.0, 3638.0, 2122.0, 1360.0, 888.0, 670.0, 449.0, 334.0, 242.0, 179.0, 126.0, 95.0, 60.0, 35.0, 28.0, 29.0, 13.0, 15.0, 10.0, 8.0, 8.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.0, -21.3046875, -20.609375, -19.9140625, -19.21875, -18.5234375, -17.828125, -17.1328125, -16.4375, -15.7421875, -15.046875, -14.3515625, -13.65625, -12.9609375, -12.265625, -11.5703125, -10.875, -10.1796875, -9.484375, -8.7890625, -8.09375, -7.3984375, -6.703125, -6.0078125, -5.3125, -4.6171875, -3.921875, -3.2265625, -2.53125, -1.8359375, -1.140625, -0.4453125, 0.25, 0.9453125, 1.640625, 2.3359375, 3.03125, 3.7265625, 4.421875, 5.1171875, 5.8125, 6.5078125, 7.203125, 7.8984375, 8.59375, 9.2890625, 9.984375, 10.6796875, 11.375, 12.0703125, 12.765625, 13.4609375, 14.15625, 14.8515625, 15.546875, 16.2421875, 16.9375, 17.6328125, 18.328125, 19.0234375, 19.71875, 20.4140625, 21.109375, 21.8046875, 22.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 2.0, 4.0, 7.0, 12.0, 18.0, 20.0, 24.0, 24.0, 46.0, 56.0, 65.0, 85.0, 186.0, 1737.0, 301.0, 112.0, 63.0, 68.0, 47.0, 43.0, 38.0, 18.0, 15.0, 10.0, 9.0, 11.0, 10.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.40625, -33.2060546875, -32.005859375, -30.8056640625, -29.60546875, -28.4052734375, -27.205078125, -26.0048828125, -24.8046875, -23.6044921875, -22.404296875, -21.2041015625, -20.00390625, -18.8037109375, -17.603515625, -16.4033203125, -15.203125, -14.0029296875, -12.802734375, -11.6025390625, -10.40234375, -9.2021484375, -8.001953125, -6.8017578125, -5.6015625, -4.4013671875, -3.201171875, -2.0009765625, -0.80078125, 0.3994140625, 1.599609375, 2.7998046875, 4.0, 5.2001953125, 6.400390625, 7.6005859375, 8.80078125, 10.0009765625, 11.201171875, 12.4013671875, 13.6015625, 14.8017578125, 16.001953125, 17.2021484375, 18.40234375, 19.6025390625, 20.802734375, 22.0029296875, 23.203125, 24.4033203125, 25.603515625, 26.8037109375, 28.00390625, 29.2041015625, 30.404296875, 31.6044921875, 32.8046875, 34.0048828125, 35.205078125, 36.4052734375, 37.60546875, 38.8056640625, 40.005859375, 41.2060546875, 42.40625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 8.0, 11.0, 12.0, 31.0, 28.0, 37.0, 78.0, 115.0, 144.0, 247.0, 565.0, 1974.0, 3082102.0, 58279.0, 1130.0, 382.0, 212.0, 129.0, 75.0, 49.0, 32.0, 31.0, 13.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-127.4375, -123.6708984375, -119.904296875, -116.1376953125, -112.37109375, -108.6044921875, -104.837890625, -101.0712890625, -97.3046875, -93.5380859375, -89.771484375, -86.0048828125, -82.23828125, -78.4716796875, -74.705078125, -70.9384765625, -67.171875, -63.4052734375, -59.638671875, -55.8720703125, -52.10546875, -48.3388671875, -44.572265625, -40.8056640625, -37.0390625, -33.2724609375, -29.505859375, -25.7392578125, -21.97265625, -18.2060546875, -14.439453125, -10.6728515625, -6.90625, -3.1396484375, 0.626953125, 4.3935546875, 8.16015625, 11.9267578125, 15.693359375, 19.4599609375, 23.2265625, 26.9931640625, 30.759765625, 34.5263671875, 38.29296875, 42.0595703125, 45.826171875, 49.5927734375, 53.359375, 57.1259765625, 60.892578125, 64.6591796875, 68.42578125, 72.1923828125, 75.958984375, 79.7255859375, 83.4921875, 87.2587890625, 91.025390625, 94.7919921875, 98.55859375, 102.3251953125, 106.091796875, 109.8583984375, 113.625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 77.0, 408.0, 454.0, 62.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-307.7058410644531, -299.8295593261719, -291.9532470703125, -284.07696533203125, -276.20068359375, -268.32440185546875, -260.4480895996094, -252.57180786132812, -244.69552612304688, -236.81922912597656, -228.9429473876953, -221.066650390625, -213.19036865234375, -205.31407165527344, -197.43777465820312, -189.56149291992188, -181.68519592285156, -173.80889892578125, -165.9326171875, -158.0563201904297, -150.18003845214844, -142.30374145507812, -134.42745971679688, -126.55116271972656, -118.67487335205078, -110.798583984375, -102.92229461669922, -95.04600524902344, -87.16970825195312, -79.29342651367188, -71.41712951660156, -63.54084014892578, -55.66453552246094, -47.788246154785156, -39.911956787109375, -32.03566360473633, -24.159374237060547, -16.283084869384766, -8.406791687011719, -0.5305023193359375, 7.345787048339844, 15.222077369689941, 23.09836769104004, 30.974658966064453, 38.850948333740234, 46.727237701416016, 54.60353088378906, 62.479820251464844, 70.35610961914062, 78.2323989868164, 86.10868835449219, 93.9849853515625, 101.86126708984375, 109.73756408691406, 117.61385345458984, 125.49014282226562, 133.36642456054688, 141.2427215576172, 149.11900329589844, 156.99530029296875, 164.87158203125, 172.7478790283203, 180.62417602539062, 188.50045776367188, 196.3767547607422]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 2.0, 6.0, 9.0, 10.0, 12.0, 10.0, 14.0, 13.0, 11.0, 17.0, 20.0, 26.0, 23.0, 37.0, 27.0, 35.0, 28.0, 28.0, 38.0, 46.0, 33.0, 35.0, 43.0, 40.0, 32.0, 38.0, 38.0, 42.0, 44.0, 37.0, 25.0, 22.0, 31.0, 18.0, 21.0, 16.0, 15.0, 6.0, 7.0, 11.0, 6.0, 5.0, 3.0, 9.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-83.14376831054688, -80.77043914794922, -78.39710998535156, -76.0237808227539, -73.65045166015625, -71.27713012695312, -68.90379333496094, -66.53047180175781, -64.15714263916016, -61.7838134765625, -59.410484313964844, -57.03715515136719, -54.6638298034668, -52.29050064086914, -49.917171478271484, -47.543846130371094, -45.17051315307617, -42.797183990478516, -40.42385482788086, -38.05052947998047, -35.67720031738281, -33.303871154785156, -30.9305419921875, -28.557214736938477, -26.18388557434082, -23.810556411743164, -21.43722915649414, -19.063899993896484, -16.690570831298828, -14.317243576049805, -11.943914413452148, -9.570587158203125, -7.197257995605469, -4.823929786682129, -2.450601100921631, -0.07727241516113281, 2.296055793762207, 4.669384002685547, 7.042713165283203, 9.416040420532227, 11.789369583129883, 14.162697792053223, 16.536026000976562, 18.90935516357422, 21.282684326171875, 23.6560115814209, 26.029340744018555, 28.402667999267578, 30.775997161865234, 33.14932632446289, 35.52265548706055, 37.89598083496094, 40.269309997558594, 42.64263916015625, 45.015968322753906, 47.38929748535156, 49.76262664794922, 52.135955810546875, 54.50928497314453, 56.88261413574219, 59.25593948364258, 61.629268646240234, 64.00259399414062, 66.37592315673828, 68.74925231933594]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 12.0, 12.0, 20.0, 15.0, 18.0, 17.0, 24.0, 20.0, 29.0, 21.0, 28.0, 37.0, 47.0, 27.0, 46.0, 40.0, 35.0, 36.0, 47.0, 39.0, 40.0, 32.0, 34.0, 24.0, 34.0, 33.0, 34.0, 21.0, 28.0, 20.0, 16.0, 12.0, 12.0, 10.0, 7.0, 9.0, 9.0, 11.0, 9.0, 7.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.53125, -9.2303466796875, -8.929443359375, -8.6285400390625, -8.32763671875, -8.0267333984375, -7.725830078125, -7.4249267578125, -7.1240234375, -6.8231201171875, -6.522216796875, -6.2213134765625, -5.92041015625, -5.6195068359375, -5.318603515625, -5.0177001953125, -4.716796875, -4.4158935546875, -4.114990234375, -3.8140869140625, -3.51318359375, -3.2122802734375, -2.911376953125, -2.6104736328125, -2.3095703125, -2.0086669921875, -1.707763671875, -1.4068603515625, -1.10595703125, -0.8050537109375, -0.504150390625, -0.2032470703125, 0.09765625, 0.3985595703125, 0.699462890625, 1.0003662109375, 1.30126953125, 1.6021728515625, 1.903076171875, 2.2039794921875, 2.5048828125, 2.8057861328125, 3.106689453125, 3.4075927734375, 3.70849609375, 4.0093994140625, 4.310302734375, 4.6112060546875, 4.912109375, 5.2130126953125, 5.513916015625, 5.8148193359375, 6.11572265625, 6.4166259765625, 6.717529296875, 7.0184326171875, 7.3193359375, 7.6202392578125, 7.921142578125, 8.2220458984375, 8.52294921875, 8.8238525390625, 9.124755859375, 9.4256591796875, 9.7265625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 7.0, 8.0, 9.0, 15.0, 30.0, 39.0, 48.0, 73.0, 96.0, 118.0, 172.0, 319.0, 416.0, 697.0, 1142.0, 1989.0, 3734.0, 8079.0, 23092.0, 117522.0, 818443.0, 2235849.0, 825819.0, 117239.0, 22547.0, 7825.0, 3808.0, 1930.0, 1148.0, 704.0, 472.0, 269.0, 196.0, 127.0, 82.0, 59.0, 34.0, 30.0, 25.0, 23.0, 19.0, 13.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.734375, -17.188720703125, -16.64306640625, -16.097412109375, -15.5517578125, -15.006103515625, -14.46044921875, -13.914794921875, -13.369140625, -12.823486328125, -12.27783203125, -11.732177734375, -11.1865234375, -10.640869140625, -10.09521484375, -9.549560546875, -9.00390625, -8.458251953125, -7.91259765625, -7.366943359375, -6.8212890625, -6.275634765625, -5.72998046875, -5.184326171875, -4.638671875, -4.093017578125, -3.54736328125, -3.001708984375, -2.4560546875, -1.910400390625, -1.36474609375, -0.819091796875, -0.2734375, 0.272216796875, 0.81787109375, 1.363525390625, 1.9091796875, 2.454833984375, 3.00048828125, 3.546142578125, 4.091796875, 4.637451171875, 5.18310546875, 5.728759765625, 6.2744140625, 6.820068359375, 7.36572265625, 7.911376953125, 8.45703125, 9.002685546875, 9.54833984375, 10.093994140625, 10.6396484375, 11.185302734375, 11.73095703125, 12.276611328125, 12.822265625, 13.367919921875, 13.91357421875, 14.459228515625, 15.0048828125, 15.550537109375, 16.09619140625, 16.641845703125, 17.1875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 8.0, 13.0, 14.0, 20.0, 27.0, 55.0, 56.0, 77.0, 106.0, 182.0, 274.0, 407.0, 571.0, 598.0, 477.0, 360.0, 229.0, 182.0, 102.0, 92.0, 68.0, 46.0, 35.0, 17.0, 16.0, 6.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.109375, -20.455078125, -19.80078125, -19.146484375, -18.4921875, -17.837890625, -17.18359375, -16.529296875, -15.875, -15.220703125, -14.56640625, -13.912109375, -13.2578125, -12.603515625, -11.94921875, -11.294921875, -10.640625, -9.986328125, -9.33203125, -8.677734375, -8.0234375, -7.369140625, -6.71484375, -6.060546875, -5.40625, -4.751953125, -4.09765625, -3.443359375, -2.7890625, -2.134765625, -1.48046875, -0.826171875, -0.171875, 0.482421875, 1.13671875, 1.791015625, 2.4453125, 3.099609375, 3.75390625, 4.408203125, 5.0625, 5.716796875, 6.37109375, 7.025390625, 7.6796875, 8.333984375, 8.98828125, 9.642578125, 10.296875, 10.951171875, 11.60546875, 12.259765625, 12.9140625, 13.568359375, 14.22265625, 14.876953125, 15.53125, 16.185546875, 16.83984375, 17.494140625, 18.1484375, 18.802734375, 19.45703125, 20.111328125, 20.765625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 15.0, 23.0, 56.0, 108.0, 215.0, 490.0, 1368.0, 9256.0, 4123715.0, 55921.0, 2026.0, 592.0, 230.0, 124.0, 54.0, 32.0, 18.0, 11.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.5, -87.6416015625, -84.783203125, -81.9248046875, -79.06640625, -76.2080078125, -73.349609375, -70.4912109375, -67.6328125, -64.7744140625, -61.916015625, -59.0576171875, -56.19921875, -53.3408203125, -50.482421875, -47.6240234375, -44.765625, -41.9072265625, -39.048828125, -36.1904296875, -33.33203125, -30.4736328125, -27.615234375, -24.7568359375, -21.8984375, -19.0400390625, -16.181640625, -13.3232421875, -10.46484375, -7.6064453125, -4.748046875, -1.8896484375, 0.96875, 3.8271484375, 6.685546875, 9.5439453125, 12.40234375, 15.2607421875, 18.119140625, 20.9775390625, 23.8359375, 26.6943359375, 29.552734375, 32.4111328125, 35.26953125, 38.1279296875, 40.986328125, 43.8447265625, 46.703125, 49.5615234375, 52.419921875, 55.2783203125, 58.13671875, 60.9951171875, 63.853515625, 66.7119140625, 69.5703125, 72.4287109375, 75.287109375, 78.1455078125, 81.00390625, 83.8623046875, 86.720703125, 89.5791015625, 92.4375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 26.0, 405.0, 523.0, 59.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-584.51513671875, -572.3607177734375, -560.206298828125, -548.0519409179688, -535.8975219726562, -523.7431030273438, -511.5887145996094, -499.434326171875, -487.2799072265625, -475.12548828125, -462.9710998535156, -450.81671142578125, -438.66229248046875, -426.50787353515625, -414.3534851074219, -402.1990966796875, -390.044677734375, -377.8902587890625, -365.7358703613281, -353.58148193359375, -341.42706298828125, -329.27264404296875, -317.1182556152344, -304.9638671875, -292.8094482421875, -280.655029296875, -268.5006408691406, -256.34625244140625, -244.19183349609375, -232.0374298095703, -219.88302612304688, -207.72862243652344, -195.57420349121094, -183.4197998046875, -171.26539611816406, -159.11099243164062, -146.9565887451172, -134.80218505859375, -122.64778137207031, -110.49337768554688, -98.33897399902344, -86.1845703125, -74.03016662597656, -61.875762939453125, -49.72135925292969, -37.56695556640625, -25.412551879882812, -13.258148193359375, -1.1037445068359375, 11.0506591796875, 23.205062866210938, 35.359466552734375, 47.51387023925781, 59.66827392578125, 71.82267761230469, 83.97708129882812, 96.13148498535156, 108.285888671875, 120.44029235839844, 132.59469604492188, 144.7490997314453, 156.90350341796875, 169.0579071044922, 181.21231079101562, 193.36671447753906]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 1.0, 2.0, 3.0, 10.0, 8.0, 9.0, 4.0, 7.0, 17.0, 8.0, 16.0, 16.0, 21.0, 22.0, 19.0, 28.0, 36.0, 30.0, 37.0, 38.0, 37.0, 34.0, 52.0, 41.0, 41.0, 44.0, 36.0, 40.0, 28.0, 31.0, 28.0, 28.0, 34.0, 25.0, 26.0, 20.0, 22.0, 21.0, 14.0, 7.0, 14.0, 11.0, 12.0, 4.0, 3.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.023529052734375, -60.97969436645508, -58.93585968017578, -56.89202117919922, -54.84818649291992, -52.804351806640625, -50.76051330566406, -48.716678619384766, -46.67284393310547, -44.62900924682617, -42.585174560546875, -40.54133605957031, -38.497501373291016, -36.45366668701172, -34.409828186035156, -32.36599349975586, -30.322158813476562, -28.278324127197266, -26.234487533569336, -24.190650939941406, -22.14681625366211, -20.102981567382812, -18.059144973754883, -16.015308380126953, -13.971473693847656, -11.927638053894043, -9.88380241394043, -7.839966773986816, -5.796131134033203, -3.75229549407959, -1.7084598541259766, 0.3353757858276367, 2.37921142578125, 4.423047065734863, 6.466882705688477, 8.51071834564209, 10.554553985595703, 12.598389625549316, 14.64222526550293, 16.68606185913086, 18.729896545410156, 20.773731231689453, 22.817567825317383, 24.861404418945312, 26.90523910522461, 28.949073791503906, 30.992910385131836, 33.036746978759766, 35.08058166503906, 37.12441635131836, 39.168251037597656, 41.21208953857422, 43.255924224853516, 45.29975891113281, 47.343597412109375, 49.38743209838867, 51.43126678466797, 53.475101470947266, 55.51893615722656, 57.562774658203125, 59.60660934448242, 61.65044403076172, 63.69428253173828, 65.73811340332031, 67.78195190429688]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 6.0, 7.0, 13.0, 8.0, 14.0, 16.0, 23.0, 29.0, 30.0, 24.0, 26.0, 36.0, 36.0, 42.0, 29.0, 40.0, 43.0, 33.0, 42.0, 42.0, 47.0, 39.0, 42.0, 25.0, 32.0, 44.0, 34.0, 31.0, 27.0, 19.0, 22.0, 14.0, 8.0, 11.0, 9.0, 13.0, 15.0, 3.0, 5.0, 4.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.7080078125, -8.439453125, -8.1708984375, -7.90234375, -7.6337890625, -7.365234375, -7.0966796875, -6.828125, -6.5595703125, -6.291015625, -6.0224609375, -5.75390625, -5.4853515625, -5.216796875, -4.9482421875, -4.6796875, -4.4111328125, -4.142578125, -3.8740234375, -3.60546875, -3.3369140625, -3.068359375, -2.7998046875, -2.53125, -2.2626953125, -1.994140625, -1.7255859375, -1.45703125, -1.1884765625, -0.919921875, -0.6513671875, -0.3828125, -0.1142578125, 0.154296875, 0.4228515625, 0.69140625, 0.9599609375, 1.228515625, 1.4970703125, 1.765625, 2.0341796875, 2.302734375, 2.5712890625, 2.83984375, 3.1083984375, 3.376953125, 3.6455078125, 3.9140625, 4.1826171875, 4.451171875, 4.7197265625, 4.98828125, 5.2568359375, 5.525390625, 5.7939453125, 6.0625, 6.3310546875, 6.599609375, 6.8681640625, 7.13671875, 7.4052734375, 7.673828125, 7.9423828125, 8.2109375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 9.0, 3.0, 8.0, 14.0, 24.0, 30.0, 74.0, 90.0, 124.0, 241.0, 349.0, 514.0, 798.0, 1243.0, 1909.0, 2839.0, 4418.0, 6756.0, 10586.0, 16759.0, 27230.0, 45164.0, 77238.0, 146826.0, 338812.0, 159409.0, 82028.0, 47325.0, 28674.0, 17932.0, 10970.0, 7002.0, 4552.0, 2972.0, 1950.0, 1285.0, 905.0, 573.0, 309.0, 218.0, 145.0, 103.0, 55.0, 33.0, 17.0, 24.0, 9.0, 10.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6823272705078125, -1.625396728515625, -1.5684661865234375, -1.51153564453125, -1.4546051025390625, -1.397674560546875, -1.3407440185546875, -1.2838134765625, -1.2268829345703125, -1.169952392578125, -1.1130218505859375, -1.05609130859375, -0.9991607666015625, -0.942230224609375, -0.8852996826171875, -0.828369140625, -0.7714385986328125, -0.714508056640625, -0.6575775146484375, -0.60064697265625, -0.5437164306640625, -0.486785888671875, -0.4298553466796875, -0.3729248046875, -0.3159942626953125, -0.259063720703125, -0.2021331787109375, -0.14520263671875, -0.0882720947265625, -0.031341552734375, 0.0255889892578125, 0.08251953125, 0.1394500732421875, 0.196380615234375, 0.2533111572265625, 0.31024169921875, 0.3671722412109375, 0.424102783203125, 0.4810333251953125, 0.5379638671875, 0.5948944091796875, 0.651824951171875, 0.7087554931640625, 0.76568603515625, 0.8226165771484375, 0.879547119140625, 0.9364776611328125, 0.993408203125, 1.0503387451171875, 1.107269287109375, 1.1641998291015625, 1.22113037109375, 1.2780609130859375, 1.334991455078125, 1.3919219970703125, 1.4488525390625, 1.5057830810546875, 1.562713623046875, 1.6196441650390625, 1.67657470703125, 1.7335052490234375, 1.790435791015625, 1.8473663330078125, 1.904296875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 12.0, 16.0, 13.0, 22.0, 21.0, 23.0, 27.0, 23.0, 30.0, 34.0, 42.0, 29.0, 39.0, 29.0, 36.0, 24.0, 1062.0, 42.0, 49.0, 38.0, 35.0, 36.0, 35.0, 25.0, 33.0, 27.0, 25.0, 26.0, 18.0, 23.0, 11.0, 17.0, 6.0, 9.0, 7.0, 13.0, 5.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.51220703125, -4.3564453125, -4.20068359375, -4.044921875, -3.88916015625, -3.7333984375, -3.57763671875, -3.421875, -3.26611328125, -3.1103515625, -2.95458984375, -2.798828125, -2.64306640625, -2.4873046875, -2.33154296875, -2.17578125, -2.02001953125, -1.8642578125, -1.70849609375, -1.552734375, -1.39697265625, -1.2412109375, -1.08544921875, -0.9296875, -0.77392578125, -0.6181640625, -0.46240234375, -0.306640625, -0.15087890625, 0.0048828125, 0.16064453125, 0.31640625, 0.47216796875, 0.6279296875, 0.78369140625, 0.939453125, 1.09521484375, 1.2509765625, 1.40673828125, 1.5625, 1.71826171875, 1.8740234375, 2.02978515625, 2.185546875, 2.34130859375, 2.4970703125, 2.65283203125, 2.80859375, 2.96435546875, 3.1201171875, 3.27587890625, 3.431640625, 3.58740234375, 3.7431640625, 3.89892578125, 4.0546875, 4.21044921875, 4.3662109375, 4.52197265625, 4.677734375, 4.83349609375, 4.9892578125, 5.14501953125, 5.30078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 6.0, 5.0, 11.0, 21.0, 32.0, 46.0, 76.0, 136.0, 228.0, 297.0, 499.0, 745.0, 1151.0, 1770.0, 2493.0, 3803.0, 5981.0, 9328.0, 14324.0, 22959.0, 36767.0, 61816.0, 111800.0, 1342328.0, 231321.0, 99096.0, 56520.0, 34164.0, 21188.0, 13484.0, 8465.0, 5584.0, 3671.0, 2430.0, 1548.0, 1034.0, 714.0, 472.0, 325.0, 173.0, 118.0, 77.0, 44.0, 29.0, 18.0, 14.0, 8.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.630859375, -1.5763397216796875, -1.521820068359375, -1.4673004150390625, -1.41278076171875, -1.3582611083984375, -1.303741455078125, -1.2492218017578125, -1.1947021484375, -1.1401824951171875, -1.085662841796875, -1.0311431884765625, -0.97662353515625, -0.9221038818359375, -0.867584228515625, -0.8130645751953125, -0.758544921875, -0.7040252685546875, -0.649505615234375, -0.5949859619140625, -0.54046630859375, -0.4859466552734375, -0.431427001953125, -0.3769073486328125, -0.3223876953125, -0.2678680419921875, -0.213348388671875, -0.1588287353515625, -0.10430908203125, -0.0497894287109375, 0.004730224609375, 0.0592498779296875, 0.11376953125, 0.1682891845703125, 0.222808837890625, 0.2773284912109375, 0.33184814453125, 0.3863677978515625, 0.440887451171875, 0.4954071044921875, 0.5499267578125, 0.6044464111328125, 0.658966064453125, 0.7134857177734375, 0.76800537109375, 0.8225250244140625, 0.877044677734375, 0.9315643310546875, 0.986083984375, 1.0406036376953125, 1.095123291015625, 1.1496429443359375, 1.20416259765625, 1.2586822509765625, 1.313201904296875, 1.3677215576171875, 1.4222412109375, 1.4767608642578125, 1.531280517578125, 1.5858001708984375, 1.64031982421875, 1.6948394775390625, 1.749359130859375, 1.8038787841796875, 1.8583984375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 5.0, 7.0, 7.0, 11.0, 7.0, 11.0, 15.0, 24.0, 13.0, 17.0, 20.0, 36.0, 47.0, 61.0, 60.0, 86.0, 79.0, 84.0, 67.0, 56.0, 57.0, 34.0, 28.0, 20.0, 34.0, 17.0, 16.0, 18.0, 14.0, 9.0, 6.0, 6.0, 4.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0008897781372070312, -0.0008617416024208069, -0.0008337050676345825, -0.0008056685328483582, -0.0007776319980621338, -0.0007495954632759094, -0.0007215589284896851, -0.0006935223937034607, -0.0006654858589172363, -0.000637449324131012, -0.0006094127893447876, -0.0005813762545585632, -0.0005533397197723389, -0.0005253031849861145, -0.0004972666501998901, -0.00046923011541366577, -0.0004411935806274414, -0.00041315704584121704, -0.0003851205110549927, -0.0003570839762687683, -0.00032904744148254395, -0.0003010109066963196, -0.0002729743719100952, -0.00024493783712387085, -0.00021690130233764648, -0.00018886476755142212, -0.00016082823276519775, -0.0001327916979789734, -0.00010475516319274902, -7.671862840652466e-05, -4.868209362030029e-05, -2.0645558834075928e-05, 7.3909759521484375e-06, 3.54275107383728e-05, 6.346404552459717e-05, 9.150058031082153e-05, 0.0001195371150970459, 0.00014757364988327026, 0.00017561018466949463, 0.000203646719455719, 0.00023168325424194336, 0.0002597197890281677, 0.0002877563238143921, 0.00031579285860061646, 0.0003438293933868408, 0.0003718659281730652, 0.00039990246295928955, 0.0004279389977455139, 0.0004559755325317383, 0.00048401206731796265, 0.000512048602104187, 0.0005400851368904114, 0.0005681216716766357, 0.0005961582064628601, 0.0006241947412490845, 0.0006522312760353088, 0.0006802678108215332, 0.0007083043456077576, 0.0007363408803939819, 0.0007643774151802063, 0.0007924139499664307, 0.000820450484752655, 0.0008484870195388794, 0.0008765235543251038, 0.0009045600891113281]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 7.0, 7.0, 13.0, 25.0, 18.0, 17.0, 23.0, 41.0, 57.0, 68.0, 90.0, 112.0, 195.0, 299.0, 456.0, 1014.0, 43239.0, 999408.0, 1704.0, 641.0, 314.0, 237.0, 153.0, 95.0, 78.0, 57.0, 41.0, 23.0, 25.0, 13.0, 13.0, 15.0, 8.0, 7.0, 12.0, 5.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017578125, -0.01701498031616211, -0.01645183563232422, -0.015888690948486328, -0.015325546264648438, -0.014762401580810547, -0.014199256896972656, -0.013636112213134766, -0.013072967529296875, -0.012509822845458984, -0.011946678161621094, -0.011383533477783203, -0.010820388793945312, -0.010257244110107422, -0.009694099426269531, -0.00913095474243164, -0.00856781005859375, -0.00800466537475586, -0.007441520690917969, -0.006878376007080078, -0.0063152313232421875, -0.005752086639404297, -0.005188941955566406, -0.004625797271728516, -0.004062652587890625, -0.0034995079040527344, -0.0029363632202148438, -0.002373218536376953, -0.0018100738525390625, -0.0012469291687011719, -0.0006837844848632812, -0.00012063980102539062, 0.0004425048828125, 0.0010056495666503906, 0.0015687942504882812, 0.002131938934326172, 0.0026950836181640625, 0.003258228302001953, 0.0038213729858398438, 0.004384517669677734, 0.004947662353515625, 0.005510807037353516, 0.006073951721191406, 0.006637096405029297, 0.0072002410888671875, 0.007763385772705078, 0.008326530456542969, 0.00888967514038086, 0.00945281982421875, 0.01001596450805664, 0.010579109191894531, 0.011142253875732422, 0.011705398559570312, 0.012268543243408203, 0.012831687927246094, 0.013394832611083984, 0.013957977294921875, 0.014521121978759766, 0.015084266662597656, 0.015647411346435547, 0.016210556030273438, 0.016773700714111328, 0.01733684539794922, 0.01789999008178711, 0.018463134765625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 38.0, 508.0, 437.0, 25.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002544370014220476, -0.002467023441568017, -0.002389676868915558, -0.002312330063432455, -0.002234983490779996, -0.0021576369181275368, -0.0020802903454750776, -0.0020029437728226185, -0.0019255972001701593, -0.0018482506275177002, -0.0017709039384499192, -0.00169355736579746, -0.001616210793145001, -0.00153886410407722, -0.0014615175314247608, -0.0013841709587723017, -0.0013068242697045207, -0.0012294776970520616, -0.0011521310079842806, -0.0010747844353318214, -0.0009974378626793623, -0.0009200912318192422, -0.0008427446009591222, -0.000765398028306663, -0.000688051397446543, -0.0006107047665864229, -0.0005333581939339638, -0.0004560115630738437, -0.0003786649613175541, -0.0003013183595612645, -0.00022397172870114446, -0.0001466251560486853, -6.927852518856525e-05, 8.068083843681961e-06, 8.541469287592918e-05, 0.000162761309184134, 0.0002401079109404236, 0.0003174545126967132, 0.00039480114355683327, 0.0004721477162092924, 0.0005494943470694125, 0.0006268409779295325, 0.0007041875505819917, 0.0007815341814421117, 0.0008588808123022318, 0.0009362273849546909, 0.00101357395760715, 0.0010909205302596092, 0.0011682672193273902, 0.0012456137919798493, 0.0013229604810476303, 0.0014003070537000895, 0.0014776536263525486, 0.0015550001990050077, 0.0016323468880727887, 0.0017096934607252479, 0.0017870401497930288, 0.001864386722445488, 0.001941733411513269, 0.0020190798677504063, 0.002096426673233509, 0.002173773245885968, 0.0022511198185384274, 0.0023284663911908865, 0.0024058129638433456]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 5.0, 9.0, 8.0, 21.0, 14.0, 14.0, 14.0, 24.0, 19.0, 30.0, 35.0, 27.0, 24.0, 24.0, 40.0, 44.0, 41.0, 41.0, 43.0, 44.0, 39.0, 49.0, 53.0, 36.0, 35.0, 46.0, 36.0, 28.0, 23.0, 19.0, 20.0, 23.0, 12.0, 8.0, 9.0, 7.0, 7.0, 13.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041800737380981445, -0.00040341727435588837, -0.0003888271749019623, -0.0003742370754480362, -0.0003596469759941101, -0.000345056876540184, -0.00033046677708625793, -0.00031587667763233185, -0.00030128657817840576, -0.0002866964787244797, -0.0002721063792705536, -0.0002575162798166275, -0.00024292618036270142, -0.00022833608090877533, -0.00021374598145484924, -0.00019915588200092316, -0.00018456578254699707, -0.00016997568309307098, -0.0001553855836391449, -0.0001407954841852188, -0.00012620538473129272, -0.00011161528527736664, -9.702518582344055e-05, -8.243508636951447e-05, -6.784498691558838e-05, -5.325488746166229e-05, -3.8664788007736206e-05, -2.407468855381012e-05, -9.484589099884033e-06, 5.105510354042053e-06, 1.969560980796814e-05, 3.4285709261894226e-05, 4.887580871582031e-05, 6.34659081697464e-05, 7.805600762367249e-05, 9.264610707759857e-05, 0.00010723620653152466, 0.00012182630598545074, 0.00013641640543937683, 0.00015100650489330292, 0.000165596604347229, 0.0001801867038011551, 0.00019477680325508118, 0.00020936690270900726, 0.00022395700216293335, 0.00023854710161685944, 0.0002531372010707855, 0.0002677273005247116, 0.0002823173999786377, 0.0002969074994325638, 0.00031149759888648987, 0.00032608769834041595, 0.00034067779779434204, 0.00035526789724826813, 0.0003698579967021942, 0.0003844480961561203, 0.0003990381956100464, 0.0004136282950639725, 0.00042821839451789856, 0.00044280849397182465, 0.00045739859342575073, 0.0004719886928796768, 0.0004865787923336029, 0.000501168891787529, 0.0005157589912414551]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 6.0, 7.0, 13.0, 8.0, 14.0, 16.0, 23.0, 29.0, 30.0, 24.0, 26.0, 36.0, 36.0, 42.0, 29.0, 40.0, 43.0, 33.0, 41.0, 43.0, 47.0, 39.0, 42.0, 25.0, 32.0, 44.0, 34.0, 31.0, 27.0, 19.0, 22.0, 14.0, 8.0, 11.0, 9.0, 13.0, 15.0, 3.0, 5.0, 4.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.7080078125, -8.439453125, -8.1708984375, -7.90234375, -7.6337890625, -7.365234375, -7.0966796875, -6.828125, -6.5595703125, -6.291015625, -6.0224609375, -5.75390625, -5.4853515625, -5.216796875, -4.9482421875, -4.6796875, -4.4111328125, -4.142578125, -3.8740234375, -3.60546875, -3.3369140625, -3.068359375, -2.7998046875, -2.53125, -2.2626953125, -1.994140625, -1.7255859375, -1.45703125, -1.1884765625, -0.919921875, -0.6513671875, -0.3828125, -0.1142578125, 0.154296875, 0.4228515625, 0.69140625, 0.9599609375, 1.228515625, 1.4970703125, 1.765625, 2.0341796875, 2.302734375, 2.5712890625, 2.83984375, 3.1083984375, 3.376953125, 3.6455078125, 3.9140625, 4.1826171875, 4.451171875, 4.7197265625, 4.98828125, 5.2568359375, 5.525390625, 5.7939453125, 6.0625, 6.3310546875, 6.599609375, 6.8681640625, 7.13671875, 7.4052734375, 7.673828125, 7.9423828125, 8.2109375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 3.0, 8.0, 10.0, 17.0, 21.0, 18.0, 31.0, 42.0, 60.0, 88.0, 119.0, 156.0, 233.0, 347.0, 478.0, 766.0, 1368.0, 2466.0, 5403.0, 14252.0, 47087.0, 224529.0, 581956.0, 120497.0, 29747.0, 9616.0, 4083.0, 1934.0, 1091.0, 663.0, 439.0, 299.0, 196.0, 156.0, 107.0, 75.0, 47.0, 36.0, 27.0, 23.0, 16.0, 14.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-16.546875, -16.078369140625, -15.60986328125, -15.141357421875, -14.6728515625, -14.204345703125, -13.73583984375, -13.267333984375, -12.798828125, -12.330322265625, -11.86181640625, -11.393310546875, -10.9248046875, -10.456298828125, -9.98779296875, -9.519287109375, -9.05078125, -8.582275390625, -8.11376953125, -7.645263671875, -7.1767578125, -6.708251953125, -6.23974609375, -5.771240234375, -5.302734375, -4.834228515625, -4.36572265625, -3.897216796875, -3.4287109375, -2.960205078125, -2.49169921875, -2.023193359375, -1.5546875, -1.086181640625, -0.61767578125, -0.149169921875, 0.3193359375, 0.787841796875, 1.25634765625, 1.724853515625, 2.193359375, 2.661865234375, 3.13037109375, 3.598876953125, 4.0673828125, 4.535888671875, 5.00439453125, 5.472900390625, 5.94140625, 6.409912109375, 6.87841796875, 7.346923828125, 7.8154296875, 8.283935546875, 8.75244140625, 9.220947265625, 9.689453125, 10.157958984375, 10.62646484375, 11.094970703125, 11.5634765625, 12.031982421875, 12.50048828125, 12.968994140625, 13.4375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 7.0, 9.0, 14.0, 15.0, 19.0, 26.0, 21.0, 32.0, 35.0, 48.0, 49.0, 57.0, 94.0, 419.0, 1660.0, 112.0, 86.0, 59.0, 51.0, 49.0, 32.0, 31.0, 26.0, 15.0, 15.0, 7.0, 14.0, 9.0, 4.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.3125, -23.416015625, -22.51953125, -21.623046875, -20.7265625, -19.830078125, -18.93359375, -18.037109375, -17.140625, -16.244140625, -15.34765625, -14.451171875, -13.5546875, -12.658203125, -11.76171875, -10.865234375, -9.96875, -9.072265625, -8.17578125, -7.279296875, -6.3828125, -5.486328125, -4.58984375, -3.693359375, -2.796875, -1.900390625, -1.00390625, -0.107421875, 0.7890625, 1.685546875, 2.58203125, 3.478515625, 4.375, 5.271484375, 6.16796875, 7.064453125, 7.9609375, 8.857421875, 9.75390625, 10.650390625, 11.546875, 12.443359375, 13.33984375, 14.236328125, 15.1328125, 16.029296875, 16.92578125, 17.822265625, 18.71875, 19.615234375, 20.51171875, 21.408203125, 22.3046875, 23.201171875, 24.09765625, 24.994140625, 25.890625, 26.787109375, 27.68359375, 28.580078125, 29.4765625, 30.373046875, 31.26953125, 32.166015625, 33.0625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 4.0, 6.0, 11.0, 9.0, 12.0, 13.0, 20.0, 33.0, 52.0, 69.0, 116.0, 181.0, 340.0, 848.0, 5489.0, 3132434.0, 4488.0, 716.0, 355.0, 191.0, 89.0, 60.0, 31.0, 26.0, 30.0, 16.0, 15.0, 13.0, 12.0, 4.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-91.625, -89.11328125, -86.6015625, -84.08984375, -81.578125, -79.06640625, -76.5546875, -74.04296875, -71.53125, -69.01953125, -66.5078125, -63.99609375, -61.484375, -58.97265625, -56.4609375, -53.94921875, -51.4375, -48.92578125, -46.4140625, -43.90234375, -41.390625, -38.87890625, -36.3671875, -33.85546875, -31.34375, -28.83203125, -26.3203125, -23.80859375, -21.296875, -18.78515625, -16.2734375, -13.76171875, -11.25, -8.73828125, -6.2265625, -3.71484375, -1.203125, 1.30859375, 3.8203125, 6.33203125, 8.84375, 11.35546875, 13.8671875, 16.37890625, 18.890625, 21.40234375, 23.9140625, 26.42578125, 28.9375, 31.44921875, 33.9609375, 36.47265625, 38.984375, 41.49609375, 44.0078125, 46.51953125, 49.03125, 51.54296875, 54.0546875, 56.56640625, 59.078125, 61.58984375, 64.1015625, 66.61328125, 69.125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 59.0, 740.0, 200.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-277.339111328125, -272.443359375, -267.5476379394531, -262.6518859863281, -257.75616455078125, -252.8604278564453, -247.96469116210938, -243.06893920898438, -238.1732177734375, -233.27748107910156, -228.38174438476562, -223.4860076904297, -218.59027099609375, -213.6945343017578, -208.79879760742188, -203.90304565429688, -199.00730895996094, -194.111572265625, -189.21583557128906, -184.32009887695312, -179.4243621826172, -174.52862548828125, -169.6328887939453, -164.73715209960938, -159.84140014648438, -154.94566345214844, -150.0499267578125, -145.15419006347656, -140.25845336914062, -135.3627166748047, -130.46697998046875, -125.57123565673828, -120.67550659179688, -115.77976989746094, -110.884033203125, -105.98829650878906, -101.09255981445312, -96.19682312011719, -91.30107879638672, -86.40534210205078, -81.50961303710938, -76.61387634277344, -71.7181396484375, -66.82240295410156, -61.92666244506836, -57.03092575073242, -52.13518524169922, -47.23944854736328, -42.34370803833008, -37.44797134399414, -32.55223083496094, -27.656494140625, -22.760757446289062, -17.865020751953125, -12.969282150268555, -8.073543548583984, -3.177806854248047, 1.717930793762207, 6.613668441772461, 11.509406089782715, 16.40514373779297, 21.300880432128906, 26.196619033813477, 31.092357635498047, 35.988094329833984]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 7.0, 4.0, 4.0, 6.0, 7.0, 14.0, 16.0, 14.0, 9.0, 26.0, 17.0, 25.0, 30.0, 27.0, 34.0, 37.0, 36.0, 37.0, 44.0, 34.0, 40.0, 43.0, 50.0, 44.0, 41.0, 46.0, 34.0, 34.0, 25.0, 25.0, 26.0, 27.0, 18.0, 19.0, 10.0, 11.0, 20.0, 20.0, 7.0, 7.0, 8.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-53.08030700683594, -51.53553009033203, -49.990753173828125, -48.44597244262695, -46.90119552612305, -45.35641860961914, -43.81163787841797, -42.26686096191406, -40.722084045410156, -39.17730712890625, -37.632530212402344, -36.08774948120117, -34.542972564697266, -32.99819564819336, -31.45341682434082, -29.90863800048828, -28.363861083984375, -26.81908416748047, -25.27430534362793, -23.72952651977539, -22.184749603271484, -20.639972686767578, -19.09519386291504, -17.5504150390625, -16.005638122558594, -14.460860252380371, -12.916082382202148, -11.371304512023926, -9.826526641845703, -8.28174877166748, -6.736970901489258, -5.192193031311035, -3.6474151611328125, -2.10263729095459, -0.5578594207763672, 0.9869184494018555, 2.531696319580078, 4.076474189758301, 5.621252059936523, 7.166029930114746, 8.710807800292969, 10.255585670471191, 11.800363540649414, 13.345141410827637, 14.88991928100586, 16.434696197509766, 17.979475021362305, 19.524253845214844, 21.06903076171875, 22.613807678222656, 24.158586502075195, 25.703365325927734, 27.24814224243164, 28.792919158935547, 30.337697982788086, 31.882476806640625, 33.42725372314453, 34.97203063964844, 36.516807556152344, 38.061588287353516, 39.60636520385742, 41.15114212036133, 42.6959228515625, 44.240699768066406, 45.78547668457031]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 7.0, 12.0, 17.0, 13.0, 14.0, 12.0, 13.0, 23.0, 29.0, 27.0, 36.0, 42.0, 39.0, 36.0, 47.0, 43.0, 34.0, 33.0, 33.0, 38.0, 45.0, 40.0, 38.0, 50.0, 33.0, 30.0, 28.0, 19.0, 19.0, 25.0, 20.0, 15.0, 13.0, 11.0, 9.0, 11.0, 3.0, 5.0, 5.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9765625, -9.6536865234375, -9.330810546875, -9.0079345703125, -8.68505859375, -8.3621826171875, -8.039306640625, -7.7164306640625, -7.3935546875, -7.0706787109375, -6.747802734375, -6.4249267578125, -6.10205078125, -5.7791748046875, -5.456298828125, -5.1334228515625, -4.810546875, -4.4876708984375, -4.164794921875, -3.8419189453125, -3.51904296875, -3.1961669921875, -2.873291015625, -2.5504150390625, -2.2275390625, -1.9046630859375, -1.581787109375, -1.2589111328125, -0.93603515625, -0.6131591796875, -0.290283203125, 0.0325927734375, 0.35546875, 0.6783447265625, 1.001220703125, 1.3240966796875, 1.64697265625, 1.9698486328125, 2.292724609375, 2.6156005859375, 2.9384765625, 3.2613525390625, 3.584228515625, 3.9071044921875, 4.22998046875, 4.5528564453125, 4.875732421875, 5.1986083984375, 5.521484375, 5.8443603515625, 6.167236328125, 6.4901123046875, 6.81298828125, 7.1358642578125, 7.458740234375, 7.7816162109375, 8.1044921875, 8.4273681640625, 8.750244140625, 9.0731201171875, 9.39599609375, 9.7188720703125, 10.041748046875, 10.3646240234375, 10.6875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 9.0, 6.0, 10.0, 11.0, 13.0, 26.0, 30.0, 43.0, 45.0, 60.0, 65.0, 84.0, 111.0, 127.0, 186.0, 286.0, 345.0, 571.0, 960.0, 2661.0, 21955.0, 3082172.0, 1070613.0, 9388.0, 1842.0, 778.0, 503.0, 345.0, 222.0, 170.0, 145.0, 112.0, 87.0, 70.0, 55.0, 40.0, 27.0, 27.0, 18.0, 20.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.09375, -58.14599609375, -56.1982421875, -54.25048828125, -52.302734375, -50.35498046875, -48.4072265625, -46.45947265625, -44.51171875, -42.56396484375, -40.6162109375, -38.66845703125, -36.720703125, -34.77294921875, -32.8251953125, -30.87744140625, -28.9296875, -26.98193359375, -25.0341796875, -23.08642578125, -21.138671875, -19.19091796875, -17.2431640625, -15.29541015625, -13.34765625, -11.39990234375, -9.4521484375, -7.50439453125, -5.556640625, -3.60888671875, -1.6611328125, 0.28662109375, 2.234375, 4.18212890625, 6.1298828125, 8.07763671875, 10.025390625, 11.97314453125, 13.9208984375, 15.86865234375, 17.81640625, 19.76416015625, 21.7119140625, 23.65966796875, 25.607421875, 27.55517578125, 29.5029296875, 31.45068359375, 33.3984375, 35.34619140625, 37.2939453125, 39.24169921875, 41.189453125, 43.13720703125, 45.0849609375, 47.03271484375, 48.98046875, 50.92822265625, 52.8759765625, 54.82373046875, 56.771484375, 58.71923828125, 60.6669921875, 62.61474609375, 64.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 26.0, 54.0, 132.0, 438.0, 1195.0, 1372.0, 546.0, 187.0, 62.0, 29.0, 10.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.28125, -46.77783203125, -45.2744140625, -43.77099609375, -42.267578125, -40.76416015625, -39.2607421875, -37.75732421875, -36.25390625, -34.75048828125, -33.2470703125, -31.74365234375, -30.240234375, -28.73681640625, -27.2333984375, -25.72998046875, -24.2265625, -22.72314453125, -21.2197265625, -19.71630859375, -18.212890625, -16.70947265625, -15.2060546875, -13.70263671875, -12.19921875, -10.69580078125, -9.1923828125, -7.68896484375, -6.185546875, -4.68212890625, -3.1787109375, -1.67529296875, -0.171875, 1.33154296875, 2.8349609375, 4.33837890625, 5.841796875, 7.34521484375, 8.8486328125, 10.35205078125, 11.85546875, 13.35888671875, 14.8623046875, 16.36572265625, 17.869140625, 19.37255859375, 20.8759765625, 22.37939453125, 23.8828125, 25.38623046875, 26.8896484375, 28.39306640625, 29.896484375, 31.39990234375, 32.9033203125, 34.40673828125, 35.91015625, 37.41357421875, 38.9169921875, 40.42041015625, 41.923828125, 43.42724609375, 44.9306640625, 46.43408203125, 47.9375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 22.0, 34.0, 68.0, 166.0, 367.0, 1163.0, 6938.0, 709009.0, 3459077.0, 14886.0, 1631.0, 496.0, 188.0, 102.0, 38.0, 25.0, 16.0, 11.0, 7.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.625, -60.84228515625, -59.0595703125, -57.27685546875, -55.494140625, -53.71142578125, -51.9287109375, -50.14599609375, -48.36328125, -46.58056640625, -44.7978515625, -43.01513671875, -41.232421875, -39.44970703125, -37.6669921875, -35.88427734375, -34.1015625, -32.31884765625, -30.5361328125, -28.75341796875, -26.970703125, -25.18798828125, -23.4052734375, -21.62255859375, -19.83984375, -18.05712890625, -16.2744140625, -14.49169921875, -12.708984375, -10.92626953125, -9.1435546875, -7.36083984375, -5.578125, -3.79541015625, -2.0126953125, -0.22998046875, 1.552734375, 3.33544921875, 5.1181640625, 6.90087890625, 8.68359375, 10.46630859375, 12.2490234375, 14.03173828125, 15.814453125, 17.59716796875, 19.3798828125, 21.16259765625, 22.9453125, 24.72802734375, 26.5107421875, 28.29345703125, 30.076171875, 31.85888671875, 33.6416015625, 35.42431640625, 37.20703125, 38.98974609375, 40.7724609375, 42.55517578125, 44.337890625, 46.12060546875, 47.9033203125, 49.68603515625, 51.46875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 23.0, 62.0, 110.0, 198.0, 235.0, 198.0, 104.0, 40.0, 15.0, 10.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-438.64544677734375, -430.4537048339844, -422.2619934082031, -414.07025146484375, -405.8785400390625, -397.6867980957031, -389.49505615234375, -381.3033447265625, -373.1116027832031, -364.91986083984375, -356.7281494140625, -348.5364074707031, -340.3446960449219, -332.1529541015625, -323.96124267578125, -315.7695007324219, -307.5777587890625, -299.3860168457031, -291.1943054199219, -283.0025634765625, -274.81085205078125, -266.6191101074219, -258.4273681640625, -250.23565673828125, -242.0439453125, -233.8522186279297, -225.66049194335938, -217.46875, -209.2770233154297, -201.08529663085938, -192.89356994628906, -184.70184326171875, -176.5101318359375, -168.3184051513672, -160.12667846679688, -151.9349365234375, -143.7432098388672, -135.55148315429688, -127.35975646972656, -119.16802978515625, -110.97628784179688, -102.78456115722656, -94.59282684326172, -86.4011001586914, -78.20936584472656, -70.01763916015625, -61.82591247558594, -53.63418197631836, -45.44245147705078, -37.2507209777832, -29.058992385864258, -20.867263793945312, -12.675533294677734, -4.483802795410156, 3.7079238891601562, 11.899654388427734, 20.091384887695312, 28.28311538696289, 36.47484588623047, 44.66657257080078, 52.85830307006836, 61.05003356933594, 69.24176025390625, 77.43348693847656, 85.6252212524414]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 8.0, 6.0, 10.0, 13.0, 13.0, 15.0, 18.0, 23.0, 28.0, 27.0, 40.0, 40.0, 48.0, 53.0, 55.0, 53.0, 49.0, 36.0, 41.0, 45.0, 49.0, 45.0, 37.0, 31.0, 37.0, 33.0, 28.0, 23.0, 18.0, 17.0, 15.0, 9.0, 6.0, 11.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.0462646484375, -78.68144989013672, -76.31664276123047, -73.95182800292969, -71.58702087402344, -69.22220611572266, -66.8573989868164, -64.49258422851562, -62.127777099609375, -59.76296615600586, -57.398155212402344, -55.03334426879883, -52.66853332519531, -50.3037223815918, -47.93891143798828, -45.5740966796875, -43.209285736083984, -40.84447479248047, -38.47966384887695, -36.11485290527344, -33.75004196166992, -31.385231018066406, -29.020418167114258, -26.655607223510742, -24.290796279907227, -21.92598533630371, -19.561174392700195, -17.196361541748047, -14.831551551818848, -12.466740608215332, -10.1019287109375, -7.737117767333984, -5.372306823730469, -3.007495641708374, -0.6426844596862793, 1.7221269607543945, 4.08693790435791, 6.451748847961426, 8.816560745239258, 11.181371688842773, 13.546182632446289, 15.910993576049805, 18.27580451965332, 20.64061737060547, 23.005428314208984, 25.3702392578125, 27.735050201416016, 30.09986114501953, 32.46467208862305, 34.82948303222656, 37.19429397583008, 39.559104919433594, 41.92391586303711, 44.288726806640625, 46.653541564941406, 49.018348693847656, 51.38316345214844, 53.74797439575195, 56.11278533935547, 58.477596282958984, 60.8424072265625, 63.207218170166016, 65.57202911376953, 67.93684387207031, 70.30165100097656]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 5.0, 9.0, 6.0, 7.0, 13.0, 9.0, 11.0, 22.0, 19.0, 29.0, 34.0, 27.0, 27.0, 38.0, 49.0, 45.0, 51.0, 34.0, 41.0, 41.0, 38.0, 41.0, 39.0, 33.0, 41.0, 31.0, 25.0, 42.0, 30.0, 17.0, 22.0, 23.0, 17.0, 14.0, 14.0, 11.0, 8.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-96.0, -92.955078125, -89.91015625, -86.865234375, -83.8203125, -80.775390625, -77.73046875, -74.685546875, -71.640625, -68.595703125, -65.55078125, -62.505859375, -59.4609375, -56.416015625, -53.37109375, -50.326171875, -47.28125, -44.236328125, -41.19140625, -38.146484375, -35.1015625, -32.056640625, -29.01171875, -25.966796875, -22.921875, -19.876953125, -16.83203125, -13.787109375, -10.7421875, -7.697265625, -4.65234375, -1.607421875, 1.4375, 4.482421875, 7.52734375, 10.572265625, 13.6171875, 16.662109375, 19.70703125, 22.751953125, 25.796875, 28.841796875, 31.88671875, 34.931640625, 37.9765625, 41.021484375, 44.06640625, 47.111328125, 50.15625, 53.201171875, 56.24609375, 59.291015625, 62.3359375, 65.380859375, 68.42578125, 71.470703125, 74.515625, 77.560546875, 80.60546875, 83.650390625, 86.6953125, 89.740234375, 92.78515625, 95.830078125, 98.875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 6.0, 15.0, 15.0, 32.0, 38.0, 43.0, 65.0, 85.0, 124.0, 184.0, 219.0, 299.0, 423.0, 556.0, 751.0, 1073.0, 1428.0, 2090.0, 2833.0, 3997.0, 5549.0, 7999.0, 11469.0, 16835.0, 25055.0, 37844.0, 58334.0, 93646.0, 174261.0, 272603.0, 118062.0, 70995.0, 45368.0, 29947.0, 19962.0, 13729.0, 9595.0, 6605.0, 4557.0, 3323.0, 2260.0, 1736.0, 1187.0, 905.0, 697.0, 441.0, 378.0, 273.0, 185.0, 125.0, 102.0, 86.0, 56.0, 37.0, 26.0, 23.0, 13.0, 11.0, 5.0, 4.0, 3.0], "bins": [-16.109375, -15.609375, -15.109375, -14.609375, -14.109375, -13.609375, -13.109375, -12.609375, -12.109375, -11.609375, -11.109375, -10.609375, -10.109375, -9.609375, -9.109375, -8.609375, -8.109375, -7.609375, -7.109375, -6.609375, -6.109375, -5.609375, -5.109375, -4.609375, -4.109375, -3.609375, -3.109375, -2.609375, -2.109375, -1.609375, -1.109375, -0.609375, -0.109375, 0.390625, 0.890625, 1.390625, 1.890625, 2.390625, 2.890625, 3.390625, 3.890625, 4.390625, 4.890625, 5.390625, 5.890625, 6.390625, 6.890625, 7.390625, 7.890625, 8.390625, 8.890625, 9.390625, 9.890625, 10.390625, 10.890625, 11.390625, 11.890625, 12.390625, 12.890625, 13.390625, 13.890625, 14.390625, 14.890625, 15.390625, 15.890625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 0.0, 6.0, 7.0, 7.0, 5.0, 9.0, 17.0, 16.0, 18.0, 16.0, 28.0, 17.0, 19.0, 36.0, 37.0, 36.0, 46.0, 49.0, 38.0, 38.0, 49.0, 1062.0, 48.0, 34.0, 41.0, 35.0, 39.0, 36.0, 27.0, 24.0, 33.0, 27.0, 22.0, 13.0, 14.0, 16.0, 12.0, 14.0, 6.0, 7.0, 8.0, 7.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.625, -68.57958984375, -66.5341796875, -64.48876953125, -62.443359375, -60.39794921875, -58.3525390625, -56.30712890625, -54.26171875, -52.21630859375, -50.1708984375, -48.12548828125, -46.080078125, -44.03466796875, -41.9892578125, -39.94384765625, -37.8984375, -35.85302734375, -33.8076171875, -31.76220703125, -29.716796875, -27.67138671875, -25.6259765625, -23.58056640625, -21.53515625, -19.48974609375, -17.4443359375, -15.39892578125, -13.353515625, -11.30810546875, -9.2626953125, -7.21728515625, -5.171875, -3.12646484375, -1.0810546875, 0.96435546875, 3.009765625, 5.05517578125, 7.1005859375, 9.14599609375, 11.19140625, 13.23681640625, 15.2822265625, 17.32763671875, 19.373046875, 21.41845703125, 23.4638671875, 25.50927734375, 27.5546875, 29.60009765625, 31.6455078125, 33.69091796875, 35.736328125, 37.78173828125, 39.8271484375, 41.87255859375, 43.91796875, 45.96337890625, 48.0087890625, 50.05419921875, 52.099609375, 54.14501953125, 56.1904296875, 58.23583984375, 60.28125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 11.0, 9.0, 8.0, 16.0, 24.0, 37.0, 55.0, 85.0, 144.0, 232.0, 339.0, 520.0, 885.0, 1379.0, 2274.0, 3538.0, 5660.0, 9165.0, 14858.0, 24489.0, 41857.0, 75079.0, 153367.0, 1424084.0, 155684.0, 76616.0, 42107.0, 25031.0, 14739.0, 9212.0, 5875.0, 3620.0, 2259.0, 1431.0, 916.0, 560.0, 356.0, 226.0, 121.0, 82.0, 66.0, 40.0, 31.0, 25.0, 9.0, 4.0, 2.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-24.703125, -23.9873046875, -23.271484375, -22.5556640625, -21.83984375, -21.1240234375, -20.408203125, -19.6923828125, -18.9765625, -18.2607421875, -17.544921875, -16.8291015625, -16.11328125, -15.3974609375, -14.681640625, -13.9658203125, -13.25, -12.5341796875, -11.818359375, -11.1025390625, -10.38671875, -9.6708984375, -8.955078125, -8.2392578125, -7.5234375, -6.8076171875, -6.091796875, -5.3759765625, -4.66015625, -3.9443359375, -3.228515625, -2.5126953125, -1.796875, -1.0810546875, -0.365234375, 0.3505859375, 1.06640625, 1.7822265625, 2.498046875, 3.2138671875, 3.9296875, 4.6455078125, 5.361328125, 6.0771484375, 6.79296875, 7.5087890625, 8.224609375, 8.9404296875, 9.65625, 10.3720703125, 11.087890625, 11.8037109375, 12.51953125, 13.2353515625, 13.951171875, 14.6669921875, 15.3828125, 16.0986328125, 16.814453125, 17.5302734375, 18.24609375, 18.9619140625, 19.677734375, 20.3935546875, 21.109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 8.0, 10.0, 9.0, 18.0, 11.0, 17.0, 16.0, 25.0, 28.0, 38.0, 44.0, 58.0, 56.0, 75.0, 70.0, 85.0, 68.0, 57.0, 44.0, 35.0, 27.0, 30.0, 25.0, 16.0, 23.0, 21.0, 7.0, 13.0, 10.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00864410400390625, -0.008378744125366211, -0.008113384246826172, -0.007848024368286133, -0.007582664489746094, -0.007317304611206055, -0.007051944732666016, -0.0067865848541259766, -0.0065212249755859375, -0.0062558650970458984, -0.005990505218505859, -0.00572514533996582, -0.005459785461425781, -0.005194425582885742, -0.004929065704345703, -0.004663705825805664, -0.004398345947265625, -0.004132986068725586, -0.003867626190185547, -0.003602266311645508, -0.0033369064331054688, -0.0030715465545654297, -0.0028061866760253906, -0.0025408267974853516, -0.0022754669189453125, -0.0020101070404052734, -0.0017447471618652344, -0.0014793872833251953, -0.0012140274047851562, -0.0009486675262451172, -0.0006833076477050781, -0.00041794776916503906, -0.000152587890625, 0.00011277198791503906, 0.0003781318664550781, 0.0006434917449951172, 0.0009088516235351562, 0.0011742115020751953, 0.0014395713806152344, 0.0017049312591552734, 0.0019702911376953125, 0.0022356510162353516, 0.0025010108947753906, 0.0027663707733154297, 0.0030317306518554688, 0.003297090530395508, 0.003562450408935547, 0.003827810287475586, 0.004093170166015625, 0.004358530044555664, 0.004623889923095703, 0.004889249801635742, 0.005154609680175781, 0.00541996955871582, 0.005685329437255859, 0.0059506893157958984, 0.0062160491943359375, 0.0064814090728759766, 0.006746768951416016, 0.007012128829956055, 0.007277488708496094, 0.007542848587036133, 0.007808208465576172, 0.008073568344116211, 0.00833892822265625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 7.0, 11.0, 12.0, 21.0, 29.0, 35.0, 72.0, 71.0, 110.0, 205.0, 384.0, 868.0, 2702.0, 14756.0, 156763.0, 777730.0, 82181.0, 9172.0, 1858.0, 658.0, 330.0, 186.0, 112.0, 79.0, 61.0, 30.0, 35.0, 25.0, 11.0, 5.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.12396240234375, -0.12035655975341797, -0.11675071716308594, -0.1131448745727539, -0.10953903198242188, -0.10593318939208984, -0.10232734680175781, -0.09872150421142578, -0.09511566162109375, -0.09150981903076172, -0.08790397644042969, -0.08429813385009766, -0.08069229125976562, -0.0770864486694336, -0.07348060607910156, -0.06987476348876953, -0.0662689208984375, -0.06266307830810547, -0.05905723571777344, -0.055451393127441406, -0.051845550537109375, -0.048239707946777344, -0.04463386535644531, -0.04102802276611328, -0.03742218017578125, -0.03381633758544922, -0.030210494995117188, -0.026604652404785156, -0.022998809814453125, -0.019392967224121094, -0.015787124633789062, -0.012181282043457031, -0.008575439453125, -0.004969596862792969, -0.0013637542724609375, 0.0022420883178710938, 0.005847930908203125, 0.009453773498535156, 0.013059616088867188, 0.01666545867919922, 0.02027130126953125, 0.02387714385986328, 0.027482986450195312, 0.031088829040527344, 0.034694671630859375, 0.038300514221191406, 0.04190635681152344, 0.04551219940185547, 0.0491180419921875, 0.05272388458251953, 0.05632972717285156, 0.059935569763183594, 0.06354141235351562, 0.06714725494384766, 0.07075309753417969, 0.07435894012451172, 0.07796478271484375, 0.08157062530517578, 0.08517646789550781, 0.08878231048583984, 0.09238815307617188, 0.0959939956665039, 0.09959983825683594, 0.10320568084716797, 0.1068115234375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 19.0, 71.0, 203.0, 365.0, 236.0, 78.0, 29.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009550882503390312, -0.008557799272239208, -0.007564716041088104, -0.006571632809937, -0.005578549578785896, -0.004585466347634792, -0.0035923831164836884, -0.0025992998853325844, -0.0016062166541814804, -0.0006131334230303764, 0.00037994980812072754, 0.0013730330392718315, 0.0023661162704229355, 0.0033591995015740395, 0.004352282732725143, 0.005345365963876247, 0.006338449195027351, 0.007331532426178455, 0.00832461565732956, 0.009317698888480663, 0.010310782119631767, 0.011303865350782871, 0.012296948581933975, 0.01329003181308508, 0.014283115044236183, 0.015276198275387287, 0.01626928150653839, 0.01726236566901207, 0.0182554479688406, 0.01924853026866913, 0.020241614431142807, 0.021234698593616486, 0.022227782756090164, 0.023220866918563843, 0.024213949218392372, 0.0252070315182209, 0.02620011568069458, 0.02719319984316826, 0.028186282142996788, 0.029179364442825317, 0.030172448605298996, 0.031165532767772675, 0.032158613204956055, 0.03315169736742973, 0.03414478152990341, 0.03513786569237709, 0.03613094985485077, 0.03712403029203415, 0.03811711445450783, 0.039110198616981506, 0.040103279054164886, 0.041096363216638565, 0.042089447379112244, 0.04308253154158592, 0.0440756157040596, 0.04506869614124298, 0.04606178030371666, 0.04705486446619034, 0.04804794490337372, 0.0490410290658474, 0.050034113228321075, 0.051027197390794754, 0.05202028155326843, 0.05301336199045181, 0.05400644615292549]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 9.0, 12.0, 10.0, 11.0, 18.0, 19.0, 17.0, 33.0, 20.0, 37.0, 40.0, 34.0, 34.0, 40.0, 31.0, 45.0, 49.0, 38.0, 47.0, 49.0, 35.0, 39.0, 39.0, 36.0, 38.0, 33.0, 27.0, 31.0, 17.0, 25.0, 14.0, 12.0, 14.0, 12.0, 9.0, 8.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.004798293113708496, -0.004652886651456356, -0.004507480189204216, -0.004362073726952076, -0.004216667264699936, -0.004071260802447796, -0.003925854340195656, -0.0037804478779435158, -0.0036350414156913757, -0.0034896349534392357, -0.0033442284911870956, -0.0031988220289349556, -0.0030534155666828156, -0.0029080091044306755, -0.0027626026421785355, -0.0026171961799263954, -0.0024717897176742554, -0.0023263832554221153, -0.0021809767931699753, -0.0020355703309178352, -0.0018901638686656952, -0.0017447574064135551, -0.001599350944161415, -0.001453944481909275, -0.001308538019657135, -0.001163131557404995, -0.001017725095152855, -0.0008723186329007149, -0.0007269121706485748, -0.0005815057083964348, -0.00043609924614429474, -0.0002906927838921547, -0.00014528632164001465, 1.2014061212539673e-07, 0.00014552660286426544, 0.0002909330651164055, 0.00043633952736854553, 0.0005817459896206856, 0.0007271524518728256, 0.0008725589141249657, 0.0010179653763771057, 0.0011633718386292458, 0.0013087783008813858, 0.0014541847631335258, 0.001599591225385666, 0.001744997687637806, 0.001890404149889946, 0.002035810612142086, 0.002181217074394226, 0.002326623536646366, 0.002472029998898506, 0.002617436461150646, 0.0027628429234027863, 0.0029082493856549263, 0.0030536558479070663, 0.0031990623101592064, 0.0033444687724113464, 0.0034898752346634865, 0.0036352816969156265, 0.0037806881591677666, 0.003926094621419907, 0.004071501083672047, 0.004216907545924187, 0.004362314008176327, 0.004507720470428467]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 5.0, 9.0, 6.0, 7.0, 12.0, 10.0, 11.0, 22.0, 19.0, 29.0, 31.0, 30.0, 27.0, 37.0, 50.0, 45.0, 49.0, 36.0, 41.0, 41.0, 38.0, 41.0, 37.0, 35.0, 41.0, 31.0, 25.0, 43.0, 28.0, 18.0, 22.0, 23.0, 17.0, 14.0, 14.0, 11.0, 7.0, 5.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-96.0625, -93.0166015625, -89.970703125, -86.9248046875, -83.87890625, -80.8330078125, -77.787109375, -74.7412109375, -71.6953125, -68.6494140625, -65.603515625, -62.5576171875, -59.51171875, -56.4658203125, -53.419921875, -50.3740234375, -47.328125, -44.2822265625, -41.236328125, -38.1904296875, -35.14453125, -32.0986328125, -29.052734375, -26.0068359375, -22.9609375, -19.9150390625, -16.869140625, -13.8232421875, -10.77734375, -7.7314453125, -4.685546875, -1.6396484375, 1.40625, 4.4521484375, 7.498046875, 10.5439453125, 13.58984375, 16.6357421875, 19.681640625, 22.7275390625, 25.7734375, 28.8193359375, 31.865234375, 34.9111328125, 37.95703125, 41.0029296875, 44.048828125, 47.0947265625, 50.140625, 53.1865234375, 56.232421875, 59.2783203125, 62.32421875, 65.3701171875, 68.416015625, 71.4619140625, 74.5078125, 77.5537109375, 80.599609375, 83.6455078125, 86.69140625, 89.7373046875, 92.783203125, 95.8291015625, 98.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 7.0, 7.0, 14.0, 23.0, 28.0, 26.0, 41.0, 40.0, 79.0, 132.0, 200.0, 356.0, 538.0, 1065.0, 2083.0, 4511.0, 11422.0, 41681.0, 273248.0, 586643.0, 93733.0, 19530.0, 6642.0, 2977.0, 1515.0, 761.0, 455.0, 263.0, 162.0, 117.0, 70.0, 33.0, 37.0, 23.0, 25.0, 15.0, 12.0, 6.0, 5.0, 4.0, 6.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-31.34375, -30.42822265625, -29.5126953125, -28.59716796875, -27.681640625, -26.76611328125, -25.8505859375, -24.93505859375, -24.01953125, -23.10400390625, -22.1884765625, -21.27294921875, -20.357421875, -19.44189453125, -18.5263671875, -17.61083984375, -16.6953125, -15.77978515625, -14.8642578125, -13.94873046875, -13.033203125, -12.11767578125, -11.2021484375, -10.28662109375, -9.37109375, -8.45556640625, -7.5400390625, -6.62451171875, -5.708984375, -4.79345703125, -3.8779296875, -2.96240234375, -2.046875, -1.13134765625, -0.2158203125, 0.69970703125, 1.615234375, 2.53076171875, 3.4462890625, 4.36181640625, 5.27734375, 6.19287109375, 7.1083984375, 8.02392578125, 8.939453125, 9.85498046875, 10.7705078125, 11.68603515625, 12.6015625, 13.51708984375, 14.4326171875, 15.34814453125, 16.263671875, 17.17919921875, 18.0947265625, 19.01025390625, 19.92578125, 20.84130859375, 21.7568359375, 22.67236328125, 23.587890625, 24.50341796875, 25.4189453125, 26.33447265625, 27.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 10.0, 12.0, 15.0, 8.0, 12.0, 24.0, 28.0, 26.0, 40.0, 33.0, 47.0, 54.0, 65.0, 48.0, 2090.0, 109.0, 70.0, 42.0, 43.0, 43.0, 54.0, 40.0, 27.0, 32.0, 12.0, 9.0, 12.0, 13.0, 3.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-244.0, -237.544921875, -231.08984375, -224.634765625, -218.1796875, -211.724609375, -205.26953125, -198.814453125, -192.359375, -185.904296875, -179.44921875, -172.994140625, -166.5390625, -160.083984375, -153.62890625, -147.173828125, -140.71875, -134.263671875, -127.80859375, -121.353515625, -114.8984375, -108.443359375, -101.98828125, -95.533203125, -89.078125, -82.623046875, -76.16796875, -69.712890625, -63.2578125, -56.802734375, -50.34765625, -43.892578125, -37.4375, -30.982421875, -24.52734375, -18.072265625, -11.6171875, -5.162109375, 1.29296875, 7.748046875, 14.203125, 20.658203125, 27.11328125, 33.568359375, 40.0234375, 46.478515625, 52.93359375, 59.388671875, 65.84375, 72.298828125, 78.75390625, 85.208984375, 91.6640625, 98.119140625, 104.57421875, 111.029296875, 117.484375, 123.939453125, 130.39453125, 136.849609375, 143.3046875, 149.759765625, 156.21484375, 162.669921875, 169.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 13.0, 12.0, 16.0, 20.0, 26.0, 55.0, 40.0, 89.0, 115.0, 207.0, 282.0, 482.0, 820.0, 2079.0, 9019.0, 114275.0, 2928803.0, 78086.0, 7400.0, 1795.0, 756.0, 420.0, 275.0, 177.0, 135.0, 78.0, 63.0, 33.0, 30.0, 33.0, 16.0, 16.0, 7.0, 4.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.40625, -47.88330078125, -46.3603515625, -44.83740234375, -43.314453125, -41.79150390625, -40.2685546875, -38.74560546875, -37.22265625, -35.69970703125, -34.1767578125, -32.65380859375, -31.130859375, -29.60791015625, -28.0849609375, -26.56201171875, -25.0390625, -23.51611328125, -21.9931640625, -20.47021484375, -18.947265625, -17.42431640625, -15.9013671875, -14.37841796875, -12.85546875, -11.33251953125, -9.8095703125, -8.28662109375, -6.763671875, -5.24072265625, -3.7177734375, -2.19482421875, -0.671875, 0.85107421875, 2.3740234375, 3.89697265625, 5.419921875, 6.94287109375, 8.4658203125, 9.98876953125, 11.51171875, 13.03466796875, 14.5576171875, 16.08056640625, 17.603515625, 19.12646484375, 20.6494140625, 22.17236328125, 23.6953125, 25.21826171875, 26.7412109375, 28.26416015625, 29.787109375, 31.31005859375, 32.8330078125, 34.35595703125, 35.87890625, 37.40185546875, 38.9248046875, 40.44775390625, 41.970703125, 43.49365234375, 45.0166015625, 46.53955078125, 48.0625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 7.0, 18.0, 45.0, 128.0, 426.0, 303.0, 56.0, 16.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1186.9801025390625, -1163.1593017578125, -1139.3385009765625, -1115.517578125, -1091.69677734375, -1067.8759765625, -1044.05517578125, -1020.234375, -996.41357421875, -972.5927734375, -948.7719116210938, -924.9511108398438, -901.1303100585938, -877.3094482421875, -853.4886474609375, -829.6678466796875, -805.8469848632812, -782.0261840820312, -758.205322265625, -734.384521484375, -710.563720703125, -686.742919921875, -662.9220581054688, -639.1012573242188, -615.2803955078125, -591.4595947265625, -567.6387329101562, -543.8179321289062, -519.9971313476562, -496.1763000488281, -472.35546875, -448.53466796875, -424.71380615234375, -400.8929748535156, -377.0721740722656, -353.2513427734375, -329.4305419921875, -305.6097106933594, -281.78887939453125, -257.96807861328125, -234.14724731445312, -210.32643127441406, -186.505615234375, -162.68478393554688, -138.8639678955078, -115.04315185546875, -91.22232055664062, -67.40150451660156, -43.5806884765625, -19.759868621826172, 4.060951232910156, 27.88177490234375, 51.70259094238281, 75.52340698242188, 99.34423828125, 123.16505432128906, 146.98587036132812, 170.8066864013672, 194.62750244140625, 218.44833374023438, 242.26914978027344, 266.0899658203125, 289.9107971191406, 313.73162841796875, 337.55242919921875]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 1.0, 7.0, 7.0, 10.0, 18.0, 7.0, 18.0, 28.0, 20.0, 30.0, 44.0, 39.0, 40.0, 46.0, 48.0, 51.0, 70.0, 48.0, 54.0, 50.0, 60.0, 41.0, 43.0, 28.0, 40.0, 36.0, 22.0, 16.0, 20.0, 14.0, 10.0, 6.0, 2.0, 5.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-212.32843017578125, -204.2517852783203, -196.17515563964844, -188.0985107421875, -180.02188110351562, -171.9452362060547, -163.86859130859375, -155.79196166992188, -147.71531677246094, -139.638671875, -131.56204223632812, -123.48539733886719, -115.40876007080078, -107.33212280273438, -99.25547790527344, -91.17884063720703, -83.10220336914062, -75.02556610107422, -66.94892883300781, -58.872283935546875, -50.79564666748047, -42.71900939941406, -34.64236831665039, -26.56572723388672, -18.489089965820312, -10.412450790405273, -2.3358116149902344, 5.740827560424805, 13.817466735839844, 21.89410400390625, 29.970745086669922, 38.047386169433594, 46.123992919921875, 54.20063018798828, 62.27727127075195, 70.35391235351562, 78.43054962158203, 86.50718688964844, 94.58383178710938, 102.66046905517578, 110.73710632324219, 118.8137435913086, 126.890380859375, 134.96702575683594, 143.04367065429688, 151.12030029296875, 159.1969451904297, 167.27359008789062, 175.3502197265625, 183.42686462402344, 191.5034942626953, 199.58013916015625, 207.65676879882812, 215.73341369628906, 223.81005859375, 231.88668823242188, 239.9633331298828, 248.03997802734375, 256.1166076660156, 264.1932373046875, 272.2698974609375, 280.3465270996094, 288.42315673828125, 296.49981689453125, 304.5764465332031]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 13.0, 10.0, 13.0, 27.0, 23.0, 26.0, 53.0, 59.0, 73.0, 112.0, 153.0, 182.0, 274.0, 357.0, 525.0, 689.0, 845.0, 948.0, 1040353.0, 881.0, 735.0, 550.0, 446.0, 299.0, 220.0, 161.0, 136.0, 94.0, 82.0, 51.0, 40.0, 29.0, 21.0, 9.0, 16.0, 10.0, 9.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.965755462646484, -57.98029327392578, -55.99482727050781, -54.00936508178711, -52.02389907836914, -50.03843688964844, -48.05297088623047, -46.067508697509766, -44.08204650878906, -42.09658432006836, -40.11111831665039, -38.12565612792969, -36.14019012451172, -34.154727935791016, -32.16926574707031, -30.183799743652344, -28.198333740234375, -26.21286964416504, -24.227405548095703, -22.241943359375, -20.25647735595703, -18.271015167236328, -16.285551071166992, -14.300086975097656, -12.31462287902832, -10.329158782958984, -8.343694686889648, -6.358231544494629, -4.372767448425293, -2.387303352355957, -0.4018402099609375, 1.5836238861083984, 3.569091796875, 5.554555892944336, 7.540019512176514, 9.525483131408691, 11.510947227478027, 13.496411323547363, 15.481874465942383, 17.46733856201172, 19.452802658081055, 21.43826675415039, 23.423730850219727, 25.409194946289062, 27.394657135009766, 29.380123138427734, 31.365585327148438, 33.351051330566406, 35.33651351928711, 37.32197570800781, 39.30744171142578, 41.292903900146484, 43.27836990356445, 45.263832092285156, 47.249298095703125, 49.23476028442383, 51.22022247314453, 53.205684661865234, 55.1911506652832, 57.176612854003906, 59.162078857421875, 61.14754104614258, 63.13300323486328, 65.11846923828125, 67.10393524169922]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 0.0, 4.0, 6.0, 6.0, 8.0, 2.0, 7.0, 22.0, 44.0, 142.0, 51461428.0, 1325.0, 59.0, 15.0, 15.0, 16.0, 8.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6288.0, -5986.9443359375, -5685.888671875, -5384.8330078125, -5083.77734375, -4782.7216796875, -4481.666015625, -4180.6103515625, -3879.5546875, -3578.4990234375, -3277.443359375, -2976.3876953125, -2675.33203125, -2374.2763671875, -2073.220703125, -1772.1650390625, -1471.109375, -1170.0537109375, -868.998046875, -567.9423828125, -266.88671875, 34.1689453125, 335.224609375, 636.2802734375, 937.3359375, 1238.3916015625, 1539.447265625, 1840.5029296875, 2141.55859375, 2442.6142578125, 2743.669921875, 3044.7255859375, 3345.7822265625, 3646.837890625, 3947.8935546875, 4248.94921875, 4550.0048828125, 4851.060546875, 5152.1162109375, 5453.171875, 5754.2275390625, 6055.283203125, 6356.3388671875, 6657.39453125, 6958.4501953125, 7259.505859375, 7560.5615234375, 7861.6171875, 8162.6728515625, 8463.728515625, 8764.7841796875, 9065.83984375, 9366.8955078125, 9667.951171875, 9969.0068359375, 10270.0625, 10571.1181640625, 10872.173828125, 11173.2294921875, 11474.28515625, 11775.3408203125, 12076.396484375, 12377.4521484375, 12678.5078125, 12979.5634765625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [4.0, 4.0, 7.0, 7.0, 14.0, 21.0, 31.0, 40.0, 70.0, 95.0, 136.0, 188.0, 286.0, 403.0, 522.0, 841.0, 1224.0, 1700.0, 2390.0, 3346.0, 4904.0, 7078.0, 10051.0, 14957.0, 22236.0, 32375.0, 47943.0, 71490.0, 109060.0, 174054.0, 305371.0, 1122901.0, 3434972.0, 361578.0, 194373.0, 122357.0, 79121.0, 52685.0, 35506.0, 23627.0, 16409.0, 11451.0, 7963.0, 5329.0, 3788.0, 2544.0, 1758.0, 1253.0, 864.0, 642.0, 456.0, 301.0, 234.0, 157.0, 89.0, 84.0, 66.0, 41.0, 21.0, 13.0, 7.0, 6.0, 7.0, 5.0], "bins": [-8.5625, -8.2958984375, -8.029296875, -7.7626953125, -7.49609375, -7.2294921875, -6.962890625, -6.6962890625, -6.4296875, -6.1630859375, -5.896484375, -5.6298828125, -5.36328125, -5.0966796875, -4.830078125, -4.5634765625, -4.296875, -4.0302734375, -3.763671875, -3.4970703125, -3.23046875, -2.9638671875, -2.697265625, -2.4306640625, -2.1640625, -1.8974609375, -1.630859375, -1.3642578125, -1.09765625, -0.8310546875, -0.564453125, -0.2978515625, -0.03125, 0.2353515625, 0.501953125, 0.7685546875, 1.03515625, 1.3017578125, 1.568359375, 1.8349609375, 2.1015625, 2.3681640625, 2.634765625, 2.9013671875, 3.16796875, 3.4345703125, 3.701171875, 3.9677734375, 4.234375, 4.5009765625, 4.767578125, 5.0341796875, 5.30078125, 5.5673828125, 5.833984375, 6.1005859375, 6.3671875, 6.6337890625, 6.900390625, 7.1669921875, 7.43359375, 7.7001953125, 7.966796875, 8.2333984375, 8.5]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 12.0, 10.0, 10.0, 9.0, 10.0, 18.0, 17.0, 23.0, 29.0, 26.0, 29.0, 38.0, 46.0, 38.0, 37.0, 41.0, 78.0, 216.0, 652.0, 191.0, 60.0, 64.0, 40.0, 32.0, 37.0, 26.0, 28.0, 19.0, 21.0, 22.0, 19.0, 23.0, 20.0, 13.0, 12.0, 11.0, 3.0, 7.0, 4.0, 7.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.140625, -20.488525390625, -19.83642578125, -19.184326171875, -18.5322265625, -17.880126953125, -17.22802734375, -16.575927734375, -15.923828125, -15.271728515625, -14.61962890625, -13.967529296875, -13.3154296875, -12.663330078125, -12.01123046875, -11.359130859375, -10.70703125, -10.054931640625, -9.40283203125, -8.750732421875, -8.0986328125, -7.446533203125, -6.79443359375, -6.142333984375, -5.490234375, -4.838134765625, -4.18603515625, -3.533935546875, -2.8818359375, -2.229736328125, -1.57763671875, -0.925537109375, -0.2734375, 0.378662109375, 1.03076171875, 1.682861328125, 2.3349609375, 2.987060546875, 3.63916015625, 4.291259765625, 4.943359375, 5.595458984375, 6.24755859375, 6.899658203125, 7.5517578125, 8.203857421875, 8.85595703125, 9.508056640625, 10.16015625, 10.812255859375, 11.46435546875, 12.116455078125, 12.7685546875, 13.420654296875, 14.07275390625, 14.724853515625, 15.376953125, 16.029052734375, 16.68115234375, 17.333251953125, 17.9853515625, 18.637451171875, 19.28955078125, 19.941650390625, 20.59375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 7.0, 2.0, 17.0, 20.0, 23.0, 22.0, 44.0, 93.0, 125.0, 176.0, 337.0, 420.0, 576.0, 974.0, 1446.0, 2467.0, 4102.0, 6456.0, 10836.0, 18972.0, 33625.0, 61865.0, 120152.0, 259712.0, 885277.0, 4110713.0, 413777.0, 169695.0, 83835.0, 45195.0, 24566.0, 13957.0, 8548.0, 4934.0, 2953.0, 1938.0, 1339.0, 831.0, 441.0, 327.0, 204.0, 124.0, 72.0, 84.0, 37.0, 47.0, 31.0, 15.0, 14.0, 6.0, 1.0, 5.0, 0.0, 3.0, 0.0, 3.0], "bins": [-13.8359375, -13.419677734375, -13.00341796875, -12.587158203125, -12.1708984375, -11.754638671875, -11.33837890625, -10.922119140625, -10.505859375, -10.089599609375, -9.67333984375, -9.257080078125, -8.8408203125, -8.424560546875, -8.00830078125, -7.592041015625, -7.17578125, -6.759521484375, -6.34326171875, -5.927001953125, -5.5107421875, -5.094482421875, -4.67822265625, -4.261962890625, -3.845703125, -3.429443359375, -3.01318359375, -2.596923828125, -2.1806640625, -1.764404296875, -1.34814453125, -0.931884765625, -0.515625, -0.099365234375, 0.31689453125, 0.733154296875, 1.1494140625, 1.565673828125, 1.98193359375, 2.398193359375, 2.814453125, 3.230712890625, 3.64697265625, 4.063232421875, 4.4794921875, 4.895751953125, 5.31201171875, 5.728271484375, 6.14453125, 6.560791015625, 6.97705078125, 7.393310546875, 7.8095703125, 8.225830078125, 8.64208984375, 9.058349609375, 9.474609375, 9.890869140625, 10.30712890625, 10.723388671875, 11.1396484375, 11.555908203125, 11.97216796875, 12.388427734375, 12.8046875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 9.0, 8.0, 8.0, 17.0, 19.0, 22.0, 17.0, 25.0, 30.0, 35.0, 47.0, 56.0, 50.0, 59.0, 79.0, 170.0, 605.0, 253.0, 109.0, 61.0, 50.0, 42.0, 36.0, 39.0, 21.0, 22.0, 27.0, 19.0, 18.0, 13.0, 14.0, 13.0, 11.0, 4.0, 7.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.630126953125, -15.10400390625, -14.577880859375, -14.0517578125, -13.525634765625, -12.99951171875, -12.473388671875, -11.947265625, -11.421142578125, -10.89501953125, -10.368896484375, -9.8427734375, -9.316650390625, -8.79052734375, -8.264404296875, -7.73828125, -7.212158203125, -6.68603515625, -6.159912109375, -5.6337890625, -5.107666015625, -4.58154296875, -4.055419921875, -3.529296875, -3.003173828125, -2.47705078125, -1.950927734375, -1.4248046875, -0.898681640625, -0.37255859375, 0.153564453125, 0.6796875, 1.205810546875, 1.73193359375, 2.258056640625, 2.7841796875, 3.310302734375, 3.83642578125, 4.362548828125, 4.888671875, 5.414794921875, 5.94091796875, 6.467041015625, 6.9931640625, 7.519287109375, 8.04541015625, 8.571533203125, 9.09765625, 9.623779296875, 10.14990234375, 10.676025390625, 11.2021484375, 11.728271484375, 12.25439453125, 12.780517578125, 13.306640625, 13.832763671875, 14.35888671875, 14.885009765625, 15.4111328125, 15.937255859375, 16.46337890625, 16.989501953125, 17.515625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 12.0, 3.0, 12.0, 16.0, 18.0, 22.0, 28.0, 19.0, 39.0, 42.0, 46.0, 76.0, 113.0, 122.0, 205.0, 253.0, 280.0, 415.0, 566.0, 791.0, 1054.0, 1555.0, 2346.0, 3799.0, 7346.0, 14896.0, 36948.0, 152924.0, 5922392.0, 89500.0, 27235.0, 11651.0, 5978.0, 3518.0, 2190.0, 1354.0, 964.0, 698.0, 470.0, 317.0, 264.0, 209.0, 176.0, 153.0, 94.0, 84.0, 63.0, 63.0, 30.0, 10.0, 22.0, 18.0, 5.0, 8.0, 5.0, 15.0, 8.0, 4.0, 0.0, 6.0], "bins": [-29.6875, -28.769775390625, -27.85205078125, -26.934326171875, -26.0166015625, -25.098876953125, -24.18115234375, -23.263427734375, -22.345703125, -21.427978515625, -20.51025390625, -19.592529296875, -18.6748046875, -17.757080078125, -16.83935546875, -15.921630859375, -15.00390625, -14.086181640625, -13.16845703125, -12.250732421875, -11.3330078125, -10.415283203125, -9.49755859375, -8.579833984375, -7.662109375, -6.744384765625, -5.82666015625, -4.908935546875, -3.9912109375, -3.073486328125, -2.15576171875, -1.238037109375, -0.3203125, 0.597412109375, 1.51513671875, 2.432861328125, 3.3505859375, 4.268310546875, 5.18603515625, 6.103759765625, 7.021484375, 7.939208984375, 8.85693359375, 9.774658203125, 10.6923828125, 11.610107421875, 12.52783203125, 13.445556640625, 14.36328125, 15.281005859375, 16.19873046875, 17.116455078125, 18.0341796875, 18.951904296875, 19.86962890625, 20.787353515625, 21.705078125, 22.622802734375, 23.54052734375, 24.458251953125, 25.3759765625, 26.293701171875, 27.21142578125, 28.129150390625, 29.046875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 4.0, 7.0, 5.0, 7.0, 7.0, 11.0, 9.0, 16.0, 9.0, 15.0, 20.0, 22.0, 20.0, 38.0, 47.0, 41.0, 43.0, 64.0, 64.0, 111.0, 264.0, 507.0, 157.0, 108.0, 65.0, 48.0, 36.0, 40.0, 30.0, 30.0, 13.0, 28.0, 25.0, 13.0, 15.0, 18.0, 19.0, 13.0, 8.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.234375, -9.91748046875, -9.6005859375, -9.28369140625, -8.966796875, -8.64990234375, -8.3330078125, -8.01611328125, -7.69921875, -7.38232421875, -7.0654296875, -6.74853515625, -6.431640625, -6.11474609375, -5.7978515625, -5.48095703125, -5.1640625, -4.84716796875, -4.5302734375, -4.21337890625, -3.896484375, -3.57958984375, -3.2626953125, -2.94580078125, -2.62890625, -2.31201171875, -1.9951171875, -1.67822265625, -1.361328125, -1.04443359375, -0.7275390625, -0.41064453125, -0.09375, 0.22314453125, 0.5400390625, 0.85693359375, 1.173828125, 1.49072265625, 1.8076171875, 2.12451171875, 2.44140625, 2.75830078125, 3.0751953125, 3.39208984375, 3.708984375, 4.02587890625, 4.3427734375, 4.65966796875, 4.9765625, 5.29345703125, 5.6103515625, 5.92724609375, 6.244140625, 6.56103515625, 6.8779296875, 7.19482421875, 7.51171875, 7.82861328125, 8.1455078125, 8.46240234375, 8.779296875, 9.09619140625, 9.4130859375, 9.72998046875, 10.046875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 4.0, 8.0, 12.0, 9.0, 22.0, 37.0, 44.0, 97.0, 244.0, 234.0, 114.0, 55.0, 43.0, 19.0, 14.0, 10.0, 5.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.19587516784668, -23.298669815063477, -22.40146255493164, -21.504257202148438, -20.607051849365234, -19.7098445892334, -18.812639236450195, -17.91543197631836, -17.018226623535156, -16.121021270751953, -15.223814010620117, -14.326608657836914, -13.429402351379395, -12.532196044921875, -11.634990692138672, -10.737784385681152, -9.840578079223633, -8.943371772766113, -8.046165466308594, -7.148960113525391, -6.251753807067871, -5.354547500610352, -4.45734167098999, -3.560135841369629, -2.6629295349121094, -1.765723466873169, -0.8685173988342285, 0.028688669204711914, 0.9258947372436523, 1.8231010437011719, 2.720306873321533, 3.6175127029418945, 4.514717102050781, 5.411923408508301, 6.309129238128662, 7.206335067749023, 8.103541374206543, 9.000747680664062, 9.897953033447266, 10.795159339904785, 11.692365646362305, 12.589571952819824, 13.486778259277344, 14.383983612060547, 15.281189918518066, 16.178396224975586, 17.07560157775879, 17.972808837890625, 18.870014190673828, 19.76721954345703, 20.664426803588867, 21.56163215637207, 22.458839416503906, 23.35604476928711, 24.253250122070312, 25.150455474853516, 26.04766273498535, 26.944868087768555, 27.84207534790039, 28.739280700683594, 29.636486053466797, 30.533693313598633, 31.430898666381836, 32.32810592651367, 33.225311279296875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 5.0, 10.0, 13.0, 7.0, 16.0, 16.0, 12.0, 13.0, 15.0, 22.0, 30.0, 26.0, 32.0, 29.0, 16.0, 40.0, 28.0, 37.0, 34.0, 34.0, 36.0, 31.0, 29.0, 34.0, 40.0, 38.0, 40.0, 27.0, 39.0, 32.0, 27.0, 17.0, 11.0, 18.0, 17.0, 16.0, 11.0, 14.0, 10.0, 12.0, 11.0, 7.0, 8.0, 6.0, 3.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0], "bins": [-12.512365341186523, -12.137743949890137, -11.763121604919434, -11.388500213623047, -11.01387882232666, -10.639257431030273, -10.26463508605957, -9.890013694763184, -9.515392303466797, -9.14077091217041, -8.766148567199707, -8.39152717590332, -8.016905784606934, -7.642283916473389, -7.267662048339844, -6.893040657043457, -6.518418788909912, -6.143796920776367, -5.7691755294799805, -5.3945536613464355, -5.019932270050049, -4.645310401916504, -4.270689010620117, -3.8960671424865723, -3.5214455127716064, -3.1468238830566406, -2.772202253341675, -2.397580623626709, -2.022958755493164, -1.6483372449874878, -1.2737154960632324, -0.8990938663482666, -0.5244722366333008, -0.14985057711601257, 0.22477108240127563, 0.5993927717208862, 0.974014401435852, 1.3486360311508179, 1.7232577800750732, 2.097879409790039, 2.472501039505005, 2.8471226692199707, 3.2217442989349365, 3.5963659286499023, 3.9709877967834473, 4.345609188079834, 4.720231056213379, 5.094852447509766, 5.4694743156433105, 5.8440961837768555, 6.218717575073242, 6.593339443206787, 6.967960834503174, 7.342582702636719, 7.7172040939331055, 8.091825485229492, 8.466447830200195, 8.841069221496582, 9.215691566467285, 9.590312957763672, 9.964934349060059, 10.339555740356445, 10.714178085327148, 11.088799476623535, 11.463420867919922]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 0.0, 7.0, 2.0, 4.0, 10.0, 14.0, 8.0, 14.0, 22.0, 27.0, 36.0, 43.0, 60.0, 95.0, 125.0, 156.0, 226.0, 305.0, 492.0, 739.0, 1155.0, 2022.0, 3751.0, 8359.0, 26049.0, 4082613.0, 45196.0, 11016.0, 4848.0, 2502.0, 1447.0, 914.0, 655.0, 440.0, 263.0, 198.0, 139.0, 78.0, 71.0, 46.0, 22.0, 25.0, 18.0, 20.0, 8.0, 16.0, 3.0, 11.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0], "bins": [-0.037841796875, -0.03678178787231445, -0.035721778869628906, -0.03466176986694336, -0.03360176086425781, -0.032541751861572266, -0.03148174285888672, -0.030421733856201172, -0.029361724853515625, -0.028301715850830078, -0.02724170684814453, -0.026181697845458984, -0.025121688842773438, -0.02406167984008789, -0.023001670837402344, -0.021941661834716797, -0.02088165283203125, -0.019821643829345703, -0.018761634826660156, -0.01770162582397461, -0.016641616821289062, -0.015581607818603516, -0.014521598815917969, -0.013461589813232422, -0.012401580810546875, -0.011341571807861328, -0.010281562805175781, -0.009221553802490234, -0.008161544799804688, -0.007101535797119141, -0.006041526794433594, -0.004981517791748047, -0.0039215087890625, -0.002861499786376953, -0.0018014907836914062, -0.0007414817810058594, 0.0003185272216796875, 0.0013785362243652344, 0.0024385452270507812, 0.003498554229736328, 0.004558563232421875, 0.005618572235107422, 0.006678581237792969, 0.007738590240478516, 0.008798599243164062, 0.00985860824584961, 0.010918617248535156, 0.011978626251220703, 0.01303863525390625, 0.014098644256591797, 0.015158653259277344, 0.01621866226196289, 0.017278671264648438, 0.018338680267333984, 0.01939868927001953, 0.020458698272705078, 0.021518707275390625, 0.022578716278076172, 0.02363872528076172, 0.024698734283447266, 0.025758743286132812, 0.02681875228881836, 0.027878761291503906, 0.028938770294189453, 0.029998779296875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 3.0, 3.0, 9.0, 9.0, 7.0, 7.0, 12.0, 7.0, 12.0, 11.0, 21.0, 769.0, 19.0, 21.0, 9.0, 5.0, 11.0, 9.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 5.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0026092529296875, -0.002535790205001831, -0.002462327480316162, -0.002388864755630493, -0.0023154020309448242, -0.0022419393062591553, -0.0021684765815734863, -0.0020950138568878174, -0.0020215511322021484, -0.0019480884075164795, -0.0018746256828308105, -0.0018011629581451416, -0.0017277002334594727, -0.0016542375087738037, -0.0015807747840881348, -0.0015073120594024658, -0.0014338493347167969, -0.001360386610031128, -0.001286923885345459, -0.00121346116065979, -0.001139998435974121, -0.0010665357112884521, -0.0009930729866027832, -0.0009196102619171143, -0.0008461475372314453, -0.0007726848125457764, -0.0006992220878601074, -0.0006257593631744385, -0.0005522966384887695, -0.0004788339138031006, -0.00040537118911743164, -0.0003319084644317627, -0.00025844573974609375, -0.0001849830150604248, -0.00011152029037475586, -3.8057565689086914e-05, 3.540515899658203e-05, 0.00010886788368225098, 0.00018233060836791992, 0.00025579333305358887, 0.0003292560577392578, 0.00040271878242492676, 0.0004761815071105957, 0.0005496442317962646, 0.0006231069564819336, 0.0006965696811676025, 0.0007700324058532715, 0.0008434951305389404, 0.0009169578552246094, 0.0009904205799102783, 0.0010638833045959473, 0.0011373460292816162, 0.0012108087539672852, 0.001284271478652954, 0.001357734203338623, 0.001431196928024292, 0.001504659652709961, 0.0015781223773956299, 0.0016515851020812988, 0.0017250478267669678, 0.0017985105514526367, 0.0018719732761383057, 0.0019454360008239746, 0.0020188987255096436, 0.0020923614501953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 11.0, 11.0, 12.0, 23.0, 31.0, 35.0, 45.0, 75.0, 101.0, 139.0, 206.0, 321.0, 534.0, 916.0, 1792.0, 4098.0, 14531.0, 152681.0, 3955141.0, 48994.0, 8255.0, 2912.0, 1327.0, 695.0, 479.0, 281.0, 166.0, 130.0, 96.0, 62.0, 50.0, 36.0, 24.0, 14.0, 7.0, 17.0, 8.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04486083984375, -0.0433807373046875, -0.041900634765625, -0.0404205322265625, -0.0389404296875, -0.0374603271484375, -0.035980224609375, -0.0345001220703125, -0.03302001953125, -0.0315399169921875, -0.030059814453125, -0.0285797119140625, -0.027099609375, -0.0256195068359375, -0.024139404296875, -0.0226593017578125, -0.02117919921875, -0.0196990966796875, -0.018218994140625, -0.0167388916015625, -0.0152587890625, -0.0137786865234375, -0.012298583984375, -0.0108184814453125, -0.00933837890625, -0.0078582763671875, -0.006378173828125, -0.0048980712890625, -0.00341796875, -0.0019378662109375, -0.000457763671875, 0.0010223388671875, 0.00250244140625, 0.0039825439453125, 0.005462646484375, 0.0069427490234375, 0.0084228515625, 0.0099029541015625, 0.011383056640625, 0.0128631591796875, 0.01434326171875, 0.0158233642578125, 0.017303466796875, 0.0187835693359375, 0.020263671875, 0.0217437744140625, 0.023223876953125, 0.0247039794921875, 0.02618408203125, 0.0276641845703125, 0.029144287109375, 0.0306243896484375, 0.0321044921875, 0.0335845947265625, 0.035064697265625, 0.0365447998046875, 0.03802490234375, 0.0395050048828125, 0.040985107421875, 0.0424652099609375, 0.0439453125, 0.0454254150390625, 0.046905517578125, 0.0483856201171875, 0.04986572265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 9.0, 8.0, 9.0, 12.0, 10.0, 17.0, 19.0, 20.0, 32.0, 24.0, 43.0, 53.0, 47.0, 57.0, 82.0, 149.0, 548.0, 2080.0, 309.0, 131.0, 82.0, 69.0, 45.0, 52.0, 30.0, 25.0, 21.0, 18.0, 18.0, 10.0, 8.0, 7.0, 8.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004180908203125, -0.004033267498016357, -0.003885626792907715, -0.0037379860877990723, -0.0035903453826904297, -0.003442704677581787, -0.0032950639724731445, -0.003147423267364502, -0.0029997825622558594, -0.002852141857147217, -0.0027045011520385742, -0.0025568604469299316, -0.002409219741821289, -0.0022615790367126465, -0.002113938331604004, -0.0019662976264953613, -0.0018186569213867188, -0.0016710162162780762, -0.0015233755111694336, -0.001375734806060791, -0.0012280941009521484, -0.0010804533958435059, -0.0009328126907348633, -0.0007851719856262207, -0.0006375312805175781, -0.0004898905754089355, -0.00034224987030029297, -0.0001946091651916504, -4.696846008300781e-05, 0.00010067224502563477, 0.00024831295013427734, 0.0003959536552429199, 0.0005435943603515625, 0.0006912350654602051, 0.0008388757705688477, 0.0009865164756774902, 0.0011341571807861328, 0.0012817978858947754, 0.001429438591003418, 0.0015770792961120605, 0.0017247200012207031, 0.0018723607063293457, 0.0020200014114379883, 0.002167642116546631, 0.0023152828216552734, 0.002462923526763916, 0.0026105642318725586, 0.002758204936981201, 0.0029058456420898438, 0.0030534863471984863, 0.003201127052307129, 0.0033487677574157715, 0.003496408462524414, 0.0036440491676330566, 0.0037916898727416992, 0.003939330577850342, 0.004086971282958984, 0.004234611988067627, 0.0043822526931762695, 0.004529893398284912, 0.004677534103393555, 0.004825174808502197, 0.00497281551361084, 0.005120456218719482, 0.005268096923828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 19.0, 59.0, 133.0, 486.0, 202.0, 45.0, 28.0, 13.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.061979569494724274, -0.05988351255655289, -0.0577874556183815, -0.055691398680210114, -0.05359534174203873, -0.05149928480386734, -0.049403224140405655, -0.04730716720223427, -0.04521111026406288, -0.043115053325891495, -0.04101899638772011, -0.03892293944954872, -0.036826878786087036, -0.03473082184791565, -0.03263476490974426, -0.030538707971572876, -0.02844265103340149, -0.026346594095230103, -0.024250537157058716, -0.02215447835624218, -0.020058421418070793, -0.017962364479899406, -0.01586630567908287, -0.013770248740911484, -0.011674191802740097, -0.00957813486456871, -0.007482076995074749, -0.005386019591242075, -0.003289962187409401, -0.0011939052492380142, 0.0009021526202559471, 0.0029982104897499084, 0.005094274878501892, 0.007190332282334566, 0.00928638968616724, 0.011382447555661201, 0.013478504493832588, 0.015574561432003975, 0.01767062023282051, 0.019766677170991898, 0.021862734109163284, 0.02395879104733467, 0.026054847985506058, 0.028150906786322594, 0.03024696372449398, 0.032343022525310516, 0.0344390794634819, 0.03653513640165329, 0.038631193339824677, 0.04072725027799606, 0.04282330721616745, 0.04491936415433884, 0.04701542109251022, 0.04911147803068161, 0.051207538694143295, 0.05330359563231468, 0.05539965257048607, 0.057495709508657455, 0.05959176644682884, 0.06168782338500023, 0.06378388404846191, 0.0658799409866333, 0.06797599792480469, 0.07007205486297607, 0.07216811180114746]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 8.0, 9.0, 9.0, 8.0, 11.0, 16.0, 18.0, 22.0, 40.0, 50.0, 44.0, 61.0, 59.0, 62.0, 60.0, 56.0, 69.0, 55.0, 52.0, 66.0, 45.0, 36.0, 35.0, 32.0, 19.0, 14.0, 11.0, 5.0, 9.0, 3.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017933547496795654, -0.017298541963100433, -0.016663534566760063, -0.016028527170419693, -0.015393521636724472, -0.014758515171706676, -0.014123508706688881, -0.013488502241671085, -0.01285349577665329, -0.012218489311635494, -0.011583482846617699, -0.010948476381599903, -0.010313469916582108, -0.009678463451564312, -0.009043456986546516, -0.00840845052152872, -0.007773444056510925, -0.00713843759149313, -0.006503431126475334, -0.005868424661457539, -0.005233418196439743, -0.0045984117314219475, -0.003963405266404152, -0.0033283988013863564, -0.002693392336368561, -0.0020583858713507652, -0.0014233794063329697, -0.0007883729413151741, -0.00015336647629737854, 0.000481639988720417, 0.0011166464537382126, 0.0017516529187560081, 0.0023866593837738037, 0.0030216658487915993, 0.003656672313809395, 0.00429167877882719, 0.004926685243844986, 0.0055616917088627815, 0.006196698173880577, 0.006831704638898373, 0.007466711103916168, 0.008101717568933964, 0.00873672403395176, 0.009371730498969555, 0.01000673696398735, 0.010641743429005146, 0.011276749894022942, 0.011911756359040737, 0.012546762824058533, 0.013181769289076328, 0.013816775754094124, 0.01445178221911192, 0.015086788684129715, 0.015721794217824936, 0.016356801614165306, 0.016991809010505676, 0.017626814544200897, 0.018261820077896118, 0.01889682747423649, 0.01953183487057686, 0.02016684040427208, 0.0208018459379673, 0.02143685333430767, 0.02207186073064804, 0.02270686626434326]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 11.0, 9.0, 13.0, 23.0, 18.0, 39.0, 43.0, 67.0, 79.0, 117.0, 157.0, 213.0, 305.0, 389.0, 522.0, 771.0, 1133.0, 1762.0, 2593.0, 4100.0, 6511.0, 11860.0, 25201.0, 854825.0, 92053.0, 19630.0, 9552.0, 5621.0, 3576.0, 2254.0, 1577.0, 1016.0, 684.0, 519.0, 347.0, 258.0, 192.0, 136.0, 92.0, 86.0, 62.0, 45.0, 28.0, 18.0, 18.0, 11.0, 10.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.028289794921875, -0.02740168571472168, -0.02651357650756836, -0.02562546730041504, -0.02473735809326172, -0.0238492488861084, -0.022961139678955078, -0.022073030471801758, -0.021184921264648438, -0.020296812057495117, -0.019408702850341797, -0.018520593643188477, -0.017632484436035156, -0.016744375228881836, -0.015856266021728516, -0.014968156814575195, -0.014080047607421875, -0.013191938400268555, -0.012303829193115234, -0.011415719985961914, -0.010527610778808594, -0.009639501571655273, -0.008751392364501953, -0.007863283157348633, -0.0069751739501953125, -0.006087064743041992, -0.005198955535888672, -0.0043108463287353516, -0.0034227371215820312, -0.002534627914428711, -0.0016465187072753906, -0.0007584095001220703, 0.00012969970703125, 0.0010178089141845703, 0.0019059181213378906, 0.002794027328491211, 0.0036821365356445312, 0.0045702457427978516, 0.005458354949951172, 0.006346464157104492, 0.0072345733642578125, 0.008122682571411133, 0.009010791778564453, 0.009898900985717773, 0.010787010192871094, 0.011675119400024414, 0.012563228607177734, 0.013451337814331055, 0.014339447021484375, 0.015227556228637695, 0.016115665435791016, 0.017003774642944336, 0.017891883850097656, 0.018779993057250977, 0.019668102264404297, 0.020556211471557617, 0.021444320678710938, 0.022332429885864258, 0.023220539093017578, 0.0241086483001709, 0.02499675750732422, 0.02588486671447754, 0.02677297592163086, 0.02766108512878418, 0.0285491943359375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 9.0, 14.0, 4.0, 9.0, 10.0, 8.0, 11.0, 14.0, 33.0, 706.0, 64.0, 25.0, 10.0, 5.0, 10.0, 7.0, 8.0, 6.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00269317626953125, -0.0026192069053649902, -0.0025452375411987305, -0.0024712681770324707, -0.002397298812866211, -0.002323329448699951, -0.0022493600845336914, -0.0021753907203674316, -0.002101421356201172, -0.002027451992034912, -0.0019534826278686523, -0.0018795132637023926, -0.0018055438995361328, -0.001731574535369873, -0.0016576051712036133, -0.0015836358070373535, -0.0015096664428710938, -0.001435697078704834, -0.0013617277145385742, -0.0012877583503723145, -0.0012137889862060547, -0.001139819622039795, -0.0010658502578735352, -0.0009918808937072754, -0.0009179115295410156, -0.0008439421653747559, -0.0007699728012084961, -0.0006960034370422363, -0.0006220340728759766, -0.0005480647087097168, -0.00047409534454345703, -0.00040012598037719727, -0.0003261566162109375, -0.00025218725204467773, -0.00017821788787841797, -0.0001042485237121582, -3.0279159545898438e-05, 4.369020462036133e-05, 0.0001176595687866211, 0.00019162893295288086, 0.0002655982971191406, 0.0003395676612854004, 0.00041353702545166016, 0.0004875063896179199, 0.0005614757537841797, 0.0006354451179504395, 0.0007094144821166992, 0.000783383846282959, 0.0008573532104492188, 0.0009313225746154785, 0.0010052919387817383, 0.001079261302947998, 0.0011532306671142578, 0.0012272000312805176, 0.0013011693954467773, 0.0013751387596130371, 0.0014491081237792969, 0.0015230774879455566, 0.0015970468521118164, 0.0016710162162780762, 0.001744985580444336, 0.0018189549446105957, 0.0018929243087768555, 0.0019668936729431152, 0.002040863037109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 13.0, 7.0, 13.0, 15.0, 28.0, 38.0, 40.0, 60.0, 88.0, 135.0, 207.0, 335.0, 473.0, 769.0, 1146.0, 2114.0, 4429.0, 11413.0, 64459.0, 885065.0, 57126.0, 10895.0, 4241.0, 2163.0, 1218.0, 663.0, 434.0, 286.0, 204.0, 141.0, 99.0, 67.0, 59.0, 29.0, 27.0, 19.0, 9.0, 7.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.050445556640625, -0.048938751220703125, -0.04743194580078125, -0.045925140380859375, -0.0444183349609375, -0.042911529541015625, -0.04140472412109375, -0.039897918701171875, -0.03839111328125, -0.036884307861328125, -0.03537750244140625, -0.033870697021484375, -0.0323638916015625, -0.030857086181640625, -0.02935028076171875, -0.027843475341796875, -0.026336669921875, -0.024829864501953125, -0.02332305908203125, -0.021816253662109375, -0.0203094482421875, -0.018802642822265625, -0.01729583740234375, -0.015789031982421875, -0.0142822265625, -0.012775421142578125, -0.01126861572265625, -0.009761810302734375, -0.0082550048828125, -0.006748199462890625, -0.00524139404296875, -0.003734588623046875, -0.002227783203125, -0.000720977783203125, 0.00078582763671875, 0.002292633056640625, 0.0037994384765625, 0.005306243896484375, 0.00681304931640625, 0.008319854736328125, 0.00982666015625, 0.011333465576171875, 0.01284027099609375, 0.014347076416015625, 0.0158538818359375, 0.017360687255859375, 0.01886749267578125, 0.020374298095703125, 0.021881103515625, 0.023387908935546875, 0.02489471435546875, 0.026401519775390625, 0.0279083251953125, 0.029415130615234375, 0.03092193603515625, 0.032428741455078125, 0.033935546875, 0.035442352294921875, 0.03694915771484375, 0.038455963134765625, 0.0399627685546875, 0.041469573974609375, 0.04297637939453125, 0.044483184814453125, 0.045989990234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 12.0, 10.0, 8.0, 7.0, 12.0, 13.0, 18.0, 21.0, 25.0, 26.0, 29.0, 31.0, 34.0, 37.0, 42.0, 56.0, 41.0, 41.0, 59.0, 37.0, 57.0, 41.0, 35.0, 35.0, 22.0, 24.0, 34.0, 24.0, 25.0, 22.0, 27.0, 30.0, 11.0, 11.0, 17.0, 4.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01035308837890625, -0.010038256645202637, -0.009723424911499023, -0.00940859317779541, -0.009093761444091797, -0.008778929710388184, -0.00846409797668457, -0.008149266242980957, -0.007834434509277344, -0.0075196027755737305, -0.007204771041870117, -0.006889939308166504, -0.006575107574462891, -0.006260275840759277, -0.005945444107055664, -0.005630612373352051, -0.0053157806396484375, -0.005000948905944824, -0.004686117172241211, -0.004371285438537598, -0.004056453704833984, -0.003741621971130371, -0.003426790237426758, -0.0031119585037231445, -0.0027971267700195312, -0.002482295036315918, -0.0021674633026123047, -0.0018526315689086914, -0.0015377998352050781, -0.0012229681015014648, -0.0009081363677978516, -0.0005933046340942383, -0.000278472900390625, 3.635883331298828e-05, 0.00035119056701660156, 0.0006660223007202148, 0.0009808540344238281, 0.0012956857681274414, 0.0016105175018310547, 0.001925349235534668, 0.0022401809692382812, 0.0025550127029418945, 0.002869844436645508, 0.003184676170349121, 0.0034995079040527344, 0.0038143396377563477, 0.004129171371459961, 0.004444003105163574, 0.0047588348388671875, 0.005073666572570801, 0.005388498306274414, 0.005703330039978027, 0.006018161773681641, 0.006332993507385254, 0.006647825241088867, 0.0069626569747924805, 0.007277488708496094, 0.007592320442199707, 0.00790715217590332, 0.008221983909606934, 0.008536815643310547, 0.00885164737701416, 0.009166479110717773, 0.009481310844421387, 0.009796142578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 3.0, 7.0, 18.0, 10.0, 19.0, 23.0, 30.0, 53.0, 57.0, 101.0, 150.0, 269.0, 519.0, 1283.0, 5505.0, 892096.0, 141621.0, 4425.0, 1124.0, 467.0, 258.0, 136.0, 96.0, 78.0, 46.0, 33.0, 28.0, 19.0, 14.0, 8.0, 13.0, 7.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03363037109375, -0.032468318939208984, -0.03130626678466797, -0.030144214630126953, -0.028982162475585938, -0.027820110321044922, -0.026658058166503906, -0.02549600601196289, -0.024333953857421875, -0.02317190170288086, -0.022009849548339844, -0.020847797393798828, -0.019685745239257812, -0.018523693084716797, -0.01736164093017578, -0.016199588775634766, -0.01503753662109375, -0.013875484466552734, -0.012713432312011719, -0.011551380157470703, -0.010389328002929688, -0.009227275848388672, -0.008065223693847656, -0.006903171539306641, -0.005741119384765625, -0.004579067230224609, -0.0034170150756835938, -0.002254962921142578, -0.0010929107666015625, 6.914138793945312e-05, 0.0012311935424804688, 0.0023932456970214844, 0.0035552978515625, 0.004717350006103516, 0.005879402160644531, 0.007041454315185547, 0.008203506469726562, 0.009365558624267578, 0.010527610778808594, 0.01168966293334961, 0.012851715087890625, 0.01401376724243164, 0.015175819396972656, 0.016337871551513672, 0.017499923706054688, 0.018661975860595703, 0.01982402801513672, 0.020986080169677734, 0.02214813232421875, 0.023310184478759766, 0.02447223663330078, 0.025634288787841797, 0.026796340942382812, 0.027958393096923828, 0.029120445251464844, 0.03028249740600586, 0.031444549560546875, 0.03260660171508789, 0.033768653869628906, 0.03493070602416992, 0.03609275817871094, 0.03725481033325195, 0.03841686248779297, 0.039578914642333984, 0.040740966796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 10.0, 6.0, 13.0, 10.0, 12.0, 22.0, 32.0, 33.0, 69.0, 137.0, 187.0, 148.0, 108.0, 70.0, 24.0, 25.0, 8.0, 20.0, 12.0, 7.0, 13.0, 5.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.823902130126953e-05, -1.7697922885417938e-05, -1.7156824469566345e-05, -1.6615726053714752e-05, -1.607462763786316e-05, -1.5533529222011566e-05, -1.4992430806159973e-05, -1.445133239030838e-05, -1.3910233974456787e-05, -1.3369135558605194e-05, -1.2828037142753601e-05, -1.2286938726902008e-05, -1.1745840311050415e-05, -1.1204741895198822e-05, -1.0663643479347229e-05, -1.0122545063495636e-05, -9.581446647644043e-06, -9.04034823179245e-06, -8.499249815940857e-06, -7.958151400089264e-06, -7.417052984237671e-06, -6.875954568386078e-06, -6.334856152534485e-06, -5.793757736682892e-06, -5.252659320831299e-06, -4.711560904979706e-06, -4.170462489128113e-06, -3.6293640732765198e-06, -3.0882656574249268e-06, -2.5471672415733337e-06, -2.0060688257217407e-06, -1.4649704098701477e-06, -9.238719940185547e-07, -3.8277357816696167e-07, 1.5832483768463135e-07, 6.994232535362244e-07, 1.2405216693878174e-06, 1.7816200852394104e-06, 2.3227185010910034e-06, 2.8638169169425964e-06, 3.4049153327941895e-06, 3.9460137486457825e-06, 4.4871121644973755e-06, 5.0282105803489685e-06, 5.5693089962005615e-06, 6.1104074120521545e-06, 6.6515058279037476e-06, 7.1926042437553406e-06, 7.733702659606934e-06, 8.274801075458527e-06, 8.81589949131012e-06, 9.356997907161713e-06, 9.898096323013306e-06, 1.0439194738864899e-05, 1.0980293154716492e-05, 1.1521391570568085e-05, 1.2062489986419678e-05, 1.260358840227127e-05, 1.3144686818122864e-05, 1.3685785233974457e-05, 1.422688364982605e-05, 1.4767982065677643e-05, 1.5309080481529236e-05, 1.585017889738083e-05, 1.6391277313232422e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 9.0, 3.0, 12.0, 17.0, 6.0, 18.0, 32.0, 61.0, 59.0, 88.0, 174.0, 306.0, 685.0, 2374.0, 62587.0, 977061.0, 3423.0, 798.0, 373.0, 154.0, 103.0, 66.0, 43.0, 23.0, 14.0, 14.0, 12.0, 9.0, 8.0, 8.0, 6.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1324462890625, -0.1289691925048828, -0.12549209594726562, -0.12201499938964844, -0.11853790283203125, -0.11506080627441406, -0.11158370971679688, -0.10810661315917969, -0.1046295166015625, -0.10115242004394531, -0.09767532348632812, -0.09419822692871094, -0.09072113037109375, -0.08724403381347656, -0.08376693725585938, -0.08028984069824219, -0.076812744140625, -0.07333564758300781, -0.06985855102539062, -0.06638145446777344, -0.06290435791015625, -0.05942726135253906, -0.055950164794921875, -0.05247306823730469, -0.0489959716796875, -0.04551887512207031, -0.042041778564453125, -0.03856468200683594, -0.03508758544921875, -0.03161048889160156, -0.028133392333984375, -0.024656295776367188, -0.02117919921875, -0.017702102661132812, -0.014225006103515625, -0.010747909545898438, -0.00727081298828125, -0.0037937164306640625, -0.000316619873046875, 0.0031604766845703125, 0.0066375732421875, 0.010114669799804688, 0.013591766357421875, 0.017068862915039062, 0.02054595947265625, 0.024023056030273438, 0.027500152587890625, 0.030977249145507812, 0.034454345703125, 0.03793144226074219, 0.041408538818359375, 0.04488563537597656, 0.04836273193359375, 0.05183982849121094, 0.055316925048828125, 0.05879402160644531, 0.0622711181640625, 0.06574821472167969, 0.06922531127929688, 0.07270240783691406, 0.07617950439453125, 0.07965660095214844, 0.08313369750976562, 0.08661079406738281, 0.090087890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 5.0, 6.0, 14.0, 27.0, 99.0, 601.0, 147.0, 37.0, 9.0, 6.0, 8.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0272369384765625, -0.026582002639770508, -0.025927066802978516, -0.025272130966186523, -0.02461719512939453, -0.02396225929260254, -0.023307323455810547, -0.022652387619018555, -0.021997451782226562, -0.02134251594543457, -0.020687580108642578, -0.020032644271850586, -0.019377708435058594, -0.0187227725982666, -0.01806783676147461, -0.017412900924682617, -0.016757965087890625, -0.016103029251098633, -0.01544809341430664, -0.014793157577514648, -0.014138221740722656, -0.013483285903930664, -0.012828350067138672, -0.01217341423034668, -0.011518478393554688, -0.010863542556762695, -0.010208606719970703, -0.009553670883178711, -0.008898735046386719, -0.008243799209594727, -0.007588863372802734, -0.006933927536010742, -0.00627899169921875, -0.005624055862426758, -0.004969120025634766, -0.0043141841888427734, -0.0036592483520507812, -0.003004312515258789, -0.002349376678466797, -0.0016944408416748047, -0.0010395050048828125, -0.0003845691680908203, 0.0002703666687011719, 0.0009253025054931641, 0.0015802383422851562, 0.0022351741790771484, 0.0028901100158691406, 0.003545045852661133, 0.004199981689453125, 0.004854917526245117, 0.005509853363037109, 0.0061647891998291016, 0.006819725036621094, 0.007474660873413086, 0.008129596710205078, 0.00878453254699707, 0.009439468383789062, 0.010094404220581055, 0.010749340057373047, 0.011404275894165039, 0.012059211730957031, 0.012714147567749023, 0.013369083404541016, 0.014024019241333008, 0.014678955078125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 12.0, 8.0, 16.0, 42.0, 712.0, 149.0, 24.0, 14.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5015972852706909, -0.4820994436740875, -0.46260160207748413, -0.44310376048088074, -0.42360591888427734, -0.40410804748535156, -0.38461020588874817, -0.3651123642921448, -0.3456145226955414, -0.326116681098938, -0.3066188395023346, -0.2871209979057312, -0.2676231265068054, -0.24812529981136322, -0.22862744331359863, -0.20912960171699524, -0.18963176012039185, -0.17013391852378845, -0.15063607692718506, -0.13113822042942047, -0.11164037883281708, -0.09214253723621368, -0.0726446881890297, -0.0531468391418457, -0.03364899754524231, -0.014151152223348618, 0.0053466930985450745, 0.024844538420438766, 0.04434238374233246, 0.06384022533893585, 0.08333807438611984, 0.10283592343330383, 0.12233376502990723, 0.14183160662651062, 0.161329448223114, 0.1808273047208786, 0.200325146317482, 0.2198229879140854, 0.23932084441184998, 0.25881868600845337, 0.27831652760505676, 0.29781436920166016, 0.31731221079826355, 0.33681005239486694, 0.3563079237937927, 0.37580573558807373, 0.3953036069869995, 0.4148014485836029, 0.4342992901802063, 0.4537971317768097, 0.4732949733734131, 0.4927928149700165, 0.5122906565666199, 0.5317885279655457, 0.5512863397598267, 0.5707842111587524, 0.5902820825576782, 0.609779953956604, 0.629277765750885, 0.6487756371498108, 0.6682734489440918, 0.6877713203430176, 0.7072691321372986, 0.7267670035362244, 0.7462648153305054]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 2.0, 10.0, 7.0, 19.0, 35.0, 37.0, 69.0, 111.0, 151.0, 163.0, 116.0, 79.0, 54.0, 41.0, 17.0, 6.0, 16.0, 8.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1800197958946228, -0.17422284185886383, -0.16842590272426605, -0.16262894868850708, -0.1568319946527481, -0.15103504061698914, -0.14523810148239136, -0.13944114744663239, -0.1336441934108734, -0.12784723937511444, -0.12205029278993607, -0.11625334620475769, -0.11045639216899872, -0.10465944558382034, -0.09886249899864197, -0.093065544962883, -0.08726860582828522, -0.08147165924310684, -0.07567470520734787, -0.0698777586221695, -0.06408080458641052, -0.05828385800123215, -0.05248691141605377, -0.0466899611055851, -0.040893010795116425, -0.03509606048464775, -0.029299112036824226, -0.023502163589000702, -0.017705213278532028, -0.011908262968063354, -0.006111316382884979, -0.00031436607241630554, 0.005482584238052368, 0.011279533617198467, 0.017076482996344566, 0.02287343144416809, 0.028670381754636765, 0.03446733206510544, 0.040264278650283813, 0.04606122896075249, 0.05185817927122116, 0.057655129581689835, 0.06345207989215851, 0.06924902647733688, 0.07504597306251526, 0.08084292709827423, 0.0866398736834526, 0.09243682026863098, 0.09823377430438995, 0.10403072088956833, 0.1098276749253273, 0.11562462151050568, 0.12142157554626465, 0.12721851468086243, 0.1330154687166214, 0.13881242275238037, 0.14460936188697815, 0.15040631592273712, 0.1562032550573349, 0.16200020909309387, 0.16779716312885284, 0.17359411716461182, 0.1793910562992096, 0.18518801033496857, 0.19098496437072754]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 8.0, 6.0, 2.0, 15.0, 14.0, 17.0, 29.0, 46.0, 59.0, 223.0, 3246.0, 4157350.0, 32252.0, 734.0, 103.0, 44.0, 22.0, 20.0, 9.0, 16.0, 17.0, 4.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.34765625, -4.22607421875, -4.1044921875, -3.98291015625, -3.861328125, -3.73974609375, -3.6181640625, -3.49658203125, -3.375, -3.25341796875, -3.1318359375, -3.01025390625, -2.888671875, -2.76708984375, -2.6455078125, -2.52392578125, -2.40234375, -2.28076171875, -2.1591796875, -2.03759765625, -1.916015625, -1.79443359375, -1.6728515625, -1.55126953125, -1.4296875, -1.30810546875, -1.1865234375, -1.06494140625, -0.943359375, -0.82177734375, -0.7001953125, -0.57861328125, -0.45703125, -0.33544921875, -0.2138671875, -0.09228515625, 0.029296875, 0.15087890625, 0.2724609375, 0.39404296875, 0.515625, 0.63720703125, 0.7587890625, 0.88037109375, 1.001953125, 1.12353515625, 1.2451171875, 1.36669921875, 1.48828125, 1.60986328125, 1.7314453125, 1.85302734375, 1.974609375, 2.09619140625, 2.2177734375, 2.33935546875, 2.4609375, 2.58251953125, 2.7041015625, 2.82568359375, 2.947265625, 3.06884765625, 3.1904296875, 3.31201171875, 3.43359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 10.0, 8.0, 6.0, 11.0, 3.0, 13.0, 15.0, 18.0, 240.0, 526.0, 35.0, 19.0, 9.0, 4.0, 9.0, 10.0, 7.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00260162353515625, -0.002531304955482483, -0.002460986375808716, -0.0023906677961349487, -0.0023203492164611816, -0.0022500306367874146, -0.0021797120571136475, -0.0021093934774398804, -0.0020390748977661133, -0.001968756318092346, -0.001898437738418579, -0.001828119158744812, -0.001757800579071045, -0.0016874819993972778, -0.0016171634197235107, -0.0015468448400497437, -0.0014765262603759766, -0.0014062076807022095, -0.0013358891010284424, -0.0012655705213546753, -0.0011952519416809082, -0.0011249333620071411, -0.001054614782333374, -0.000984296202659607, -0.0009139776229858398, -0.0008436590433120728, -0.0007733404636383057, -0.0007030218839645386, -0.0006327033042907715, -0.0005623847246170044, -0.0004920661449432373, -0.0004217475652694702, -0.0003514289855957031, -0.00028111040592193604, -0.00021079182624816895, -0.00014047324657440186, -7.015466690063477e-05, 1.6391277313232422e-07, 7.048249244689941e-05, 0.0001408010721206665, 0.0002111196517944336, 0.0002814382314682007, 0.0003517568111419678, 0.00042207539081573486, 0.000492393970489502, 0.000562712550163269, 0.0006330311298370361, 0.0007033497095108032, 0.0007736682891845703, 0.0008439868688583374, 0.0009143054485321045, 0.0009846240282058716, 0.0010549426078796387, 0.0011252611875534058, 0.0011955797672271729, 0.00126589834690094, 0.001336216926574707, 0.0014065355062484741, 0.0014768540859222412, 0.0015471726655960083, 0.0016174912452697754, 0.0016878098249435425, 0.0017581284046173096, 0.0018284469842910767, 0.0018987655639648438]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 3.0, 0.0, 5.0, 8.0, 7.0, 13.0, 17.0, 19.0, 16.0, 24.0, 33.0, 44.0, 50.0, 51.0, 72.0, 91.0, 133.0, 136.0, 191.0, 764.0, 44451.0, 4145035.0, 2286.0, 250.0, 122.0, 99.0, 66.0, 67.0, 42.0, 36.0, 24.0, 27.0, 18.0, 20.0, 13.0, 10.0, 9.0, 7.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.7666015625, -0.7454299926757812, -0.7242584228515625, -0.7030868530273438, -0.681915283203125, -0.6607437133789062, -0.6395721435546875, -0.6184005737304688, -0.59722900390625, -0.5760574340820312, -0.5548858642578125, -0.5337142944335938, -0.512542724609375, -0.49137115478515625, -0.4701995849609375, -0.44902801513671875, -0.4278564453125, -0.40668487548828125, -0.3855133056640625, -0.36434173583984375, -0.343170166015625, -0.32199859619140625, -0.3008270263671875, -0.27965545654296875, -0.25848388671875, -0.23731231689453125, -0.2161407470703125, -0.19496917724609375, -0.173797607421875, -0.15262603759765625, -0.1314544677734375, -0.11028289794921875, -0.089111328125, -0.06793975830078125, -0.0467681884765625, -0.02559661865234375, -0.004425048828125, 0.01674652099609375, 0.0379180908203125, 0.05908966064453125, 0.08026123046875, 0.10143280029296875, 0.1226043701171875, 0.14377593994140625, 0.164947509765625, 0.18611907958984375, 0.2072906494140625, 0.22846221923828125, 0.2496337890625, 0.27080535888671875, 0.2919769287109375, 0.31314849853515625, 0.334320068359375, 0.35549163818359375, 0.3766632080078125, 0.39783477783203125, 0.41900634765625, 0.44017791748046875, 0.4613494873046875, 0.48252105712890625, 0.503692626953125, 0.5248641967773438, 0.5460357666015625, 0.5672073364257812, 0.58837890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 3.0, 4.0, 6.0, 9.0, 13.0, 19.0, 20.0, 21.0, 30.0, 41.0, 40.0, 59.0, 74.0, 85.0, 99.0, 140.0, 185.0, 173.0, 284.0, 1356.0, 414.0, 236.0, 167.0, 132.0, 92.0, 78.0, 70.0, 43.0, 31.0, 31.0, 21.0, 26.0, 11.0, 14.0, 7.0, 11.0, 6.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.006175994873046875, -0.006008446216583252, -0.005840897560119629, -0.005673348903656006, -0.005505800247192383, -0.00533825159072876, -0.005170702934265137, -0.005003154277801514, -0.004835605621337891, -0.004668056964874268, -0.0045005083084106445, -0.0043329596519470215, -0.0041654109954833984, -0.003997862339019775, -0.0038303136825561523, -0.0036627650260925293, -0.0034952163696289062, -0.003327667713165283, -0.00316011905670166, -0.002992570400238037, -0.002825021743774414, -0.002657473087310791, -0.002489924430847168, -0.002322375774383545, -0.002154827117919922, -0.001987278461456299, -0.0018197298049926758, -0.0016521811485290527, -0.0014846324920654297, -0.0013170838356018066, -0.0011495351791381836, -0.0009819865226745605, -0.0008144378662109375, -0.0006468892097473145, -0.0004793405532836914, -0.00031179189682006836, -0.0001442432403564453, 2.3305416107177734e-05, 0.00019085407257080078, 0.00035840272903442383, 0.0005259513854980469, 0.0006935000419616699, 0.000861048698425293, 0.001028597354888916, 0.001196146011352539, 0.0013636946678161621, 0.0015312433242797852, 0.0016987919807434082, 0.0018663406372070312, 0.0020338892936706543, 0.0022014379501342773, 0.0023689866065979004, 0.0025365352630615234, 0.0027040839195251465, 0.0028716325759887695, 0.0030391812324523926, 0.0032067298889160156, 0.0033742785453796387, 0.0035418272018432617, 0.0037093758583068848, 0.003876924514770508, 0.004044473171234131, 0.004212021827697754, 0.004379570484161377, 0.004547119140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 55.0, 953.0, 8.0], "bins": [-2.7687370777130127, -2.7244925498962402, -2.6802477836608887, -2.636003255844116, -2.5917587280273438, -2.547513961791992, -2.5032694339752197, -2.4590249061584473, -2.4147801399230957, -2.3705356121063232, -2.3262908458709717, -2.282046318054199, -2.2378017902374268, -2.193557024002075, -2.1493124961853027, -2.1050679683685303, -2.060823440551758, -2.0165789127349854, -1.9723342657089233, -1.9280896186828613, -1.8838449716567993, -1.8396003246307373, -1.7953557968139648, -1.7511111497879028, -1.7068665027618408, -1.6626218557357788, -1.6183773279190063, -1.5741326808929443, -1.5298880338668823, -1.4856433868408203, -1.4413988590240479, -1.3971542119979858, -1.3529095649719238, -1.3086649179458618, -1.2644203901290894, -1.2201757431030273, -1.1759310960769653, -1.1316864490509033, -1.0874419212341309, -1.0431972742080688, -0.9989526271820068, -0.9547080397605896, -0.9104633927345276, -0.8662188053131104, -0.8219741582870483, -0.7777295708656311, -0.7334849834442139, -0.6892403364181519, -0.6449957489967346, -0.6007511615753174, -0.5565065145492554, -0.5122619271278381, -0.4680173099040985, -0.4237726926803589, -0.37952810525894165, -0.335283488035202, -0.2910388708114624, -0.24679425358772278, -0.20254965126514435, -0.15830504894256592, -0.1140604317188263, -0.06981581449508667, -0.025571227073669434, 0.01867339015007019, 0.06291799247264862]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 11.0, 17.0, 25.0, 30.0, 44.0, 73.0, 109.0, 109.0, 135.0, 113.0, 108.0, 82.0, 52.0, 44.0, 28.0, 14.0, 7.0, 2.0, 3.0, 3.0], "bins": [-0.17797493934631348, -0.17456719279289246, -0.17115946114063263, -0.1677517145872116, -0.16434398293495178, -0.16093623638153076, -0.15752850472927094, -0.15412075817584991, -0.1507130265235901, -0.14730527997016907, -0.14389754831790924, -0.14048980176448822, -0.1370820701122284, -0.13367432355880737, -0.13026659190654755, -0.12685884535312653, -0.1234510987997055, -0.12004335969686508, -0.11663562059402466, -0.11322788149118423, -0.10982014238834381, -0.10641239583492279, -0.10300465673208237, -0.09959691762924194, -0.09618917852640152, -0.0927814394235611, -0.08937370032072067, -0.08596596121788025, -0.08255821466445923, -0.0791504830121994, -0.07574273645877838, -0.07233499735593796, -0.06892725825309753, -0.06551951915025711, -0.06211178004741669, -0.058704037219285965, -0.05529629811644554, -0.05188855901360512, -0.048480816185474396, -0.04507307708263397, -0.04166533797979355, -0.038257598876953125, -0.0348498597741127, -0.03144211694598198, -0.028034377843141556, -0.024626638740301132, -0.02121889777481556, -0.017811156809329987, -0.014403417706489563, -0.010995677672326565, -0.007587937638163567, -0.004180197604000568, -0.0007724575698375702, 0.0026352815330028534, 0.006043022498488426, 0.009450763463973999, 0.012858502566814423, 0.016266241669654846, 0.01967398263514042, 0.023081723600625992, 0.026489462703466415, 0.02989720180630684, 0.03330494463443756, 0.036712683737277985, 0.04012042284011841]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 18.0, 28.0, 28.0, 52.0, 66.0, 75.0, 120.0, 151.0, 220.0, 282.0, 410.0, 534.0, 749.0, 1074.0, 1612.0, 2224.0, 3550.0, 5847.0, 9793.0, 18607.0, 76016.0, 854550.0, 35207.0, 14584.0, 7960.0, 4881.0, 3018.0, 2074.0, 1364.0, 938.0, 689.0, 433.0, 403.0, 260.0, 181.0, 153.0, 110.0, 61.0, 48.0, 44.0, 42.0, 20.0, 20.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.03448486328125, -0.033383846282958984, -0.03228282928466797, -0.031181812286376953, -0.030080795288085938, -0.028979778289794922, -0.027878761291503906, -0.02677774429321289, -0.025676727294921875, -0.02457571029663086, -0.023474693298339844, -0.022373676300048828, -0.021272659301757812, -0.020171642303466797, -0.01907062530517578, -0.017969608306884766, -0.01686859130859375, -0.015767574310302734, -0.014666557312011719, -0.013565540313720703, -0.012464523315429688, -0.011363506317138672, -0.010262489318847656, -0.00916147232055664, -0.008060455322265625, -0.006959438323974609, -0.005858421325683594, -0.004757404327392578, -0.0036563873291015625, -0.002555370330810547, -0.0014543533325195312, -0.0003533363342285156, 0.0007476806640625, 0.0018486976623535156, 0.0029497146606445312, 0.004050731658935547, 0.0051517486572265625, 0.006252765655517578, 0.007353782653808594, 0.00845479965209961, 0.009555816650390625, 0.01065683364868164, 0.011757850646972656, 0.012858867645263672, 0.013959884643554688, 0.015060901641845703, 0.01616191864013672, 0.017262935638427734, 0.01836395263671875, 0.019464969635009766, 0.02056598663330078, 0.021667003631591797, 0.022768020629882812, 0.023869037628173828, 0.024970054626464844, 0.02607107162475586, 0.027172088623046875, 0.02827310562133789, 0.029374122619628906, 0.030475139617919922, 0.03157615661621094, 0.03267717361450195, 0.03377819061279297, 0.034879207611083984, 0.035980224609375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 5.0, 6.0, 4.0, 7.0, 2.0, 8.0, 9.0, 9.0, 13.0, 5.0, 11.0, 26.0, 124.0, 355.0, 261.0, 58.0, 16.0, 6.0, 11.0, 6.0, 6.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.00201416015625, -0.0019574910402297974, -0.0019008219242095947, -0.001844152808189392, -0.0017874836921691895, -0.0017308145761489868, -0.0016741454601287842, -0.0016174763441085815, -0.001560807228088379, -0.0015041381120681763, -0.0014474689960479736, -0.001390799880027771, -0.0013341307640075684, -0.0012774616479873657, -0.001220792531967163, -0.0011641234159469604, -0.0011074542999267578, -0.0010507851839065552, -0.0009941160678863525, -0.0009374469518661499, -0.0008807778358459473, -0.0008241087198257446, -0.000767439603805542, -0.0007107704877853394, -0.0006541013717651367, -0.0005974322557449341, -0.0005407631397247314, -0.0004840940237045288, -0.00042742490768432617, -0.00037075579166412354, -0.0003140866756439209, -0.00025741755962371826, -0.00020074844360351562, -0.000144079327583313, -8.741021156311035e-05, -3.0741095542907715e-05, 2.5928020477294922e-05, 8.259713649749756e-05, 0.0001392662525177002, 0.00019593536853790283, 0.00025260448455810547, 0.0003092736005783081, 0.00036594271659851074, 0.0004226118326187134, 0.000479280948638916, 0.0005359500646591187, 0.0005926191806793213, 0.0006492882966995239, 0.0007059574127197266, 0.0007626265287399292, 0.0008192956447601318, 0.0008759647607803345, 0.0009326338768005371, 0.0009893029928207397, 0.0010459721088409424, 0.001102641224861145, 0.0011593103408813477, 0.0012159794569015503, 0.001272648572921753, 0.0013293176889419556, 0.0013859868049621582, 0.0014426559209823608, 0.0014993250370025635, 0.0015559941530227661, 0.0016126632690429688]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 2.0, 7.0, 11.0, 14.0, 11.0, 15.0, 9.0, 23.0, 20.0, 19.0, 31.0, 24.0, 33.0, 47.0, 68.0, 155.0, 870.0, 8769.0, 979073.0, 56158.0, 2444.0, 339.0, 102.0, 48.0, 34.0, 33.0, 24.0, 22.0, 15.0, 22.0, 14.0, 10.0, 11.0, 6.0, 15.0, 14.0, 7.0, 5.0, 5.0, 3.0, 1.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09950447082519531, -0.09604263305664062, -0.09258079528808594, -0.08911895751953125, -0.08565711975097656, -0.08219528198242188, -0.07873344421386719, -0.0752716064453125, -0.07180976867675781, -0.06834793090820312, -0.06488609313964844, -0.06142425537109375, -0.05796241760253906, -0.054500579833984375, -0.05103874206542969, -0.047576904296875, -0.04411506652832031, -0.040653228759765625, -0.03719139099121094, -0.03372955322265625, -0.030267715454101562, -0.026805877685546875, -0.023344039916992188, -0.0198822021484375, -0.016420364379882812, -0.012958526611328125, -0.009496688842773438, -0.00603485107421875, -0.0025730133056640625, 0.000888824462890625, 0.0043506622314453125, 0.0078125, 0.011274337768554688, 0.014736175537109375, 0.018198013305664062, 0.02165985107421875, 0.025121688842773438, 0.028583526611328125, 0.03204536437988281, 0.0355072021484375, 0.03896903991699219, 0.042430877685546875, 0.04589271545410156, 0.04935455322265625, 0.05281639099121094, 0.056278228759765625, 0.05974006652832031, 0.063201904296875, 0.06666374206542969, 0.07012557983398438, 0.07358741760253906, 0.07704925537109375, 0.08051109313964844, 0.08397293090820312, 0.08743476867675781, 0.0908966064453125, 0.09435844421386719, 0.09782028198242188, 0.10128211975097656, 0.10474395751953125, 0.10820579528808594, 0.11166763305664062, 0.11512947082519531, 0.11859130859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 3.0, 12.0, 8.0, 7.0, 14.0, 17.0, 21.0, 21.0, 24.0, 18.0, 21.0, 30.0, 31.0, 38.0, 28.0, 35.0, 31.0, 40.0, 32.0, 37.0, 35.0, 35.0, 41.0, 22.0, 33.0, 34.0, 30.0, 32.0, 36.0, 23.0, 20.0, 19.0, 19.0, 26.0, 10.0, 18.0, 10.0, 11.0, 18.0, 7.0, 9.0, 10.0, 4.0, 9.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.005672454833984375, -0.0054947733879089355, -0.005317091941833496, -0.005139410495758057, -0.004961729049682617, -0.004784047603607178, -0.004606366157531738, -0.004428684711456299, -0.004251003265380859, -0.00407332181930542, -0.0038956403732299805, -0.003717958927154541, -0.0035402774810791016, -0.003362596035003662, -0.0031849145889282227, -0.003007233142852783, -0.0028295516967773438, -0.0026518702507019043, -0.002474188804626465, -0.0022965073585510254, -0.002118825912475586, -0.0019411444664001465, -0.001763463020324707, -0.0015857815742492676, -0.0014081001281738281, -0.0012304186820983887, -0.0010527372360229492, -0.0008750557899475098, -0.0006973743438720703, -0.0005196928977966309, -0.0003420114517211914, -0.00016433000564575195, 1.33514404296875e-05, 0.00019103288650512695, 0.0003687143325805664, 0.0005463957786560059, 0.0007240772247314453, 0.0009017586708068848, 0.0010794401168823242, 0.0012571215629577637, 0.0014348030090332031, 0.0016124844551086426, 0.001790165901184082, 0.0019678473472595215, 0.002145528793334961, 0.0023232102394104004, 0.00250089168548584, 0.0026785731315612793, 0.0028562545776367188, 0.003033936023712158, 0.0032116174697875977, 0.003389298915863037, 0.0035669803619384766, 0.003744661808013916, 0.0039223432540893555, 0.004100024700164795, 0.004277706146240234, 0.004455387592315674, 0.004633069038391113, 0.004810750484466553, 0.004988431930541992, 0.005166113376617432, 0.005343794822692871, 0.0055214762687683105, 0.00569915771484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 1.0, 1.0, 5.0, 4.0, 10.0, 15.0, 15.0, 36.0, 91.0, 293.0, 2115.0, 1034331.0, 10897.0, 501.0, 112.0, 40.0, 19.0, 14.0, 9.0, 10.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.066162109375, -0.06435918807983398, -0.06255626678466797, -0.06075334548950195, -0.05895042419433594, -0.05714750289916992, -0.055344581604003906, -0.05354166030883789, -0.051738739013671875, -0.04993581771850586, -0.048132896423339844, -0.04632997512817383, -0.04452705383300781, -0.0427241325378418, -0.04092121124267578, -0.039118289947509766, -0.03731536865234375, -0.035512447357177734, -0.03370952606201172, -0.0319066047668457, -0.030103683471679688, -0.028300762176513672, -0.026497840881347656, -0.02469491958618164, -0.022891998291015625, -0.02108907699584961, -0.019286155700683594, -0.017483234405517578, -0.015680313110351562, -0.013877391815185547, -0.012074470520019531, -0.010271549224853516, -0.0084686279296875, -0.006665706634521484, -0.004862785339355469, -0.003059864044189453, -0.0012569427490234375, 0.0005459785461425781, 0.0023488998413085938, 0.004151821136474609, 0.005954742431640625, 0.007757663726806641, 0.009560585021972656, 0.011363506317138672, 0.013166427612304688, 0.014969348907470703, 0.01677227020263672, 0.018575191497802734, 0.02037811279296875, 0.022181034088134766, 0.02398395538330078, 0.025786876678466797, 0.027589797973632812, 0.029392719268798828, 0.031195640563964844, 0.03299856185913086, 0.034801483154296875, 0.03660440444946289, 0.038407325744628906, 0.04021024703979492, 0.04201316833496094, 0.04381608963012695, 0.04561901092529297, 0.047421932220458984, 0.049224853515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 8.0, 14.0, 19.0, 10.0, 28.0, 51.0, 80.0, 232.0, 272.0, 91.0, 44.0, 32.0, 26.0, 13.0, 18.0, 11.0, 7.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010591745376586914, -0.0001011071726679802, -9.629689157009125e-05, -9.14866104722023e-05, -8.667632937431335e-05, -8.186604827642441e-05, -7.705576717853546e-05, -7.224548608064651e-05, -6.743520498275757e-05, -6.262492388486862e-05, -5.7814642786979675e-05, -5.300436168909073e-05, -4.819408059120178e-05, -4.3383799493312836e-05, -3.857351839542389e-05, -3.376323729753494e-05, -2.8952956199645996e-05, -2.414267510175705e-05, -1.9332394003868103e-05, -1.4522112905979156e-05, -9.71183180809021e-06, -4.9015507102012634e-06, -9.12696123123169e-08, 4.71901148557663e-06, 9.529292583465576e-06, 1.4339573681354523e-05, 1.914985477924347e-05, 2.3960135877132416e-05, 2.8770416975021362e-05, 3.358069807291031e-05, 3.8390979170799255e-05, 4.32012602686882e-05, 4.801154136657715e-05, 5.2821822464466095e-05, 5.763210356235504e-05, 6.244238466024399e-05, 6.725266575813293e-05, 7.206294685602188e-05, 7.687322795391083e-05, 8.168350905179977e-05, 8.649379014968872e-05, 9.130407124757767e-05, 9.611435234546661e-05, 0.00010092463344335556, 0.00010573491454124451, 0.00011054519563913345, 0.0001153554767370224, 0.00012016575783491135, 0.0001249760389328003, 0.00012978632003068924, 0.00013459660112857819, 0.00013940688222646713, 0.00014421716332435608, 0.00014902744442224503, 0.00015383772552013397, 0.00015864800661802292, 0.00016345828771591187, 0.0001682685688138008, 0.00017307884991168976, 0.0001778891310095787, 0.00018269941210746765, 0.0001875096932053566, 0.00019231997430324554, 0.0001971302554011345, 0.00020194053649902344]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 9.0, 7.0, 9.0, 23.0, 48.0, 152.0, 613.0, 4563.0, 1011388.0, 29790.0, 1469.0, 298.0, 87.0, 35.0, 13.0, 10.0, 5.0, 12.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0758056640625, -0.07384967803955078, -0.07189369201660156, -0.06993770599365234, -0.06798171997070312, -0.0660257339477539, -0.06406974792480469, -0.06211376190185547, -0.06015777587890625, -0.05820178985595703, -0.05624580383300781, -0.054289817810058594, -0.052333831787109375, -0.050377845764160156, -0.04842185974121094, -0.04646587371826172, -0.0445098876953125, -0.04255390167236328, -0.04059791564941406, -0.038641929626464844, -0.036685943603515625, -0.034729957580566406, -0.03277397155761719, -0.03081798553466797, -0.02886199951171875, -0.02690601348876953, -0.024950027465820312, -0.022994041442871094, -0.021038055419921875, -0.019082069396972656, -0.017126083374023438, -0.015170097351074219, -0.013214111328125, -0.011258125305175781, -0.009302139282226562, -0.007346153259277344, -0.005390167236328125, -0.0034341812133789062, -0.0014781951904296875, 0.00047779083251953125, 0.00243377685546875, 0.004389762878417969, 0.0063457489013671875, 0.008301734924316406, 0.010257720947265625, 0.012213706970214844, 0.014169692993164062, 0.01612567901611328, 0.0180816650390625, 0.02003765106201172, 0.021993637084960938, 0.023949623107910156, 0.025905609130859375, 0.027861595153808594, 0.029817581176757812, 0.03177356719970703, 0.03372955322265625, 0.03568553924560547, 0.03764152526855469, 0.039597511291503906, 0.041553497314453125, 0.043509483337402344, 0.04546546936035156, 0.04742145538330078, 0.04937744140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 2.0, 5.0, 4.0, 11.0, 11.0, 14.0, 14.0, 26.0, 25.0, 54.0, 88.0, 403.0, 154.0, 58.0, 29.0, 25.0, 19.0, 8.0, 7.0, 12.0, 6.0, 3.0, 5.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.005466461181640625, -0.0052890777587890625, -0.0051116943359375, -0.0049343109130859375, -0.004756927490234375, -0.0045795440673828125, -0.00440216064453125, -0.0042247772216796875, -0.004047393798828125, -0.0038700103759765625, -0.003692626953125, -0.0035152435302734375, -0.003337860107421875, -0.0031604766845703125, -0.00298309326171875, -0.0028057098388671875, -0.002628326416015625, -0.0024509429931640625, -0.0022735595703125, -0.0020961761474609375, -0.001918792724609375, -0.0017414093017578125, -0.00156402587890625, -0.0013866424560546875, -0.001209259033203125, -0.0010318756103515625, -0.0008544921875, -0.0006771087646484375, -0.000499725341796875, -0.0003223419189453125, -0.00014495849609375, 3.24249267578125e-05, 0.000209808349609375, 0.0003871917724609375, 0.0005645751953125, 0.0007419586181640625, 0.000919342041015625, 0.0010967254638671875, 0.00127410888671875, 0.0014514923095703125, 0.001628875732421875, 0.0018062591552734375, 0.001983642578125, 0.0021610260009765625, 0.002338409423828125, 0.0025157928466796875, 0.00269317626953125, 0.0028705596923828125, 0.003047943115234375, 0.0032253265380859375, 0.0034027099609375, 0.0035800933837890625, 0.003757476806640625, 0.0039348602294921875, 0.00411224365234375, 0.0042896270751953125, 0.004467010498046875, 0.0046443939208984375, 0.00482177734375, 0.0049991607666015625, 0.005176544189453125, 0.0053539276123046875, 0.00553131103515625, 0.0057086944580078125, 0.005886077880859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 5.0, 2.0, 5.0, 4.0, 4.0, 14.0, 33.0, 76.0, 368.0, 341.0, 94.0, 28.0, 9.0, 10.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21499013900756836, -0.20974375307559967, -0.20449736714363098, -0.1992509663105011, -0.1940045803785324, -0.18875819444656372, -0.18351180851459503, -0.17826542258262634, -0.17301903665065765, -0.16777265071868896, -0.16252626478672028, -0.1572798788547516, -0.1520334780216217, -0.14678709208965302, -0.14154070615768433, -0.13629432022571564, -0.13104793429374695, -0.12580154836177826, -0.12055515497922897, -0.11530876904726028, -0.1100623831152916, -0.10481598973274231, -0.09956960380077362, -0.09432321786880493, -0.08907681703567505, -0.08383043110370636, -0.07858403772115707, -0.07333765178918839, -0.0680912658572197, -0.06284487247467041, -0.05759848654270172, -0.05235210061073303, -0.04710571467876434, -0.041859325021505356, -0.03661293908953667, -0.03136654943227768, -0.02612016163766384, -0.020873773843050003, -0.015627384185791016, -0.010380998253822327, -0.005134608596563339, 0.00011177966371178627, 0.005358167923986912, 0.010604556649923325, 0.015850944444537163, 0.021097332239151, 0.02634372189640999, 0.03159010782837868, 0.036836497485637665, 0.04208288714289665, 0.04732927307486534, 0.05257566273212433, 0.05782204866409302, 0.0630684345960617, 0.06831482797861099, 0.07356121391057968, 0.07880760729312897, 0.08405399322509766, 0.08930038660764694, 0.09454677253961563, 0.09979315847158432, 0.1050395518541336, 0.1102859377861023, 0.11553232371807098, 0.12077870965003967]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 4.0, 6.0, 9.0, 22.0, 16.0, 35.0, 39.0, 45.0, 72.0, 77.0, 88.0, 84.0, 109.0, 82.0, 66.0, 62.0, 51.0, 35.0, 24.0, 15.0, 12.0, 6.0, 8.0, 7.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07322335243225098, -0.07085585594177246, -0.06848835945129395, -0.06612086296081543, -0.06375336647033691, -0.0613858662545681, -0.059018366038799286, -0.05665086954832077, -0.054283373057842255, -0.05191587656736374, -0.04954838007688522, -0.04718087986111641, -0.044813383370637894, -0.04244588688015938, -0.040078386664390564, -0.03771089017391205, -0.03534339368343353, -0.03297589719295502, -0.030608398839831352, -0.028240900486707687, -0.025873403996229172, -0.023505907505750656, -0.02113840915262699, -0.018770910799503326, -0.01640341430902481, -0.01403591688722372, -0.01166841946542263, -0.00930092204362154, -0.00693342462182045, -0.00456592720001936, -0.0021984297782182693, 0.0001690685749053955, 0.002536565065383911, 0.004904062487185001, 0.007271559908986092, 0.009639057330787182, 0.012006554752588272, 0.014374052174389362, 0.016741549596190453, 0.019109047949314117, 0.021476544439792633, 0.02384404093027115, 0.026211539283394814, 0.02857903763651848, 0.030946534126996994, 0.03331403061747551, 0.035681530833244324, 0.03804902732372284, 0.040416523814201355, 0.04278402030467987, 0.045151516795158386, 0.0475190170109272, 0.049886513501405716, 0.05225400999188423, 0.054621510207653046, 0.05698900669813156, 0.05935650318861008, 0.06172399967908859, 0.06409149616956711, 0.06645899266004562, 0.06882649660110474, 0.07119399309158325, 0.07356148958206177, 0.07592898607254028, 0.0782964825630188]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 10.0, 6.0, 4.0, 4.0, 10.0, 8.0, 8.0, 14.0, 12.0, 12.0, 20.0, 26.0, 36.0, 22.0, 32.0, 407631.0, 3786211.0, 34.0, 28.0, 20.0, 18.0, 20.0, 14.0, 14.0, 18.0, 6.0, 6.0, 2.0, 6.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 2.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.908203125, -2.827423095703125, -2.74664306640625, -2.665863037109375, -2.5850830078125, -2.504302978515625, -2.42352294921875, -2.342742919921875, -2.261962890625, -2.181182861328125, -2.10040283203125, -2.019622802734375, -1.9388427734375, -1.858062744140625, -1.77728271484375, -1.696502685546875, -1.61572265625, -1.534942626953125, -1.45416259765625, -1.373382568359375, -1.2926025390625, -1.211822509765625, -1.13104248046875, -1.050262451171875, -0.969482421875, -0.888702392578125, -0.80792236328125, -0.727142333984375, -0.6463623046875, -0.565582275390625, -0.48480224609375, -0.404022216796875, -0.3232421875, -0.242462158203125, -0.16168212890625, -0.080902099609375, -0.0001220703125, 0.080657958984375, 0.16143798828125, 0.242218017578125, 0.322998046875, 0.403778076171875, 0.48455810546875, 0.565338134765625, 0.6461181640625, 0.726898193359375, 0.80767822265625, 0.888458251953125, 0.96923828125, 1.050018310546875, 1.13079833984375, 1.211578369140625, 1.2923583984375, 1.373138427734375, 1.45391845703125, 1.534698486328125, 1.615478515625, 1.696258544921875, 1.77703857421875, 1.857818603515625, 1.9385986328125, 2.019378662109375, 2.10015869140625, 2.180938720703125, 2.26171875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 7.0, 3.0, 3.0, 3.0, 6.0, 11.0, 9.0, 7.0, 10.0, 12.0, 13.0, 9.0, 53.0, 158.0, 288.0, 205.0, 93.0, 26.0, 13.0, 12.0, 6.0, 4.0, 7.0, 3.0, 2.0, 3.0, 6.0, 5.0, 1.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018262863159179688, -0.001774802803993225, -0.0017233192920684814, -0.0016718357801437378, -0.0016203522682189941, -0.0015688687562942505, -0.0015173852443695068, -0.0014659017324447632, -0.0014144182205200195, -0.0013629347085952759, -0.0013114511966705322, -0.0012599676847457886, -0.001208484172821045, -0.0011570006608963013, -0.0011055171489715576, -0.001054033637046814, -0.0010025501251220703, -0.0009510666131973267, -0.000899583101272583, -0.0008480995893478394, -0.0007966160774230957, -0.000745132565498352, -0.0006936490535736084, -0.0006421655416488647, -0.0005906820297241211, -0.0005391985177993774, -0.0004877150058746338, -0.00043623149394989014, -0.0003847479820251465, -0.00033326447010040283, -0.0002817809581756592, -0.00023029744625091553, -0.00017881393432617188, -0.00012733042240142822, -7.584691047668457e-05, -2.4363398551940918e-05, 2.7120113372802734e-05, 7.860362529754639e-05, 0.00013008713722229004, 0.0001815706491470337, 0.00023305416107177734, 0.000284537672996521, 0.00033602118492126465, 0.0003875046968460083, 0.00043898820877075195, 0.0004904717206954956, 0.0005419552326202393, 0.0005934387445449829, 0.0006449222564697266, 0.0006964057683944702, 0.0007478892803192139, 0.0007993727922439575, 0.0008508563041687012, 0.0009023398160934448, 0.0009538233280181885, 0.0010053068399429321, 0.0010567903518676758, 0.0011082738637924194, 0.001159757375717163, 0.0012112408876419067, 0.0012627243995666504, 0.001314207911491394, 0.0013656914234161377, 0.0014171749353408813, 0.001468658447265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 13.0, 25.0, 24.0, 43.0, 89.0, 236.0, 1882.0, 4191409.0, 283.0, 149.0, 53.0, 27.0, 22.0, 16.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49462890625, -0.46196746826171875, -0.4293060302734375, -0.39664459228515625, -0.363983154296875, -0.33132171630859375, -0.2986602783203125, -0.26599884033203125, -0.23333740234375, -0.20067596435546875, -0.1680145263671875, -0.13535308837890625, -0.102691650390625, -0.07003021240234375, -0.0373687744140625, -0.00470733642578125, 0.0279541015625, 0.06061553955078125, 0.0932769775390625, 0.12593841552734375, 0.158599853515625, 0.19126129150390625, 0.2239227294921875, 0.25658416748046875, 0.28924560546875, 0.32190704345703125, 0.3545684814453125, 0.38722991943359375, 0.419891357421875, 0.45255279541015625, 0.4852142333984375, 0.5178756713867188, 0.550537109375, 0.5831985473632812, 0.6158599853515625, 0.6485214233398438, 0.681182861328125, 0.7138442993164062, 0.7465057373046875, 0.7791671752929688, 0.81182861328125, 0.8444900512695312, 0.8771514892578125, 0.9098129272460938, 0.942474365234375, 0.9751358032226562, 1.0077972412109375, 1.0404586791992188, 1.0731201171875, 1.1057815551757812, 1.1384429931640625, 1.1711044311523438, 1.203765869140625, 1.2364273071289062, 1.2690887451171875, 1.3017501831054688, 1.33441162109375, 1.3670730590820312, 1.3997344970703125, 1.4323959350585938, 1.465057373046875, 1.4977188110351562, 1.5303802490234375, 1.5630416870117188, 1.595703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 15.0, 5.0, 28.0, 23.0, 48.0, 102.0, 222.0, 549.0, 2095.0, 498.0, 218.0, 112.0, 64.0, 35.0, 24.0, 12.0, 11.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.004314422607421875, -0.004103720188140869, -0.0038930177688598633, -0.0036823153495788574, -0.0034716129302978516, -0.0032609105110168457, -0.00305020809173584, -0.002839505672454834, -0.002628803253173828, -0.0024181008338928223, -0.0022073984146118164, -0.0019966959953308105, -0.0017859935760498047, -0.0015752911567687988, -0.001364588737487793, -0.0011538863182067871, -0.0009431838989257812, -0.0007324814796447754, -0.0005217790603637695, -0.00031107664108276367, -0.00010037422180175781, 0.00011032819747924805, 0.0003210306167602539, 0.0005317330360412598, 0.0007424354553222656, 0.0009531378746032715, 0.0011638402938842773, 0.0013745427131652832, 0.001585245132446289, 0.001795947551727295, 0.0020066499710083008, 0.0022173523902893066, 0.0024280548095703125, 0.0026387572288513184, 0.0028494596481323242, 0.00306016206741333, 0.003270864486694336, 0.003481566905975342, 0.0036922693252563477, 0.0039029717445373535, 0.004113674163818359, 0.004324376583099365, 0.004535079002380371, 0.004745781421661377, 0.004956483840942383, 0.005167186260223389, 0.0053778886795043945, 0.0055885910987854, 0.005799293518066406, 0.006009995937347412, 0.006220698356628418, 0.006431400775909424, 0.00664210319519043, 0.0068528056144714355, 0.007063508033752441, 0.007274210453033447, 0.007484912872314453, 0.007695615291595459, 0.007906317710876465, 0.00811702013015747, 0.008327722549438477, 0.008538424968719482, 0.008749127388000488, 0.008959829807281494, 0.0091705322265625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1000.0, 21.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1173999160528183, -0.05539610609412193, 0.006607703864574432, 0.0686115175485611, 0.13061532378196716, 0.19261913001537323, 0.2546229362487793, 0.31662672758102417, 0.3786305785179138, 0.4406343996524811, 0.5026382207870483, 0.5646420121192932, 0.6266458034515381, 0.6886496543884277, 0.7506534457206726, 0.8126572370529175, 0.8746610283851624, 0.9366648197174072, 0.9986686706542969, 1.0606725215911865, 1.1226762533187866, 1.1846801042556763, 1.2466838359832764, 1.308687686920166, 1.3706915378570557, 1.4326953887939453, 1.4946991205215454, 1.556702971458435, 1.6187068223953247, 1.6807105541229248, 1.7427144050598145, 1.804718255996704, 1.8667219877243042, 1.9287258386611938, 1.990729570388794, 2.0527334213256836, 2.1147372722625732, 2.176741123199463, 2.2387447357177734, 2.300748586654663, 2.3627524375915527, 2.4247562885284424, 2.486760139465332, 2.5487637519836426, 2.6107676029205322, 2.672771453857422, 2.7347753047943115, 2.796779155731201, 2.858783006668091, 2.9207868576049805, 2.98279070854187, 3.0447945594787598, 3.1067981719970703, 3.16880202293396, 3.2308058738708496, 3.2928097248077393, 3.35481333732605, 3.4168171882629395, 3.478821039199829, 3.5408248901367188, 3.6028285026550293, 3.664832353591919, 3.7268362045288086, 3.7888400554656982, 3.850843906402588]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 22.0, 48.0, 139.0, 213.0, 252.0, 198.0, 86.0, 36.0, 12.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061533331871032715, -0.057570554316043854, -0.05360777676105499, -0.04964499920606613, -0.04568222165107727, -0.04171944409608841, -0.03775666654109955, -0.03379388898611069, -0.029831111431121826, -0.025868333876132965, -0.021905556321144104, -0.017942778766155243, -0.013980001211166382, -0.01001722365617752, -0.00605444610118866, -0.0020916685461997986, 0.0018711090087890625, 0.005833886563777924, 0.009796664118766785, 0.013759441673755646, 0.017722219228744507, 0.021684996783733368, 0.02564777433872223, 0.02961055189371109, 0.03357332944869995, 0.03753610700368881, 0.04149888455867767, 0.045461662113666534, 0.049424439668655396, 0.05338721722364426, 0.05734999477863312, 0.06131277233362198, 0.06527554988861084, 0.0692383274435997, 0.07320110499858856, 0.07716388255357742, 0.08112666010856628, 0.08508943766355515, 0.089052215218544, 0.09301499277353287, 0.09697777032852173, 0.10094054788351059, 0.10490332543849945, 0.10886610299348831, 0.11282888054847717, 0.11679165810346603, 0.1207544356584549, 0.12471721321344376, 0.12867999076843262, 0.13264277577400208, 0.13660554587841034, 0.1405683159828186, 0.14453110098838806, 0.14849388599395752, 0.15245665609836578, 0.15641942620277405, 0.1603822112083435, 0.16434499621391296, 0.16830776631832123, 0.1722705364227295, 0.17623332142829895, 0.1801961064338684, 0.18415887653827667, 0.18812164664268494, 0.1920844316482544]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 7.0, 8.0, 5.0, 16.0, 7.0, 27.0, 17.0, 23.0, 38.0, 42.0, 44.0, 68.0, 107.0, 630.0, 1012915.0, 34018.0, 188.0, 75.0, 58.0, 40.0, 40.0, 40.0, 26.0, 25.0, 11.0, 19.0, 10.0, 10.0, 8.0, 6.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.205078125, -0.1981964111328125, -0.191314697265625, -0.1844329833984375, -0.17755126953125, -0.1706695556640625, -0.163787841796875, -0.1569061279296875, -0.1500244140625, -0.1431427001953125, -0.136260986328125, -0.1293792724609375, -0.12249755859375, -0.1156158447265625, -0.108734130859375, -0.1018524169921875, -0.094970703125, -0.0880889892578125, -0.081207275390625, -0.0743255615234375, -0.06744384765625, -0.0605621337890625, -0.053680419921875, -0.0467987060546875, -0.0399169921875, -0.0330352783203125, -0.026153564453125, -0.0192718505859375, -0.01239013671875, -0.0055084228515625, 0.001373291015625, 0.0082550048828125, 0.01513671875, 0.0220184326171875, 0.028900146484375, 0.0357818603515625, 0.04266357421875, 0.0495452880859375, 0.056427001953125, 0.0633087158203125, 0.0701904296875, 0.0770721435546875, 0.083953857421875, 0.0908355712890625, 0.09771728515625, 0.1045989990234375, 0.111480712890625, 0.1183624267578125, 0.125244140625, 0.1321258544921875, 0.139007568359375, 0.1458892822265625, 0.15277099609375, 0.1596527099609375, 0.166534423828125, 0.1734161376953125, 0.1802978515625, 0.1871795654296875, 0.194061279296875, 0.2009429931640625, 0.20782470703125, 0.2147064208984375, 0.221588134765625, 0.2284698486328125, 0.2353515625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 92.0, 345.0, 440.0, 118.0, 14.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006687164306640625, -0.005956590175628662, -0.005226016044616699, -0.004495441913604736, -0.0037648677825927734, -0.0030342936515808105, -0.0023037195205688477, -0.0015731453895568848, -0.0008425712585449219, -0.00011199712753295898, 0.0006185770034790039, 0.0013491511344909668, 0.0020797252655029297, 0.0028102993965148926, 0.0035408735275268555, 0.004271447658538818, 0.005002021789550781, 0.005732595920562744, 0.006463170051574707, 0.00719374418258667, 0.007924318313598633, 0.008654892444610596, 0.009385466575622559, 0.010116040706634521, 0.010846614837646484, 0.011577188968658447, 0.01230776309967041, 0.013038337230682373, 0.013768911361694336, 0.014499485492706299, 0.015230059623718262, 0.015960633754730225, 0.016691207885742188, 0.01742178201675415, 0.018152356147766113, 0.018882930278778076, 0.01961350440979004, 0.020344078540802002, 0.021074652671813965, 0.021805226802825928, 0.02253580093383789, 0.023266375064849854, 0.023996949195861816, 0.02472752332687378, 0.025458097457885742, 0.026188671588897705, 0.026919245719909668, 0.02764981985092163, 0.028380393981933594, 0.029110968112945557, 0.02984154224395752, 0.030572116374969482, 0.031302690505981445, 0.03203326463699341, 0.03276383876800537, 0.033494412899017334, 0.0342249870300293, 0.03495556116104126, 0.03568613529205322, 0.036416709423065186, 0.03714728355407715, 0.03787785768508911, 0.038608431816101074, 0.03933900594711304, 0.040069580078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 0.0, 4.0, 2.0, 5.0, 6.0, 6.0, 9.0, 8.0, 17.0, 22.0, 27.0, 45.0, 35.0, 79.0, 93.0, 153.0, 273.0, 503.0, 1537.0, 9449.0, 340031.0, 678264.0, 14746.0, 1833.0, 586.0, 246.0, 163.0, 117.0, 76.0, 51.0, 28.0, 35.0, 24.0, 12.0, 16.0, 12.0, 15.0, 4.0, 4.0, 7.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0858154296875, -0.08286476135253906, -0.07991409301757812, -0.07696342468261719, -0.07401275634765625, -0.07106208801269531, -0.06811141967773438, -0.06516075134277344, -0.0622100830078125, -0.05925941467285156, -0.056308746337890625, -0.05335807800292969, -0.05040740966796875, -0.04745674133300781, -0.044506072998046875, -0.04155540466308594, -0.038604736328125, -0.03565406799316406, -0.032703399658203125, -0.029752731323242188, -0.02680206298828125, -0.023851394653320312, -0.020900726318359375, -0.017950057983398438, -0.0149993896484375, -0.012048721313476562, -0.009098052978515625, -0.0061473846435546875, -0.00319671630859375, -0.0002460479736328125, 0.002704620361328125, 0.0056552886962890625, 0.00860595703125, 0.011556625366210938, 0.014507293701171875, 0.017457962036132812, 0.02040863037109375, 0.023359298706054688, 0.026309967041015625, 0.029260635375976562, 0.0322113037109375, 0.03516197204589844, 0.038112640380859375, 0.04106330871582031, 0.04401397705078125, 0.04696464538574219, 0.049915313720703125, 0.05286598205566406, 0.055816650390625, 0.05876731872558594, 0.061717987060546875, 0.06466865539550781, 0.06761932373046875, 0.07056999206542969, 0.07352066040039062, 0.07647132873535156, 0.0794219970703125, 0.08237266540527344, 0.08532333374023438, 0.08827400207519531, 0.09122467041015625, 0.09417533874511719, 0.09712600708007812, 0.10007667541503906, 0.10302734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 10.0, 10.0, 9.0, 12.0, 16.0, 24.0, 24.0, 32.0, 36.0, 30.0, 49.0, 56.0, 63.0, 60.0, 53.0, 51.0, 45.0, 53.0, 48.0, 52.0, 41.0, 32.0, 35.0, 26.0, 22.0, 18.0, 18.0, 16.0, 13.0, 6.0, 13.0, 4.0, 9.0, 2.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0, 5.0], "bins": [-0.03472900390625, -0.03382563591003418, -0.03292226791381836, -0.03201889991760254, -0.03111553192138672, -0.0302121639251709, -0.029308795928955078, -0.028405427932739258, -0.027502059936523438, -0.026598691940307617, -0.025695323944091797, -0.024791955947875977, -0.023888587951660156, -0.022985219955444336, -0.022081851959228516, -0.021178483963012695, -0.020275115966796875, -0.019371747970581055, -0.018468379974365234, -0.017565011978149414, -0.016661643981933594, -0.015758275985717773, -0.014854907989501953, -0.013951539993286133, -0.013048171997070312, -0.012144804000854492, -0.011241436004638672, -0.010338068008422852, -0.009434700012207031, -0.008531332015991211, -0.007627964019775391, -0.00672459602355957, -0.00582122802734375, -0.00491786003112793, -0.004014492034912109, -0.003111124038696289, -0.0022077560424804688, -0.0013043880462646484, -0.0004010200500488281, 0.0005023479461669922, 0.0014057159423828125, 0.002309083938598633, 0.003212451934814453, 0.0041158199310302734, 0.005019187927246094, 0.005922555923461914, 0.006825923919677734, 0.007729291915893555, 0.008632659912109375, 0.009536027908325195, 0.010439395904541016, 0.011342763900756836, 0.012246131896972656, 0.013149499893188477, 0.014052867889404297, 0.014956235885620117, 0.015859603881835938, 0.016762971878051758, 0.017666339874267578, 0.0185697078704834, 0.01947307586669922, 0.02037644386291504, 0.02127981185913086, 0.02218317985534668, 0.0230865478515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 2.0, 7.0, 3.0, 9.0, 7.0, 12.0, 13.0, 15.0, 22.0, 31.0, 53.0, 56.0, 99.0, 161.0, 341.0, 895.0, 3494.0, 24932.0, 929576.0, 80209.0, 6198.0, 1340.0, 488.0, 206.0, 118.0, 63.0, 52.0, 25.0, 29.0, 25.0, 17.0, 13.0, 12.0, 4.0, 7.0, 4.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.1060791015625, -0.10318660736083984, -0.10029411315917969, -0.09740161895751953, -0.09450912475585938, -0.09161663055419922, -0.08872413635253906, -0.0858316421508789, -0.08293914794921875, -0.0800466537475586, -0.07715415954589844, -0.07426166534423828, -0.07136917114257812, -0.06847667694091797, -0.06558418273925781, -0.06269168853759766, -0.0597991943359375, -0.056906700134277344, -0.05401420593261719, -0.05112171173095703, -0.048229217529296875, -0.04533672332763672, -0.04244422912597656, -0.039551734924316406, -0.03665924072265625, -0.033766746520996094, -0.030874252319335938, -0.02798175811767578, -0.025089263916015625, -0.02219676971435547, -0.019304275512695312, -0.016411781311035156, -0.013519287109375, -0.010626792907714844, -0.0077342987060546875, -0.004841804504394531, -0.001949310302734375, 0.0009431838989257812, 0.0038356781005859375, 0.006728172302246094, 0.00962066650390625, 0.012513160705566406, 0.015405654907226562, 0.01829814910888672, 0.021190643310546875, 0.02408313751220703, 0.026975631713867188, 0.029868125915527344, 0.0327606201171875, 0.035653114318847656, 0.03854560852050781, 0.04143810272216797, 0.044330596923828125, 0.04722309112548828, 0.05011558532714844, 0.053008079528808594, 0.05590057373046875, 0.058793067932128906, 0.06168556213378906, 0.06457805633544922, 0.06747055053710938, 0.07036304473876953, 0.07325553894042969, 0.07614803314208984, 0.07904052734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 11.0, 12.0, 29.0, 32.0, 49.0, 90.0, 90.0, 111.0, 108.0, 132.0, 85.0, 77.0, 54.0, 32.0, 22.0, 18.0, 7.0, 5.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.821487426757812e-06, -8.488073945045471e-06, -8.15466046333313e-06, -7.821246981620789e-06, -7.487833499908447e-06, -7.154420018196106e-06, -6.821006536483765e-06, -6.487593054771423e-06, -6.154179573059082e-06, -5.820766091346741e-06, -5.487352609634399e-06, -5.153939127922058e-06, -4.820525646209717e-06, -4.4871121644973755e-06, -4.153698682785034e-06, -3.820285201072693e-06, -3.4868717193603516e-06, -3.1534582376480103e-06, -2.820044755935669e-06, -2.4866312742233276e-06, -2.1532177925109863e-06, -1.819804310798645e-06, -1.4863908290863037e-06, -1.1529773473739624e-06, -8.195638656616211e-07, -4.861503839492798e-07, -1.5273690223693848e-07, 1.8067657947540283e-07, 5.140900611877441e-07, 8.475035429000854e-07, 1.1809170246124268e-06, 1.514330506324768e-06, 1.8477439880371094e-06, 2.1811574697494507e-06, 2.514570951461792e-06, 2.8479844331741333e-06, 3.1813979148864746e-06, 3.514811396598816e-06, 3.848224878311157e-06, 4.1816383600234985e-06, 4.51505184173584e-06, 4.848465323448181e-06, 5.1818788051605225e-06, 5.515292286872864e-06, 5.848705768585205e-06, 6.182119250297546e-06, 6.515532732009888e-06, 6.848946213722229e-06, 7.18235969543457e-06, 7.515773177146912e-06, 7.849186658859253e-06, 8.182600140571594e-06, 8.516013622283936e-06, 8.849427103996277e-06, 9.182840585708618e-06, 9.51625406742096e-06, 9.8496675491333e-06, 1.0183081030845642e-05, 1.0516494512557983e-05, 1.0849907994270325e-05, 1.1183321475982666e-05, 1.1516734957695007e-05, 1.1850148439407349e-05, 1.218356192111969e-05, 1.2516975402832031e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 10.0, 5.0, 8.0, 20.0, 9.0, 30.0, 34.0, 70.0, 131.0, 296.0, 882.0, 3529.0, 19892.0, 895607.0, 116330.0, 8842.0, 1812.0, 568.0, 214.0, 109.0, 54.0, 28.0, 28.0, 10.0, 9.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13232421875, -0.12862682342529297, -0.12492942810058594, -0.1212320327758789, -0.11753463745117188, -0.11383724212646484, -0.11013984680175781, -0.10644245147705078, -0.10274505615234375, -0.09904766082763672, -0.09535026550292969, -0.09165287017822266, -0.08795547485351562, -0.0842580795288086, -0.08056068420410156, -0.07686328887939453, -0.0731658935546875, -0.06946849822998047, -0.06577110290527344, -0.062073707580566406, -0.058376312255859375, -0.054678916931152344, -0.05098152160644531, -0.04728412628173828, -0.04358673095703125, -0.03988933563232422, -0.03619194030761719, -0.032494544982910156, -0.028797149658203125, -0.025099754333496094, -0.021402359008789062, -0.01770496368408203, -0.014007568359375, -0.010310173034667969, -0.0066127777099609375, -0.0029153823852539062, 0.000782012939453125, 0.004479408264160156, 0.008176803588867188, 0.011874198913574219, 0.01557159423828125, 0.01926898956298828, 0.022966384887695312, 0.026663780212402344, 0.030361175537109375, 0.034058570861816406, 0.03775596618652344, 0.04145336151123047, 0.0451507568359375, 0.04884815216064453, 0.05254554748535156, 0.056242942810058594, 0.059940338134765625, 0.06363773345947266, 0.06733512878417969, 0.07103252410888672, 0.07472991943359375, 0.07842731475830078, 0.08212471008300781, 0.08582210540771484, 0.08951950073242188, 0.0932168960571289, 0.09691429138183594, 0.10061168670654297, 0.10430908203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 9.0, 7.0, 6.0, 17.0, 21.0, 25.0, 38.0, 68.0, 102.0, 167.0, 202.0, 117.0, 66.0, 39.0, 29.0, 12.0, 10.0, 12.0, 8.0, 10.0, 3.0, 1.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0352783203125, -0.03432893753051758, -0.033379554748535156, -0.032430171966552734, -0.03148078918457031, -0.03053140640258789, -0.02958202362060547, -0.028632640838623047, -0.027683258056640625, -0.026733875274658203, -0.02578449249267578, -0.02483510971069336, -0.023885726928710938, -0.022936344146728516, -0.021986961364746094, -0.021037578582763672, -0.02008819580078125, -0.019138813018798828, -0.018189430236816406, -0.017240047454833984, -0.016290664672851562, -0.01534128189086914, -0.014391899108886719, -0.013442516326904297, -0.012493133544921875, -0.011543750762939453, -0.010594367980957031, -0.00964498519897461, -0.008695602416992188, -0.007746219635009766, -0.006796836853027344, -0.005847454071044922, -0.0048980712890625, -0.003948688507080078, -0.0029993057250976562, -0.0020499229431152344, -0.0011005401611328125, -0.00015115737915039062, 0.0007982254028320312, 0.0017476081848144531, 0.002696990966796875, 0.003646373748779297, 0.004595756530761719, 0.005545139312744141, 0.0064945220947265625, 0.007443904876708984, 0.008393287658691406, 0.009342670440673828, 0.01029205322265625, 0.011241436004638672, 0.012190818786621094, 0.013140201568603516, 0.014089584350585938, 0.01503896713256836, 0.01598834991455078, 0.016937732696533203, 0.017887115478515625, 0.018836498260498047, 0.01978588104248047, 0.02073526382446289, 0.021684646606445312, 0.022634029388427734, 0.023583412170410156, 0.024532794952392578, 0.025482177734375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 11.0, 989.0, 12.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5994638204574585, -0.43732643127441406, -0.27518904209136963, -0.1130516529083252, 0.04908573627471924, 0.21122312545776367, 0.3733605146408081, 0.5354979038238525, 0.697635293006897, 0.8597726821899414, 1.0219100713729858, 1.1840474605560303, 1.3461848497390747, 1.5083222389221191, 1.6704596281051636, 1.832597017288208, 1.9947344064712524, 2.156871795654297, 2.319009304046631, 2.4811465740203857, 2.6432838439941406, 2.8054213523864746, 2.9675588607788086, 3.1296961307525635, 3.2918334007263184, 3.4539709091186523, 3.6161081790924072, 3.778245449066162, 3.940382957458496, 4.10252046585083, 4.264657974243164, 4.42679500579834, 4.588932991027832, 4.751070499420166, 4.9132080078125, 5.075345039367676, 5.23748254776001, 5.399620056152344, 5.5617570877075195, 5.7238945960998535, 5.8860321044921875, 6.0481696128845215, 6.2103071212768555, 6.372444152832031, 6.534581661224365, 6.696719169616699, 6.858856201171875, 7.020993709564209, 7.183131217956543, 7.345268726348877, 7.507406234741211, 7.669543266296387, 7.831680774688721, 7.993818283081055, 8.15595531463623, 8.318093299865723, 8.480230331420898, 8.642367362976074, 8.804505348205566, 8.966642379760742, 9.128780364990234, 9.29091739654541, 9.453054428100586, 9.615192413330078, 9.777329444885254]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 10.0, 13.0, 14.0, 23.0, 33.0, 45.0, 57.0, 66.0, 93.0, 93.0, 102.0, 89.0, 98.0, 77.0, 56.0, 35.0, 39.0, 25.0, 20.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27286297082901, -0.26150915026664734, -0.2501552999019623, -0.2388014793395996, -0.22744764387607574, -0.21609380841255188, -0.20473997294902802, -0.19338613748550415, -0.18203231692314148, -0.17067848145961761, -0.15932464599609375, -0.14797082543373108, -0.13661698997020721, -0.12526315450668335, -0.11390931904315948, -0.10255549103021622, -0.09120164811611176, -0.07984781265258789, -0.06849398463964462, -0.05714014917612076, -0.04578631743788719, -0.034432485699653625, -0.02307865023612976, -0.011724822223186493, -0.0003709867596626282, 0.010982845909893513, 0.022336678579449654, 0.03369051218032837, 0.045044343918561935, 0.0563981756567955, 0.06775201112031937, 0.07910583913326263, 0.0904596745967865, 0.10181351006031036, 0.11316733807325363, 0.1245211735367775, 0.13587500154972076, 0.14722883701324463, 0.1585826724767685, 0.16993650794029236, 0.18129032850265503, 0.1926441639661789, 0.20399799942970276, 0.21535181999206543, 0.2267056554555893, 0.23805949091911316, 0.24941332638263702, 0.2607671618461609, 0.27212101221084595, 0.2834748327732086, 0.2948286831378937, 0.30618250370025635, 0.3175363540649414, 0.3288901746273041, 0.34024399518966675, 0.3515978455543518, 0.3629516661167145, 0.37430548667907715, 0.3856593370437622, 0.3970131576061249, 0.40836700797080994, 0.4197208285331726, 0.43107467889785767, 0.44242849946022034, 0.453782320022583]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 9.0, 40.0, 308.0, 3647831.0, 545033.0, 685.0, 225.0, 81.0, 44.0, 19.0, 11.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.261962890625, -0.23281478881835938, -0.20366668701171875, -0.17451858520507812, -0.1453704833984375, -0.11622238159179688, -0.08707427978515625, -0.057926177978515625, -0.028778076171875, 0.000370025634765625, 0.02951812744140625, 0.058666229248046875, 0.0878143310546875, 0.11696243286132812, 0.14611053466796875, 0.17525863647460938, 0.20440673828125, 0.23355484008789062, 0.26270294189453125, 0.2918510437011719, 0.3209991455078125, 0.3501472473144531, 0.37929534912109375, 0.4084434509277344, 0.437591552734375, 0.4667396545410156, 0.49588775634765625, 0.5250358581542969, 0.5541839599609375, 0.5833320617675781, 0.6124801635742188, 0.6416282653808594, 0.6707763671875, 0.6999244689941406, 0.7290725708007812, 0.7582206726074219, 0.7873687744140625, 0.8165168762207031, 0.8456649780273438, 0.8748130798339844, 0.903961181640625, 0.9331092834472656, 0.9622573852539062, 0.9914054870605469, 1.0205535888671875, 1.0497016906738281, 1.0788497924804688, 1.1079978942871094, 1.13714599609375, 1.1662940979003906, 1.1954421997070312, 1.2245903015136719, 1.2537384033203125, 1.2828865051269531, 1.3120346069335938, 1.3411827087402344, 1.370330810546875, 1.3994789123535156, 1.4286270141601562, 1.4577751159667969, 1.4869232177734375, 1.5160713195800781, 1.5452194213867188, 1.5743675231933594, 1.603515625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 13.0, 83.0, 246.0, 375.0, 225.0, 64.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00804901123046875, -0.007198452949523926, -0.0063478946685791016, -0.005497336387634277, -0.004646778106689453, -0.003796219825744629, -0.0029456615447998047, -0.0020951032638549805, -0.0012445449829101562, -0.00039398670196533203, 0.0004565715789794922, 0.0013071298599243164, 0.0021576881408691406, 0.003008246421813965, 0.003858804702758789, 0.004709362983703613, 0.0055599212646484375, 0.006410479545593262, 0.007261037826538086, 0.00811159610748291, 0.008962154388427734, 0.009812712669372559, 0.010663270950317383, 0.011513829231262207, 0.012364387512207031, 0.013214945793151855, 0.01406550407409668, 0.014916062355041504, 0.015766620635986328, 0.016617178916931152, 0.017467737197875977, 0.0183182954788208, 0.019168853759765625, 0.02001941204071045, 0.020869970321655273, 0.021720528602600098, 0.022571086883544922, 0.023421645164489746, 0.02427220344543457, 0.025122761726379395, 0.02597332000732422, 0.026823878288269043, 0.027674436569213867, 0.02852499485015869, 0.029375553131103516, 0.03022611141204834, 0.031076669692993164, 0.03192722797393799, 0.03277778625488281, 0.03362834453582764, 0.03447890281677246, 0.035329461097717285, 0.03618001937866211, 0.037030577659606934, 0.03788113594055176, 0.03873169422149658, 0.039582252502441406, 0.04043281078338623, 0.041283369064331055, 0.04213392734527588, 0.0429844856262207, 0.04383504390716553, 0.04468560218811035, 0.045536160469055176, 0.04638671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 14.0, 38.0, 87.0, 226.0, 594.0, 4192025.0, 697.0, 288.0, 188.0, 68.0, 35.0, 17.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.30078125, -1.2266845703125, -1.152587890625, -1.0784912109375, -1.00439453125, -0.9302978515625, -0.856201171875, -0.7821044921875, -0.7080078125, -0.6339111328125, -0.559814453125, -0.4857177734375, -0.41162109375, -0.3375244140625, -0.263427734375, -0.1893310546875, -0.115234375, -0.0411376953125, 0.032958984375, 0.1070556640625, 0.18115234375, 0.2552490234375, 0.329345703125, 0.4034423828125, 0.4775390625, 0.5516357421875, 0.625732421875, 0.6998291015625, 0.77392578125, 0.8480224609375, 0.922119140625, 0.9962158203125, 1.0703125, 1.1444091796875, 1.218505859375, 1.2926025390625, 1.36669921875, 1.4407958984375, 1.514892578125, 1.5889892578125, 1.6630859375, 1.7371826171875, 1.811279296875, 1.8853759765625, 1.95947265625, 2.0335693359375, 2.107666015625, 2.1817626953125, 2.255859375, 2.3299560546875, 2.404052734375, 2.4781494140625, 2.55224609375, 2.6263427734375, 2.700439453125, 2.7745361328125, 2.8486328125, 2.9227294921875, 2.996826171875, 3.0709228515625, 3.14501953125, 3.2191162109375, 3.293212890625, 3.3673095703125, 3.44140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 18.0, 113.0, 3906.0, 46.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.06262588500976562, -0.05664825439453125, -0.050670623779296875, -0.0446929931640625, -0.038715362548828125, -0.03273773193359375, -0.026760101318359375, -0.020782470703125, -0.014804840087890625, -0.00882720947265625, -0.002849578857421875, 0.0031280517578125, 0.009105682373046875, 0.01508331298828125, 0.021060943603515625, 0.02703857421875, 0.033016204833984375, 0.03899383544921875, 0.044971466064453125, 0.0509490966796875, 0.056926727294921875, 0.06290435791015625, 0.06888198852539062, 0.074859619140625, 0.08083724975585938, 0.08681488037109375, 0.09279251098632812, 0.0987701416015625, 0.10474777221679688, 0.11072540283203125, 0.11670303344726562, 0.1226806640625, 0.12865829467773438, 0.13463592529296875, 0.14061355590820312, 0.1465911865234375, 0.15256881713867188, 0.15854644775390625, 0.16452407836914062, 0.170501708984375, 0.17647933959960938, 0.18245697021484375, 0.18843460083007812, 0.1944122314453125, 0.20038986206054688, 0.20636749267578125, 0.21234512329101562, 0.21832275390625, 0.22430038452148438, 0.23027801513671875, 0.23625564575195312, 0.2422332763671875, 0.24821090698242188, 0.25418853759765625, 0.2601661682128906, 0.266143798828125, 0.2721214294433594, 0.27809906005859375, 0.2840766906738281, 0.2900543212890625, 0.2960319519042969, 0.30200958251953125, 0.3079872131347656, 0.31396484375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 22.0, 690.0, 274.0, 17.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1373865604400635, -1.0554683208465576, -0.9735502004623413, -0.8916320204734802, -0.8097138404846191, -0.7277956604957581, -0.645877480506897, -0.5639593005180359, -0.4820411205291748, -0.4001229405403137, -0.31820476055145264, -0.23628658056259155, -0.15436840057373047, -0.07245022058486938, 0.0094679594039917, 0.09138613939285278, 0.17330431938171387, 0.25522249937057495, 0.33714067935943604, 0.4190588593482971, 0.5009770393371582, 0.5828952193260193, 0.6648133993148804, 0.7467315793037415, 0.8286497592926025, 0.9105679392814636, 0.9924861192703247, 1.074404239654541, 1.1563224792480469, 1.2382407188415527, 1.320158839225769, 1.4020769596099854, 1.483994960784912, 1.565913200378418, 1.6478313207626343, 1.7297494411468506, 1.8116676807403564, 1.8935859203338623, 1.9755040407180786, 2.057422161102295, 2.139340400695801, 2.2212586402893066, 2.3031768798828125, 2.3850948810577393, 2.467013120651245, 2.548931360244751, 2.6308493614196777, 2.7127676010131836, 2.7946858406066895, 2.8766040802001953, 2.958522319793701, 3.040440320968628, 3.122358560562134, 3.2042768001556396, 3.2861948013305664, 3.3681130409240723, 3.450031280517578, 3.531949520111084, 3.61386775970459, 3.6957857608795166, 3.7777040004730225, 3.8596222400665283, 3.941540241241455, 4.023458480834961, 4.105376720428467]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 13.0, 20.0, 62.0, 87.0, 120.0, 158.0, 183.0, 138.0, 103.0, 53.0, 33.0, 18.0, 7.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0028475522994995, -0.9718499183654785, -0.9408523440361023, -0.9098547101020813, -0.8788571357727051, -0.8478595018386841, -0.8168618679046631, -0.7858642339706421, -0.7548666596412659, -0.7238690257072449, -0.6928714513778687, -0.6618738174438477, -0.6308761835098267, -0.5998786091804504, -0.5688809752464294, -0.5378834009170532, -0.5068857669830322, -0.4758881628513336, -0.444890558719635, -0.413892924785614, -0.3828953206539154, -0.3518977165222168, -0.3209000825881958, -0.2899024784564972, -0.2589048743247986, -0.22790727019309998, -0.19690965116024017, -0.16591203212738037, -0.13491442799568176, -0.10391682386398315, -0.07291920483112335, -0.04192158579826355, -0.010923981666564941, 0.020073629915714264, 0.05107124149799347, 0.08206885308027267, 0.11306646466255188, 0.1440640687942505, 0.1750616878271103, 0.2060593068599701, 0.2370569109916687, 0.2680545151233673, 0.2990521192550659, 0.3300497531890869, 0.3610473573207855, 0.39204496145248413, 0.4230425953865051, 0.45404019951820374, 0.48503780364990234, 0.5160354375839233, 0.5470330119132996, 0.5780306458473206, 0.6090282201766968, 0.6400258541107178, 0.6710234880447388, 0.7020211219787598, 0.733018696308136, 0.764016330242157, 0.7950139045715332, 0.8260115385055542, 0.8570091724395752, 0.8880067467689514, 0.9190043807029724, 0.9500019550323486, 0.9809995889663696]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 8.0, 9.0, 14.0, 10.0, 16.0, 39.0, 49.0, 85.0, 127.0, 238.0, 488.0, 1286.0, 5028.0, 46545.0, 915497.0, 70292.0, 6169.0, 1468.0, 564.0, 243.0, 124.0, 79.0, 49.0, 37.0, 19.0, 15.0, 12.0, 12.0, 6.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.351318359375, -0.340850830078125, -0.33038330078125, -0.319915771484375, -0.3094482421875, -0.298980712890625, -0.28851318359375, -0.278045654296875, -0.267578125, -0.257110595703125, -0.24664306640625, -0.236175537109375, -0.2257080078125, -0.215240478515625, -0.20477294921875, -0.194305419921875, -0.183837890625, -0.173370361328125, -0.16290283203125, -0.152435302734375, -0.1419677734375, -0.131500244140625, -0.12103271484375, -0.110565185546875, -0.10009765625, -0.089630126953125, -0.07916259765625, -0.068695068359375, -0.0582275390625, -0.047760009765625, -0.03729248046875, -0.026824951171875, -0.016357421875, -0.005889892578125, 0.00457763671875, 0.015045166015625, 0.0255126953125, 0.035980224609375, 0.04644775390625, 0.056915283203125, 0.0673828125, 0.077850341796875, 0.08831787109375, 0.098785400390625, 0.1092529296875, 0.119720458984375, 0.13018798828125, 0.140655517578125, 0.151123046875, 0.161590576171875, 0.17205810546875, 0.182525634765625, 0.1929931640625, 0.203460693359375, 0.21392822265625, 0.224395751953125, 0.23486328125, 0.245330810546875, 0.25579833984375, 0.266265869140625, 0.2767333984375, 0.287200927734375, 0.29766845703125, 0.308135986328125, 0.318603515625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 26.0, 33.0, 63.0, 96.0, 142.0, 166.0, 167.0, 121.0, 92.0, 34.0, 29.0, 19.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03485107421875, -0.033184051513671875, -0.03151702880859375, -0.029850006103515625, -0.0281829833984375, -0.026515960693359375, -0.02484893798828125, -0.023181915283203125, -0.021514892578125, -0.019847869873046875, -0.01818084716796875, -0.016513824462890625, -0.0148468017578125, -0.013179779052734375, -0.01151275634765625, -0.009845733642578125, -0.0081787109375, -0.006511688232421875, -0.00484466552734375, -0.003177642822265625, -0.0015106201171875, 0.000156402587890625, 0.00182342529296875, 0.003490447998046875, 0.005157470703125, 0.006824493408203125, 0.00849151611328125, 0.010158538818359375, 0.0118255615234375, 0.013492584228515625, 0.01515960693359375, 0.016826629638671875, 0.01849365234375, 0.020160675048828125, 0.02182769775390625, 0.023494720458984375, 0.0251617431640625, 0.026828765869140625, 0.02849578857421875, 0.030162811279296875, 0.031829833984375, 0.033496856689453125, 0.03516387939453125, 0.036830902099609375, 0.0384979248046875, 0.040164947509765625, 0.04183197021484375, 0.043498992919921875, 0.045166015625, 0.046833038330078125, 0.04850006103515625, 0.050167083740234375, 0.0518341064453125, 0.053501129150390625, 0.05516815185546875, 0.056835174560546875, 0.058502197265625, 0.060169219970703125, 0.06183624267578125, 0.06350326538085938, 0.0651702880859375, 0.06683731079101562, 0.06850433349609375, 0.07017135620117188, 0.07183837890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 14.0, 10.0, 14.0, 21.0, 19.0, 31.0, 31.0, 80.0, 96.0, 184.0, 474.0, 1642.0, 19818.0, 936016.0, 85349.0, 3434.0, 673.0, 261.0, 130.0, 76.0, 40.0, 32.0, 23.0, 18.0, 15.0, 9.0, 8.0, 7.0, 3.0, 3.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.2728996276855469, -0.26454925537109375, -0.2561988830566406, -0.2478485107421875, -0.23949813842773438, -0.23114776611328125, -0.22279739379882812, -0.214447021484375, -0.20609664916992188, -0.19774627685546875, -0.18939590454101562, -0.1810455322265625, -0.17269515991210938, -0.16434478759765625, -0.15599441528320312, -0.14764404296875, -0.13929367065429688, -0.13094329833984375, -0.12259292602539062, -0.1142425537109375, -0.10589218139648438, -0.09754180908203125, -0.08919143676757812, -0.080841064453125, -0.07249069213867188, -0.06414031982421875, -0.055789947509765625, -0.0474395751953125, -0.039089202880859375, -0.03073883056640625, -0.022388458251953125, -0.0140380859375, -0.005687713623046875, 0.00266265869140625, 0.011013031005859375, 0.0193634033203125, 0.027713775634765625, 0.03606414794921875, 0.044414520263671875, 0.052764892578125, 0.061115264892578125, 0.06946563720703125, 0.07781600952148438, 0.0861663818359375, 0.09451675415039062, 0.10286712646484375, 0.11121749877929688, 0.11956787109375, 0.12791824340820312, 0.13626861572265625, 0.14461898803710938, 0.1529693603515625, 0.16131973266601562, 0.16967010498046875, 0.17802047729492188, 0.186370849609375, 0.19472122192382812, 0.20307159423828125, 0.21142196655273438, 0.2197723388671875, 0.22812271118164062, 0.23647308349609375, 0.24482345581054688, 0.253173828125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 7.0, 3.0, 3.0, 2.0, 7.0, 9.0, 12.0, 12.0, 21.0, 20.0, 21.0, 28.0, 37.0, 44.0, 46.0, 51.0, 56.0, 46.0, 48.0, 53.0, 54.0, 54.0, 63.0, 48.0, 42.0, 33.0, 34.0, 34.0, 28.0, 22.0, 21.0, 14.0, 9.0, 3.0, 6.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09820556640625, -0.09527778625488281, -0.09235000610351562, -0.08942222595214844, -0.08649444580078125, -0.08356666564941406, -0.08063888549804688, -0.07771110534667969, -0.0747833251953125, -0.07185554504394531, -0.06892776489257812, -0.06599998474121094, -0.06307220458984375, -0.06014442443847656, -0.057216644287109375, -0.05428886413574219, -0.051361083984375, -0.04843330383300781, -0.045505523681640625, -0.04257774353027344, -0.03964996337890625, -0.03672218322753906, -0.033794403076171875, -0.030866622924804688, -0.0279388427734375, -0.025011062622070312, -0.022083282470703125, -0.019155502319335938, -0.01622772216796875, -0.013299942016601562, -0.010372161865234375, -0.0074443817138671875, -0.0045166015625, -0.0015888214111328125, 0.001338958740234375, 0.0042667388916015625, 0.00719451904296875, 0.010122299194335938, 0.013050079345703125, 0.015977859497070312, 0.0189056396484375, 0.021833419799804688, 0.024761199951171875, 0.027688980102539062, 0.03061676025390625, 0.03354454040527344, 0.036472320556640625, 0.03940010070800781, 0.042327880859375, 0.04525566101074219, 0.048183441162109375, 0.05111122131347656, 0.05403900146484375, 0.05696678161621094, 0.059894561767578125, 0.06282234191894531, 0.0657501220703125, 0.06867790222167969, 0.07160568237304688, 0.07453346252441406, 0.07746124267578125, 0.08038902282714844, 0.08331680297851562, 0.08624458312988281, 0.08917236328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 14.0, 19.0, 14.0, 41.0, 94.0, 198.0, 461.0, 1427.0, 5341.0, 77841.0, 922197.0, 35220.0, 3854.0, 1093.0, 384.0, 174.0, 73.0, 31.0, 23.0, 13.0, 5.0, 7.0, 8.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1104736328125, -0.10683917999267578, -0.10320472717285156, -0.09957027435302734, -0.09593582153320312, -0.0923013687133789, -0.08866691589355469, -0.08503246307373047, -0.08139801025390625, -0.07776355743408203, -0.07412910461425781, -0.0704946517944336, -0.06686019897460938, -0.06322574615478516, -0.05959129333496094, -0.05595684051513672, -0.0523223876953125, -0.04868793487548828, -0.04505348205566406, -0.041419029235839844, -0.037784576416015625, -0.034150123596191406, -0.030515670776367188, -0.02688121795654297, -0.02324676513671875, -0.01961231231689453, -0.015977859497070312, -0.012343406677246094, -0.008708953857421875, -0.005074501037597656, -0.0014400482177734375, 0.0021944046020507812, 0.005828857421875, 0.009463310241699219, 0.013097763061523438, 0.016732215881347656, 0.020366668701171875, 0.024001121520996094, 0.027635574340820312, 0.03127002716064453, 0.03490447998046875, 0.03853893280029297, 0.04217338562011719, 0.045807838439941406, 0.049442291259765625, 0.053076744079589844, 0.05671119689941406, 0.06034564971923828, 0.0639801025390625, 0.06761455535888672, 0.07124900817871094, 0.07488346099853516, 0.07851791381835938, 0.0821523666381836, 0.08578681945800781, 0.08942127227783203, 0.09305572509765625, 0.09669017791748047, 0.10032463073730469, 0.1039590835571289, 0.10759353637695312, 0.11122798919677734, 0.11486244201660156, 0.11849689483642578, 0.12213134765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 11.0, 15.0, 22.0, 25.0, 53.0, 59.0, 79.0, 108.0, 99.0, 128.0, 118.0, 106.0, 59.0, 34.0, 27.0, 16.0, 16.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5437602996826172e-05, -1.509394496679306e-05, -1.4750286936759949e-05, -1.4406628906726837e-05, -1.4062970876693726e-05, -1.3719312846660614e-05, -1.3375654816627502e-05, -1.3031996786594391e-05, -1.268833875656128e-05, -1.2344680726528168e-05, -1.2001022696495056e-05, -1.1657364666461945e-05, -1.1313706636428833e-05, -1.0970048606395721e-05, -1.062639057636261e-05, -1.0282732546329498e-05, -9.939074516296387e-06, -9.595416486263275e-06, -9.251758456230164e-06, -8.908100426197052e-06, -8.56444239616394e-06, -8.220784366130829e-06, -7.877126336097717e-06, -7.533468306064606e-06, -7.189810276031494e-06, -6.8461522459983826e-06, -6.502494215965271e-06, -6.1588361859321594e-06, -5.815178155899048e-06, -5.471520125865936e-06, -5.127862095832825e-06, -4.784204065799713e-06, -4.4405460357666016e-06, -4.09688800573349e-06, -3.7532299757003784e-06, -3.409571945667267e-06, -3.0659139156341553e-06, -2.7222558856010437e-06, -2.378597855567932e-06, -2.0349398255348206e-06, -1.691281795501709e-06, -1.3476237654685974e-06, -1.0039657354354858e-06, -6.603077054023743e-07, -3.166496753692627e-07, 2.7008354663848877e-08, 3.7066638469696045e-07, 7.14324414730072e-07, 1.0579824447631836e-06, 1.4016404747962952e-06, 1.7452985048294067e-06, 2.0889565348625183e-06, 2.43261456489563e-06, 2.7762725949287415e-06, 3.119930624961853e-06, 3.4635886549949646e-06, 3.807246685028076e-06, 4.150904715061188e-06, 4.494562745094299e-06, 4.838220775127411e-06, 5.1818788051605225e-06, 5.525536835193634e-06, 5.869194865226746e-06, 6.212852895259857e-06, 6.556510925292969e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 8.0, 7.0, 15.0, 11.0, 40.0, 46.0, 92.0, 289.0, 934.0, 5874.0, 324370.0, 705858.0, 9212.0, 1219.0, 337.0, 104.0, 50.0, 33.0, 22.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1258544921875, -0.12137413024902344, -0.11689376831054688, -0.11241340637207031, -0.10793304443359375, -0.10345268249511719, -0.09897232055664062, -0.09449195861816406, -0.0900115966796875, -0.08553123474121094, -0.08105087280273438, -0.07657051086425781, -0.07209014892578125, -0.06760978698730469, -0.06312942504882812, -0.05864906311035156, -0.054168701171875, -0.04968833923339844, -0.045207977294921875, -0.04072761535644531, -0.03624725341796875, -0.03176689147949219, -0.027286529541015625, -0.022806167602539062, -0.0183258056640625, -0.013845443725585938, -0.009365081787109375, -0.0048847198486328125, -0.00040435791015625, 0.0040760040283203125, 0.008556365966796875, 0.013036727905273438, 0.01751708984375, 0.021997451782226562, 0.026477813720703125, 0.030958175659179688, 0.03543853759765625, 0.03991889953613281, 0.044399261474609375, 0.04887962341308594, 0.0533599853515625, 0.05784034729003906, 0.062320709228515625, 0.06680107116699219, 0.07128143310546875, 0.07576179504394531, 0.08024215698242188, 0.08472251892089844, 0.089202880859375, 0.09368324279785156, 0.09816360473632812, 0.10264396667480469, 0.10712432861328125, 0.11160469055175781, 0.11608505249023438, 0.12056541442871094, 0.1250457763671875, 0.12952613830566406, 0.13400650024414062, 0.1384868621826172, 0.14296722412109375, 0.1474475860595703, 0.15192794799804688, 0.15640830993652344, 0.160888671875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 7.0, 7.0, 9.0, 11.0, 15.0, 29.0, 37.0, 55.0, 70.0, 83.0, 121.0, 132.0, 102.0, 88.0, 76.0, 39.0, 25.0, 18.0, 18.0, 17.0, 10.0, 2.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04547119140625, -0.044148921966552734, -0.04282665252685547, -0.0415043830871582, -0.04018211364746094, -0.03885984420776367, -0.037537574768066406, -0.03621530532836914, -0.034893035888671875, -0.03357076644897461, -0.032248497009277344, -0.030926227569580078, -0.029603958129882812, -0.028281688690185547, -0.02695941925048828, -0.025637149810791016, -0.02431488037109375, -0.022992610931396484, -0.02167034149169922, -0.020348072052001953, -0.019025802612304688, -0.017703533172607422, -0.016381263732910156, -0.01505899429321289, -0.013736724853515625, -0.01241445541381836, -0.011092185974121094, -0.009769916534423828, -0.008447647094726562, -0.007125377655029297, -0.005803108215332031, -0.004480838775634766, -0.0031585693359375, -0.0018362998962402344, -0.0005140304565429688, 0.0008082389831542969, 0.0021305084228515625, 0.003452777862548828, 0.004775047302246094, 0.006097316741943359, 0.007419586181640625, 0.00874185562133789, 0.010064125061035156, 0.011386394500732422, 0.012708663940429688, 0.014030933380126953, 0.015353202819824219, 0.016675472259521484, 0.01799774169921875, 0.019320011138916016, 0.02064228057861328, 0.021964550018310547, 0.023286819458007812, 0.024609088897705078, 0.025931358337402344, 0.02725362777709961, 0.028575897216796875, 0.02989816665649414, 0.031220436096191406, 0.03254270553588867, 0.03386497497558594, 0.0351872444152832, 0.03650951385498047, 0.037831783294677734, 0.039154052734375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 5.0, 23.0, 80.0, 386.0, 436.0, 58.0, 10.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.91969895362854, -1.8652253150939941, -1.8107515573501587, -1.7562779188156128, -1.701804280281067, -1.6473305225372314, -1.5928568840026855, -1.5383832454681396, -1.4839094877243042, -1.4294358491897583, -1.3749620914459229, -1.320488452911377, -1.266014814376831, -1.2115410566329956, -1.1570674180984497, -1.1025936603546143, -1.0481200218200684, -0.9936463236808777, -0.9391726851463318, -0.8846989870071411, -0.8302252888679504, -0.7757515907287598, -0.7212779521942139, -0.6668042540550232, -0.6123306751251221, -0.5578569769859314, -0.5033833384513855, -0.4489096403121948, -0.39443594217300415, -0.33996227383613586, -0.2854886054992676, -0.2310149073600769, -0.17654120922088623, -0.12206752598285675, -0.06759385019540787, -0.013120174407958984, 0.041353508830070496, 0.09582719206809998, 0.15030086040496826, 0.20477455854415894, 0.2592482268810272, 0.3137218952178955, 0.3681955933570862, 0.42266926169395447, 0.47714293003082275, 0.5316166281700134, 0.5860903263092041, 0.64056396484375, 0.6950376629829407, 0.7495113611221313, 0.8039849996566772, 0.8584586977958679, 0.9129323959350586, 0.9674060344696045, 1.0218796730041504, 1.0763534307479858, 1.1308270692825317, 1.1853007078170776, 1.239774465560913, 1.294248104095459, 1.3487217426300049, 1.4031955003738403, 1.4576691389083862, 1.5121428966522217, 1.5666165351867676]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 2.0, 2.0, 5.0, 5.0, 8.0, 8.0, 9.0, 19.0, 19.0, 26.0, 26.0, 34.0, 41.0, 60.0, 43.0, 68.0, 64.0, 65.0, 56.0, 68.0, 68.0, 49.0, 51.0, 33.0, 38.0, 34.0, 22.0, 24.0, 19.0, 9.0, 8.0, 10.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.699747622013092, -0.6778216361999512, -0.6558957099914551, -0.6339697241783142, -0.6120437383651733, -0.5901177525520325, -0.5681917667388916, -0.5462658405303955, -0.5243398547172546, -0.5024138689041138, -0.4804879128932953, -0.4585619568824768, -0.43663597106933594, -0.41470998525619507, -0.3927840292453766, -0.3708580732345581, -0.34893208742141724, -0.32700610160827637, -0.3050801455974579, -0.2831541895866394, -0.26122820377349854, -0.23930223286151886, -0.21737626194953918, -0.1954502910375595, -0.17352432012557983, -0.15159834921360016, -0.12967237830162048, -0.10774640738964081, -0.08582043647766113, -0.06389446556568146, -0.04196849465370178, -0.020042523741722107, 0.0018834471702575684, 0.023809418082237244, 0.04573538899421692, 0.0676613599061966, 0.08958733081817627, 0.11151330173015594, 0.13343927264213562, 0.1553652435541153, 0.17729121446609497, 0.19921718537807465, 0.22114315629005432, 0.243069127202034, 0.26499509811401367, 0.28692108392715454, 0.308847039937973, 0.3307729959487915, 0.3526989817619324, 0.37462496757507324, 0.3965509235858917, 0.4184768795967102, 0.4404028654098511, 0.46232885122299194, 0.4842548072338104, 0.5061807632446289, 0.5281067490577698, 0.5500327348709106, 0.5719586610794067, 0.5938846468925476, 0.6158106327056885, 0.6377366185188293, 0.6596626043319702, 0.6815885305404663, 0.7035145163536072]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 8.0, 12.0, 20.0, 31.0, 123.0, 385.0, 1395.0, 8794.0, 269802.0, 3887548.0, 21000.0, 3122.0, 994.0, 425.0, 204.0, 121.0, 86.0, 54.0, 46.0, 24.0, 28.0, 17.0, 12.0, 9.0, 6.0, 3.0, 8.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1927490234375, -0.1781177520751953, -0.16348648071289062, -0.14885520935058594, -0.13422393798828125, -0.11959266662597656, -0.10496139526367188, -0.09033012390136719, -0.0756988525390625, -0.06106758117675781, -0.046436309814453125, -0.03180503845214844, -0.01717376708984375, -0.0025424957275390625, 0.012088775634765625, 0.026720046997070312, 0.041351318359375, 0.05598258972167969, 0.07061386108398438, 0.08524513244628906, 0.09987640380859375, 0.11450767517089844, 0.12913894653320312, 0.1437702178955078, 0.1584014892578125, 0.1730327606201172, 0.18766403198242188, 0.20229530334472656, 0.21692657470703125, 0.23155784606933594, 0.24618911743164062, 0.2608203887939453, 0.27545166015625, 0.2900829315185547, 0.3047142028808594, 0.31934547424316406, 0.33397674560546875, 0.34860801696777344, 0.3632392883300781, 0.3778705596923828, 0.3925018310546875, 0.4071331024169922, 0.4217643737792969, 0.43639564514160156, 0.45102691650390625, 0.46565818786621094, 0.4802894592285156, 0.4949207305908203, 0.509552001953125, 0.5241832733154297, 0.5388145446777344, 0.5534458160400391, 0.5680770874023438, 0.5827083587646484, 0.5973396301269531, 0.6119709014892578, 0.6266021728515625, 0.6412334442138672, 0.6558647155761719, 0.6704959869384766, 0.6851272583007812, 0.6997585296630859, 0.7143898010253906, 0.7290210723876953, 0.74365234375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 4.0, 6.0, 9.0, 24.0, 44.0, 61.0, 81.0, 124.0, 163.0, 141.0, 122.0, 91.0, 64.0, 34.0, 16.0, 13.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020111083984375, -0.018572330474853516, -0.01703357696533203, -0.015494823455810547, -0.013956069946289062, -0.012417316436767578, -0.010878562927246094, -0.00933980941772461, -0.007801055908203125, -0.006262302398681641, -0.004723548889160156, -0.003184795379638672, -0.0016460418701171875, -0.00010728836059570312, 0.0014314651489257812, 0.0029702186584472656, 0.00450897216796875, 0.006047725677490234, 0.007586479187011719, 0.009125232696533203, 0.010663986206054688, 0.012202739715576172, 0.013741493225097656, 0.01528024673461914, 0.016819000244140625, 0.01835775375366211, 0.019896507263183594, 0.021435260772705078, 0.022974014282226562, 0.024512767791748047, 0.02605152130126953, 0.027590274810791016, 0.0291290283203125, 0.030667781829833984, 0.03220653533935547, 0.03374528884887695, 0.03528404235839844, 0.03682279586791992, 0.038361549377441406, 0.03990030288696289, 0.041439056396484375, 0.04297780990600586, 0.044516563415527344, 0.04605531692504883, 0.04759407043457031, 0.0491328239440918, 0.05067157745361328, 0.052210330963134766, 0.05374908447265625, 0.055287837982177734, 0.05682659149169922, 0.0583653450012207, 0.05990409851074219, 0.06144285202026367, 0.06298160552978516, 0.06452035903930664, 0.06605911254882812, 0.06759786605834961, 0.0691366195678711, 0.07067537307739258, 0.07221412658691406, 0.07375288009643555, 0.07529163360595703, 0.07683038711547852, 0.078369140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 8.0, 36.0, 85.0, 312.0, 86642.0, 4106266.0, 678.0, 164.0, 63.0, 20.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2734375, -1.194091796875, -1.11474609375, -1.035400390625, -0.9560546875, -0.876708984375, -0.79736328125, -0.718017578125, -0.638671875, -0.559326171875, -0.47998046875, -0.400634765625, -0.3212890625, -0.241943359375, -0.16259765625, -0.083251953125, -0.00390625, 0.075439453125, 0.15478515625, 0.234130859375, 0.3134765625, 0.392822265625, 0.47216796875, 0.551513671875, 0.630859375, 0.710205078125, 0.78955078125, 0.868896484375, 0.9482421875, 1.027587890625, 1.10693359375, 1.186279296875, 1.265625, 1.344970703125, 1.42431640625, 1.503662109375, 1.5830078125, 1.662353515625, 1.74169921875, 1.821044921875, 1.900390625, 1.979736328125, 2.05908203125, 2.138427734375, 2.2177734375, 2.297119140625, 2.37646484375, 2.455810546875, 2.53515625, 2.614501953125, 2.69384765625, 2.773193359375, 2.8525390625, 2.931884765625, 3.01123046875, 3.090576171875, 3.169921875, 3.249267578125, 3.32861328125, 3.407958984375, 3.4873046875, 3.566650390625, 3.64599609375, 3.725341796875, 3.8046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 8.0, 20.0, 61.0, 508.0, 3299.0, 141.0, 31.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050628662109375, -0.04443979263305664, -0.03825092315673828, -0.03206205368041992, -0.025873184204101562, -0.019684314727783203, -0.013495445251464844, -0.007306575775146484, -0.001117706298828125, 0.005071163177490234, 0.011260032653808594, 0.017448902130126953, 0.023637771606445312, 0.029826641082763672, 0.03601551055908203, 0.04220438003540039, 0.04839324951171875, 0.05458211898803711, 0.06077098846435547, 0.06695985794067383, 0.07314872741699219, 0.07933759689331055, 0.0855264663696289, 0.09171533584594727, 0.09790420532226562, 0.10409307479858398, 0.11028194427490234, 0.1164708137512207, 0.12265968322753906, 0.12884855270385742, 0.13503742218017578, 0.14122629165649414, 0.1474151611328125, 0.15360403060913086, 0.15979290008544922, 0.16598176956176758, 0.17217063903808594, 0.1783595085144043, 0.18454837799072266, 0.19073724746704102, 0.19692611694335938, 0.20311498641967773, 0.2093038558959961, 0.21549272537231445, 0.2216815948486328, 0.22787046432495117, 0.23405933380126953, 0.2402482032775879, 0.24643707275390625, 0.2526259422302246, 0.25881481170654297, 0.26500368118286133, 0.2711925506591797, 0.27738142013549805, 0.2835702896118164, 0.28975915908813477, 0.2959480285644531, 0.3021368980407715, 0.30832576751708984, 0.3145146369934082, 0.32070350646972656, 0.3268923759460449, 0.3330812454223633, 0.33927011489868164, 0.345458984375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 43.0, 727.0, 204.0, 22.0, 10.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4796266555786133, -2.4119467735290527, -2.344266891479492, -2.2765870094299316, -2.208907127380371, -2.1412272453308105, -2.07354736328125, -2.0058674812316895, -1.9381877183914185, -1.870507836341858, -1.8028279542922974, -1.7351480722427368, -1.6674683094024658, -1.5997884273529053, -1.5321085453033447, -1.4644286632537842, -1.3967487812042236, -1.329068899154663, -1.2613890171051025, -1.193709135055542, -1.1260292530059814, -1.058349370956421, -0.9906696081161499, -0.9229897260665894, -0.8553098440170288, -0.7876299619674683, -0.7199500799179077, -0.6522702574729919, -0.5845903754234314, -0.5169104933738708, -0.4492306411266327, -0.38155078887939453, -0.31387102603912354, -0.24619115889072418, -0.17851129174232483, -0.11083142459392548, -0.04315155744552612, 0.024528324604034424, 0.09220817685127258, 0.15988802909851074, 0.2275679111480713, 0.29524779319763184, 0.36292764544487, 0.43060749769210815, 0.4982873797416687, 0.5659672617912292, 0.633647084236145, 0.7013269662857056, 0.7690068483352661, 0.8366867303848267, 0.9043666124343872, 0.972046434879303, 1.0397262573242188, 1.1074061393737793, 1.1750860214233398, 1.2427659034729004, 1.310445785522461, 1.3781256675720215, 1.445805549621582, 1.5134854316711426, 1.5811653137207031, 1.6488451957702637, 1.7165249586105347, 1.7842048406600952, 1.8518847227096558]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 18.0, 19.0, 35.0, 51.0, 77.0, 83.0, 101.0, 133.0, 117.0, 88.0, 77.0, 80.0, 47.0, 26.0, 18.0, 10.0, 11.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6839224696159363, -0.6592913269996643, -0.6346602439880371, -0.6100291013717651, -0.5853979587554932, -0.5607668161392212, -0.5361356735229492, -0.511504590511322, -0.48687344789505005, -0.4622423052787781, -0.4376111924648285, -0.4129800796508789, -0.38834893703460693, -0.36371779441833496, -0.3390866816043854, -0.3144555687904358, -0.2898244261741638, -0.26519328355789185, -0.24056217074394226, -0.21593104302883148, -0.1912999153137207, -0.16666878759860992, -0.14203765988349915, -0.11740653216838837, -0.09277540445327759, -0.06814427673816681, -0.04351314902305603, -0.01888202130794525, 0.005749106407165527, 0.030380234122276306, 0.055011361837387085, 0.07964248955249786, 0.10427355766296387, 0.12890468537807465, 0.15353581309318542, 0.1781669408082962, 0.20279806852340698, 0.22742919623851776, 0.25206032395362854, 0.2766914367675781, 0.3013225793838501, 0.32595372200012207, 0.35058483481407166, 0.37521594762802124, 0.3998470902442932, 0.4244782328605652, 0.44910934567451477, 0.47374045848846436, 0.49837160110473633, 0.5230027437210083, 0.5476338863372803, 0.5722649693489075, 0.5968961119651794, 0.6215272545814514, 0.6461583375930786, 0.6707894802093506, 0.6954206228256226, 0.7200517654418945, 0.7446829080581665, 0.7693139910697937, 0.7939451336860657, 0.8185762763023376, 0.8432073593139648, 0.8678385019302368, 0.8924696445465088]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 5.0, 12.0, 12.0, 14.0, 17.0, 21.0, 24.0, 33.0, 35.0, 62.0, 75.0, 82.0, 129.0, 170.0, 243.0, 363.0, 599.0, 1193.0, 2539.0, 7032.0, 23074.0, 97187.0, 587006.0, 259177.0, 47967.0, 13022.0, 4314.0, 1749.0, 812.0, 458.0, 308.0, 208.0, 146.0, 105.0, 84.0, 67.0, 44.0, 34.0, 30.0, 28.0, 22.0, 13.0, 12.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1522216796875, -0.1471080780029297, -0.14199447631835938, -0.13688087463378906, -0.13176727294921875, -0.12665367126464844, -0.12154006958007812, -0.11642646789550781, -0.1113128662109375, -0.10619926452636719, -0.10108566284179688, -0.09597206115722656, -0.09085845947265625, -0.08574485778808594, -0.08063125610351562, -0.07551765441894531, -0.070404052734375, -0.06529045104980469, -0.060176849365234375, -0.05506324768066406, -0.04994964599609375, -0.04483604431152344, -0.039722442626953125, -0.03460884094238281, -0.0294952392578125, -0.024381637573242188, -0.019268035888671875, -0.014154434204101562, -0.00904083251953125, -0.0039272308349609375, 0.001186370849609375, 0.0062999725341796875, 0.01141357421875, 0.016527175903320312, 0.021640777587890625, 0.026754379272460938, 0.03186798095703125, 0.03698158264160156, 0.042095184326171875, 0.04720878601074219, 0.0523223876953125, 0.05743598937988281, 0.06254959106445312, 0.06766319274902344, 0.07277679443359375, 0.07789039611816406, 0.08300399780273438, 0.08811759948730469, 0.093231201171875, 0.09834480285644531, 0.10345840454101562, 0.10857200622558594, 0.11368560791015625, 0.11879920959472656, 0.12391281127929688, 0.1290264129638672, 0.1341400146484375, 0.1392536163330078, 0.14436721801757812, 0.14948081970214844, 0.15459442138671875, 0.15970802307128906, 0.16482162475585938, 0.1699352264404297, 0.175048828125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 9.0, 17.0, 27.0, 36.0, 52.0, 70.0, 73.0, 95.0, 103.0, 116.0, 79.0, 81.0, 73.0, 59.0, 37.0, 27.0, 14.0, 7.0, 9.0, 10.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039703369140625, -0.03791189193725586, -0.03612041473388672, -0.03432893753051758, -0.03253746032714844, -0.030745983123779297, -0.028954505920410156, -0.027163028717041016, -0.025371551513671875, -0.023580074310302734, -0.021788597106933594, -0.019997119903564453, -0.018205642700195312, -0.016414165496826172, -0.014622688293457031, -0.01283121109008789, -0.01103973388671875, -0.00924825668334961, -0.007456779479980469, -0.005665302276611328, -0.0038738250732421875, -0.002082347869873047, -0.00029087066650390625, 0.0015006065368652344, 0.003292083740234375, 0.005083560943603516, 0.006875038146972656, 0.008666515350341797, 0.010457992553710938, 0.012249469757080078, 0.014040946960449219, 0.01583242416381836, 0.0176239013671875, 0.01941537857055664, 0.02120685577392578, 0.022998332977294922, 0.024789810180664062, 0.026581287384033203, 0.028372764587402344, 0.030164241790771484, 0.031955718994140625, 0.033747196197509766, 0.035538673400878906, 0.03733015060424805, 0.03912162780761719, 0.04091310501098633, 0.04270458221435547, 0.04449605941772461, 0.04628753662109375, 0.04807901382446289, 0.04987049102783203, 0.05166196823120117, 0.05345344543457031, 0.05524492263793945, 0.057036399841308594, 0.058827877044677734, 0.060619354248046875, 0.062410831451416016, 0.06420230865478516, 0.0659937858581543, 0.06778526306152344, 0.06957674026489258, 0.07136821746826172, 0.07315969467163086, 0.074951171875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 12.0, 7.0, 14.0, 22.0, 31.0, 45.0, 66.0, 99.0, 186.0, 489.0, 1665.0, 8648.0, 112215.0, 862262.0, 55109.0, 5588.0, 1241.0, 410.0, 167.0, 93.0, 49.0, 40.0, 23.0, 12.0, 12.0, 10.0, 11.0, 2.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.280517578125, -0.2730140686035156, -0.26551055908203125, -0.2580070495605469, -0.2505035400390625, -0.24300003051757812, -0.23549652099609375, -0.22799301147460938, -0.220489501953125, -0.21298599243164062, -0.20548248291015625, -0.19797897338867188, -0.1904754638671875, -0.18297195434570312, -0.17546844482421875, -0.16796493530273438, -0.16046142578125, -0.15295791625976562, -0.14545440673828125, -0.13795089721679688, -0.1304473876953125, -0.12294387817382812, -0.11544036865234375, -0.10793685913085938, -0.100433349609375, -0.09292984008789062, -0.08542633056640625, -0.07792282104492188, -0.0704193115234375, -0.06291580200195312, -0.05541229248046875, -0.047908782958984375, -0.0404052734375, -0.032901763916015625, -0.02539825439453125, -0.017894744873046875, -0.0103912353515625, -0.002887725830078125, 0.00461578369140625, 0.012119293212890625, 0.019622802734375, 0.027126312255859375, 0.03462982177734375, 0.042133331298828125, 0.0496368408203125, 0.057140350341796875, 0.06464385986328125, 0.07214736938476562, 0.07965087890625, 0.08715438842773438, 0.09465789794921875, 0.10216140747070312, 0.1096649169921875, 0.11716842651367188, 0.12467193603515625, 0.13217544555664062, 0.139678955078125, 0.14718246459960938, 0.15468597412109375, 0.16218948364257812, 0.1696929931640625, 0.17719650268554688, 0.18470001220703125, 0.19220352172851562, 0.19970703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 5.0, 12.0, 10.0, 21.0, 15.0, 27.0, 28.0, 35.0, 44.0, 31.0, 53.0, 68.0, 55.0, 69.0, 49.0, 69.0, 51.0, 55.0, 63.0, 51.0, 31.0, 34.0, 18.0, 27.0, 18.0, 14.0, 9.0, 4.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.174072265625, -0.16942787170410156, -0.16478347778320312, -0.1601390838623047, -0.15549468994140625, -0.1508502960205078, -0.14620590209960938, -0.14156150817871094, -0.1369171142578125, -0.13227272033691406, -0.12762832641601562, -0.12298393249511719, -0.11833953857421875, -0.11369514465332031, -0.10905075073242188, -0.10440635681152344, -0.099761962890625, -0.09511756896972656, -0.09047317504882812, -0.08582878112792969, -0.08118438720703125, -0.07653999328613281, -0.07189559936523438, -0.06725120544433594, -0.0626068115234375, -0.05796241760253906, -0.053318023681640625, -0.04867362976074219, -0.04402923583984375, -0.03938484191894531, -0.034740447998046875, -0.030096054077148438, -0.02545166015625, -0.020807266235351562, -0.016162872314453125, -0.011518478393554688, -0.00687408447265625, -0.0022296905517578125, 0.002414703369140625, 0.0070590972900390625, 0.0117034912109375, 0.016347885131835938, 0.020992279052734375, 0.025636672973632812, 0.03028106689453125, 0.03492546081542969, 0.039569854736328125, 0.04421424865722656, 0.048858642578125, 0.05350303649902344, 0.058147430419921875, 0.06279182434082031, 0.06743621826171875, 0.07208061218261719, 0.07672500610351562, 0.08136940002441406, 0.0860137939453125, 0.09065818786621094, 0.09530258178710938, 0.09994697570800781, 0.10459136962890625, 0.10923576354980469, 0.11388015747070312, 0.11852455139160156, 0.1231689453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 9.0, 1.0, 7.0, 5.0, 8.0, 6.0, 11.0, 29.0, 31.0, 50.0, 83.0, 124.0, 213.0, 415.0, 810.0, 1741.0, 4306.0, 14108.0, 96045.0, 766018.0, 138286.0, 17344.0, 4945.0, 1926.0, 923.0, 431.0, 262.0, 136.0, 99.0, 51.0, 41.0, 23.0, 15.0, 15.0, 9.0, 2.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06695556640625, -0.0648345947265625, -0.062713623046875, -0.0605926513671875, -0.0584716796875, -0.0563507080078125, -0.054229736328125, -0.0521087646484375, -0.04998779296875, -0.0478668212890625, -0.045745849609375, -0.0436248779296875, -0.04150390625, -0.0393829345703125, -0.037261962890625, -0.0351409912109375, -0.03302001953125, -0.0308990478515625, -0.028778076171875, -0.0266571044921875, -0.0245361328125, -0.0224151611328125, -0.020294189453125, -0.0181732177734375, -0.01605224609375, -0.0139312744140625, -0.011810302734375, -0.0096893310546875, -0.007568359375, -0.0054473876953125, -0.003326416015625, -0.0012054443359375, 0.00091552734375, 0.0030364990234375, 0.005157470703125, 0.0072784423828125, 0.0093994140625, 0.0115203857421875, 0.013641357421875, 0.0157623291015625, 0.01788330078125, 0.0200042724609375, 0.022125244140625, 0.0242462158203125, 0.0263671875, 0.0284881591796875, 0.030609130859375, 0.0327301025390625, 0.03485107421875, 0.0369720458984375, 0.039093017578125, 0.0412139892578125, 0.0433349609375, 0.0454559326171875, 0.047576904296875, 0.0496978759765625, 0.05181884765625, 0.0539398193359375, 0.056060791015625, 0.0581817626953125, 0.060302734375, 0.0624237060546875, 0.064544677734375, 0.0666656494140625, 0.06878662109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 5.0, 10.0, 11.0, 21.0, 29.0, 41.0, 58.0, 74.0, 82.0, 105.0, 103.0, 106.0, 94.0, 69.0, 57.0, 54.0, 27.0, 22.0, 12.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1086463928222656e-05, -1.0747462511062622e-05, -1.0408461093902588e-05, -1.0069459676742554e-05, -9.73045825958252e-06, -9.391456842422485e-06, -9.052455425262451e-06, -8.713454008102417e-06, -8.374452590942383e-06, -8.035451173782349e-06, -7.696449756622314e-06, -7.35744833946228e-06, -7.018446922302246e-06, -6.679445505142212e-06, -6.340444087982178e-06, -6.0014426708221436e-06, -5.662441253662109e-06, -5.323439836502075e-06, -4.984438419342041e-06, -4.645437002182007e-06, -4.306435585021973e-06, -3.9674341678619385e-06, -3.6284327507019043e-06, -3.28943133354187e-06, -2.950429916381836e-06, -2.6114284992218018e-06, -2.2724270820617676e-06, -1.9334256649017334e-06, -1.5944242477416992e-06, -1.255422830581665e-06, -9.164214134216309e-07, -5.774199962615967e-07, -2.384185791015625e-07, 1.0058283805847168e-07, 4.3958425521850586e-07, 7.7858567237854e-07, 1.1175870895385742e-06, 1.4565885066986084e-06, 1.7955899238586426e-06, 2.1345913410186768e-06, 2.473592758178711e-06, 2.812594175338745e-06, 3.1515955924987793e-06, 3.4905970096588135e-06, 3.829598426818848e-06, 4.168599843978882e-06, 4.507601261138916e-06, 4.84660267829895e-06, 5.185604095458984e-06, 5.5246055126190186e-06, 5.863606929779053e-06, 6.202608346939087e-06, 6.541609764099121e-06, 6.880611181259155e-06, 7.2196125984191895e-06, 7.558614015579224e-06, 7.897615432739258e-06, 8.236616849899292e-06, 8.575618267059326e-06, 8.91461968421936e-06, 9.253621101379395e-06, 9.592622518539429e-06, 9.931623935699463e-06, 1.0270625352859497e-05, 1.0609626770019531e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 7.0, 10.0, 12.0, 27.0, 31.0, 80.0, 123.0, 277.0, 599.0, 1814.0, 7148.0, 52646.0, 786949.0, 180246.0, 13877.0, 3008.0, 889.0, 376.0, 171.0, 100.0, 57.0, 36.0, 24.0, 13.0, 8.0, 5.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06585693359375, -0.0632944107055664, -0.06073188781738281, -0.05816936492919922, -0.055606842041015625, -0.05304431915283203, -0.05048179626464844, -0.047919273376464844, -0.04535675048828125, -0.042794227600097656, -0.04023170471191406, -0.03766918182373047, -0.035106658935546875, -0.03254413604736328, -0.029981613159179688, -0.027419090270996094, -0.0248565673828125, -0.022294044494628906, -0.019731521606445312, -0.01716899871826172, -0.014606475830078125, -0.012043952941894531, -0.009481430053710938, -0.006918907165527344, -0.00435638427734375, -0.0017938613891601562, 0.0007686614990234375, 0.0033311843872070312, 0.005893707275390625, 0.008456230163574219, 0.011018753051757812, 0.013581275939941406, 0.016143798828125, 0.018706321716308594, 0.021268844604492188, 0.02383136749267578, 0.026393890380859375, 0.02895641326904297, 0.03151893615722656, 0.034081459045410156, 0.03664398193359375, 0.039206504821777344, 0.04176902770996094, 0.04433155059814453, 0.046894073486328125, 0.04945659637451172, 0.05201911926269531, 0.054581642150878906, 0.0571441650390625, 0.059706687927246094, 0.06226921081542969, 0.06483173370361328, 0.06739425659179688, 0.06995677947998047, 0.07251930236816406, 0.07508182525634766, 0.07764434814453125, 0.08020687103271484, 0.08276939392089844, 0.08533191680908203, 0.08789443969726562, 0.09045696258544922, 0.09301948547363281, 0.0955820083618164, 0.09814453125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 19.0, 30.0, 59.0, 104.0, 130.0, 153.0, 154.0, 110.0, 59.0, 51.0, 32.0, 27.0, 12.0, 11.0, 4.0, 7.0, 2.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054290771484375, -0.05232858657836914, -0.05036640167236328, -0.04840421676635742, -0.04644203186035156, -0.0444798469543457, -0.042517662048339844, -0.040555477142333984, -0.038593292236328125, -0.036631107330322266, -0.034668922424316406, -0.03270673751831055, -0.030744552612304688, -0.028782367706298828, -0.02682018280029297, -0.02485799789428711, -0.02289581298828125, -0.02093362808227539, -0.01897144317626953, -0.017009258270263672, -0.015047073364257812, -0.013084888458251953, -0.011122703552246094, -0.009160518646240234, -0.007198333740234375, -0.005236148834228516, -0.0032739639282226562, -0.0013117790222167969, 0.0006504058837890625, 0.002612590789794922, 0.004574775695800781, 0.006536960601806641, 0.0084991455078125, 0.01046133041381836, 0.012423515319824219, 0.014385700225830078, 0.016347885131835938, 0.018310070037841797, 0.020272254943847656, 0.022234439849853516, 0.024196624755859375, 0.026158809661865234, 0.028120994567871094, 0.030083179473876953, 0.03204536437988281, 0.03400754928588867, 0.03596973419189453, 0.03793191909790039, 0.03989410400390625, 0.04185628890991211, 0.04381847381591797, 0.04578065872192383, 0.04774284362792969, 0.04970502853393555, 0.051667213439941406, 0.053629398345947266, 0.055591583251953125, 0.057553768157958984, 0.059515953063964844, 0.0614781379699707, 0.06344032287597656, 0.06540250778198242, 0.06736469268798828, 0.06932687759399414, 0.0712890625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 10.0, 46.0, 250.0, 532.0, 136.0, 24.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2018861770629883, -2.1359713077545166, -2.070056200027466, -2.004141330718994, -1.9382262229919434, -1.8723113536834717, -1.8063963651657104, -1.7404813766479492, -1.674566388130188, -1.6086513996124268, -1.5427364110946655, -1.4768214225769043, -1.4109065532684326, -1.3449914455413818, -1.2790765762329102, -1.213161587715149, -1.1472465991973877, -1.0813316106796265, -1.0154166221618652, -0.9495016932487488, -0.8835867047309875, -0.8176717162132263, -0.7517567873001099, -0.6858417987823486, -0.6199268102645874, -0.5540118217468262, -0.48809686303138733, -0.4221819043159485, -0.35626691579818726, -0.290351927280426, -0.22443696856498718, -0.15852200984954834, -0.09260702133178711, -0.026692047715187073, 0.039222925901412964, 0.105137899518013, 0.17105287313461304, 0.23696786165237427, 0.3028828203678131, 0.36879777908325195, 0.4347127676010132, 0.5006277561187744, 0.5665427446365356, 0.6324576735496521, 0.6983726620674133, 0.7642876505851746, 0.830202579498291, 0.8961175680160522, 0.9620325565338135, 1.0279475450515747, 1.093862533569336, 1.1597775220870972, 1.2256925106048584, 1.29160737991333, 1.3575223684310913, 1.4234373569488525, 1.4893523454666138, 1.555267333984375, 1.6211823225021362, 1.6870973110198975, 1.7530121803283691, 1.81892728805542, 1.8848421573638916, 1.9507571458816528, 2.016672134399414]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 10.0, 10.0, 7.0, 14.0, 20.0, 26.0, 29.0, 31.0, 37.0, 38.0, 51.0, 50.0, 53.0, 62.0, 52.0, 60.0, 70.0, 38.0, 49.0, 44.0, 45.0, 37.0, 25.0, 30.0, 17.0, 18.0, 17.0, 15.0, 6.0, 5.0, 9.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6999630928039551, -0.6768515706062317, -0.6537399888038635, -0.6306284666061401, -0.607516884803772, -0.5844053626060486, -0.5612938404083252, -0.538182258605957, -0.5150706768035889, -0.4919591248035431, -0.4688475728034973, -0.4457360506057739, -0.42262446880340576, -0.3995129466056824, -0.3764013946056366, -0.3532898426055908, -0.33017832040786743, -0.30706676840782166, -0.2839552164077759, -0.2608436942100525, -0.23773212730884552, -0.21462057530879974, -0.19150903820991516, -0.16839748620986938, -0.1452859342098236, -0.12217438220977783, -0.09906283766031265, -0.07595129311084747, -0.0528397411108017, -0.02972818911075592, -0.006616652011871338, 0.01649489998817444, 0.03960639238357544, 0.06271794438362122, 0.0858294889330864, 0.10894103348255157, 0.13205258548259735, 0.15516413748264313, 0.1782756745815277, 0.2013872265815735, 0.22449877858161926, 0.24761033058166504, 0.2707218825817108, 0.2938334345817566, 0.31694495677948, 0.34005653858184814, 0.36316806077957153, 0.3862796127796173, 0.4093911647796631, 0.43250271677970886, 0.45561426877975464, 0.478725790977478, 0.5018373727798462, 0.5249488949775696, 0.548060417175293, 0.5711719989776611, 0.5942835807800293, 0.6173951029777527, 0.6405066847801208, 0.6636182069778442, 0.6867297887802124, 0.7098413109779358, 0.7329528331756592, 0.7560644149780273, 0.7791759371757507]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 8.0, 2.0, 9.0, 11.0, 17.0, 28.0, 41.0, 82.0, 177.0, 331.0, 760.0, 1923.0, 6832.0, 37432.0, 2419214.0, 1680965.0, 34500.0, 6855.0, 2421.0, 1089.0, 564.0, 346.0, 180.0, 148.0, 94.0, 64.0, 46.0, 43.0, 26.0, 22.0, 8.0, 10.0, 8.0, 10.0, 4.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1590576171875, -0.15110206604003906, -0.14314651489257812, -0.1351909637451172, -0.12723541259765625, -0.11927986145019531, -0.11132431030273438, -0.10336875915527344, -0.0954132080078125, -0.08745765686035156, -0.07950210571289062, -0.07154655456542969, -0.06359100341796875, -0.05563545227050781, -0.047679901123046875, -0.03972434997558594, -0.031768798828125, -0.023813247680664062, -0.015857696533203125, -0.007902145385742188, 5.340576171875e-05, 0.008008956909179688, 0.015964508056640625, 0.023920059204101562, 0.0318756103515625, 0.03983116149902344, 0.047786712646484375, 0.05574226379394531, 0.06369781494140625, 0.07165336608886719, 0.07960891723632812, 0.08756446838378906, 0.09552001953125, 0.10347557067871094, 0.11143112182617188, 0.11938667297363281, 0.12734222412109375, 0.1352977752685547, 0.14325332641601562, 0.15120887756347656, 0.1591644287109375, 0.16711997985839844, 0.17507553100585938, 0.1830310821533203, 0.19098663330078125, 0.1989421844482422, 0.20689773559570312, 0.21485328674316406, 0.222808837890625, 0.23076438903808594, 0.23871994018554688, 0.2466754913330078, 0.25463104248046875, 0.2625865936279297, 0.2705421447753906, 0.27849769592285156, 0.2864532470703125, 0.29440879821777344, 0.3023643493652344, 0.3103199005126953, 0.31827545166015625, 0.3262310028076172, 0.3341865539550781, 0.34214210510253906, 0.35009765625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 8.0, 10.0, 16.0, 33.0, 41.0, 59.0, 80.0, 80.0, 87.0, 107.0, 102.0, 93.0, 80.0, 64.0, 45.0, 33.0, 27.0, 13.0, 5.0, 7.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0394287109375, -0.037619590759277344, -0.03581047058105469, -0.03400135040283203, -0.032192230224609375, -0.03038311004638672, -0.028573989868164062, -0.026764869689941406, -0.02495574951171875, -0.023146629333496094, -0.021337509155273438, -0.01952838897705078, -0.017719268798828125, -0.01591014862060547, -0.014101028442382812, -0.012291908264160156, -0.0104827880859375, -0.008673667907714844, -0.0068645477294921875, -0.005055427551269531, -0.003246307373046875, -0.0014371871948242188, 0.0003719329833984375, 0.0021810531616210938, 0.00399017333984375, 0.005799293518066406, 0.0076084136962890625, 0.009417533874511719, 0.011226654052734375, 0.013035774230957031, 0.014844894409179688, 0.016654014587402344, 0.018463134765625, 0.020272254943847656, 0.022081375122070312, 0.02389049530029297, 0.025699615478515625, 0.02750873565673828, 0.029317855834960938, 0.031126976013183594, 0.03293609619140625, 0.034745216369628906, 0.03655433654785156, 0.03836345672607422, 0.040172576904296875, 0.04198169708251953, 0.04379081726074219, 0.045599937438964844, 0.0474090576171875, 0.049218177795410156, 0.05102729797363281, 0.05283641815185547, 0.054645538330078125, 0.05645465850830078, 0.05826377868652344, 0.060072898864746094, 0.06188201904296875, 0.0636911392211914, 0.06550025939941406, 0.06730937957763672, 0.06911849975585938, 0.07092761993408203, 0.07273674011230469, 0.07454586029052734, 0.07635498046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 15.0, 18.0, 30.0, 54.0, 71.0, 145.0, 255.0, 1401.0, 4190729.0, 1110.0, 254.0, 94.0, 44.0, 31.0, 23.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.5819015502929688, -2.5251312255859375, -2.4683609008789062, -2.411590576171875, -2.3548202514648438, -2.2980499267578125, -2.2412796020507812, -2.18450927734375, -2.1277389526367188, -2.0709686279296875, -2.0141983032226562, -1.957427978515625, -1.9006576538085938, -1.8438873291015625, -1.7871170043945312, -1.7303466796875, -1.6735763549804688, -1.6168060302734375, -1.5600357055664062, -1.503265380859375, -1.4464950561523438, -1.3897247314453125, -1.3329544067382812, -1.27618408203125, -1.2194137573242188, -1.1626434326171875, -1.1058731079101562, -1.049102783203125, -0.9923324584960938, -0.9355621337890625, -0.8787918090820312, -0.822021484375, -0.7652511596679688, -0.7084808349609375, -0.6517105102539062, -0.594940185546875, -0.5381698608398438, -0.4813995361328125, -0.42462921142578125, -0.36785888671875, -0.31108856201171875, -0.2543182373046875, -0.19754791259765625, -0.140777587890625, -0.08400726318359375, -0.0272369384765625, 0.02953338623046875, 0.0863037109375, 0.14307403564453125, 0.1998443603515625, 0.25661468505859375, 0.313385009765625, 0.37015533447265625, 0.4269256591796875, 0.48369598388671875, 0.54046630859375, 0.5972366333007812, 0.6540069580078125, 0.7107772827148438, 0.767547607421875, 0.8243179321289062, 0.8810882568359375, 0.9378585815429688, 0.99462890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 11.0, 56.0, 3650.0, 352.0, 15.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.458984375, -0.4487285614013672, -0.4384727478027344, -0.42821693420410156, -0.41796112060546875, -0.40770530700683594, -0.3974494934082031, -0.3871936798095703, -0.3769378662109375, -0.3666820526123047, -0.3564262390136719, -0.34617042541503906, -0.33591461181640625, -0.32565879821777344, -0.3154029846191406, -0.3051471710205078, -0.294891357421875, -0.2846355438232422, -0.2743797302246094, -0.26412391662597656, -0.25386810302734375, -0.24361228942871094, -0.23335647583007812, -0.2231006622314453, -0.2128448486328125, -0.2025890350341797, -0.19233322143554688, -0.18207740783691406, -0.17182159423828125, -0.16156578063964844, -0.15130996704101562, -0.1410541534423828, -0.13079833984375, -0.12054252624511719, -0.11028671264648438, -0.10003089904785156, -0.08977508544921875, -0.07951927185058594, -0.06926345825195312, -0.05900764465332031, -0.0487518310546875, -0.03849601745605469, -0.028240203857421875, -0.017984390258789062, -0.00772857666015625, 0.0025272369384765625, 0.012783050537109375, 0.023038864135742188, 0.033294677734375, 0.04355049133300781, 0.053806304931640625, 0.06406211853027344, 0.07431793212890625, 0.08457374572753906, 0.09482955932617188, 0.10508537292480469, 0.1153411865234375, 0.1255970001220703, 0.13585281372070312, 0.14610862731933594, 0.15636444091796875, 0.16662025451660156, 0.17687606811523438, 0.1871318817138672, 0.1973876953125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 972.0, 42.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.570873975753784, -2.4171504974365234, -2.263427257537842, -2.10970401763916, -1.9559805393218994, -1.8022571802139282, -1.648533821105957, -1.4948104619979858, -1.3410871028900146, -1.1873637437820435, -1.0336403846740723, -0.8799170255661011, -0.7261936664581299, -0.5724703073501587, -0.4187469482421875, -0.2650235891342163, -0.11130023002624512, 0.042423129081726074, 0.19614648818969727, 0.34986984729766846, 0.5035932064056396, 0.6573165655136108, 0.811039924621582, 0.9647632837295532, 1.1184866428375244, 1.2722100019454956, 1.4259333610534668, 1.579656720161438, 1.7333800792694092, 1.8871034383773804, 2.0408267974853516, 2.194550037384033, 2.348273754119873, 2.5019969940185547, 2.6557204723358154, 2.809443950653076, 2.963167190551758, 3.1168904304504395, 3.2706139087677, 3.424337387084961, 3.5780606269836426, 3.731783866882324, 3.885507345199585, 4.039230823516846, 4.192954063415527, 4.346677303314209, 4.500400543212891, 4.6541242599487305, 4.807847499847412, 4.961570739746094, 5.115294456481934, 5.269017696380615, 5.422740936279297, 5.5764641761779785, 5.73018741607666, 5.8839111328125, 6.037634372711182, 6.191357612609863, 6.345081329345703, 6.498804569244385, 6.652527809143066, 6.806251049041748, 6.95997428894043, 7.1136980056762695, 7.267421245574951]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 10.0, 7.0, 18.0, 38.0, 68.0, 114.0, 131.0, 146.0, 145.0, 106.0, 117.0, 54.0, 29.0, 16.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.44772499799728394, -0.42949995398521423, -0.41127490997314453, -0.39304986596107483, -0.3748248219490051, -0.3565998077392578, -0.3383747637271881, -0.3201497197151184, -0.3019246757030487, -0.283699631690979, -0.2654745876789093, -0.2472495585680008, -0.2290245145559311, -0.2107994705438614, -0.19257444143295288, -0.17434939742088318, -0.15612435340881348, -0.13789930939674377, -0.11967427283525467, -0.10144923627376556, -0.08322419226169586, -0.06499914824962616, -0.046774111688137054, -0.02854907512664795, -0.010324031114578247, 0.007901009172201157, 0.02612604945898056, 0.044351089745759964, 0.06257613003253937, 0.08080117404460907, 0.09902621060609818, 0.11725124716758728, 0.13547635078430176, 0.15370139479637146, 0.17192643880844116, 0.19015146791934967, 0.20837651193141937, 0.22660155594348907, 0.24482658505439758, 0.2630516290664673, 0.281276673078537, 0.2995017170906067, 0.3177267611026764, 0.3359518051147461, 0.3541768193244934, 0.3724018931388855, 0.3906269073486328, 0.4088519513607025, 0.4270769953727722, 0.4453020393848419, 0.4635270833969116, 0.4817521274089813, 0.499977171421051, 0.5182021856307983, 0.5364272594451904, 0.5546522736549377, 0.5728772878646851, 0.5911023020744324, 0.6093273758888245, 0.6275523900985718, 0.6457774639129639, 0.6640024781227112, 0.6822275519371033, 0.7004525661468506, 0.7186776399612427]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 8.0, 21.0, 17.0, 13.0, 49.0, 62.0, 63.0, 139.0, 202.0, 330.0, 582.0, 1040.0, 2423.0, 6951.0, 24934.0, 130711.0, 638766.0, 194364.0, 33518.0, 8463.0, 2882.0, 1293.0, 617.0, 356.0, 240.0, 153.0, 106.0, 64.0, 45.0, 33.0, 34.0, 22.0, 9.0, 9.0, 8.0, 6.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.109130859375, -0.10486793518066406, -0.10060501098632812, -0.09634208679199219, -0.09207916259765625, -0.08781623840332031, -0.08355331420898438, -0.07929039001464844, -0.0750274658203125, -0.07076454162597656, -0.06650161743164062, -0.06223869323730469, -0.05797576904296875, -0.05371284484863281, -0.049449920654296875, -0.04518699645996094, -0.040924072265625, -0.03666114807128906, -0.032398223876953125, -0.028135299682617188, -0.02387237548828125, -0.019609451293945312, -0.015346527099609375, -0.011083602905273438, -0.0068206787109375, -0.0025577545166015625, 0.001705169677734375, 0.0059680938720703125, 0.01023101806640625, 0.014493942260742188, 0.018756866455078125, 0.023019790649414062, 0.02728271484375, 0.03154563903808594, 0.035808563232421875, 0.04007148742675781, 0.04433441162109375, 0.04859733581542969, 0.052860260009765625, 0.05712318420410156, 0.0613861083984375, 0.06564903259277344, 0.06991195678710938, 0.07417488098144531, 0.07843780517578125, 0.08270072937011719, 0.08696365356445312, 0.09122657775878906, 0.095489501953125, 0.09975242614746094, 0.10401535034179688, 0.10827827453613281, 0.11254119873046875, 0.11680412292480469, 0.12106704711914062, 0.12532997131347656, 0.1295928955078125, 0.13385581970214844, 0.13811874389648438, 0.1423816680908203, 0.14664459228515625, 0.1509075164794922, 0.15517044067382812, 0.15943336486816406, 0.1636962890625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 9.0, 19.0, 23.0, 27.0, 39.0, 62.0, 72.0, 79.0, 106.0, 98.0, 89.0, 91.0, 65.0, 43.0, 61.0, 41.0, 28.0, 12.0, 17.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035247802734375, -0.03370332717895508, -0.032158851623535156, -0.030614376068115234, -0.029069900512695312, -0.02752542495727539, -0.02598094940185547, -0.024436473846435547, -0.022891998291015625, -0.021347522735595703, -0.01980304718017578, -0.01825857162475586, -0.016714096069335938, -0.015169620513916016, -0.013625144958496094, -0.012080669403076172, -0.01053619384765625, -0.008991718292236328, -0.007447242736816406, -0.005902767181396484, -0.0043582916259765625, -0.0028138160705566406, -0.0012693405151367188, 0.0002751350402832031, 0.001819610595703125, 0.003364086151123047, 0.004908561706542969, 0.006453037261962891, 0.007997512817382812, 0.009541988372802734, 0.011086463928222656, 0.012630939483642578, 0.0141754150390625, 0.015719890594482422, 0.017264366149902344, 0.018808841705322266, 0.020353317260742188, 0.02189779281616211, 0.02344226837158203, 0.024986743927001953, 0.026531219482421875, 0.028075695037841797, 0.02962017059326172, 0.03116464614868164, 0.03270912170410156, 0.034253597259521484, 0.035798072814941406, 0.03734254837036133, 0.03888702392578125, 0.04043149948120117, 0.041975975036621094, 0.043520450592041016, 0.04506492614746094, 0.04660940170288086, 0.04815387725830078, 0.0496983528137207, 0.051242828369140625, 0.05278730392456055, 0.05433177947998047, 0.05587625503540039, 0.05742073059082031, 0.058965206146240234, 0.060509681701660156, 0.06205415725708008, 0.0635986328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 4.0, 4.0, 8.0, 12.0, 13.0, 25.0, 34.0, 67.0, 102.0, 199.0, 492.0, 1273.0, 4947.0, 37738.0, 781509.0, 205142.0, 12994.0, 2479.0, 798.0, 330.0, 157.0, 80.0, 47.0, 30.0, 25.0, 11.0, 14.0, 3.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1834716796875, -0.17635154724121094, -0.16923141479492188, -0.1621112823486328, -0.15499114990234375, -0.1478710174560547, -0.14075088500976562, -0.13363075256347656, -0.1265106201171875, -0.11939048767089844, -0.11227035522460938, -0.10515022277832031, -0.09803009033203125, -0.09090995788574219, -0.08378982543945312, -0.07666969299316406, -0.069549560546875, -0.06242942810058594, -0.055309295654296875, -0.04818916320800781, -0.04106903076171875, -0.03394889831542969, -0.026828765869140625, -0.019708633422851562, -0.0125885009765625, -0.0054683685302734375, 0.001651763916015625, 0.008771896362304688, 0.01589202880859375, 0.023012161254882812, 0.030132293701171875, 0.03725242614746094, 0.04437255859375, 0.05149269104003906, 0.058612823486328125, 0.06573295593261719, 0.07285308837890625, 0.07997322082519531, 0.08709335327148438, 0.09421348571777344, 0.1013336181640625, 0.10845375061035156, 0.11557388305664062, 0.12269401550292969, 0.12981414794921875, 0.1369342803955078, 0.14405441284179688, 0.15117454528808594, 0.158294677734375, 0.16541481018066406, 0.17253494262695312, 0.1796550750732422, 0.18677520751953125, 0.1938953399658203, 0.20101547241210938, 0.20813560485839844, 0.2152557373046875, 0.22237586975097656, 0.22949600219726562, 0.2366161346435547, 0.24373626708984375, 0.2508563995361328, 0.2579765319824219, 0.26509666442871094, 0.272216796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 8.0, 12.0, 13.0, 16.0, 25.0, 31.0, 47.0, 57.0, 73.0, 73.0, 93.0, 74.0, 82.0, 71.0, 74.0, 53.0, 50.0, 31.0, 24.0, 24.0, 17.0, 16.0, 5.0, 5.0, 2.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.150146484375, -0.1442432403564453, -0.13833999633789062, -0.13243675231933594, -0.12653350830078125, -0.12063026428222656, -0.11472702026367188, -0.10882377624511719, -0.1029205322265625, -0.09701728820800781, -0.09111404418945312, -0.08521080017089844, -0.07930755615234375, -0.07340431213378906, -0.06750106811523438, -0.06159782409667969, -0.055694580078125, -0.04979133605957031, -0.043888092041015625, -0.03798484802246094, -0.03208160400390625, -0.026178359985351562, -0.020275115966796875, -0.014371871948242188, -0.0084686279296875, -0.0025653839111328125, 0.003337860107421875, 0.009241104125976562, 0.01514434814453125, 0.021047592163085938, 0.026950836181640625, 0.03285408020019531, 0.03875732421875, 0.04466056823730469, 0.050563812255859375, 0.05646705627441406, 0.06237030029296875, 0.06827354431152344, 0.07417678833007812, 0.08008003234863281, 0.0859832763671875, 0.09188652038574219, 0.09778976440429688, 0.10369300842285156, 0.10959625244140625, 0.11549949645996094, 0.12140274047851562, 0.1273059844970703, 0.133209228515625, 0.1391124725341797, 0.14501571655273438, 0.15091896057128906, 0.15682220458984375, 0.16272544860839844, 0.16862869262695312, 0.1745319366455078, 0.1804351806640625, 0.1863384246826172, 0.19224166870117188, 0.19814491271972656, 0.20404815673828125, 0.20995140075683594, 0.21585464477539062, 0.2217578887939453, 0.2276611328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 7.0, 11.0, 23.0, 57.0, 121.0, 266.0, 670.0, 1809.0, 6133.0, 34138.0, 692993.0, 287686.0, 18365.0, 4021.0, 1346.0, 493.0, 209.0, 103.0, 43.0, 33.0, 14.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07879638671875, -0.0760650634765625, -0.073333740234375, -0.0706024169921875, -0.06787109375, -0.0651397705078125, -0.062408447265625, -0.0596771240234375, -0.05694580078125, -0.0542144775390625, -0.051483154296875, -0.0487518310546875, -0.0460205078125, -0.0432891845703125, -0.040557861328125, -0.0378265380859375, -0.03509521484375, -0.0323638916015625, -0.029632568359375, -0.0269012451171875, -0.024169921875, -0.0214385986328125, -0.018707275390625, -0.0159759521484375, -0.01324462890625, -0.0105133056640625, -0.007781982421875, -0.0050506591796875, -0.0023193359375, 0.0004119873046875, 0.003143310546875, 0.0058746337890625, 0.00860595703125, 0.0113372802734375, 0.014068603515625, 0.0167999267578125, 0.01953125, 0.0222625732421875, 0.024993896484375, 0.0277252197265625, 0.03045654296875, 0.0331878662109375, 0.035919189453125, 0.0386505126953125, 0.0413818359375, 0.0441131591796875, 0.046844482421875, 0.0495758056640625, 0.05230712890625, 0.0550384521484375, 0.057769775390625, 0.0605010986328125, 0.063232421875, 0.0659637451171875, 0.068695068359375, 0.0714263916015625, 0.07415771484375, 0.0768890380859375, 0.079620361328125, 0.0823516845703125, 0.0850830078125, 0.0878143310546875, 0.090545654296875, 0.0932769775390625, 0.09600830078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 4.0, 20.0, 17.0, 24.0, 39.0, 48.0, 55.0, 51.0, 81.0, 74.0, 76.0, 97.0, 78.0, 74.0, 69.0, 47.0, 40.0, 30.0, 16.0, 14.0, 8.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.715557098388672e-06, -9.4585120677948e-06, -9.201467037200928e-06, -8.944422006607056e-06, -8.687376976013184e-06, -8.430331945419312e-06, -8.17328691482544e-06, -7.916241884231567e-06, -7.659196853637695e-06, -7.402151823043823e-06, -7.145106792449951e-06, -6.888061761856079e-06, -6.631016731262207e-06, -6.373971700668335e-06, -6.116926670074463e-06, -5.859881639480591e-06, -5.602836608886719e-06, -5.345791578292847e-06, -5.088746547698975e-06, -4.8317015171051025e-06, -4.5746564865112305e-06, -4.317611455917358e-06, -4.060566425323486e-06, -3.8035213947296143e-06, -3.546476364135742e-06, -3.28943133354187e-06, -3.032386302947998e-06, -2.775341272354126e-06, -2.518296241760254e-06, -2.261251211166382e-06, -2.0042061805725098e-06, -1.7471611499786377e-06, -1.4901161193847656e-06, -1.2330710887908936e-06, -9.760260581970215e-07, -7.189810276031494e-07, -4.6193599700927734e-07, -2.0489096641540527e-07, 5.21540641784668e-08, 3.0919909477233887e-07, 5.662441253662109e-07, 8.23289155960083e-07, 1.080334186553955e-06, 1.3373792171478271e-06, 1.5944242477416992e-06, 1.8514692783355713e-06, 2.1085143089294434e-06, 2.3655593395233154e-06, 2.6226043701171875e-06, 2.8796494007110596e-06, 3.1366944313049316e-06, 3.3937394618988037e-06, 3.6507844924926758e-06, 3.907829523086548e-06, 4.16487455368042e-06, 4.421919584274292e-06, 4.678964614868164e-06, 4.936009645462036e-06, 5.193054676055908e-06, 5.45009970664978e-06, 5.707144737243652e-06, 5.964189767837524e-06, 6.2212347984313965e-06, 6.4782798290252686e-06, 6.735324859619141e-06]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 15.0, 24.0, 20.0, 29.0, 50.0, 73.0, 137.0, 220.0, 427.0, 932.0, 2108.0, 6048.0, 21204.0, 125869.0, 679774.0, 173913.0, 26029.0, 6992.0, 2538.0, 996.0, 494.0, 259.0, 132.0, 84.0, 44.0, 31.0, 30.0, 21.0, 14.0, 8.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.059295654296875, -0.057628631591796875, -0.05596160888671875, -0.054294586181640625, -0.0526275634765625, -0.050960540771484375, -0.04929351806640625, -0.047626495361328125, -0.04595947265625, -0.044292449951171875, -0.04262542724609375, -0.040958404541015625, -0.0392913818359375, -0.037624359130859375, -0.03595733642578125, -0.034290313720703125, -0.032623291015625, -0.030956268310546875, -0.02928924560546875, -0.027622222900390625, -0.0259552001953125, -0.024288177490234375, -0.02262115478515625, -0.020954132080078125, -0.019287109375, -0.017620086669921875, -0.01595306396484375, -0.014286041259765625, -0.0126190185546875, -0.010951995849609375, -0.00928497314453125, -0.007617950439453125, -0.005950927734375, -0.004283905029296875, -0.00261688232421875, -0.000949859619140625, 0.0007171630859375, 0.002384185791015625, 0.00405120849609375, 0.005718231201171875, 0.00738525390625, 0.009052276611328125, 0.01071929931640625, 0.012386322021484375, 0.0140533447265625, 0.015720367431640625, 0.01738739013671875, 0.019054412841796875, 0.020721435546875, 0.022388458251953125, 0.02405548095703125, 0.025722503662109375, 0.0273895263671875, 0.029056549072265625, 0.03072357177734375, 0.032390594482421875, 0.0340576171875, 0.035724639892578125, 0.03739166259765625, 0.039058685302734375, 0.0407257080078125, 0.042392730712890625, 0.04405975341796875, 0.045726776123046875, 0.047393798828125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 10.0, 6.0, 8.0, 8.0, 16.0, 14.0, 15.0, 25.0, 32.0, 48.0, 66.0, 92.0, 123.0, 119.0, 104.0, 76.0, 61.0, 52.0, 31.0, 19.0, 16.0, 19.0, 7.0, 8.0, 8.0, 4.0, 6.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0452880859375, -0.043890953063964844, -0.04249382019042969, -0.04109668731689453, -0.039699554443359375, -0.03830242156982422, -0.03690528869628906, -0.035508155822753906, -0.03411102294921875, -0.032713890075683594, -0.03131675720214844, -0.02991962432861328, -0.028522491455078125, -0.02712535858154297, -0.025728225708007812, -0.024331092834472656, -0.0229339599609375, -0.021536827087402344, -0.020139694213867188, -0.01874256134033203, -0.017345428466796875, -0.01594829559326172, -0.014551162719726562, -0.013154029846191406, -0.01175689697265625, -0.010359764099121094, -0.008962631225585938, -0.007565498352050781, -0.006168365478515625, -0.004771232604980469, -0.0033740997314453125, -0.0019769668579101562, -0.000579833984375, 0.0008172988891601562, 0.0022144317626953125, 0.0036115646362304688, 0.005008697509765625, 0.006405830383300781, 0.0078029632568359375, 0.009200096130371094, 0.01059722900390625, 0.011994361877441406, 0.013391494750976562, 0.014788627624511719, 0.016185760498046875, 0.01758289337158203, 0.018980026245117188, 0.020377159118652344, 0.0217742919921875, 0.023171424865722656, 0.024568557739257812, 0.02596569061279297, 0.027362823486328125, 0.02875995635986328, 0.030157089233398438, 0.031554222106933594, 0.03295135498046875, 0.034348487854003906, 0.03574562072753906, 0.03714275360107422, 0.038539886474609375, 0.03993701934814453, 0.04133415222167969, 0.042731285095214844, 0.04412841796875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 19.0, 40.0, 158.0, 439.0, 251.0, 67.0, 20.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7756141424179077, -0.718558669090271, -0.661503255367279, -0.6044478416442871, -0.5473923683166504, -0.49033692479133606, -0.43328148126602173, -0.3762260377407074, -0.31917059421539307, -0.26211515069007874, -0.2050597071647644, -0.14800426363945007, -0.09094882011413574, -0.03389337658882141, 0.02316206693649292, 0.08021751046180725, 0.13727295398712158, 0.1943283975124359, 0.25138384103775024, 0.3084392845630646, 0.3654947280883789, 0.42255017161369324, 0.47960561513900757, 0.5366610288619995, 0.5937165021896362, 0.650771975517273, 0.7078273892402649, 0.7648828029632568, 0.8219382762908936, 0.8789937496185303, 0.9360491633415222, 0.9931045770645142, 1.0501599311828613, 1.107215404510498, 1.1642708778381348, 1.221326231956482, 1.2783817052841187, 1.3354371786117554, 1.3924925327301025, 1.4495480060577393, 1.506603479385376, 1.5636589527130127, 1.6207144260406494, 1.6777697801589966, 1.7348252534866333, 1.79188072681427, 1.8489360809326172, 1.905991554260254, 1.9630470275878906, 2.0201025009155273, 2.077157974243164, 2.134213447570801, 2.1912689208984375, 2.248324155807495, 2.305379629135132, 2.3624351024627686, 2.4194905757904053, 2.476546049118042, 2.5336015224456787, 2.5906569957733154, 2.647712230682373, 2.7047677040100098, 2.7618231773376465, 2.818878650665283, 2.87593412399292]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 2.0, 2.0, 5.0, 2.0, 11.0, 15.0, 11.0, 17.0, 39.0, 29.0, 31.0, 31.0, 32.0, 33.0, 50.0, 43.0, 64.0, 68.0, 64.0, 54.0, 50.0, 49.0, 57.0, 43.0, 42.0, 24.0, 29.0, 22.0, 14.0, 21.0, 13.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6864655613899231, -0.6611626148223877, -0.6358596682548523, -0.6105567216873169, -0.5852538347244263, -0.5599508285522461, -0.5346479415893555, -0.5093449950218201, -0.48404204845428467, -0.45873910188674927, -0.43343615531921387, -0.40813323855400085, -0.38283029198646545, -0.35752734541893005, -0.33222442865371704, -0.30692148208618164, -0.28161853551864624, -0.25631558895111084, -0.23101265728473663, -0.20570972561836243, -0.18040677905082703, -0.15510383248329163, -0.12980090081691742, -0.10449796915054321, -0.07919502258300781, -0.05389208346605301, -0.028589144349098206, -0.003286205232143402, 0.0220167338848114, 0.0473196804523468, 0.07262261211872101, 0.09792554378509521, 0.12322854995727539, 0.1485314965248108, 0.173834428191185, 0.1991373598575592, 0.2244403064250946, 0.24974325299263, 0.275046169757843, 0.3003491163253784, 0.3256520628929138, 0.3509550094604492, 0.3762579560279846, 0.40156087279319763, 0.42686381936073303, 0.45216676592826843, 0.47746968269348145, 0.5027726292610168, 0.5280755758285522, 0.5533785223960876, 0.578681468963623, 0.6039844155311584, 0.6292873620986938, 0.6545902490615845, 0.6798931956291199, 0.7051961421966553, 0.7304990887641907, 0.7558020353317261, 0.7811049818992615, 0.8064079284667969, 0.8317108154296875, 0.8570138216018677, 0.8823167085647583, 0.9076196551322937, 0.9329226016998291]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 3.0, 6.0, 12.0, 23.0, 19.0, 34.0, 61.0, 114.0, 210.0, 317.0, 580.0, 1182.0, 2348.0, 5732.0, 18017.0, 92194.0, 3395255.0, 608657.0, 47498.0, 12013.0, 4671.0, 2251.0, 1174.0, 610.0, 397.0, 264.0, 167.0, 92.0, 109.0, 59.0, 31.0, 33.0, 28.0, 30.0, 14.0, 17.0, 10.0, 8.0, 3.0, 4.0, 3.0, 1.0, 5.0, 3.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1373291015625, -0.13156509399414062, -0.12580108642578125, -0.12003707885742188, -0.1142730712890625, -0.10850906372070312, -0.10274505615234375, -0.09698104858398438, -0.091217041015625, -0.08545303344726562, -0.07968902587890625, -0.07392501831054688, -0.0681610107421875, -0.062397003173828125, -0.05663299560546875, -0.050868988037109375, -0.04510498046875, -0.039340972900390625, -0.03357696533203125, -0.027812957763671875, -0.0220489501953125, -0.016284942626953125, -0.01052093505859375, -0.004756927490234375, 0.001007080078125, 0.006771087646484375, 0.01253509521484375, 0.018299102783203125, 0.0240631103515625, 0.029827117919921875, 0.03559112548828125, 0.041355133056640625, 0.047119140625, 0.052883148193359375, 0.05864715576171875, 0.06441116333007812, 0.0701751708984375, 0.07593917846679688, 0.08170318603515625, 0.08746719360351562, 0.093231201171875, 0.09899520874023438, 0.10475921630859375, 0.11052322387695312, 0.1162872314453125, 0.12205123901367188, 0.12781524658203125, 0.13357925415039062, 0.13934326171875, 0.14510726928710938, 0.15087127685546875, 0.15663528442382812, 0.1623992919921875, 0.16816329956054688, 0.17392730712890625, 0.17969131469726562, 0.185455322265625, 0.19121932983398438, 0.19698333740234375, 0.20274734497070312, 0.2085113525390625, 0.21427536010742188, 0.22003936767578125, 0.22580337524414062, 0.2315673828125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 13.0, 21.0, 27.0, 36.0, 46.0, 59.0, 75.0, 86.0, 87.0, 111.0, 92.0, 75.0, 60.0, 42.0, 52.0, 34.0, 29.0, 17.0, 10.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03192138671875, -0.030437469482421875, -0.02895355224609375, -0.027469635009765625, -0.0259857177734375, -0.024501800537109375, -0.02301788330078125, -0.021533966064453125, -0.020050048828125, -0.018566131591796875, -0.01708221435546875, -0.015598297119140625, -0.0141143798828125, -0.012630462646484375, -0.01114654541015625, -0.009662628173828125, -0.0081787109375, -0.006694793701171875, -0.00521087646484375, -0.003726959228515625, -0.0022430419921875, -0.000759124755859375, 0.00072479248046875, 0.002208709716796875, 0.003692626953125, 0.005176544189453125, 0.00666046142578125, 0.008144378662109375, 0.0096282958984375, 0.011112213134765625, 0.01259613037109375, 0.014080047607421875, 0.01556396484375, 0.017047882080078125, 0.01853179931640625, 0.020015716552734375, 0.0214996337890625, 0.022983551025390625, 0.02446746826171875, 0.025951385498046875, 0.027435302734375, 0.028919219970703125, 0.03040313720703125, 0.031887054443359375, 0.0333709716796875, 0.034854888916015625, 0.03633880615234375, 0.037822723388671875, 0.039306640625, 0.040790557861328125, 0.04227447509765625, 0.043758392333984375, 0.0452423095703125, 0.046726226806640625, 0.04821014404296875, 0.049694061279296875, 0.051177978515625, 0.052661895751953125, 0.05414581298828125, 0.055629730224609375, 0.0571136474609375, 0.058597564697265625, 0.06008148193359375, 0.061565399169921875, 0.06304931640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 9.0, 15.0, 18.0, 35.0, 54.0, 114.0, 197.0, 501.0, 1969.0, 11390.0, 1159771.0, 3003429.0, 13437.0, 2238.0, 542.0, 236.0, 121.0, 83.0, 39.0, 30.0, 20.0, 14.0, 7.0, 11.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.43505859375, -0.4229850769042969, -0.41091156005859375, -0.3988380432128906, -0.3867645263671875, -0.3746910095214844, -0.36261749267578125, -0.3505439758300781, -0.338470458984375, -0.3263969421386719, -0.31432342529296875, -0.3022499084472656, -0.2901763916015625, -0.2781028747558594, -0.26602935791015625, -0.2539558410644531, -0.24188232421875, -0.22980880737304688, -0.21773529052734375, -0.20566177368164062, -0.1935882568359375, -0.18151473999023438, -0.16944122314453125, -0.15736770629882812, -0.145294189453125, -0.13322067260742188, -0.12114715576171875, -0.10907363891601562, -0.0970001220703125, -0.08492660522460938, -0.07285308837890625, -0.060779571533203125, -0.0487060546875, -0.036632537841796875, -0.02455902099609375, -0.012485504150390625, -0.0004119873046875, 0.011661529541015625, 0.02373504638671875, 0.035808563232421875, 0.047882080078125, 0.059955596923828125, 0.07202911376953125, 0.08410263061523438, 0.0961761474609375, 0.10824966430664062, 0.12032318115234375, 0.13239669799804688, 0.14447021484375, 0.15654373168945312, 0.16861724853515625, 0.18069076538085938, 0.1927642822265625, 0.20483779907226562, 0.21691131591796875, 0.22898483276367188, 0.241058349609375, 0.2531318664550781, 0.26520538330078125, 0.2772789001464844, 0.2893524169921875, 0.3014259338378906, 0.31349945068359375, 0.3255729675292969, 0.337646484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 10.0, 17.0, 34.0, 76.0, 222.0, 1650.0, 1671.0, 215.0, 78.0, 25.0, 28.0, 9.0, 5.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08203125, -0.07771492004394531, -0.07339859008789062, -0.06908226013183594, -0.06476593017578125, -0.06044960021972656, -0.056133270263671875, -0.05181694030761719, -0.0475006103515625, -0.04318428039550781, -0.038867950439453125, -0.03455162048339844, -0.03023529052734375, -0.025918960571289062, -0.021602630615234375, -0.017286300659179688, -0.012969970703125, -0.008653640747070312, -0.004337310791015625, -2.09808349609375e-05, 0.00429534912109375, 0.008611679077148438, 0.012928009033203125, 0.017244338989257812, 0.0215606689453125, 0.025876998901367188, 0.030193328857421875, 0.03450965881347656, 0.03882598876953125, 0.04314231872558594, 0.047458648681640625, 0.05177497863769531, 0.05609130859375, 0.06040763854980469, 0.06472396850585938, 0.06904029846191406, 0.07335662841796875, 0.07767295837402344, 0.08198928833007812, 0.08630561828613281, 0.0906219482421875, 0.09493827819824219, 0.09925460815429688, 0.10357093811035156, 0.10788726806640625, 0.11220359802246094, 0.11651992797851562, 0.12083625793457031, 0.125152587890625, 0.1294689178466797, 0.13378524780273438, 0.13810157775878906, 0.14241790771484375, 0.14673423767089844, 0.15105056762695312, 0.1553668975830078, 0.1596832275390625, 0.1639995574951172, 0.16831588745117188, 0.17263221740722656, 0.17694854736328125, 0.18126487731933594, 0.18558120727539062, 0.1898975372314453, 0.1942138671875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 11.0, 105.0, 590.0, 264.0, 25.0, 12.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7518150806427002, -1.7065293788909912, -1.6612435579299927, -1.6159578561782837, -1.5706720352172852, -1.5253863334655762, -1.4801006317138672, -1.4348148107528687, -1.3895289897918701, -1.3442432880401611, -1.2989574670791626, -1.2536717653274536, -1.208385944366455, -1.163100242614746, -1.117814540863037, -1.0725287199020386, -1.0272430181503296, -0.9819572567939758, -0.9366714954376221, -0.8913857936859131, -0.8460999727249146, -0.8008142709732056, -0.7555285096168518, -0.710242748260498, -0.6649569869041443, -0.6196712255477905, -0.5743854641914368, -0.529099702835083, -0.48381397128105164, -0.4385282099246979, -0.3932424783706665, -0.34795671701431274, -0.30267083644866943, -0.2573850750923157, -0.2120993286371231, -0.16681358218193054, -0.12152782082557678, -0.07624205946922302, -0.03095632791519165, 0.01432943344116211, 0.05961519479751587, 0.10490094870328903, 0.1501867026090622, 0.19547244906425476, 0.24075821042060852, 0.2860439717769623, 0.33132970333099365, 0.3766154646873474, 0.42190122604370117, 0.46718698740005493, 0.5124727487564087, 0.5577584505081177, 0.6030442714691162, 0.6483299732208252, 0.693615734577179, 0.7389014959335327, 0.7841872572898865, 0.8294730186462402, 0.874758780002594, 0.9200445413589478, 0.9653302431106567, 1.0106160640716553, 1.0559017658233643, 1.1011874675750732, 1.1464732885360718]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 10.0, 11.0, 12.0, 31.0, 26.0, 32.0, 43.0, 49.0, 76.0, 71.0, 68.0, 75.0, 67.0, 71.0, 86.0, 53.0, 49.0, 28.0, 41.0, 25.0, 17.0, 16.0, 9.0, 10.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43587785959243774, -0.4239506125450134, -0.4120233952999115, -0.4000961482524872, -0.38816893100738525, -0.37624168395996094, -0.364314466714859, -0.3523872196674347, -0.34046000242233276, -0.32853275537490845, -0.3166055381298065, -0.3046782910823822, -0.2927510738372803, -0.28082382678985596, -0.26889660954475403, -0.2569693624973297, -0.2450421303510666, -0.23311489820480347, -0.22118766605854034, -0.20926043391227722, -0.1973332017660141, -0.18540596961975098, -0.17347872257232666, -0.16155150532722473, -0.14962425827980042, -0.1376970261335373, -0.12576979398727417, -0.11384256184101105, -0.10191532969474792, -0.0899880975484848, -0.07806085795164108, -0.06613362580537796, -0.054206401109695435, -0.04227916896343231, -0.03035193495452404, -0.01842470094561577, -0.006497468799352646, 0.005429763346910477, 0.017356999218463898, 0.02928423136472702, 0.04121146351099014, 0.053138695657253265, 0.06506592780351639, 0.07699316740036011, 0.08892039954662323, 0.10084763169288635, 0.11277486383914948, 0.1247020959854126, 0.13662932813167572, 0.14855656027793884, 0.16048379242420197, 0.1724110245704651, 0.1843382567167282, 0.19626548886299133, 0.20819273591041565, 0.22011995315551758, 0.2320472002029419, 0.24397443234920502, 0.25590166449546814, 0.26782891154289246, 0.2797561287879944, 0.2916833758354187, 0.30361059308052063, 0.31553784012794495, 0.3274650573730469]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 11.0, 10.0, 9.0, 14.0, 19.0, 20.0, 30.0, 47.0, 47.0, 83.0, 140.0, 199.0, 360.0, 712.0, 1567.0, 4537.0, 17212.0, 96737.0, 578950.0, 291917.0, 41747.0, 9006.0, 2807.0, 1065.0, 488.0, 255.0, 164.0, 125.0, 93.0, 48.0, 29.0, 26.0, 11.0, 9.0, 6.0, 7.0, 6.0, 8.0, 4.0, 7.0, 6.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.14892578125, -0.1445159912109375, -0.140106201171875, -0.1356964111328125, -0.13128662109375, -0.1268768310546875, -0.122467041015625, -0.1180572509765625, -0.1136474609375, -0.1092376708984375, -0.104827880859375, -0.1004180908203125, -0.09600830078125, -0.0915985107421875, -0.087188720703125, -0.0827789306640625, -0.078369140625, -0.0739593505859375, -0.069549560546875, -0.0651397705078125, -0.06072998046875, -0.0563201904296875, -0.051910400390625, -0.0475006103515625, -0.0430908203125, -0.0386810302734375, -0.034271240234375, -0.0298614501953125, -0.02545166015625, -0.0210418701171875, -0.016632080078125, -0.0122222900390625, -0.0078125, -0.0034027099609375, 0.001007080078125, 0.0054168701171875, 0.00982666015625, 0.0142364501953125, 0.018646240234375, 0.0230560302734375, 0.0274658203125, 0.0318756103515625, 0.036285400390625, 0.0406951904296875, 0.04510498046875, 0.0495147705078125, 0.053924560546875, 0.0583343505859375, 0.062744140625, 0.0671539306640625, 0.071563720703125, 0.0759735107421875, 0.08038330078125, 0.0847930908203125, 0.089202880859375, 0.0936126708984375, 0.0980224609375, 0.1024322509765625, 0.106842041015625, 0.1112518310546875, 0.11566162109375, 0.1200714111328125, 0.124481201171875, 0.1288909912109375, 0.13330078125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 10.0, 19.0, 29.0, 39.0, 61.0, 98.0, 102.0, 116.0, 123.0, 113.0, 103.0, 65.0, 44.0, 39.0, 27.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03314208984375, -0.03133201599121094, -0.029521942138671875, -0.027711868286132812, -0.02590179443359375, -0.024091720581054688, -0.022281646728515625, -0.020471572875976562, -0.0186614990234375, -0.016851425170898438, -0.015041351318359375, -0.013231277465820312, -0.01142120361328125, -0.009611129760742188, -0.007801055908203125, -0.0059909820556640625, -0.004180908203125, -0.0023708343505859375, -0.000560760498046875, 0.0012493133544921875, 0.00305938720703125, 0.0048694610595703125, 0.006679534912109375, 0.008489608764648438, 0.0102996826171875, 0.012109756469726562, 0.013919830322265625, 0.015729904174804688, 0.01753997802734375, 0.019350051879882812, 0.021160125732421875, 0.022970199584960938, 0.0247802734375, 0.026590347290039062, 0.028400421142578125, 0.030210494995117188, 0.03202056884765625, 0.03383064270019531, 0.035640716552734375, 0.03745079040527344, 0.0392608642578125, 0.04107093811035156, 0.042881011962890625, 0.04469108581542969, 0.04650115966796875, 0.04831123352050781, 0.050121307373046875, 0.05193138122558594, 0.053741455078125, 0.05555152893066406, 0.057361602783203125, 0.05917167663574219, 0.06098175048828125, 0.06279182434082031, 0.06460189819335938, 0.06641197204589844, 0.0682220458984375, 0.07003211975097656, 0.07184219360351562, 0.07365226745605469, 0.07546234130859375, 0.07727241516113281, 0.07908248901367188, 0.08089256286621094, 0.08270263671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 15.0, 10.0, 10.0, 30.0, 26.0, 51.0, 52.0, 91.0, 152.0, 213.0, 450.0, 797.0, 1681.0, 3437.0, 8299.0, 21653.0, 61662.0, 192623.0, 398569.0, 236800.0, 77174.0, 26366.0, 10178.0, 4250.0, 1850.0, 876.0, 485.0, 248.0, 138.0, 100.0, 69.0, 49.0, 41.0, 24.0, 18.0, 16.0, 10.0, 4.0, 8.0, 7.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.064697265625, -0.06282711029052734, -0.06095695495605469, -0.05908679962158203, -0.057216644287109375, -0.05534648895263672, -0.05347633361816406, -0.051606178283691406, -0.04973602294921875, -0.047865867614746094, -0.04599571228027344, -0.04412555694580078, -0.042255401611328125, -0.04038524627685547, -0.03851509094238281, -0.036644935607910156, -0.0347747802734375, -0.032904624938964844, -0.031034469604492188, -0.02916431427001953, -0.027294158935546875, -0.02542400360107422, -0.023553848266601562, -0.021683692932128906, -0.01981353759765625, -0.017943382263183594, -0.016073226928710938, -0.014203071594238281, -0.012332916259765625, -0.010462760925292969, -0.008592605590820312, -0.006722450256347656, -0.004852294921875, -0.0029821395874023438, -0.0011119842529296875, 0.0007581710815429688, 0.002628326416015625, 0.004498481750488281, 0.0063686370849609375, 0.008238792419433594, 0.01010894775390625, 0.011979103088378906, 0.013849258422851562, 0.01571941375732422, 0.017589569091796875, 0.01945972442626953, 0.021329879760742188, 0.023200035095214844, 0.0250701904296875, 0.026940345764160156, 0.028810501098632812, 0.03068065643310547, 0.032550811767578125, 0.03442096710205078, 0.03629112243652344, 0.038161277770996094, 0.04003143310546875, 0.041901588439941406, 0.04377174377441406, 0.04564189910888672, 0.047512054443359375, 0.04938220977783203, 0.05125236511230469, 0.053122520446777344, 0.05499267578125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 4.0, 10.0, 12.0, 8.0, 17.0, 15.0, 14.0, 27.0, 26.0, 33.0, 34.0, 49.0, 36.0, 49.0, 46.0, 42.0, 43.0, 51.0, 47.0, 50.0, 41.0, 55.0, 43.0, 37.0, 41.0, 24.0, 28.0, 25.0, 19.0, 15.0, 13.0, 12.0, 3.0, 12.0, 8.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320068359375, -0.09017753601074219, -0.08715438842773438, -0.08413124084472656, -0.08110809326171875, -0.07808494567871094, -0.07506179809570312, -0.07203865051269531, -0.0690155029296875, -0.06599235534667969, -0.06296920776367188, -0.05994606018066406, -0.05692291259765625, -0.05389976501464844, -0.050876617431640625, -0.04785346984863281, -0.044830322265625, -0.04180717468261719, -0.038784027099609375, -0.03576087951660156, -0.03273773193359375, -0.029714584350585938, -0.026691436767578125, -0.023668289184570312, -0.0206451416015625, -0.017621994018554688, -0.014598846435546875, -0.011575698852539062, -0.00855255126953125, -0.0055294036865234375, -0.002506256103515625, 0.0005168914794921875, 0.0035400390625, 0.0065631866455078125, 0.009586334228515625, 0.012609481811523438, 0.01563262939453125, 0.018655776977539062, 0.021678924560546875, 0.024702072143554688, 0.0277252197265625, 0.030748367309570312, 0.033771514892578125, 0.03679466247558594, 0.03981781005859375, 0.04284095764160156, 0.045864105224609375, 0.04888725280761719, 0.051910400390625, 0.05493354797363281, 0.057956695556640625, 0.06097984313964844, 0.06400299072265625, 0.06702613830566406, 0.07004928588867188, 0.07307243347167969, 0.0760955810546875, 0.07911872863769531, 0.08214187622070312, 0.08516502380371094, 0.08818817138671875, 0.09121131896972656, 0.09423446655273438, 0.09725761413574219, 0.10028076171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 10.0, 12.0, 16.0, 15.0, 37.0, 46.0, 55.0, 78.0, 128.0, 165.0, 298.0, 449.0, 746.0, 1249.0, 2197.0, 4171.0, 8436.0, 19639.0, 58071.0, 219985.0, 447418.0, 197441.0, 52949.0, 18027.0, 7657.0, 3922.0, 2079.0, 1210.0, 736.0, 465.0, 296.0, 172.0, 105.0, 82.0, 61.0, 28.0, 25.0, 16.0, 13.0, 8.0, 9.0, 13.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.029205322265625, -0.028305530548095703, -0.027405738830566406, -0.02650594711303711, -0.025606155395507812, -0.024706363677978516, -0.02380657196044922, -0.022906780242919922, -0.022006988525390625, -0.021107196807861328, -0.02020740509033203, -0.019307613372802734, -0.018407821655273438, -0.01750802993774414, -0.016608238220214844, -0.015708446502685547, -0.01480865478515625, -0.013908863067626953, -0.013009071350097656, -0.01210927963256836, -0.011209487915039062, -0.010309696197509766, -0.009409904479980469, -0.008510112762451172, -0.007610321044921875, -0.006710529327392578, -0.005810737609863281, -0.004910945892333984, -0.0040111541748046875, -0.0031113624572753906, -0.0022115707397460938, -0.0013117790222167969, -0.0004119873046875, 0.0004878044128417969, 0.0013875961303710938, 0.0022873878479003906, 0.0031871795654296875, 0.004086971282958984, 0.004986763000488281, 0.005886554718017578, 0.006786346435546875, 0.007686138153076172, 0.008585929870605469, 0.009485721588134766, 0.010385513305664062, 0.01128530502319336, 0.012185096740722656, 0.013084888458251953, 0.01398468017578125, 0.014884471893310547, 0.015784263610839844, 0.01668405532836914, 0.017583847045898438, 0.018483638763427734, 0.01938343048095703, 0.020283222198486328, 0.021183013916015625, 0.022082805633544922, 0.02298259735107422, 0.023882389068603516, 0.024782180786132812, 0.02568197250366211, 0.026581764221191406, 0.027481555938720703, 0.02838134765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 13.0, 19.0, 18.0, 33.0, 35.0, 44.0, 52.0, 47.0, 81.0, 82.0, 74.0, 65.0, 81.0, 53.0, 81.0, 52.0, 27.0, 38.0, 31.0, 13.0, 13.0, 14.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.5367431640625e-06, -9.318813681602478e-06, -9.100884199142456e-06, -8.882954716682434e-06, -8.665025234222412e-06, -8.44709575176239e-06, -8.229166269302368e-06, -8.011236786842346e-06, -7.793307304382324e-06, -7.575377821922302e-06, -7.35744833946228e-06, -7.139518857002258e-06, -6.921589374542236e-06, -6.703659892082214e-06, -6.485730409622192e-06, -6.26780092716217e-06, -6.0498714447021484e-06, -5.8319419622421265e-06, -5.6140124797821045e-06, -5.3960829973220825e-06, -5.1781535148620605e-06, -4.9602240324020386e-06, -4.742294549942017e-06, -4.524365067481995e-06, -4.306435585021973e-06, -4.088506102561951e-06, -3.870576620101929e-06, -3.6526471376419067e-06, -3.4347176551818848e-06, -3.216788172721863e-06, -2.998858690261841e-06, -2.780929207801819e-06, -2.562999725341797e-06, -2.345070242881775e-06, -2.127140760421753e-06, -1.909211277961731e-06, -1.691281795501709e-06, -1.473352313041687e-06, -1.255422830581665e-06, -1.037493348121643e-06, -8.195638656616211e-07, -6.016343832015991e-07, -3.8370490074157715e-07, -1.6577541828155518e-07, 5.21540641784668e-08, 2.7008354663848877e-07, 4.880130290985107e-07, 7.059425115585327e-07, 9.238719940185547e-07, 1.1418014764785767e-06, 1.3597309589385986e-06, 1.5776604413986206e-06, 1.7955899238586426e-06, 2.0135194063186646e-06, 2.2314488887786865e-06, 2.4493783712387085e-06, 2.6673078536987305e-06, 2.8852373361587524e-06, 3.1031668186187744e-06, 3.3210963010787964e-06, 3.5390257835388184e-06, 3.7569552659988403e-06, 3.974884748458862e-06, 4.192814230918884e-06, 4.410743713378906e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 7.0, 7.0, 7.0, 22.0, 54.0, 146.0, 329.0, 1003.0, 3510.0, 18281.0, 230976.0, 721277.0, 62158.0, 7890.0, 1908.0, 613.0, 196.0, 91.0, 38.0, 18.0, 11.0, 8.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07232666015625, -0.07021617889404297, -0.06810569763183594, -0.0659952163696289, -0.06388473510742188, -0.061774253845214844, -0.05966377258300781, -0.05755329132080078, -0.05544281005859375, -0.05333232879638672, -0.05122184753417969, -0.049111366271972656, -0.047000885009765625, -0.044890403747558594, -0.04277992248535156, -0.04066944122314453, -0.0385589599609375, -0.03644847869873047, -0.03433799743652344, -0.032227516174316406, -0.030117034912109375, -0.028006553649902344, -0.025896072387695312, -0.02378559112548828, -0.02167510986328125, -0.01956462860107422, -0.017454147338867188, -0.015343666076660156, -0.013233184814453125, -0.011122703552246094, -0.009012222290039062, -0.006901741027832031, -0.004791259765625, -0.0026807785034179688, -0.0005702972412109375, 0.0015401840209960938, 0.003650665283203125, 0.005761146545410156, 0.007871627807617188, 0.009982109069824219, 0.01209259033203125, 0.014203071594238281, 0.016313552856445312, 0.018424034118652344, 0.020534515380859375, 0.022644996643066406, 0.024755477905273438, 0.02686595916748047, 0.0289764404296875, 0.03108692169189453, 0.03319740295410156, 0.035307884216308594, 0.037418365478515625, 0.039528846740722656, 0.04163932800292969, 0.04374980926513672, 0.04586029052734375, 0.04797077178955078, 0.05008125305175781, 0.052191734313964844, 0.054302215576171875, 0.056412696838378906, 0.05852317810058594, 0.06063365936279297, 0.062744140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 5.0, 5.0, 8.0, 15.0, 15.0, 26.0, 40.0, 48.0, 57.0, 81.0, 102.0, 123.0, 105.0, 98.0, 74.0, 49.0, 44.0, 22.0, 21.0, 13.0, 15.0, 6.0, 11.0, 2.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.042816162109375, -0.04162168502807617, -0.040427207946777344, -0.039232730865478516, -0.03803825378417969, -0.03684377670288086, -0.03564929962158203, -0.0344548225402832, -0.033260345458984375, -0.03206586837768555, -0.03087139129638672, -0.02967691421508789, -0.028482437133789062, -0.027287960052490234, -0.026093482971191406, -0.024899005889892578, -0.02370452880859375, -0.022510051727294922, -0.021315574645996094, -0.020121097564697266, -0.018926620483398438, -0.01773214340209961, -0.01653766632080078, -0.015343189239501953, -0.014148712158203125, -0.012954235076904297, -0.011759757995605469, -0.01056528091430664, -0.009370803833007812, -0.008176326751708984, -0.006981849670410156, -0.005787372589111328, -0.0045928955078125, -0.003398418426513672, -0.0022039413452148438, -0.0010094642639160156, 0.0001850128173828125, 0.0013794898986816406, 0.0025739669799804688, 0.003768444061279297, 0.004962921142578125, 0.006157398223876953, 0.007351875305175781, 0.00854635238647461, 0.009740829467773438, 0.010935306549072266, 0.012129783630371094, 0.013324260711669922, 0.01451873779296875, 0.015713214874267578, 0.016907691955566406, 0.018102169036865234, 0.019296646118164062, 0.02049112319946289, 0.02168560028076172, 0.022880077362060547, 0.024074554443359375, 0.025269031524658203, 0.02646350860595703, 0.02765798568725586, 0.028852462768554688, 0.030046939849853516, 0.031241416931152344, 0.03243589401245117, 0.03363037109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 15.0, 30.0, 36.0, 55.0, 71.0, 135.0, 139.0, 147.0, 118.0, 78.0, 62.0, 35.0, 20.0, 22.0, 12.0, 3.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62468421459198, -0.6097890138626099, -0.5948938131332397, -0.5799986124038696, -0.5651034116744995, -0.5502082109451294, -0.5353130102157593, -0.5204178094863892, -0.5055226683616638, -0.4906274676322937, -0.4757322669029236, -0.46083706617355347, -0.44594189524650574, -0.4310466945171356, -0.4161514937877655, -0.4012562930583954, -0.3863610625267029, -0.37146586179733276, -0.35657066106796265, -0.34167546033859253, -0.3267802894115448, -0.3118850886821747, -0.29698988795280457, -0.28209468722343445, -0.2671995162963867, -0.2523043155670166, -0.23740912973880768, -0.22251392900943756, -0.20761872828006744, -0.19272354245185852, -0.1778283417224884, -0.1629331409931183, -0.14803794026374817, -0.13314273953437805, -0.11824754625558853, -0.10335235297679901, -0.0884571522474289, -0.07356195896863937, -0.058666765689849854, -0.043771564960479736, -0.028876371681690216, -0.013981175608932972, 0.0009140204638242722, 0.01580921560525894, 0.03070441260933876, 0.04559960961341858, 0.0604948028922081, 0.07539000362157822, 0.09028519690036774, 0.10518039017915726, 0.12007559090852737, 0.1349707841873169, 0.149865984916687, 0.16476118564605713, 0.17965637147426605, 0.19455157220363617, 0.2094467580318451, 0.2243419587612152, 0.23923714458942413, 0.25413233041763306, 0.2690275311470032, 0.2839227318763733, 0.2988179326057434, 0.3137131333351135, 0.32860833406448364]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 5.0, 4.0, 8.0, 6.0, 8.0, 18.0, 10.0, 22.0, 18.0, 22.0, 24.0, 21.0, 32.0, 39.0, 45.0, 48.0, 35.0, 37.0, 44.0, 35.0, 44.0, 54.0, 32.0, 46.0, 38.0, 34.0, 42.0, 34.0, 27.0, 29.0, 19.0, 19.0, 12.0, 16.0, 15.0, 8.0, 10.0, 6.0, 10.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5149874091148376, -0.4998050630092621, -0.4846227467060089, -0.46944040060043335, -0.4542580544948578, -0.4390757083892822, -0.42389339208602905, -0.4087110459804535, -0.39352869987487793, -0.37834635376930237, -0.3631640374660492, -0.34798169136047363, -0.33279934525489807, -0.3176169991493225, -0.30243468284606934, -0.2872523367404938, -0.2720699906349182, -0.25688764452934265, -0.24170531332492828, -0.22652298212051392, -0.21134063601493835, -0.196158304810524, -0.18097597360610962, -0.16579362750053406, -0.15061131119728088, -0.13542897999286652, -0.12024663388729095, -0.10506430268287659, -0.08988195657730103, -0.07469962537288666, -0.05951728671789169, -0.04433494806289673, -0.029152601957321167, -0.013970264233648777, 0.001212073490023613, 0.01639441028237343, 0.03157674893736839, 0.04675908386707306, 0.061941422522068024, 0.07712376117706299, 0.09230609983205795, 0.10748843848705292, 0.12267077714204788, 0.13785311579704285, 0.15303544700145721, 0.16821777820587158, 0.18340012431144714, 0.1985824704170227, 0.21376480162143707, 0.22894713282585144, 0.244129478931427, 0.25931182503700256, 0.27449414134025574, 0.2896764874458313, 0.30485883355140686, 0.3200411796569824, 0.3352234959602356, 0.35040584206581116, 0.36558815836906433, 0.3807705044746399, 0.39595285058021545, 0.411135196685791, 0.4263175129890442, 0.44149985909461975, 0.4566822052001953]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 7.0, 16.0, 24.0, 47.0, 102.0, 203.0, 545.0, 2167.0, 17963.0, 3656058.0, 503071.0, 10871.0, 1950.0, 607.0, 266.0, 163.0, 82.0, 50.0, 35.0, 17.0, 8.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.1343669891357422, -0.12725448608398438, -0.12014198303222656, -0.11302947998046875, -0.10591697692871094, -0.09880447387695312, -0.09169197082519531, -0.0845794677734375, -0.07746696472167969, -0.07035446166992188, -0.06324195861816406, -0.05612945556640625, -0.04901695251464844, -0.041904449462890625, -0.03479194641113281, -0.027679443359375, -0.020566940307617188, -0.013454437255859375, -0.0063419342041015625, 0.00077056884765625, 0.007883071899414062, 0.014995574951171875, 0.022108078002929688, 0.0292205810546875, 0.03633308410644531, 0.043445587158203125, 0.05055809020996094, 0.05767059326171875, 0.06478309631347656, 0.07189559936523438, 0.07900810241699219, 0.08612060546875, 0.09323310852050781, 0.10034561157226562, 0.10745811462402344, 0.11457061767578125, 0.12168312072753906, 0.12879562377929688, 0.1359081268310547, 0.1430206298828125, 0.1501331329345703, 0.15724563598632812, 0.16435813903808594, 0.17147064208984375, 0.17858314514160156, 0.18569564819335938, 0.1928081512451172, 0.199920654296875, 0.2070331573486328, 0.21414566040039062, 0.22125816345214844, 0.22837066650390625, 0.23548316955566406, 0.24259567260742188, 0.2497081756591797, 0.2568206787109375, 0.2639331817626953, 0.2710456848144531, 0.27815818786621094, 0.28527069091796875, 0.29238319396972656, 0.2994956970214844, 0.3066082000732422, 0.313720703125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 11.0, 22.0, 36.0, 58.0, 95.0, 98.0, 110.0, 108.0, 118.0, 104.0, 74.0, 58.0, 39.0, 28.0, 16.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0311737060546875, -0.02940678596496582, -0.02763986587524414, -0.02587294578552246, -0.02410602569580078, -0.0223391056060791, -0.020572185516357422, -0.018805265426635742, -0.017038345336914062, -0.015271425247192383, -0.013504505157470703, -0.011737585067749023, -0.009970664978027344, -0.008203744888305664, -0.006436824798583984, -0.004669904708862305, -0.002902984619140625, -0.0011360645294189453, 0.0006308555603027344, 0.002397775650024414, 0.004164695739746094, 0.0059316158294677734, 0.007698535919189453, 0.009465456008911133, 0.011232376098632812, 0.012999296188354492, 0.014766216278076172, 0.01653313636779785, 0.01830005645751953, 0.02006697654724121, 0.02183389663696289, 0.02360081672668457, 0.02536773681640625, 0.02713465690612793, 0.02890157699584961, 0.03066849708557129, 0.03243541717529297, 0.03420233726501465, 0.03596925735473633, 0.03773617744445801, 0.03950309753417969, 0.04127001762390137, 0.04303693771362305, 0.04480385780334473, 0.046570777893066406, 0.048337697982788086, 0.050104618072509766, 0.051871538162231445, 0.053638458251953125, 0.055405378341674805, 0.057172298431396484, 0.058939218521118164, 0.060706138610839844, 0.06247305870056152, 0.0642399787902832, 0.06600689888000488, 0.06777381896972656, 0.06954073905944824, 0.07130765914916992, 0.0730745792388916, 0.07484149932861328, 0.07660841941833496, 0.07837533950805664, 0.08014225959777832, 0.0819091796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 3.0, 20.0, 18.0, 36.0, 73.0, 127.0, 213.0, 387.0, 754.0, 2646.0, 16982.0, 2755543.0, 1400020.0, 13914.0, 2159.0, 696.0, 307.0, 171.0, 74.0, 57.0, 32.0, 17.0, 8.0, 7.0, 6.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1866455078125, -0.1809844970703125, -0.175323486328125, -0.1696624755859375, -0.16400146484375, -0.1583404541015625, -0.152679443359375, -0.1470184326171875, -0.141357421875, -0.1356964111328125, -0.130035400390625, -0.1243743896484375, -0.11871337890625, -0.1130523681640625, -0.107391357421875, -0.1017303466796875, -0.0960693359375, -0.0904083251953125, -0.084747314453125, -0.0790863037109375, -0.07342529296875, -0.0677642822265625, -0.062103271484375, -0.0564422607421875, -0.05078125, -0.0451202392578125, -0.039459228515625, -0.0337982177734375, -0.02813720703125, -0.0224761962890625, -0.016815185546875, -0.0111541748046875, -0.0054931640625, 0.0001678466796875, 0.005828857421875, 0.0114898681640625, 0.01715087890625, 0.0228118896484375, 0.028472900390625, 0.0341339111328125, 0.039794921875, 0.0454559326171875, 0.051116943359375, 0.0567779541015625, 0.06243896484375, 0.0680999755859375, 0.073760986328125, 0.0794219970703125, 0.0850830078125, 0.0907440185546875, 0.096405029296875, 0.1020660400390625, 0.10772705078125, 0.1133880615234375, 0.119049072265625, 0.1247100830078125, 0.13037109375, 0.1360321044921875, 0.141693115234375, 0.1473541259765625, 0.15301513671875, 0.1586761474609375, 0.164337158203125, 0.1699981689453125, 0.1756591796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 12.0, 12.0, 17.0, 29.0, 68.0, 162.0, 476.0, 2035.0, 853.0, 236.0, 78.0, 43.0, 18.0, 11.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07098388671875, -0.06924104690551758, -0.06749820709228516, -0.06575536727905273, -0.06401252746582031, -0.06226968765258789, -0.06052684783935547, -0.05878400802612305, -0.057041168212890625, -0.0552983283996582, -0.05355548858642578, -0.05181264877319336, -0.05006980895996094, -0.048326969146728516, -0.046584129333496094, -0.04484128952026367, -0.04309844970703125, -0.04135560989379883, -0.039612770080566406, -0.037869930267333984, -0.03612709045410156, -0.03438425064086914, -0.03264141082763672, -0.030898571014404297, -0.029155731201171875, -0.027412891387939453, -0.02567005157470703, -0.02392721176147461, -0.022184371948242188, -0.020441532135009766, -0.018698692321777344, -0.016955852508544922, -0.0152130126953125, -0.013470172882080078, -0.011727333068847656, -0.009984493255615234, -0.008241653442382812, -0.006498813629150391, -0.004755973815917969, -0.003013134002685547, -0.001270294189453125, 0.0004725456237792969, 0.0022153854370117188, 0.003958225250244141, 0.0057010650634765625, 0.007443904876708984, 0.009186744689941406, 0.010929584503173828, 0.01267242431640625, 0.014415264129638672, 0.016158103942871094, 0.017900943756103516, 0.019643783569335938, 0.02138662338256836, 0.02312946319580078, 0.024872303009033203, 0.026615142822265625, 0.028357982635498047, 0.03010082244873047, 0.03184366226196289, 0.03358650207519531, 0.035329341888427734, 0.037072181701660156, 0.03881502151489258, 0.040557861328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 12.0, 112.0, 559.0, 286.0, 26.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0172717571258545, -0.9903963208198547, -0.9635208249092102, -0.9366453886032104, -0.9097698926925659, -0.8828944563865662, -0.8560190200805664, -0.8291435241699219, -0.8022680282592773, -0.7753925919532776, -0.7485170960426331, -0.7216416597366333, -0.6947661638259888, -0.667890727519989, -0.6410152912139893, -0.6141397953033447, -0.587264358997345, -0.5603889226913452, -0.5335134267807007, -0.5066379904747009, -0.4797624945640564, -0.45288705825805664, -0.4260115921497345, -0.39913612604141235, -0.3722606599330902, -0.34538519382476807, -0.3185097277164459, -0.2916342616081238, -0.264758825302124, -0.23788334429264069, -0.21100789308547974, -0.1841324269771576, -0.15725690126419067, -0.13038143515586853, -0.10350597649812698, -0.07663051784038544, -0.04975505173206329, -0.02287958562374115, 0.0039958655834198, 0.030871331691741943, 0.05774679780006409, 0.08462226390838623, 0.11149772256612778, 0.13837318122386932, 0.16524864733219147, 0.1921241134405136, 0.21899956464767456, 0.2458750307559967, 0.27275049686431885, 0.299625962972641, 0.32650142908096313, 0.3533768653869629, 0.3802523612976074, 0.4071277976036072, 0.4340032637119293, 0.46087872982025146, 0.4877541959285736, 0.5146296620368958, 0.5415050983428955, 0.56838059425354, 0.5952560305595398, 0.6221315264701843, 0.6490069627761841, 0.6758824586868286, 0.7027578949928284]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 15.0, 14.0, 16.0, 20.0, 25.0, 27.0, 48.0, 48.0, 41.0, 42.0, 58.0, 62.0, 64.0, 54.0, 56.0, 47.0, 61.0, 38.0, 48.0, 45.0, 32.0, 26.0, 18.0, 19.0, 10.0, 17.0, 6.0, 9.0, 7.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.17846620082855225, -0.17318670451641083, -0.1679072082042694, -0.162627711892128, -0.15734821557998657, -0.15206871926784515, -0.14678922295570374, -0.14150971174240112, -0.1362302303314209, -0.13095073401927948, -0.12567123770713806, -0.12039174139499664, -0.11511224508285522, -0.1098327487707138, -0.10455324500799179, -0.09927374869585037, -0.09399424493312836, -0.08871474862098694, -0.08343525230884552, -0.0781557559967041, -0.07287625968456268, -0.06759676337242126, -0.06231725960969925, -0.05703776329755783, -0.05175826698541641, -0.046478770673274994, -0.041199274361133575, -0.03591977432370186, -0.03064027801156044, -0.02536078169941902, -0.020081281661987305, -0.014801785349845886, -0.009522289037704468, -0.004242791794240475, 0.0010367054492235184, 0.006316203624010086, 0.011595699936151505, 0.016875196248292923, 0.02215469628572464, 0.02743419259786606, 0.03271368891000748, 0.037993185222148895, 0.043272681534290314, 0.04855218157172203, 0.05383167788386345, 0.05911117419600487, 0.06439067423343658, 0.069670170545578, 0.07494966685771942, 0.08022916316986084, 0.08550865948200226, 0.09078815579414368, 0.0960676521062851, 0.10134714841842651, 0.10662665218114853, 0.11190614849328995, 0.11718564480543137, 0.12246514111757278, 0.1277446448802948, 0.13302414119243622, 0.13830363750457764, 0.14358313381671906, 0.14886263012886047, 0.1541421264410019, 0.1594216227531433]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 9.0, 12.0, 11.0, 17.0, 27.0, 28.0, 41.0, 58.0, 85.0, 134.0, 257.0, 498.0, 1151.0, 2851.0, 9470.0, 45900.0, 316158.0, 552431.0, 95178.0, 16704.0, 4355.0, 1628.0, 676.0, 379.0, 179.0, 87.0, 62.0, 45.0, 32.0, 25.0, 17.0, 12.0, 11.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1080322265625, -0.10433197021484375, -0.1006317138671875, -0.09693145751953125, -0.093231201171875, -0.08953094482421875, -0.0858306884765625, -0.08213043212890625, -0.07843017578125, -0.07472991943359375, -0.0710296630859375, -0.06732940673828125, -0.063629150390625, -0.05992889404296875, -0.0562286376953125, -0.05252838134765625, -0.048828125, -0.04512786865234375, -0.0414276123046875, -0.03772735595703125, -0.034027099609375, -0.03032684326171875, -0.0266265869140625, -0.02292633056640625, -0.01922607421875, -0.01552581787109375, -0.0118255615234375, -0.00812530517578125, -0.004425048828125, -0.00072479248046875, 0.0029754638671875, 0.00667572021484375, 0.0103759765625, 0.01407623291015625, 0.0177764892578125, 0.02147674560546875, 0.025177001953125, 0.02887725830078125, 0.0325775146484375, 0.03627777099609375, 0.03997802734375, 0.04367828369140625, 0.0473785400390625, 0.05107879638671875, 0.054779052734375, 0.05847930908203125, 0.0621795654296875, 0.06587982177734375, 0.069580078125, 0.07328033447265625, 0.0769805908203125, 0.08068084716796875, 0.084381103515625, 0.08808135986328125, 0.0917816162109375, 0.09548187255859375, 0.09918212890625, 0.10288238525390625, 0.1065826416015625, 0.11028289794921875, 0.113983154296875, 0.11768341064453125, 0.1213836669921875, 0.12508392333984375, 0.1287841796875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 13.0, 20.0, 26.0, 39.0, 57.0, 85.0, 104.0, 106.0, 103.0, 112.0, 101.0, 71.0, 50.0, 33.0, 37.0, 18.0, 11.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0281524658203125, -0.026543378829956055, -0.02493429183959961, -0.023325204849243164, -0.02171611785888672, -0.020107030868530273, -0.018497943878173828, -0.016888856887817383, -0.015279769897460938, -0.013670682907104492, -0.012061595916748047, -0.010452508926391602, -0.008843421936035156, -0.007234334945678711, -0.005625247955322266, -0.00401616096496582, -0.002407073974609375, -0.0007979869842529297, 0.0008111000061035156, 0.002420186996459961, 0.004029273986816406, 0.0056383609771728516, 0.007247447967529297, 0.008856534957885742, 0.010465621948242188, 0.012074708938598633, 0.013683795928955078, 0.015292882919311523, 0.01690196990966797, 0.018511056900024414, 0.02012014389038086, 0.021729230880737305, 0.02333831787109375, 0.024947404861450195, 0.02655649185180664, 0.028165578842163086, 0.02977466583251953, 0.03138375282287598, 0.03299283981323242, 0.03460192680358887, 0.03621101379394531, 0.03782010078430176, 0.0394291877746582, 0.04103827476501465, 0.042647361755371094, 0.04425644874572754, 0.045865535736083984, 0.04747462272644043, 0.049083709716796875, 0.05069279670715332, 0.052301883697509766, 0.05391097068786621, 0.055520057678222656, 0.0571291446685791, 0.05873823165893555, 0.06034731864929199, 0.06195640563964844, 0.06356549263000488, 0.06517457962036133, 0.06678366661071777, 0.06839275360107422, 0.07000184059143066, 0.07161092758178711, 0.07322001457214355, 0.0748291015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 8.0, 11.0, 2.0, 14.0, 5.0, 18.0, 23.0, 33.0, 37.0, 56.0, 71.0, 111.0, 131.0, 217.0, 351.0, 645.0, 1316.0, 2758.0, 6040.0, 15148.0, 41453.0, 130103.0, 369886.0, 319766.0, 103469.0, 33991.0, 12618.0, 5161.0, 2352.0, 1140.0, 630.0, 342.0, 215.0, 131.0, 72.0, 58.0, 50.0, 33.0, 23.0, 18.0, 11.0, 12.0, 11.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.05712890625, -0.05539274215698242, -0.053656578063964844, -0.051920413970947266, -0.05018424987792969, -0.04844808578491211, -0.04671192169189453, -0.04497575759887695, -0.043239593505859375, -0.0415034294128418, -0.03976726531982422, -0.03803110122680664, -0.03629493713378906, -0.034558773040771484, -0.032822608947753906, -0.031086444854736328, -0.02935028076171875, -0.027614116668701172, -0.025877952575683594, -0.024141788482666016, -0.022405624389648438, -0.02066946029663086, -0.01893329620361328, -0.017197132110595703, -0.015460968017578125, -0.013724803924560547, -0.011988639831542969, -0.01025247573852539, -0.008516311645507812, -0.006780147552490234, -0.005043983459472656, -0.003307819366455078, -0.0015716552734375, 0.00016450881958007812, 0.0019006729125976562, 0.0036368370056152344, 0.0053730010986328125, 0.007109165191650391, 0.008845329284667969, 0.010581493377685547, 0.012317657470703125, 0.014053821563720703, 0.01578998565673828, 0.01752614974975586, 0.019262313842773438, 0.020998477935791016, 0.022734642028808594, 0.024470806121826172, 0.02620697021484375, 0.027943134307861328, 0.029679298400878906, 0.031415462493896484, 0.03315162658691406, 0.03488779067993164, 0.03662395477294922, 0.0383601188659668, 0.040096282958984375, 0.04183244705200195, 0.04356861114501953, 0.04530477523803711, 0.04704093933105469, 0.048777103424072266, 0.050513267517089844, 0.05224943161010742, 0.053985595703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 6.0, 4.0, 6.0, 4.0, 5.0, 6.0, 11.0, 9.0, 10.0, 20.0, 6.0, 17.0, 27.0, 34.0, 39.0, 20.0, 36.0, 35.0, 24.0, 45.0, 40.0, 31.0, 39.0, 50.0, 46.0, 50.0, 33.0, 39.0, 40.0, 31.0, 19.0, 42.0, 23.0, 24.0, 32.0, 15.0, 14.0, 16.0, 11.0, 9.0, 14.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07672119140625, -0.07416439056396484, -0.07160758972167969, -0.06905078887939453, -0.06649398803710938, -0.06393718719482422, -0.06138038635253906, -0.058823585510253906, -0.05626678466796875, -0.053709983825683594, -0.05115318298339844, -0.04859638214111328, -0.046039581298828125, -0.04348278045654297, -0.04092597961425781, -0.038369178771972656, -0.0358123779296875, -0.033255577087402344, -0.030698776245117188, -0.02814197540283203, -0.025585174560546875, -0.02302837371826172, -0.020471572875976562, -0.017914772033691406, -0.01535797119140625, -0.012801170349121094, -0.010244369506835938, -0.007687568664550781, -0.005130767822265625, -0.0025739669799804688, -1.71661376953125e-05, 0.0025396347045898438, 0.005096435546875, 0.007653236389160156, 0.010210037231445312, 0.012766838073730469, 0.015323638916015625, 0.01788043975830078, 0.020437240600585938, 0.022994041442871094, 0.02555084228515625, 0.028107643127441406, 0.030664443969726562, 0.03322124481201172, 0.035778045654296875, 0.03833484649658203, 0.04089164733886719, 0.043448448181152344, 0.0460052490234375, 0.048562049865722656, 0.05111885070800781, 0.05367565155029297, 0.056232452392578125, 0.05878925323486328, 0.06134605407714844, 0.0639028549194336, 0.06645965576171875, 0.0690164566040039, 0.07157325744628906, 0.07413005828857422, 0.07668685913085938, 0.07924365997314453, 0.08180046081542969, 0.08435726165771484, 0.0869140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 6.0, 2.0, 11.0, 11.0, 13.0, 27.0, 48.0, 58.0, 85.0, 156.0, 308.0, 531.0, 1229.0, 3033.0, 9729.0, 50346.0, 411492.0, 490302.0, 63505.0, 11469.0, 3462.0, 1393.0, 600.0, 273.0, 184.0, 90.0, 64.0, 39.0, 24.0, 19.0, 12.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 5.0, 0.0, 4.0], "bins": [-0.04931640625, -0.04811525344848633, -0.046914100646972656, -0.045712947845458984, -0.04451179504394531, -0.04331064224243164, -0.04210948944091797, -0.0409083366394043, -0.039707183837890625, -0.03850603103637695, -0.03730487823486328, -0.03610372543334961, -0.03490257263183594, -0.033701419830322266, -0.032500267028808594, -0.03129911422729492, -0.03009796142578125, -0.028896808624267578, -0.027695655822753906, -0.026494503021240234, -0.025293350219726562, -0.02409219741821289, -0.02289104461669922, -0.021689891815185547, -0.020488739013671875, -0.019287586212158203, -0.01808643341064453, -0.01688528060913086, -0.015684127807617188, -0.014482975006103516, -0.013281822204589844, -0.012080669403076172, -0.0108795166015625, -0.009678363800048828, -0.008477210998535156, -0.007276058197021484, -0.0060749053955078125, -0.004873752593994141, -0.0036725997924804688, -0.002471446990966797, -0.001270294189453125, -6.914138793945312e-05, 0.0011320114135742188, 0.0023331642150878906, 0.0035343170166015625, 0.004735469818115234, 0.005936622619628906, 0.007137775421142578, 0.00833892822265625, 0.009540081024169922, 0.010741233825683594, 0.011942386627197266, 0.013143539428710938, 0.01434469223022461, 0.015545845031738281, 0.016746997833251953, 0.017948150634765625, 0.019149303436279297, 0.02035045623779297, 0.02155160903930664, 0.022752761840820312, 0.023953914642333984, 0.025155067443847656, 0.026356220245361328, 0.027557373046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 2.0, 8.0, 4.0, 13.0, 13.0, 8.0, 16.0, 22.0, 21.0, 17.0, 46.0, 40.0, 54.0, 67.0, 51.0, 73.0, 67.0, 61.0, 37.0, 58.0, 49.0, 44.0, 44.0, 35.0, 28.0, 24.0, 16.0, 20.0, 11.0, 12.0, 9.0, 6.0, 7.0, 4.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.377696990966797e-06, -6.203539669513702e-06, -6.029382348060608e-06, -5.8552250266075134e-06, -5.681067705154419e-06, -5.5069103837013245e-06, -5.33275306224823e-06, -5.1585957407951355e-06, -4.984438419342041e-06, -4.8102810978889465e-06, -4.636123776435852e-06, -4.4619664549827576e-06, -4.287809133529663e-06, -4.113651812076569e-06, -3.939494490623474e-06, -3.7653371691703796e-06, -3.591179847717285e-06, -3.4170225262641907e-06, -3.242865204811096e-06, -3.0687078833580017e-06, -2.8945505619049072e-06, -2.7203932404518127e-06, -2.5462359189987183e-06, -2.3720785975456238e-06, -2.1979212760925293e-06, -2.023763954639435e-06, -1.8496066331863403e-06, -1.6754493117332458e-06, -1.5012919902801514e-06, -1.3271346688270569e-06, -1.1529773473739624e-06, -9.78820025920868e-07, -8.046627044677734e-07, -6.30505383014679e-07, -4.5634806156158447e-07, -2.8219074010849e-07, -1.0803341865539551e-07, 6.612390279769897e-08, 2.4028122425079346e-07, 4.1443854570388794e-07, 5.885958671569824e-07, 7.627531886100769e-07, 9.369105100631714e-07, 1.1110678315162659e-06, 1.2852251529693604e-06, 1.4593824744224548e-06, 1.6335397958755493e-06, 1.8076971173286438e-06, 1.9818544387817383e-06, 2.1560117602348328e-06, 2.3301690816879272e-06, 2.5043264031410217e-06, 2.678483724594116e-06, 2.8526410460472107e-06, 3.026798367500305e-06, 3.2009556889533997e-06, 3.375113010406494e-06, 3.5492703318595886e-06, 3.723427653312683e-06, 3.897584974765778e-06, 4.071742296218872e-06, 4.2458996176719666e-06, 4.420056939125061e-06, 4.5942142605781555e-06, 4.76837158203125e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 13.0, 12.0, 16.0, 23.0, 27.0, 36.0, 55.0, 49.0, 118.0, 169.0, 211.0, 297.0, 445.0, 728.0, 1113.0, 1868.0, 3310.0, 6267.0, 14097.0, 37172.0, 124942.0, 372829.0, 326684.0, 100983.0, 31382.0, 12141.0, 5773.0, 3067.0, 1644.0, 1005.0, 658.0, 421.0, 275.0, 178.0, 149.0, 109.0, 65.0, 53.0, 48.0, 30.0, 14.0, 14.0, 11.0, 7.0, 10.0, 5.0, 5.0, 0.0, 5.0, 5.0, 1.0, 4.0, 1.0], "bins": [-0.0240936279296875, -0.023361682891845703, -0.022629737854003906, -0.02189779281616211, -0.021165847778320312, -0.020433902740478516, -0.01970195770263672, -0.018970012664794922, -0.018238067626953125, -0.017506122589111328, -0.01677417755126953, -0.016042232513427734, -0.015310287475585938, -0.01457834243774414, -0.013846397399902344, -0.013114452362060547, -0.01238250732421875, -0.011650562286376953, -0.010918617248535156, -0.01018667221069336, -0.009454727172851562, -0.008722782135009766, -0.007990837097167969, -0.007258892059326172, -0.006526947021484375, -0.005795001983642578, -0.005063056945800781, -0.004331111907958984, -0.0035991668701171875, -0.0028672218322753906, -0.0021352767944335938, -0.0014033317565917969, -0.00067138671875, 6.0558319091796875e-05, 0.0007925033569335938, 0.0015244483947753906, 0.0022563934326171875, 0.0029883384704589844, 0.0037202835083007812, 0.004452228546142578, 0.005184173583984375, 0.005916118621826172, 0.006648063659667969, 0.007380008697509766, 0.008111953735351562, 0.00884389877319336, 0.009575843811035156, 0.010307788848876953, 0.01103973388671875, 0.011771678924560547, 0.012503623962402344, 0.01323556900024414, 0.013967514038085938, 0.014699459075927734, 0.015431404113769531, 0.016163349151611328, 0.016895294189453125, 0.017627239227294922, 0.01835918426513672, 0.019091129302978516, 0.019823074340820312, 0.02055501937866211, 0.021286964416503906, 0.022018909454345703, 0.0227508544921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 3.0, 11.0, 11.0, 9.0, 18.0, 16.0, 20.0, 20.0, 27.0, 36.0, 42.0, 48.0, 52.0, 72.0, 57.0, 73.0, 72.0, 71.0, 46.0, 50.0, 48.0, 32.0, 30.0, 23.0, 20.0, 17.0, 19.0, 9.0, 4.0, 7.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.023590087890625, -0.022815704345703125, -0.02204132080078125, -0.021266937255859375, -0.0204925537109375, -0.019718170166015625, -0.01894378662109375, -0.018169403076171875, -0.01739501953125, -0.016620635986328125, -0.01584625244140625, -0.015071868896484375, -0.0142974853515625, -0.013523101806640625, -0.01274871826171875, -0.011974334716796875, -0.011199951171875, -0.010425567626953125, -0.00965118408203125, -0.008876800537109375, -0.0081024169921875, -0.007328033447265625, -0.00655364990234375, -0.005779266357421875, -0.0050048828125, -0.004230499267578125, -0.00345611572265625, -0.002681732177734375, -0.0019073486328125, -0.001132965087890625, -0.00035858154296875, 0.000415802001953125, 0.001190185546875, 0.001964569091796875, 0.00273895263671875, 0.003513336181640625, 0.0042877197265625, 0.005062103271484375, 0.00583648681640625, 0.006610870361328125, 0.00738525390625, 0.008159637451171875, 0.00893402099609375, 0.009708404541015625, 0.0104827880859375, 0.011257171630859375, 0.01203155517578125, 0.012805938720703125, 0.013580322265625, 0.014354705810546875, 0.01512908935546875, 0.015903472900390625, 0.0166778564453125, 0.017452239990234375, 0.01822662353515625, 0.019001007080078125, 0.019775390625, 0.020549774169921875, 0.02132415771484375, 0.022098541259765625, 0.0228729248046875, 0.023647308349609375, 0.02442169189453125, 0.025196075439453125, 0.025970458984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 11.0, 36.0, 93.0, 296.0, 345.0, 169.0, 35.0, 13.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4185125827789307, -1.379377841949463, -1.3402432203292847, -1.301108479499817, -1.2619738578796387, -1.222839117050171, -1.1837043762207031, -1.144569754600525, -1.1054350137710571, -1.0663002729415894, -1.0271656513214111, -0.9880309104919434, -0.9488962292671204, -0.9097615480422974, -0.8706268668174744, -0.8314921855926514, -0.7923575043678284, -0.7532228231430054, -0.7140881419181824, -0.6749534606933594, -0.6358187198638916, -0.5966840386390686, -0.5575493574142456, -0.5184146165847778, -0.4792799651622772, -0.4401452839374542, -0.40101057291030884, -0.36187589168548584, -0.32274121046066284, -0.28360649943351746, -0.24447181820869446, -0.20533710718154907, -0.16620242595672607, -0.12706772983074188, -0.08793304115533829, -0.04879835247993469, -0.0096636563539505, 0.02947103977203369, 0.06860572099685669, 0.10774043202400208, 0.14687511324882507, 0.18600980937480927, 0.22514450550079346, 0.26427918672561646, 0.30341386795043945, 0.34254857897758484, 0.38168326020240784, 0.4208179712295532, 0.4599526524543762, 0.4990873336791992, 0.5382220149040222, 0.5773566961288452, 0.616491436958313, 0.655626118183136, 0.694760799407959, 0.7338955402374268, 0.773030161857605, 0.812164843082428, 0.851299524307251, 0.8904342651367188, 0.9295689463615417, 0.9687036275863647, 1.007838249206543, 1.0469729900360107, 1.0861077308654785]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 9.0, 8.0, 13.0, 14.0, 13.0, 13.0, 18.0, 20.0, 24.0, 28.0, 32.0, 36.0, 30.0, 28.0, 29.0, 42.0, 32.0, 40.0, 56.0, 32.0, 56.0, 44.0, 37.0, 38.0, 36.0, 28.0, 22.0, 27.0, 24.0, 24.0, 22.0, 15.0, 22.0, 18.0, 12.0, 6.0, 12.0, 3.0, 6.0, 4.0, 0.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.4656888246536255, -0.4523487985134125, -0.43900877237319946, -0.42566874623298645, -0.41232872009277344, -0.3989886939525604, -0.3856486678123474, -0.372308611869812, -0.3589686155319214, -0.3456285893917084, -0.33228856325149536, -0.31894853711128235, -0.30560851097106934, -0.2922684848308563, -0.2789284586906433, -0.2655884027481079, -0.2522483766078949, -0.23890835046768188, -0.22556832432746887, -0.21222829818725586, -0.19888827204704285, -0.18554824590682983, -0.17220820486545563, -0.15886817872524261, -0.1455281525850296, -0.1321881264448166, -0.11884810030460358, -0.10550806671380997, -0.09216804057359695, -0.07882801443338394, -0.06548798084259033, -0.05214795470237732, -0.03880792856216431, -0.025467900559306145, -0.012127872556447983, 0.0012121573090553284, 0.014552183449268341, 0.027892209589481354, 0.04123224318027496, 0.054572269320487976, 0.06791229546070099, 0.081252321600914, 0.09459234774112701, 0.10793238133192062, 0.12127240747213364, 0.13461244106292725, 0.14795246720314026, 0.16129249334335327, 0.17463251948356628, 0.1879725456237793, 0.2013125717639923, 0.21465259790420532, 0.22799262404441833, 0.24133265018463135, 0.25467270612716675, 0.2680127024650574, 0.2813527584075928, 0.2946927845478058, 0.3080328106880188, 0.3213728368282318, 0.3347128629684448, 0.34805288910865784, 0.36139291524887085, 0.37473297119140625, 0.3880729675292969]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 12.0, 14.0, 40.0, 54.0, 138.0, 334.0, 903.0, 3327.0, 16838.0, 345713.0, 3770234.0, 46769.0, 6840.0, 1843.0, 626.0, 257.0, 134.0, 75.0, 53.0, 20.0, 21.0, 10.0, 9.0, 6.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2021484375, -0.19685935974121094, -0.19157028198242188, -0.1862812042236328, -0.18099212646484375, -0.1757030487060547, -0.17041397094726562, -0.16512489318847656, -0.1598358154296875, -0.15454673767089844, -0.14925765991210938, -0.1439685821533203, -0.13867950439453125, -0.1333904266357422, -0.12810134887695312, -0.12281227111816406, -0.117523193359375, -0.11223411560058594, -0.10694503784179688, -0.10165596008300781, -0.09636688232421875, -0.09107780456542969, -0.08578872680664062, -0.08049964904785156, -0.0752105712890625, -0.06992149353027344, -0.06463241577148438, -0.05934333801269531, -0.05405426025390625, -0.04876518249511719, -0.043476104736328125, -0.03818702697753906, -0.03289794921875, -0.027608871459960938, -0.022319793701171875, -0.017030715942382812, -0.01174163818359375, -0.0064525604248046875, -0.001163482666015625, 0.0041255950927734375, 0.0094146728515625, 0.014703750610351562, 0.019992828369140625, 0.025281906127929688, 0.03057098388671875, 0.03586006164550781, 0.041149139404296875, 0.04643821716308594, 0.051727294921875, 0.05701637268066406, 0.062305450439453125, 0.06759452819824219, 0.07288360595703125, 0.07817268371582031, 0.08346176147460938, 0.08875083923339844, 0.0940399169921875, 0.09932899475097656, 0.10461807250976562, 0.10990715026855469, 0.11519622802734375, 0.12048530578613281, 0.12577438354492188, 0.13106346130371094, 0.1363525390625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 9.0, 26.0, 30.0, 52.0, 65.0, 82.0, 96.0, 105.0, 88.0, 97.0, 87.0, 75.0, 39.0, 56.0, 32.0, 29.0, 12.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031158447265625, -0.029558658599853516, -0.02795886993408203, -0.026359081268310547, -0.024759292602539062, -0.023159503936767578, -0.021559715270996094, -0.01995992660522461, -0.018360137939453125, -0.01676034927368164, -0.015160560607910156, -0.013560771942138672, -0.011960983276367188, -0.010361194610595703, -0.008761405944824219, -0.007161617279052734, -0.00556182861328125, -0.003962039947509766, -0.0023622512817382812, -0.0007624626159667969, 0.0008373260498046875, 0.002437114715576172, 0.004036903381347656, 0.005636692047119141, 0.007236480712890625, 0.00883626937866211, 0.010436058044433594, 0.012035846710205078, 0.013635635375976562, 0.015235424041748047, 0.01683521270751953, 0.018435001373291016, 0.0200347900390625, 0.021634578704833984, 0.02323436737060547, 0.024834156036376953, 0.026433944702148438, 0.028033733367919922, 0.029633522033691406, 0.03123331069946289, 0.032833099365234375, 0.03443288803100586, 0.036032676696777344, 0.03763246536254883, 0.03923225402832031, 0.0408320426940918, 0.04243183135986328, 0.044031620025634766, 0.04563140869140625, 0.047231197357177734, 0.04883098602294922, 0.0504307746887207, 0.05203056335449219, 0.05363035202026367, 0.055230140686035156, 0.05682992935180664, 0.058429718017578125, 0.06002950668334961, 0.061629295349121094, 0.06322908401489258, 0.06482887268066406, 0.06642866134643555, 0.06802845001220703, 0.06962823867797852, 0.07122802734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 7.0, 12.0, 17.0, 29.0, 51.0, 125.0, 277.0, 701.0, 1872.0, 7459.0, 58638.0, 3671825.0, 427866.0, 19862.0, 3679.0, 1078.0, 441.0, 172.0, 77.0, 43.0, 21.0, 7.0, 10.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1212158203125, -0.11700248718261719, -0.11278915405273438, -0.10857582092285156, -0.10436248779296875, -0.10014915466308594, -0.09593582153320312, -0.09172248840332031, -0.0875091552734375, -0.08329582214355469, -0.07908248901367188, -0.07486915588378906, -0.07065582275390625, -0.06644248962402344, -0.062229156494140625, -0.05801582336425781, -0.053802490234375, -0.04958915710449219, -0.045375823974609375, -0.04116249084472656, -0.03694915771484375, -0.03273582458496094, -0.028522491455078125, -0.024309158325195312, -0.0200958251953125, -0.015882492065429688, -0.011669158935546875, -0.0074558258056640625, -0.00324249267578125, 0.0009708404541015625, 0.005184173583984375, 0.009397506713867188, 0.01361083984375, 0.017824172973632812, 0.022037506103515625, 0.026250839233398438, 0.03046417236328125, 0.03467750549316406, 0.038890838623046875, 0.04310417175292969, 0.0473175048828125, 0.05153083801269531, 0.055744171142578125, 0.05995750427246094, 0.06417083740234375, 0.06838417053222656, 0.07259750366210938, 0.07681083679199219, 0.081024169921875, 0.08523750305175781, 0.08945083618164062, 0.09366416931152344, 0.09787750244140625, 0.10209083557128906, 0.10630416870117188, 0.11051750183105469, 0.1147308349609375, 0.11894416809082031, 0.12315750122070312, 0.12737083435058594, 0.13158416748046875, 0.13579750061035156, 0.14001083374023438, 0.1442241668701172, 0.1484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 5.0, 13.0, 21.0, 40.0, 80.0, 126.0, 325.0, 895.0, 1623.0, 488.0, 188.0, 85.0, 58.0, 33.0, 25.0, 9.0, 10.0, 7.0, 5.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.061614990234375, -0.060085296630859375, -0.05855560302734375, -0.057025909423828125, -0.0554962158203125, -0.053966522216796875, -0.05243682861328125, -0.050907135009765625, -0.04937744140625, -0.047847747802734375, -0.04631805419921875, -0.044788360595703125, -0.0432586669921875, -0.041728973388671875, -0.04019927978515625, -0.038669586181640625, -0.037139892578125, -0.035610198974609375, -0.03408050537109375, -0.032550811767578125, -0.0310211181640625, -0.029491424560546875, -0.02796173095703125, -0.026432037353515625, -0.02490234375, -0.023372650146484375, -0.02184295654296875, -0.020313262939453125, -0.0187835693359375, -0.017253875732421875, -0.01572418212890625, -0.014194488525390625, -0.012664794921875, -0.011135101318359375, -0.00960540771484375, -0.008075714111328125, -0.0065460205078125, -0.005016326904296875, -0.00348663330078125, -0.001956939697265625, -0.00042724609375, 0.001102447509765625, 0.00263214111328125, 0.004161834716796875, 0.0056915283203125, 0.007221221923828125, 0.00875091552734375, 0.010280609130859375, 0.011810302734375, 0.013339996337890625, 0.01486968994140625, 0.016399383544921875, 0.0179290771484375, 0.019458770751953125, 0.02098846435546875, 0.022518157958984375, 0.0240478515625, 0.025577545166015625, 0.02710723876953125, 0.028636932373046875, 0.0301666259765625, 0.031696319580078125, 0.03322601318359375, 0.034755706787109375, 0.036285400390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 13.0, 56.0, 294.0, 441.0, 165.0, 23.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7182180881500244, -0.695995032787323, -0.6737719774246216, -0.6515489220619202, -0.6293258666992188, -0.6071028113365173, -0.5848797559738159, -0.5626567006111145, -0.5404336452484131, -0.5182105898857117, -0.49598753452301025, -0.47376447916030884, -0.4515414237976074, -0.429318368434906, -0.4070953130722046, -0.3848722577095032, -0.36264923214912415, -0.34042617678642273, -0.3182031214237213, -0.2959800660610199, -0.2737570106983185, -0.25153395533561707, -0.22931091487407684, -0.20708785951137543, -0.184864804148674, -0.1626417487859726, -0.14041869342327118, -0.11819564551115036, -0.09597259014844894, -0.07374953478574753, -0.05152648687362671, -0.029303431510925293, -0.007080376148223877, 0.01514267735183239, 0.03736573085188866, 0.059588782489299774, 0.08181183785200119, 0.1040348932147026, 0.12625794112682343, 0.14848099648952484, 0.17070405185222626, 0.19292710721492767, 0.2151501625776291, 0.2373732030391693, 0.2595962584018707, 0.28181931376457214, 0.30404236912727356, 0.326265424489975, 0.3484884798526764, 0.3707115352153778, 0.3929345905780792, 0.41515764594078064, 0.43738070130348206, 0.45960375666618347, 0.4818267822265625, 0.5040498375892639, 0.5262728929519653, 0.5484959483146667, 0.5707190036773682, 0.5929420590400696, 0.615165114402771, 0.6373881697654724, 0.6596112251281738, 0.6818342804908752, 0.7040573358535767]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 14.0, 16.0, 16.0, 34.0, 25.0, 52.0, 39.0, 44.0, 50.0, 55.0, 72.0, 60.0, 66.0, 61.0, 55.0, 58.0, 48.0, 53.0, 47.0, 41.0, 21.0, 20.0, 12.0, 15.0, 5.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.198777437210083, -0.19283360242843628, -0.18688976764678955, -0.18094593286514282, -0.1750021129846573, -0.16905827820301056, -0.16311444342136383, -0.1571706086397171, -0.15122678875923157, -0.14528295397758484, -0.1393391191959381, -0.13339528441429138, -0.12745146453380585, -0.12150762975215912, -0.11556379497051239, -0.10961996018886566, -0.10367612540721893, -0.0977322906255722, -0.09178846329450607, -0.08584462851285934, -0.07990080118179321, -0.07395696640014648, -0.06801313161849976, -0.062069300562143326, -0.056125469505786896, -0.050181638449430466, -0.044237807393074036, -0.03829397261142731, -0.03235014155507088, -0.026406310498714447, -0.02046247571706772, -0.014518644660711288, -0.008574813604354858, -0.0026309816166758537, 0.003312850371003151, 0.00925668329000473, 0.01520051434636116, 0.02114434540271759, 0.02708818018436432, 0.03303201124072075, 0.03897584229707718, 0.04491967335343361, 0.05086350440979004, 0.05680733919143677, 0.0627511739730835, 0.06869500130414963, 0.07463883608579636, 0.08058266341686249, 0.08652649819850922, 0.09247033298015594, 0.09841416031122208, 0.1043579950928688, 0.11030182242393494, 0.11624565720558167, 0.1221894919872284, 0.12813332676887512, 0.13407716155052185, 0.14002099633216858, 0.1459648311138153, 0.15190866589546204, 0.15785248577594757, 0.1637963205575943, 0.16974015533924103, 0.17568399012088776, 0.1816278100013733]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 10.0, 8.0, 7.0, 14.0, 18.0, 40.0, 43.0, 84.0, 128.0, 240.0, 496.0, 1053.0, 2696.0, 8326.0, 37761.0, 302162.0, 596829.0, 78073.0, 13841.0, 3893.0, 1437.0, 632.0, 334.0, 154.0, 105.0, 61.0, 40.0, 25.0, 14.0, 4.0, 12.0, 4.0, 4.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.137939453125, -0.13378334045410156, -0.12962722778320312, -0.1254711151123047, -0.12131500244140625, -0.11715888977050781, -0.11300277709960938, -0.10884666442871094, -0.1046905517578125, -0.10053443908691406, -0.09637832641601562, -0.09222221374511719, -0.08806610107421875, -0.08390998840332031, -0.07975387573242188, -0.07559776306152344, -0.071441650390625, -0.06728553771972656, -0.06312942504882812, -0.05897331237792969, -0.05481719970703125, -0.05066108703613281, -0.046504974365234375, -0.04234886169433594, -0.0381927490234375, -0.03403663635253906, -0.029880523681640625, -0.025724411010742188, -0.02156829833984375, -0.017412185668945312, -0.013256072998046875, -0.009099960327148438, -0.00494384765625, -0.0007877349853515625, 0.003368377685546875, 0.0075244903564453125, 0.01168060302734375, 0.015836715698242188, 0.019992828369140625, 0.024148941040039062, 0.0283050537109375, 0.03246116638183594, 0.036617279052734375, 0.04077339172363281, 0.04492950439453125, 0.04908561706542969, 0.053241729736328125, 0.05739784240722656, 0.061553955078125, 0.06571006774902344, 0.06986618041992188, 0.07402229309082031, 0.07817840576171875, 0.08233451843261719, 0.08649063110351562, 0.09064674377441406, 0.0948028564453125, 0.09895896911621094, 0.10311508178710938, 0.10727119445800781, 0.11142730712890625, 0.11558341979980469, 0.11973953247070312, 0.12389564514160156, 0.1280517578125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 11.0, 18.0, 28.0, 41.0, 55.0, 54.0, 81.0, 83.0, 97.0, 93.0, 84.0, 92.0, 73.0, 50.0, 42.0, 40.0, 22.0, 10.0, 8.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02899169921875, -0.027495384216308594, -0.025999069213867188, -0.02450275421142578, -0.023006439208984375, -0.02151012420654297, -0.020013809204101562, -0.018517494201660156, -0.01702117919921875, -0.015524864196777344, -0.014028549194335938, -0.012532234191894531, -0.011035919189453125, -0.009539604187011719, -0.008043289184570312, -0.006546974182128906, -0.0050506591796875, -0.0035543441772460938, -0.0020580291748046875, -0.0005617141723632812, 0.000934600830078125, 0.0024309158325195312, 0.0039272308349609375, 0.005423545837402344, 0.00691986083984375, 0.008416175842285156, 0.009912490844726562, 0.011408805847167969, 0.012905120849609375, 0.014401435852050781, 0.015897750854492188, 0.017394065856933594, 0.018890380859375, 0.020386695861816406, 0.021883010864257812, 0.02337932586669922, 0.024875640869140625, 0.02637195587158203, 0.027868270874023438, 0.029364585876464844, 0.03086090087890625, 0.032357215881347656, 0.03385353088378906, 0.03534984588623047, 0.036846160888671875, 0.03834247589111328, 0.03983879089355469, 0.041335105895996094, 0.0428314208984375, 0.044327735900878906, 0.04582405090332031, 0.04732036590576172, 0.048816680908203125, 0.05031299591064453, 0.05180931091308594, 0.053305625915527344, 0.05480194091796875, 0.056298255920410156, 0.05779457092285156, 0.05929088592529297, 0.060787200927734375, 0.06228351593017578, 0.06377983093261719, 0.0652761459350586, 0.0667724609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 4.0, 3.0, 10.0, 8.0, 16.0, 10.0, 14.0, 13.0, 14.0, 30.0, 32.0, 55.0, 59.0, 96.0, 134.0, 197.0, 391.0, 819.0, 1774.0, 4756.0, 15514.0, 60646.0, 308179.0, 504028.0, 113149.0, 25951.0, 7598.0, 2642.0, 1063.0, 497.0, 262.0, 177.0, 113.0, 70.0, 57.0, 41.0, 31.0, 26.0, 15.0, 14.0, 10.0, 6.0, 9.0, 3.0, 8.0, 2.0, 6.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.07952880859375, -0.0772695541381836, -0.07501029968261719, -0.07275104522705078, -0.07049179077148438, -0.06823253631591797, -0.06597328186035156, -0.06371402740478516, -0.06145477294921875, -0.059195518493652344, -0.05693626403808594, -0.05467700958251953, -0.052417755126953125, -0.05015850067138672, -0.04789924621582031, -0.045639991760253906, -0.0433807373046875, -0.041121482849121094, -0.03886222839355469, -0.03660297393798828, -0.034343719482421875, -0.03208446502685547, -0.029825210571289062, -0.027565956115722656, -0.02530670166015625, -0.023047447204589844, -0.020788192749023438, -0.01852893829345703, -0.016269683837890625, -0.014010429382324219, -0.011751174926757812, -0.009491920471191406, -0.007232666015625, -0.004973411560058594, -0.0027141571044921875, -0.00045490264892578125, 0.001804351806640625, 0.004063606262207031, 0.0063228607177734375, 0.008582115173339844, 0.01084136962890625, 0.013100624084472656, 0.015359878540039062, 0.01761913299560547, 0.019878387451171875, 0.02213764190673828, 0.024396896362304688, 0.026656150817871094, 0.0289154052734375, 0.031174659729003906, 0.03343391418457031, 0.03569316864013672, 0.037952423095703125, 0.04021167755126953, 0.04247093200683594, 0.044730186462402344, 0.04698944091796875, 0.049248695373535156, 0.05150794982910156, 0.05376720428466797, 0.056026458740234375, 0.05828571319580078, 0.06054496765136719, 0.0628042221069336, 0.0650634765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 3.0, 6.0, 4.0, 12.0, 12.0, 14.0, 22.0, 24.0, 21.0, 28.0, 28.0, 41.0, 38.0, 49.0, 48.0, 43.0, 63.0, 50.0, 64.0, 47.0, 50.0, 41.0, 55.0, 43.0, 21.0, 34.0, 28.0, 25.0, 19.0, 15.0, 8.0, 11.0, 9.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10809326171875, -0.10470199584960938, -0.10131072998046875, -0.09791946411132812, -0.0945281982421875, -0.09113693237304688, -0.08774566650390625, -0.08435440063476562, -0.080963134765625, -0.07757186889648438, -0.07418060302734375, -0.07078933715820312, -0.0673980712890625, -0.06400680541992188, -0.06061553955078125, -0.057224273681640625, -0.0538330078125, -0.050441741943359375, -0.04705047607421875, -0.043659210205078125, -0.0402679443359375, -0.036876678466796875, -0.03348541259765625, -0.030094146728515625, -0.026702880859375, -0.023311614990234375, -0.01992034912109375, -0.016529083251953125, -0.0131378173828125, -0.009746551513671875, -0.00635528564453125, -0.002964019775390625, 0.00042724609375, 0.003818511962890625, 0.00720977783203125, 0.010601043701171875, 0.0139923095703125, 0.017383575439453125, 0.02077484130859375, 0.024166107177734375, 0.027557373046875, 0.030948638916015625, 0.03433990478515625, 0.037731170654296875, 0.0411224365234375, 0.044513702392578125, 0.04790496826171875, 0.051296234130859375, 0.0546875, 0.058078765869140625, 0.06147003173828125, 0.06486129760742188, 0.0682525634765625, 0.07164382934570312, 0.07503509521484375, 0.07842636108398438, 0.081817626953125, 0.08520889282226562, 0.08860015869140625, 0.09199142456054688, 0.0953826904296875, 0.09877395629882812, 0.10216522216796875, 0.10555648803710938, 0.10894775390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 30.0, 30.0, 82.0, 200.0, 423.0, 1356.0, 15895.0, 974036.0, 53449.0, 2101.0, 533.0, 217.0, 104.0, 55.0, 19.0, 8.0, 9.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1171875, -0.11370277404785156, -0.11021804809570312, -0.10673332214355469, -0.10324859619140625, -0.09976387023925781, -0.09627914428710938, -0.09279441833496094, -0.0893096923828125, -0.08582496643066406, -0.08234024047851562, -0.07885551452636719, -0.07537078857421875, -0.07188606262207031, -0.06840133666992188, -0.06491661071777344, -0.061431884765625, -0.05794715881347656, -0.054462432861328125, -0.05097770690917969, -0.04749298095703125, -0.04400825500488281, -0.040523529052734375, -0.03703880310058594, -0.0335540771484375, -0.030069351196289062, -0.026584625244140625, -0.023099899291992188, -0.01961517333984375, -0.016130447387695312, -0.012645721435546875, -0.009160995483398438, -0.00567626953125, -0.0021915435791015625, 0.001293182373046875, 0.0047779083251953125, 0.00826263427734375, 0.011747360229492188, 0.015232086181640625, 0.018716812133789062, 0.0222015380859375, 0.025686264038085938, 0.029170989990234375, 0.03265571594238281, 0.03614044189453125, 0.03962516784667969, 0.043109893798828125, 0.04659461975097656, 0.050079345703125, 0.05356407165527344, 0.057048797607421875, 0.06053352355957031, 0.06401824951171875, 0.06750297546386719, 0.07098770141601562, 0.07447242736816406, 0.0779571533203125, 0.08144187927246094, 0.08492660522460938, 0.08841133117675781, 0.09189605712890625, 0.09538078308105469, 0.09886550903320312, 0.10235023498535156, 0.1058349609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 5.0, 5.0, 9.0, 9.0, 28.0, 18.0, 19.0, 27.0, 36.0, 42.0, 41.0, 80.0, 78.0, 53.0, 62.0, 92.0, 62.0, 48.0, 52.0, 63.0, 39.0, 32.0, 40.0, 17.0, 5.0, 9.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-06, -5.168840289115906e-06, -4.973262548446655e-06, -4.777684807777405e-06, -4.582107067108154e-06, -4.386529326438904e-06, -4.190951585769653e-06, -3.995373845100403e-06, -3.7997961044311523e-06, -3.604218363761902e-06, -3.4086406230926514e-06, -3.213062882423401e-06, -3.0174851417541504e-06, -2.8219074010849e-06, -2.6263296604156494e-06, -2.430751919746399e-06, -2.2351741790771484e-06, -2.039596438407898e-06, -1.8440186977386475e-06, -1.648440957069397e-06, -1.4528632164001465e-06, -1.257285475730896e-06, -1.0617077350616455e-06, -8.66129994392395e-07, -6.705522537231445e-07, -4.7497451305389404e-07, -2.7939677238464355e-07, -8.381903171539307e-08, 1.1175870895385742e-07, 3.073364496231079e-07, 5.029141902923584e-07, 6.984919309616089e-07, 8.940696716308594e-07, 1.0896474123001099e-06, 1.2852251529693604e-06, 1.4808028936386108e-06, 1.6763806343078613e-06, 1.8719583749771118e-06, 2.0675361156463623e-06, 2.263113856315613e-06, 2.4586915969848633e-06, 2.6542693376541138e-06, 2.8498470783233643e-06, 3.0454248189926147e-06, 3.2410025596618652e-06, 3.4365803003311157e-06, 3.632158041000366e-06, 3.827735781669617e-06, 4.023313522338867e-06, 4.218891263008118e-06, 4.414469003677368e-06, 4.610046744346619e-06, 4.805624485015869e-06, 5.00120222568512e-06, 5.19677996635437e-06, 5.392357707023621e-06, 5.587935447692871e-06, 5.783513188362122e-06, 5.979090929031372e-06, 6.1746686697006226e-06, 6.370246410369873e-06, 6.5658241510391235e-06, 6.761401891708374e-06, 6.9569796323776245e-06, 7.152557373046875e-06]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 8.0, 12.0, 28.0, 57.0, 137.0, 320.0, 1545.0, 22940.0, 940554.0, 79405.0, 2723.0, 479.0, 187.0, 93.0, 32.0, 15.0, 11.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.065673828125, -0.06263923645019531, -0.059604644775390625, -0.05657005310058594, -0.05353546142578125, -0.05050086975097656, -0.047466278076171875, -0.04443168640136719, -0.0413970947265625, -0.03836250305175781, -0.035327911376953125, -0.03229331970214844, -0.02925872802734375, -0.026224136352539062, -0.023189544677734375, -0.020154953002929688, -0.017120361328125, -0.014085769653320312, -0.011051177978515625, -0.008016586303710938, -0.00498199462890625, -0.0019474029541015625, 0.001087188720703125, 0.0041217803955078125, 0.0071563720703125, 0.010190963745117188, 0.013225555419921875, 0.016260147094726562, 0.01929473876953125, 0.022329330444335938, 0.025363922119140625, 0.028398513793945312, 0.03143310546875, 0.03446769714355469, 0.037502288818359375, 0.04053688049316406, 0.04357147216796875, 0.04660606384277344, 0.049640655517578125, 0.05267524719238281, 0.0557098388671875, 0.05874443054199219, 0.061779022216796875, 0.06481361389160156, 0.06784820556640625, 0.07088279724121094, 0.07391738891601562, 0.07695198059082031, 0.079986572265625, 0.08302116394042969, 0.08605575561523438, 0.08909034729003906, 0.09212493896484375, 0.09515953063964844, 0.09819412231445312, 0.10122871398925781, 0.1042633056640625, 0.10729789733886719, 0.11033248901367188, 0.11336708068847656, 0.11640167236328125, 0.11943626403808594, 0.12247085571289062, 0.1255054473876953, 0.1285400390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 12.0, 5.0, 19.0, 28.0, 63.0, 114.0, 160.0, 211.0, 164.0, 103.0, 68.0, 30.0, 16.0, 14.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04278564453125, -0.040340423583984375, -0.03789520263671875, -0.035449981689453125, -0.0330047607421875, -0.030559539794921875, -0.02811431884765625, -0.025669097900390625, -0.023223876953125, -0.020778656005859375, -0.01833343505859375, -0.015888214111328125, -0.0134429931640625, -0.010997772216796875, -0.00855255126953125, -0.006107330322265625, -0.003662109375, -0.001216888427734375, 0.00122833251953125, 0.003673553466796875, 0.0061187744140625, 0.008563995361328125, 0.01100921630859375, 0.013454437255859375, 0.015899658203125, 0.018344879150390625, 0.02079010009765625, 0.023235321044921875, 0.0256805419921875, 0.028125762939453125, 0.03057098388671875, 0.033016204833984375, 0.03546142578125, 0.037906646728515625, 0.04035186767578125, 0.042797088623046875, 0.0452423095703125, 0.047687530517578125, 0.05013275146484375, 0.052577972412109375, 0.055023193359375, 0.057468414306640625, 0.05991363525390625, 0.062358856201171875, 0.0648040771484375, 0.06724929809570312, 0.06969451904296875, 0.07213973999023438, 0.0745849609375, 0.07703018188476562, 0.07947540283203125, 0.08192062377929688, 0.0843658447265625, 0.08681106567382812, 0.08925628662109375, 0.09170150756835938, 0.094146728515625, 0.09659194946289062, 0.09903717041015625, 0.10148239135742188, 0.1039276123046875, 0.10637283325195312, 0.10881805419921875, 0.11126327514648438, 0.11370849609375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 18.0, 39.0, 241.0, 508.0, 176.0, 22.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.541692018508911, -2.487039089202881, -2.4323861598968506, -2.377732992172241, -2.323080062866211, -2.2684271335601807, -2.2137742042541504, -2.159121036529541, -2.1044681072235107, -2.0498151779174805, -1.9951621294021606, -1.9405092000961304, -1.8858561515808105, -1.8312032222747803, -1.7765501737594604, -1.7218972444534302, -1.6672441959381104, -1.61259126663208, -1.5579382181167603, -1.50328528881073, -1.4486322402954102, -1.3939793109893799, -1.33932626247406, -1.2846733331680298, -1.2300204038619995, -1.1753674745559692, -1.1207144260406494, -1.0660614967346191, -1.0114084482192993, -0.956755518913269, -0.9021024703979492, -0.847449541091919, -0.7927964329719543, -0.7381434440612793, -0.6834904551506042, -0.6288374662399292, -0.5741844773292542, -0.5195314884185791, -0.46487852931022644, -0.4102255403995514, -0.35557255148887634, -0.3009195625782013, -0.24626657366752625, -0.1916135996580124, -0.13696061074733734, -0.08230763673782349, -0.027654647827148438, 0.02699834108352661, 0.08165132999420166, 0.1363043189048767, 0.19095730781555176, 0.2456102818250656, 0.30026328563690186, 0.3549162447452545, 0.40956923365592957, 0.4642222225666046, 0.518875241279602, 0.5735282301902771, 0.6281812191009521, 0.6828342080116272, 0.7374871969223022, 0.7921401262283325, 0.8467931747436523, 0.9014461040496826, 0.9560990929603577]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 8.0, 6.0, 12.0, 14.0, 13.0, 19.0, 24.0, 22.0, 38.0, 29.0, 35.0, 41.0, 47.0, 42.0, 60.0, 44.0, 46.0, 55.0, 39.0, 35.0, 49.0, 42.0, 44.0, 41.0, 43.0, 26.0, 18.0, 28.0, 20.0, 8.0, 10.0, 15.0, 10.0, 4.0, 2.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5508550405502319, -0.5348794460296631, -0.5189037919044495, -0.5029281973838806, -0.486952543258667, -0.47097694873809814, -0.4550013244152069, -0.4390257000923157, -0.42305007576942444, -0.4070744514465332, -0.39109882712364197, -0.37512320280075073, -0.3591476082801819, -0.34317195415496826, -0.3271963596343994, -0.3112207353115082, -0.29524511098861694, -0.2792694866657257, -0.2632938623428345, -0.24731825292110443, -0.2313426285982132, -0.21536700427532196, -0.19939139485359192, -0.18341577053070068, -0.16744014620780945, -0.1514645218849182, -0.13548889756202698, -0.11951328814029694, -0.1035376638174057, -0.08756203949451447, -0.07158642262220383, -0.05561080574989319, -0.03963512182235718, -0.02365950122475624, -0.007683880627155304, 0.008291739970445633, 0.02426736056804657, 0.040242984890937805, 0.056218601763248444, 0.07219421863555908, 0.08816984295845032, 0.10414546728134155, 0.12012108415365219, 0.13609670102596283, 0.15207232534885406, 0.1680479496717453, 0.18402355909347534, 0.19999918341636658, 0.2159748077392578, 0.23195043206214905, 0.24792605638504028, 0.2639016807079315, 0.27987730503082275, 0.2958528995513916, 0.31182852387428284, 0.3278041481971741, 0.3437797725200653, 0.35975539684295654, 0.3757310211658478, 0.391706645488739, 0.40768224000930786, 0.4236578941345215, 0.43963348865509033, 0.45560911297798157, 0.4715847373008728]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 15.0, 22.0, 39.0, 48.0, 73.0, 149.0, 322.0, 677.0, 1471.0, 3532.0, 11384.0, 63202.0, 3617098.0, 454786.0, 29644.0, 7083.0, 2506.0, 1075.0, 489.0, 266.0, 133.0, 76.0, 48.0, 42.0, 23.0, 12.0, 11.0, 12.0, 6.0, 6.0, 5.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08038330078125, -0.07700824737548828, -0.07363319396972656, -0.07025814056396484, -0.06688308715820312, -0.0635080337524414, -0.06013298034667969, -0.05675792694091797, -0.05338287353515625, -0.05000782012939453, -0.04663276672363281, -0.043257713317871094, -0.039882659912109375, -0.036507606506347656, -0.03313255310058594, -0.02975749969482422, -0.0263824462890625, -0.02300739288330078, -0.019632339477539062, -0.016257286071777344, -0.012882232666015625, -0.009507179260253906, -0.0061321258544921875, -0.0027570724487304688, 0.00061798095703125, 0.003993034362792969, 0.0073680877685546875, 0.010743141174316406, 0.014118194580078125, 0.017493247985839844, 0.020868301391601562, 0.02424335479736328, 0.027618408203125, 0.03099346160888672, 0.03436851501464844, 0.037743568420410156, 0.041118621826171875, 0.044493675231933594, 0.04786872863769531, 0.05124378204345703, 0.05461883544921875, 0.05799388885498047, 0.06136894226074219, 0.0647439956665039, 0.06811904907226562, 0.07149410247802734, 0.07486915588378906, 0.07824420928955078, 0.0816192626953125, 0.08499431610107422, 0.08836936950683594, 0.09174442291259766, 0.09511947631835938, 0.0984945297241211, 0.10186958312988281, 0.10524463653564453, 0.10861968994140625, 0.11199474334716797, 0.11536979675292969, 0.1187448501586914, 0.12211990356445312, 0.12549495697021484, 0.12887001037597656, 0.13224506378173828, 0.1356201171875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 9.0, 18.0, 26.0, 41.0, 55.0, 74.0, 81.0, 91.0, 93.0, 98.0, 90.0, 84.0, 63.0, 61.0, 44.0, 22.0, 20.0, 12.0, 5.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03167724609375, -0.03009796142578125, -0.0285186767578125, -0.02693939208984375, -0.025360107421875, -0.02378082275390625, -0.0222015380859375, -0.02062225341796875, -0.01904296875, -0.01746368408203125, -0.0158843994140625, -0.01430511474609375, -0.012725830078125, -0.01114654541015625, -0.0095672607421875, -0.00798797607421875, -0.00640869140625, -0.00482940673828125, -0.0032501220703125, -0.00167083740234375, -9.1552734375e-05, 0.00148773193359375, 0.0030670166015625, 0.00464630126953125, 0.0062255859375, 0.00780487060546875, 0.0093841552734375, 0.01096343994140625, 0.012542724609375, 0.01412200927734375, 0.0157012939453125, 0.01728057861328125, 0.01885986328125, 0.02043914794921875, 0.0220184326171875, 0.02359771728515625, 0.025177001953125, 0.02675628662109375, 0.0283355712890625, 0.02991485595703125, 0.031494140625, 0.03307342529296875, 0.0346527099609375, 0.03623199462890625, 0.037811279296875, 0.03939056396484375, 0.0409698486328125, 0.04254913330078125, 0.04412841796875, 0.04570770263671875, 0.0472869873046875, 0.04886627197265625, 0.050445556640625, 0.05202484130859375, 0.0536041259765625, 0.05518341064453125, 0.0567626953125, 0.05834197998046875, 0.0599212646484375, 0.06150054931640625, 0.063079833984375, 0.06465911865234375, 0.0662384033203125, 0.06781768798828125, 0.06939697265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 3.0, 6.0, 16.0, 19.0, 31.0, 53.0, 95.0, 150.0, 240.0, 438.0, 824.0, 1798.0, 5451.0, 28889.0, 1034281.0, 3073756.0, 38063.0, 6493.0, 1910.0, 853.0, 375.0, 219.0, 119.0, 65.0, 47.0, 30.0, 25.0, 10.0, 5.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.138671875, -0.13482666015625, -0.1309814453125, -0.12713623046875, -0.123291015625, -0.11944580078125, -0.1156005859375, -0.11175537109375, -0.10791015625, -0.10406494140625, -0.1002197265625, -0.09637451171875, -0.092529296875, -0.08868408203125, -0.0848388671875, -0.08099365234375, -0.0771484375, -0.07330322265625, -0.0694580078125, -0.06561279296875, -0.061767578125, -0.05792236328125, -0.0540771484375, -0.05023193359375, -0.04638671875, -0.04254150390625, -0.0386962890625, -0.03485107421875, -0.031005859375, -0.02716064453125, -0.0233154296875, -0.01947021484375, -0.015625, -0.01177978515625, -0.0079345703125, -0.00408935546875, -0.000244140625, 0.00360107421875, 0.0074462890625, 0.01129150390625, 0.01513671875, 0.01898193359375, 0.0228271484375, 0.02667236328125, 0.030517578125, 0.03436279296875, 0.0382080078125, 0.04205322265625, 0.0458984375, 0.04974365234375, 0.0535888671875, 0.05743408203125, 0.061279296875, 0.06512451171875, 0.0689697265625, 0.07281494140625, 0.07666015625, 0.08050537109375, 0.0843505859375, 0.08819580078125, 0.092041015625, 0.09588623046875, 0.0997314453125, 0.10357666015625, 0.107421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 10.0, 2.0, 17.0, 27.0, 41.0, 71.0, 228.0, 1168.0, 1908.0, 340.0, 119.0, 67.0, 30.0, 13.0, 10.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0792236328125, -0.07750511169433594, -0.07578659057617188, -0.07406806945800781, -0.07234954833984375, -0.07063102722167969, -0.06891250610351562, -0.06719398498535156, -0.0654754638671875, -0.06375694274902344, -0.062038421630859375, -0.06031990051269531, -0.05860137939453125, -0.05688285827636719, -0.055164337158203125, -0.05344581604003906, -0.051727294921875, -0.05000877380371094, -0.048290252685546875, -0.04657173156738281, -0.04485321044921875, -0.04313468933105469, -0.041416168212890625, -0.03969764709472656, -0.0379791259765625, -0.03626060485839844, -0.034542083740234375, -0.03282356262207031, -0.03110504150390625, -0.029386520385742188, -0.027667999267578125, -0.025949478149414062, -0.02423095703125, -0.022512435913085938, -0.020793914794921875, -0.019075393676757812, -0.01735687255859375, -0.015638351440429688, -0.013919830322265625, -0.012201309204101562, -0.0104827880859375, -0.008764266967773438, -0.007045745849609375, -0.0053272247314453125, -0.00360870361328125, -0.0018901824951171875, -0.000171661376953125, 0.0015468597412109375, 0.003265380859375, 0.0049839019775390625, 0.006702423095703125, 0.008420944213867188, 0.01013946533203125, 0.011857986450195312, 0.013576507568359375, 0.015295028686523438, 0.0170135498046875, 0.018732070922851562, 0.020450592041015625, 0.022169113159179688, 0.02388763427734375, 0.025606155395507812, 0.027324676513671875, 0.029043197631835938, 0.03076171875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 60.0, 325.0, 438.0, 137.0, 16.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5238268375396729, -0.5045003890991211, -0.48517388105392456, -0.4658474028110504, -0.44652092456817627, -0.4271944761276245, -0.40786799788475037, -0.3885415196418762, -0.3692150413990021, -0.34988856315612793, -0.3305620849132538, -0.31123560667037964, -0.2919091582298279, -0.27258265018463135, -0.2532562017440796, -0.23392972350120544, -0.2146032452583313, -0.19527676701545715, -0.175950288772583, -0.15662382543087006, -0.1372973471879959, -0.11797086894512177, -0.09864439815282822, -0.07931792736053467, -0.05999144911766052, -0.040664974600076675, -0.02133850008249283, -0.0020120255649089813, 0.017314448952674866, 0.03664092719554901, 0.05596739798784256, 0.07529386878013611, 0.09462034702301025, 0.1139468252658844, 0.13327330350875854, 0.1525997668504715, 0.17192624509334564, 0.1912527233362198, 0.21057918667793274, 0.22990566492080688, 0.24923214316368103, 0.2685586214065552, 0.2878850996494293, 0.30721157789230347, 0.3265380263328552, 0.34586453437805176, 0.3651909828186035, 0.38451746106147766, 0.4038439393043518, 0.42317041754722595, 0.4424968957901001, 0.46182337403297424, 0.4811498522758484, 0.5004763007164001, 0.5198028087615967, 0.5391292572021484, 0.5584557056427002, 0.577782154083252, 0.5971086621284485, 0.6164351105690002, 0.6357616186141968, 0.6550880670547485, 0.6744145750999451, 0.6937410235404968, 0.7130675315856934]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 9.0, 11.0, 17.0, 33.0, 37.0, 45.0, 49.0, 59.0, 75.0, 71.0, 100.0, 88.0, 69.0, 62.0, 70.0, 47.0, 40.0, 28.0, 23.0, 19.0, 17.0, 9.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.21144795417785645, -0.2060057371854782, -0.20056352019309998, -0.19512128829956055, -0.1896790713071823, -0.18423685431480408, -0.17879462242126465, -0.1733524054288864, -0.16791018843650818, -0.16246797144412994, -0.1570257544517517, -0.15158352255821228, -0.14614130556583405, -0.1406990885734558, -0.13525685667991638, -0.12981463968753815, -0.12437242269515991, -0.11893020570278168, -0.11348798125982285, -0.10804575681686401, -0.10260353982448578, -0.09716132283210754, -0.09171909838914871, -0.08627687394618988, -0.08083465695381165, -0.07539243996143341, -0.06995021551847458, -0.06450799107551575, -0.05906577408313751, -0.05362355336546898, -0.048181332647800446, -0.04273911193013191, -0.03729689121246338, -0.031854670494794846, -0.026412449777126312, -0.02097022905945778, -0.015528008341789246, -0.010085787624120712, -0.004643566906452179, 0.0007986538112163544, 0.006240874528884888, 0.011683095246553421, 0.017125315964221954, 0.022567536681890488, 0.02800975739955902, 0.033451978117227554, 0.03889419883489609, 0.04433641955256462, 0.049778640270233154, 0.05522086098790169, 0.06066308170557022, 0.06610530614852905, 0.07154752314090729, 0.07698974013328552, 0.08243196457624435, 0.08787418901920319, 0.09331640601158142, 0.09875862300395966, 0.10420084744691849, 0.10964307188987732, 0.11508528888225555, 0.12052750587463379, 0.12596973776817322, 0.13141195476055145, 0.1368541717529297]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 7.0, 6.0, 10.0, 10.0, 23.0, 28.0, 36.0, 63.0, 107.0, 181.0, 333.0, 712.0, 1798.0, 5375.0, 23055.0, 154103.0, 633158.0, 191959.0, 27756.0, 6244.0, 1962.0, 789.0, 356.0, 185.0, 108.0, 65.0, 45.0, 31.0, 19.0, 9.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0904541015625, -0.08704757690429688, -0.08364105224609375, -0.08023452758789062, -0.0768280029296875, -0.07342147827148438, -0.07001495361328125, -0.06660842895507812, -0.063201904296875, -0.059795379638671875, -0.05638885498046875, -0.052982330322265625, -0.0495758056640625, -0.046169281005859375, -0.04276275634765625, -0.039356231689453125, -0.03594970703125, -0.032543182373046875, -0.02913665771484375, -0.025730133056640625, -0.0223236083984375, -0.018917083740234375, -0.01551055908203125, -0.012104034423828125, -0.008697509765625, -0.005290985107421875, -0.00188446044921875, 0.001522064208984375, 0.0049285888671875, 0.008335113525390625, 0.01174163818359375, 0.015148162841796875, 0.0185546875, 0.021961212158203125, 0.02536773681640625, 0.028774261474609375, 0.0321807861328125, 0.035587310791015625, 0.03899383544921875, 0.042400360107421875, 0.045806884765625, 0.049213409423828125, 0.05261993408203125, 0.056026458740234375, 0.0594329833984375, 0.06283950805664062, 0.06624603271484375, 0.06965255737304688, 0.07305908203125, 0.07646560668945312, 0.07987213134765625, 0.08327865600585938, 0.0866851806640625, 0.09009170532226562, 0.09349822998046875, 0.09690475463867188, 0.100311279296875, 0.10371780395507812, 0.10712432861328125, 0.11053085327148438, 0.1139373779296875, 0.11734390258789062, 0.12075042724609375, 0.12415695190429688, 0.1275634765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 11.0, 11.0, 19.0, 45.0, 38.0, 79.0, 60.0, 73.0, 84.0, 94.0, 98.0, 82.0, 69.0, 63.0, 54.0, 44.0, 23.0, 18.0, 13.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030426025390625, -0.02895975112915039, -0.02749347686767578, -0.026027202606201172, -0.024560928344726562, -0.023094654083251953, -0.021628379821777344, -0.020162105560302734, -0.018695831298828125, -0.017229557037353516, -0.015763282775878906, -0.014297008514404297, -0.012830734252929688, -0.011364459991455078, -0.009898185729980469, -0.00843191146850586, -0.00696563720703125, -0.005499362945556641, -0.004033088684082031, -0.002566814422607422, -0.0011005401611328125, 0.0003657341003417969, 0.0018320083618164062, 0.0032982826232910156, 0.004764556884765625, 0.006230831146240234, 0.007697105407714844, 0.009163379669189453, 0.010629653930664062, 0.012095928192138672, 0.013562202453613281, 0.01502847671508789, 0.0164947509765625, 0.01796102523803711, 0.01942729949951172, 0.020893573760986328, 0.022359848022460938, 0.023826122283935547, 0.025292396545410156, 0.026758670806884766, 0.028224945068359375, 0.029691219329833984, 0.031157493591308594, 0.0326237678527832, 0.03409004211425781, 0.03555631637573242, 0.03702259063720703, 0.03848886489868164, 0.03995513916015625, 0.04142141342163086, 0.04288768768310547, 0.04435396194458008, 0.04582023620605469, 0.0472865104675293, 0.048752784729003906, 0.050219058990478516, 0.051685333251953125, 0.053151607513427734, 0.054617881774902344, 0.05608415603637695, 0.05755043029785156, 0.05901670455932617, 0.06048297882080078, 0.06194925308227539, 0.06341552734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 5.0, 4.0, 12.0, 13.0, 10.0, 17.0, 27.0, 23.0, 39.0, 52.0, 83.0, 136.0, 203.0, 405.0, 1245.0, 4032.0, 16476.0, 81739.0, 405892.0, 426153.0, 87995.0, 17437.0, 4240.0, 1295.0, 435.0, 211.0, 101.0, 75.0, 41.0, 45.0, 31.0, 22.0, 16.0, 4.0, 8.0, 9.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0809326171875, -0.07868576049804688, -0.07643890380859375, -0.07419204711914062, -0.0719451904296875, -0.06969833374023438, -0.06745147705078125, -0.06520462036132812, -0.062957763671875, -0.060710906982421875, -0.05846405029296875, -0.056217193603515625, -0.0539703369140625, -0.051723480224609375, -0.04947662353515625, -0.047229766845703125, -0.04498291015625, -0.042736053466796875, -0.04048919677734375, -0.038242340087890625, -0.0359954833984375, -0.033748626708984375, -0.03150177001953125, -0.029254913330078125, -0.027008056640625, -0.024761199951171875, -0.02251434326171875, -0.020267486572265625, -0.0180206298828125, -0.015773773193359375, -0.01352691650390625, -0.011280059814453125, -0.009033203125, -0.006786346435546875, -0.00453948974609375, -0.002292633056640625, -4.57763671875e-05, 0.002201080322265625, 0.00444793701171875, 0.006694793701171875, 0.008941650390625, 0.011188507080078125, 0.01343536376953125, 0.015682220458984375, 0.0179290771484375, 0.020175933837890625, 0.02242279052734375, 0.024669647216796875, 0.02691650390625, 0.029163360595703125, 0.03141021728515625, 0.033657073974609375, 0.0359039306640625, 0.038150787353515625, 0.04039764404296875, 0.042644500732421875, 0.044891357421875, 0.047138214111328125, 0.04938507080078125, 0.051631927490234375, 0.0538787841796875, 0.056125640869140625, 0.05837249755859375, 0.060619354248046875, 0.0628662109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 5.0, 12.0, 12.0, 12.0, 15.0, 10.0, 13.0, 21.0, 33.0, 36.0, 38.0, 52.0, 40.0, 47.0, 38.0, 58.0, 57.0, 49.0, 57.0, 46.0, 32.0, 44.0, 52.0, 26.0, 28.0, 24.0, 26.0, 26.0, 23.0, 21.0, 12.0, 6.0, 6.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10137939453125, -0.09833240509033203, -0.09528541564941406, -0.0922384262084961, -0.08919143676757812, -0.08614444732666016, -0.08309745788574219, -0.08005046844482422, -0.07700347900390625, -0.07395648956298828, -0.07090950012207031, -0.06786251068115234, -0.06481552124023438, -0.061768531799316406, -0.05872154235839844, -0.05567455291748047, -0.0526275634765625, -0.04958057403564453, -0.04653358459472656, -0.043486595153808594, -0.040439605712890625, -0.037392616271972656, -0.03434562683105469, -0.03129863739013672, -0.02825164794921875, -0.02520465850830078, -0.022157669067382812, -0.019110679626464844, -0.016063690185546875, -0.013016700744628906, -0.009969711303710938, -0.006922721862792969, -0.003875732421875, -0.0008287429809570312, 0.0022182464599609375, 0.005265235900878906, 0.008312225341796875, 0.011359214782714844, 0.014406204223632812, 0.01745319366455078, 0.02050018310546875, 0.02354717254638672, 0.026594161987304688, 0.029641151428222656, 0.032688140869140625, 0.035735130310058594, 0.03878211975097656, 0.04182910919189453, 0.0448760986328125, 0.04792308807373047, 0.05097007751464844, 0.054017066955566406, 0.057064056396484375, 0.060111045837402344, 0.06315803527832031, 0.06620502471923828, 0.06925201416015625, 0.07229900360107422, 0.07534599304199219, 0.07839298248291016, 0.08143997192382812, 0.0844869613647461, 0.08753395080566406, 0.09058094024658203, 0.0936279296875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 7.0, 4.0, 12.0, 14.0, 27.0, 38.0, 40.0, 53.0, 62.0, 96.0, 128.0, 222.0, 362.0, 632.0, 1641.0, 4532.0, 16759.0, 100799.0, 649621.0, 232352.0, 29634.0, 7024.0, 2218.0, 912.0, 457.0, 282.0, 177.0, 114.0, 89.0, 63.0, 46.0, 35.0, 19.0, 19.0, 11.0, 10.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.0482177734375, -0.046866416931152344, -0.04551506042480469, -0.04416370391845703, -0.042812347412109375, -0.04146099090576172, -0.04010963439941406, -0.038758277893066406, -0.03740692138671875, -0.036055564880371094, -0.03470420837402344, -0.03335285186767578, -0.032001495361328125, -0.03065013885498047, -0.029298782348632812, -0.027947425842285156, -0.0265960693359375, -0.025244712829589844, -0.023893356323242188, -0.02254199981689453, -0.021190643310546875, -0.01983928680419922, -0.018487930297851562, -0.017136573791503906, -0.01578521728515625, -0.014433860778808594, -0.013082504272460938, -0.011731147766113281, -0.010379791259765625, -0.009028434753417969, -0.0076770782470703125, -0.006325721740722656, -0.004974365234375, -0.0036230087280273438, -0.0022716522216796875, -0.0009202957153320312, 0.000431060791015625, 0.0017824172973632812, 0.0031337738037109375, 0.004485130310058594, 0.00583648681640625, 0.007187843322753906, 0.008539199829101562, 0.009890556335449219, 0.011241912841796875, 0.012593269348144531, 0.013944625854492188, 0.015295982360839844, 0.0166473388671875, 0.017998695373535156, 0.019350051879882812, 0.02070140838623047, 0.022052764892578125, 0.02340412139892578, 0.024755477905273438, 0.026106834411621094, 0.02745819091796875, 0.028809547424316406, 0.030160903930664062, 0.03151226043701172, 0.032863616943359375, 0.03421497344970703, 0.03556632995605469, 0.036917686462402344, 0.03826904296875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 6.0, 10.0, 19.0, 30.0, 48.0, 68.0, 91.0, 118.0, 118.0, 121.0, 100.0, 95.0, 58.0, 44.0, 33.0, 22.0, 12.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3828277587890625e-05, -1.3453885912895203e-05, -1.307949423789978e-05, -1.2705102562904358e-05, -1.2330710887908936e-05, -1.1956319212913513e-05, -1.158192753791809e-05, -1.1207535862922668e-05, -1.0833144187927246e-05, -1.0458752512931824e-05, -1.0084360837936401e-05, -9.709969162940979e-06, -9.335577487945557e-06, -8.961185812950134e-06, -8.586794137954712e-06, -8.21240246295929e-06, -7.838010787963867e-06, -7.463619112968445e-06, -7.0892274379730225e-06, -6.7148357629776e-06, -6.340444087982178e-06, -5.966052412986755e-06, -5.591660737991333e-06, -5.217269062995911e-06, -4.842877388000488e-06, -4.468485713005066e-06, -4.0940940380096436e-06, -3.719702363014221e-06, -3.345310688018799e-06, -2.9709190130233765e-06, -2.596527338027954e-06, -2.2221356630325317e-06, -1.8477439880371094e-06, -1.473352313041687e-06, -1.0989606380462646e-06, -7.245689630508423e-07, -3.501772880554199e-07, 2.421438694000244e-08, 3.986060619354248e-07, 7.729977369308472e-07, 1.1473894119262695e-06, 1.521781086921692e-06, 1.8961727619171143e-06, 2.2705644369125366e-06, 2.644956111907959e-06, 3.0193477869033813e-06, 3.3937394618988037e-06, 3.768131136894226e-06, 4.1425228118896484e-06, 4.516914486885071e-06, 4.891306161880493e-06, 5.2656978368759155e-06, 5.640089511871338e-06, 6.01448118686676e-06, 6.388872861862183e-06, 6.763264536857605e-06, 7.137656211853027e-06, 7.51204788684845e-06, 7.886439561843872e-06, 8.260831236839294e-06, 8.635222911834717e-06, 9.00961458683014e-06, 9.384006261825562e-06, 9.758397936820984e-06, 1.0132789611816406e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 13.0, 13.0, 38.0, 50.0, 126.0, 261.0, 624.0, 1568.0, 5339.0, 32401.0, 514530.0, 457324.0, 28719.0, 4972.0, 1487.0, 565.0, 265.0, 114.0, 69.0, 32.0, 14.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0703125, -0.06846094131469727, -0.06660938262939453, -0.0647578239440918, -0.06290626525878906, -0.06105470657348633, -0.059203147888183594, -0.05735158920288086, -0.055500030517578125, -0.05364847183227539, -0.051796913146972656, -0.04994535446166992, -0.04809379577636719, -0.04624223709106445, -0.04439067840576172, -0.042539119720458984, -0.04068756103515625, -0.038836002349853516, -0.03698444366455078, -0.03513288497924805, -0.03328132629394531, -0.03142976760864258, -0.029578208923339844, -0.02772665023803711, -0.025875091552734375, -0.02402353286743164, -0.022171974182128906, -0.020320415496826172, -0.018468856811523438, -0.016617298126220703, -0.014765739440917969, -0.012914180755615234, -0.0110626220703125, -0.009211063385009766, -0.007359504699707031, -0.005507946014404297, -0.0036563873291015625, -0.0018048286437988281, 4.673004150390625e-05, 0.0018982887268066406, 0.003749847412109375, 0.005601406097412109, 0.007452964782714844, 0.009304523468017578, 0.011156082153320312, 0.013007640838623047, 0.014859199523925781, 0.016710758209228516, 0.01856231689453125, 0.020413875579833984, 0.02226543426513672, 0.024116992950439453, 0.025968551635742188, 0.027820110321044922, 0.029671669006347656, 0.03152322769165039, 0.033374786376953125, 0.03522634506225586, 0.037077903747558594, 0.03892946243286133, 0.04078102111816406, 0.0426325798034668, 0.04448413848876953, 0.046335697174072266, 0.048187255859375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 14.0, 12.0, 17.0, 21.0, 35.0, 36.0, 57.0, 94.0, 91.0, 115.0, 113.0, 108.0, 78.0, 50.0, 58.0, 23.0, 23.0, 15.0, 10.0, 10.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0430908203125, -0.041660308837890625, -0.04022979736328125, -0.038799285888671875, -0.0373687744140625, -0.035938262939453125, -0.03450775146484375, -0.033077239990234375, -0.031646728515625, -0.030216217041015625, -0.02878570556640625, -0.027355194091796875, -0.0259246826171875, -0.024494171142578125, -0.02306365966796875, -0.021633148193359375, -0.02020263671875, -0.018772125244140625, -0.01734161376953125, -0.015911102294921875, -0.0144805908203125, -0.013050079345703125, -0.01161956787109375, -0.010189056396484375, -0.008758544921875, -0.007328033447265625, -0.00589752197265625, -0.004467010498046875, -0.0030364990234375, -0.001605987548828125, -0.00017547607421875, 0.001255035400390625, 0.002685546875, 0.004116058349609375, 0.00554656982421875, 0.006977081298828125, 0.0084075927734375, 0.009838104248046875, 0.01126861572265625, 0.012699127197265625, 0.014129638671875, 0.015560150146484375, 0.01699066162109375, 0.018421173095703125, 0.0198516845703125, 0.021282196044921875, 0.02271270751953125, 0.024143218994140625, 0.02557373046875, 0.027004241943359375, 0.02843475341796875, 0.029865264892578125, 0.0312957763671875, 0.032726287841796875, 0.03415679931640625, 0.035587310791015625, 0.037017822265625, 0.038448333740234375, 0.03987884521484375, 0.041309356689453125, 0.0427398681640625, 0.044170379638671875, 0.04560089111328125, 0.047031402587890625, 0.0484619140625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 13.0, 96.0, 493.0, 364.0, 37.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01871395111084, -2.951430082321167, -2.884146213531494, -2.8168623447418213, -2.7495784759521484, -2.6822946071624756, -2.6150107383728027, -2.54772686958313, -2.480443000793457, -2.413159132003784, -2.3458752632141113, -2.2785913944244385, -2.2113075256347656, -2.1440236568450928, -2.07673978805542, -2.009455919265747, -1.9421720504760742, -1.8748881816864014, -1.8076043128967285, -1.7403204441070557, -1.6730365753173828, -1.60575270652771, -1.538468837738037, -1.4711849689483643, -1.4039011001586914, -1.3366172313690186, -1.2693333625793457, -1.2020494937896729, -1.134765625, -1.0674817562103271, -1.0001978874206543, -0.9329140186309814, -0.8656302690505981, -0.7983464002609253, -0.7310625314712524, -0.6637786626815796, -0.5964947938919067, -0.5292109251022339, -0.46192705631256104, -0.3946431875228882, -0.32735931873321533, -0.2600754499435425, -0.19279158115386963, -0.12550771236419678, -0.058223843574523926, 0.009060025215148926, 0.07634389400482178, 0.14362776279449463, 0.21091163158416748, 0.27819550037384033, 0.3454793691635132, 0.41276323795318604, 0.4800471067428589, 0.5473309755325317, 0.6146148443222046, 0.6818987131118774, 0.7491825819015503, 0.8164664506912231, 0.883750319480896, 0.9510341882705688, 1.0183180570602417, 1.0856019258499146, 1.1528857946395874, 1.2201696634292603, 1.287453532218933]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 4.0, 3.0, 3.0, 9.0, 10.0, 12.0, 19.0, 13.0, 16.0, 28.0, 29.0, 28.0, 32.0, 33.0, 27.0, 48.0, 43.0, 43.0, 41.0, 48.0, 46.0, 39.0, 31.0, 52.0, 38.0, 34.0, 34.0, 34.0, 21.0, 36.0, 22.0, 16.0, 19.0, 18.0, 17.0, 13.0, 7.0, 7.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4139711856842041, -0.40111014246940613, -0.38824912905693054, -0.37538808584213257, -0.362527072429657, -0.349666029214859, -0.33680498600006104, -0.32394397258758545, -0.31108295917510986, -0.2982219159603119, -0.2853609025478363, -0.27249985933303833, -0.25963884592056274, -0.24677780270576477, -0.233916774392128, -0.2210557460784912, -0.20819470286369324, -0.19533367455005646, -0.18247264623641968, -0.1696116030216217, -0.15675058960914612, -0.14388954639434814, -0.13102851808071136, -0.11816748976707458, -0.1053064614534378, -0.09244543313980103, -0.07958440482616425, -0.06672336906194687, -0.05386234074831009, -0.04100131243467331, -0.028140276670455933, -0.015279248356819153, -0.002418220043182373, 0.010442810133099556, 0.023303840309381485, 0.03616487234830856, 0.04902590066194534, 0.06188692897558212, 0.0747479647397995, 0.08760899305343628, 0.10047002136707306, 0.11333104968070984, 0.12619207799434662, 0.1390531063079834, 0.15191414952278137, 0.16477516293525696, 0.17763620615005493, 0.1904972344636917, 0.2033582627773285, 0.21621929109096527, 0.22908031940460205, 0.24194136261940002, 0.2548023760318756, 0.2676634192466736, 0.28052443265914917, 0.29338547587394714, 0.3062465190887451, 0.3191075623035431, 0.3319685757160187, 0.34482961893081665, 0.35769063234329224, 0.3705516755580902, 0.3834127187728882, 0.39627373218536377, 0.40913474559783936]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 4.0, 1.0, 7.0, 4.0, 5.0, 10.0, 15.0, 24.0, 46.0, 81.0, 115.0, 168.0, 306.0, 574.0, 1141.0, 2548.0, 6274.0, 20460.0, 142539.0, 3887758.0, 105083.0, 17236.0, 5315.0, 2249.0, 1053.0, 557.0, 252.0, 164.0, 97.0, 56.0, 30.0, 26.0, 21.0, 17.0, 9.0, 10.0, 6.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083251953125, -0.07970046997070312, -0.07614898681640625, -0.07259750366210938, -0.0690460205078125, -0.06549453735351562, -0.06194305419921875, -0.058391571044921875, -0.054840087890625, -0.051288604736328125, -0.04773712158203125, -0.044185638427734375, -0.0406341552734375, -0.037082672119140625, -0.03353118896484375, -0.029979705810546875, -0.02642822265625, -0.022876739501953125, -0.01932525634765625, -0.015773773193359375, -0.0122222900390625, -0.008670806884765625, -0.00511932373046875, -0.001567840576171875, 0.001983642578125, 0.005535125732421875, 0.00908660888671875, 0.012638092041015625, 0.0161895751953125, 0.019741058349609375, 0.02329254150390625, 0.026844024658203125, 0.0303955078125, 0.033946990966796875, 0.03749847412109375, 0.041049957275390625, 0.0446014404296875, 0.048152923583984375, 0.05170440673828125, 0.055255889892578125, 0.058807373046875, 0.062358856201171875, 0.06591033935546875, 0.06946182250976562, 0.0730133056640625, 0.07656478881835938, 0.08011627197265625, 0.08366775512695312, 0.08721923828125, 0.09077072143554688, 0.09432220458984375, 0.09787368774414062, 0.1014251708984375, 0.10497665405273438, 0.10852813720703125, 0.11207962036132812, 0.115631103515625, 0.11918258666992188, 0.12273406982421875, 0.12628555297851562, 0.1298370361328125, 0.13338851928710938, 0.13694000244140625, 0.14049148559570312, 0.14404296875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 7.0, 15.0, 9.0, 31.0, 29.0, 50.0, 57.0, 65.0, 71.0, 83.0, 87.0, 88.0, 84.0, 68.0, 67.0, 47.0, 35.0, 35.0, 29.0, 21.0, 5.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0303802490234375, -0.02899336814880371, -0.027606487274169922, -0.026219606399536133, -0.024832725524902344, -0.023445844650268555, -0.022058963775634766, -0.020672082901000977, -0.019285202026367188, -0.0178983211517334, -0.01651144027709961, -0.01512455940246582, -0.013737678527832031, -0.012350797653198242, -0.010963916778564453, -0.009577035903930664, -0.008190155029296875, -0.006803274154663086, -0.005416393280029297, -0.004029512405395508, -0.0026426315307617188, -0.0012557506561279297, 0.00013113021850585938, 0.0015180110931396484, 0.0029048919677734375, 0.0042917728424072266, 0.005678653717041016, 0.007065534591674805, 0.008452415466308594, 0.009839296340942383, 0.011226177215576172, 0.012613058090209961, 0.01399993896484375, 0.015386819839477539, 0.016773700714111328, 0.018160581588745117, 0.019547462463378906, 0.020934343338012695, 0.022321224212646484, 0.023708105087280273, 0.025094985961914062, 0.02648186683654785, 0.02786874771118164, 0.02925562858581543, 0.03064250946044922, 0.03202939033508301, 0.0334162712097168, 0.034803152084350586, 0.036190032958984375, 0.037576913833618164, 0.03896379470825195, 0.04035067558288574, 0.04173755645751953, 0.04312443733215332, 0.04451131820678711, 0.0458981990814209, 0.04728507995605469, 0.04867196083068848, 0.050058841705322266, 0.051445722579956055, 0.052832603454589844, 0.05421948432922363, 0.05560636520385742, 0.05699324607849121, 0.058380126953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 13.0, 28.0, 59.0, 89.0, 235.0, 534.0, 1321.0, 3929.0, 16762.0, 473893.0, 3663500.0, 26035.0, 5102.0, 1616.0, 634.0, 246.0, 137.0, 67.0, 31.0, 15.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.1981525421142578, -0.19281387329101562, -0.18747520446777344, -0.18213653564453125, -0.17679786682128906, -0.17145919799804688, -0.1661205291748047, -0.1607818603515625, -0.1554431915283203, -0.15010452270507812, -0.14476585388183594, -0.13942718505859375, -0.13408851623535156, -0.12874984741210938, -0.12341117858886719, -0.118072509765625, -0.11273384094238281, -0.10739517211914062, -0.10205650329589844, -0.09671783447265625, -0.09137916564941406, -0.08604049682617188, -0.08070182800292969, -0.0753631591796875, -0.07002449035644531, -0.06468582153320312, -0.05934715270996094, -0.05400848388671875, -0.04866981506347656, -0.043331146240234375, -0.03799247741699219, -0.03265380859375, -0.027315139770507812, -0.021976470947265625, -0.016637802124023438, -0.01129913330078125, -0.0059604644775390625, -0.000621795654296875, 0.0047168731689453125, 0.0100555419921875, 0.015394210815429688, 0.020732879638671875, 0.026071548461914062, 0.03141021728515625, 0.03674888610839844, 0.042087554931640625, 0.04742622375488281, 0.052764892578125, 0.05810356140136719, 0.06344223022460938, 0.06878089904785156, 0.07411956787109375, 0.07945823669433594, 0.08479690551757812, 0.09013557434082031, 0.0954742431640625, 0.10081291198730469, 0.10615158081054688, 0.11149024963378906, 0.11682891845703125, 0.12216758728027344, 0.12750625610351562, 0.1328449249267578, 0.13818359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 3.0, 13.0, 7.0, 16.0, 25.0, 48.0, 87.0, 295.0, 2294.0, 929.0, 184.0, 67.0, 45.0, 13.0, 14.0, 6.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06304931640625, -0.061383724212646484, -0.05971813201904297, -0.05805253982543945, -0.05638694763183594, -0.05472135543823242, -0.053055763244628906, -0.05139017105102539, -0.049724578857421875, -0.04805898666381836, -0.046393394470214844, -0.04472780227661133, -0.04306221008300781, -0.0413966178894043, -0.03973102569580078, -0.038065433502197266, -0.03639984130859375, -0.034734249114990234, -0.03306865692138672, -0.0314030647277832, -0.029737472534179688, -0.028071880340576172, -0.026406288146972656, -0.02474069595336914, -0.023075103759765625, -0.02140951156616211, -0.019743919372558594, -0.018078327178955078, -0.016412734985351562, -0.014747142791748047, -0.013081550598144531, -0.011415958404541016, -0.0097503662109375, -0.008084774017333984, -0.006419181823730469, -0.004753589630126953, -0.0030879974365234375, -0.0014224052429199219, 0.00024318695068359375, 0.0019087791442871094, 0.003574371337890625, 0.005239963531494141, 0.006905555725097656, 0.008571147918701172, 0.010236740112304688, 0.011902332305908203, 0.013567924499511719, 0.015233516693115234, 0.01689910888671875, 0.018564701080322266, 0.02023029327392578, 0.021895885467529297, 0.023561477661132812, 0.025227069854736328, 0.026892662048339844, 0.02855825424194336, 0.030223846435546875, 0.03188943862915039, 0.033555030822753906, 0.03522062301635742, 0.03688621520996094, 0.03855180740356445, 0.04021739959716797, 0.041882991790771484, 0.043548583984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 9.0, 19.0, 82.0, 296.0, 422.0, 141.0, 26.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7699598073959351, -0.7533004283905029, -0.736640989780426, -0.7199816107749939, -0.703322172164917, -0.6866627931594849, -0.670003354549408, -0.6533439755439758, -0.6366845369338989, -0.6200251579284668, -0.6033657193183899, -0.5867063403129578, -0.5700469017028809, -0.5533875226974487, -0.5367280840873718, -0.5200687050819397, -0.5034093260765076, -0.48674991726875305, -0.47009050846099854, -0.453431099653244, -0.4367716908454895, -0.4201123118400574, -0.40345290303230286, -0.38679349422454834, -0.3701340854167938, -0.3534746766090393, -0.3368152678012848, -0.3201558589935303, -0.30349647998809814, -0.28683704137802124, -0.2701776623725891, -0.2535182535648346, -0.23685887455940247, -0.22019946575164795, -0.20354005694389343, -0.1868806630373001, -0.1702212542295456, -0.15356184542179108, -0.13690245151519775, -0.12024304270744324, -0.10358363389968872, -0.0869242250919342, -0.07026482373476028, -0.053605418652296066, -0.03694601356983185, -0.02028660476207733, -0.003627203404903412, 0.013032197952270508, 0.029691606760025024, 0.04635101184248924, 0.06301041692495346, 0.07966981828212738, 0.0963292270898819, 0.11298863589763641, 0.12964802980422974, 0.14630743861198425, 0.16296684741973877, 0.1796262562274933, 0.1962856650352478, 0.21294505894184113, 0.22960446774959564, 0.24626387655735016, 0.2629232704639435, 0.279582679271698, 0.2962420880794525]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 4.0, 3.0, 8.0, 7.0, 7.0, 10.0, 17.0, 23.0, 45.0, 38.0, 47.0, 52.0, 64.0, 76.0, 90.0, 100.0, 89.0, 73.0, 64.0, 44.0, 44.0, 31.0, 33.0, 13.0, 11.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.20926189422607422, -0.2038784921169281, -0.19849509000778198, -0.19311168789863586, -0.18772828578948975, -0.18234488368034363, -0.1769614815711975, -0.1715780794620514, -0.16619467735290527, -0.16081127524375916, -0.15542787313461304, -0.15004447102546692, -0.1446610689163208, -0.13927766680717468, -0.13389426469802856, -0.12851086258888245, -0.12312746047973633, -0.11774405837059021, -0.11236065626144409, -0.10697725415229797, -0.10159385204315186, -0.09621044993400574, -0.09082704782485962, -0.0854436457157135, -0.08006024360656738, -0.07467684149742126, -0.06929343938827515, -0.06391003727912903, -0.05852663516998291, -0.05314323306083679, -0.047759830951690674, -0.042376428842544556, -0.03699302673339844, -0.03160962462425232, -0.0262262225151062, -0.020842820405960083, -0.015459418296813965, -0.010076016187667847, -0.0046926140785217285, 0.0006907880306243896, 0.006074190139770508, 0.011457592248916626, 0.016840994358062744, 0.022224396467208862, 0.02760779857635498, 0.0329912006855011, 0.03837460279464722, 0.043758004903793335, 0.04914140701293945, 0.05452480912208557, 0.05990821123123169, 0.06529161334037781, 0.07067501544952393, 0.07605841755867004, 0.08144181966781616, 0.08682522177696228, 0.0922086238861084, 0.09759202599525452, 0.10297542810440063, 0.10835883021354675, 0.11374223232269287, 0.11912563443183899, 0.12450903654098511, 0.12989243865013123, 0.13527584075927734]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 13.0, 13.0, 13.0, 16.0, 23.0, 29.0, 57.0, 89.0, 111.0, 182.0, 253.0, 448.0, 750.0, 1437.0, 2885.0, 6828.0, 18150.0, 56381.0, 196473.0, 439031.0, 225714.0, 64732.0, 20417.0, 7572.0, 3289.0, 1536.0, 752.0, 453.0, 306.0, 184.0, 114.0, 79.0, 41.0, 46.0, 32.0, 27.0, 16.0, 10.0, 7.0, 7.0, 5.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0762939453125, -0.0740203857421875, -0.071746826171875, -0.0694732666015625, -0.06719970703125, -0.0649261474609375, -0.062652587890625, -0.0603790283203125, -0.05810546875, -0.0558319091796875, -0.053558349609375, -0.0512847900390625, -0.04901123046875, -0.0467376708984375, -0.044464111328125, -0.0421905517578125, -0.0399169921875, -0.0376434326171875, -0.035369873046875, -0.0330963134765625, -0.03082275390625, -0.0285491943359375, -0.026275634765625, -0.0240020751953125, -0.021728515625, -0.0194549560546875, -0.017181396484375, -0.0149078369140625, -0.01263427734375, -0.0103607177734375, -0.008087158203125, -0.0058135986328125, -0.0035400390625, -0.0012664794921875, 0.001007080078125, 0.0032806396484375, 0.00555419921875, 0.0078277587890625, 0.010101318359375, 0.0123748779296875, 0.0146484375, 0.0169219970703125, 0.019195556640625, 0.0214691162109375, 0.02374267578125, 0.0260162353515625, 0.028289794921875, 0.0305633544921875, 0.0328369140625, 0.0351104736328125, 0.037384033203125, 0.0396575927734375, 0.04193115234375, 0.0442047119140625, 0.046478271484375, 0.0487518310546875, 0.051025390625, 0.0532989501953125, 0.055572509765625, 0.0578460693359375, 0.06011962890625, 0.0623931884765625, 0.064666748046875, 0.0669403076171875, 0.0692138671875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 5.0, 16.0, 15.0, 27.0, 31.0, 35.0, 61.0, 67.0, 64.0, 59.0, 97.0, 84.0, 83.0, 69.0, 51.0, 64.0, 34.0, 47.0, 27.0, 18.0, 22.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03271484375, -0.03130626678466797, -0.029897689819335938, -0.028489112854003906, -0.027080535888671875, -0.025671958923339844, -0.024263381958007812, -0.02285480499267578, -0.02144622802734375, -0.02003765106201172, -0.018629074096679688, -0.017220497131347656, -0.015811920166015625, -0.014403343200683594, -0.012994766235351562, -0.011586189270019531, -0.0101776123046875, -0.008769035339355469, -0.0073604583740234375, -0.005951881408691406, -0.004543304443359375, -0.0031347274780273438, -0.0017261505126953125, -0.00031757354736328125, 0.00109100341796875, 0.0024995803833007812, 0.0039081573486328125, 0.005316734313964844, 0.006725311279296875, 0.008133888244628906, 0.009542465209960938, 0.010951042175292969, 0.012359619140625, 0.013768196105957031, 0.015176773071289062, 0.016585350036621094, 0.017993927001953125, 0.019402503967285156, 0.020811080932617188, 0.02221965789794922, 0.02362823486328125, 0.02503681182861328, 0.026445388793945312, 0.027853965759277344, 0.029262542724609375, 0.030671119689941406, 0.03207969665527344, 0.03348827362060547, 0.0348968505859375, 0.03630542755126953, 0.03771400451660156, 0.039122581481933594, 0.040531158447265625, 0.041939735412597656, 0.04334831237792969, 0.04475688934326172, 0.04616546630859375, 0.04757404327392578, 0.04898262023925781, 0.050391197204589844, 0.051799774169921875, 0.053208351135253906, 0.05461692810058594, 0.05602550506591797, 0.05743408203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 8.0, 10.0, 5.0, 10.0, 17.0, 16.0, 16.0, 24.0, 39.0, 52.0, 62.0, 67.0, 117.0, 152.0, 254.0, 350.0, 681.0, 1446.0, 3597.0, 10024.0, 34410.0, 144538.0, 484918.0, 278122.0, 63132.0, 16517.0, 5553.0, 2082.0, 940.0, 467.0, 309.0, 175.0, 110.0, 75.0, 68.0, 39.0, 35.0, 30.0, 21.0, 15.0, 15.0, 10.0, 10.0, 6.0, 9.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.059783935546875, -0.057627201080322266, -0.05547046661376953, -0.0533137321472168, -0.05115699768066406, -0.04900026321411133, -0.046843528747558594, -0.04468679428100586, -0.042530059814453125, -0.04037332534790039, -0.038216590881347656, -0.03605985641479492, -0.03390312194824219, -0.03174638748168945, -0.02958965301513672, -0.027432918548583984, -0.02527618408203125, -0.023119449615478516, -0.02096271514892578, -0.018805980682373047, -0.016649246215820312, -0.014492511749267578, -0.012335777282714844, -0.01017904281616211, -0.008022308349609375, -0.005865573883056641, -0.0037088394165039062, -0.0015521049499511719, 0.0006046295166015625, 0.002761363983154297, 0.004918098449707031, 0.007074832916259766, 0.0092315673828125, 0.011388301849365234, 0.013545036315917969, 0.015701770782470703, 0.017858505249023438, 0.020015239715576172, 0.022171974182128906, 0.02432870864868164, 0.026485443115234375, 0.02864217758178711, 0.030798912048339844, 0.03295564651489258, 0.03511238098144531, 0.03726911544799805, 0.03942584991455078, 0.041582584381103516, 0.04373931884765625, 0.045896053314208984, 0.04805278778076172, 0.05020952224731445, 0.05236625671386719, 0.05452299118041992, 0.056679725646972656, 0.05883646011352539, 0.060993194580078125, 0.06314992904663086, 0.0653066635131836, 0.06746339797973633, 0.06962013244628906, 0.0717768669128418, 0.07393360137939453, 0.07609033584594727, 0.0782470703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 7.0, 6.0, 7.0, 15.0, 15.0, 15.0, 18.0, 23.0, 25.0, 19.0, 25.0, 28.0, 31.0, 36.0, 41.0, 30.0, 56.0, 43.0, 37.0, 54.0, 36.0, 42.0, 43.0, 33.0, 41.0, 33.0, 25.0, 34.0, 27.0, 33.0, 20.0, 16.0, 12.0, 16.0, 13.0, 5.0, 7.0, 8.0, 4.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.09710693359375, -0.09401702880859375, -0.0909271240234375, -0.08783721923828125, -0.084747314453125, -0.08165740966796875, -0.0785675048828125, -0.07547760009765625, -0.0723876953125, -0.06929779052734375, -0.0662078857421875, -0.06311798095703125, -0.060028076171875, -0.05693817138671875, -0.0538482666015625, -0.05075836181640625, -0.04766845703125, -0.04457855224609375, -0.0414886474609375, -0.03839874267578125, -0.035308837890625, -0.03221893310546875, -0.0291290283203125, -0.02603912353515625, -0.02294921875, -0.01985931396484375, -0.0167694091796875, -0.01367950439453125, -0.010589599609375, -0.00749969482421875, -0.0044097900390625, -0.00131988525390625, 0.00177001953125, 0.00485992431640625, 0.0079498291015625, 0.01103973388671875, 0.014129638671875, 0.01721954345703125, 0.0203094482421875, 0.02339935302734375, 0.0264892578125, 0.02957916259765625, 0.0326690673828125, 0.03575897216796875, 0.038848876953125, 0.04193878173828125, 0.0450286865234375, 0.04811859130859375, 0.05120849609375, 0.05429840087890625, 0.0573883056640625, 0.06047821044921875, 0.063568115234375, 0.06665802001953125, 0.0697479248046875, 0.07283782958984375, 0.075927734375, 0.07901763916015625, 0.0821075439453125, 0.08519744873046875, 0.088287353515625, 0.09137725830078125, 0.0944671630859375, 0.09755706787109375, 0.10064697265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 16.0, 29.0, 41.0, 66.0, 120.0, 174.0, 408.0, 882.0, 2418.0, 10178.0, 70800.0, 598037.0, 323226.0, 33276.0, 5873.0, 1608.0, 665.0, 310.0, 172.0, 101.0, 51.0, 38.0, 13.0, 16.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03887939453125, -0.037575721740722656, -0.03627204895019531, -0.03496837615966797, -0.033664703369140625, -0.03236103057861328, -0.031057357788085938, -0.029753684997558594, -0.02845001220703125, -0.027146339416503906, -0.025842666625976562, -0.02453899383544922, -0.023235321044921875, -0.02193164825439453, -0.020627975463867188, -0.019324302673339844, -0.0180206298828125, -0.016716957092285156, -0.015413284301757812, -0.014109611511230469, -0.012805938720703125, -0.011502265930175781, -0.010198593139648438, -0.008894920349121094, -0.00759124755859375, -0.006287574768066406, -0.0049839019775390625, -0.0036802291870117188, -0.002376556396484375, -0.0010728836059570312, 0.0002307891845703125, 0.0015344619750976562, 0.002838134765625, 0.004141807556152344, 0.0054454803466796875, 0.006749153137207031, 0.008052825927734375, 0.009356498718261719, 0.010660171508789062, 0.011963844299316406, 0.01326751708984375, 0.014571189880371094, 0.015874862670898438, 0.01717853546142578, 0.018482208251953125, 0.01978588104248047, 0.021089553833007812, 0.022393226623535156, 0.0236968994140625, 0.025000572204589844, 0.026304244995117188, 0.02760791778564453, 0.028911590576171875, 0.03021526336669922, 0.03151893615722656, 0.032822608947753906, 0.03412628173828125, 0.035429954528808594, 0.03673362731933594, 0.03803730010986328, 0.039340972900390625, 0.04064464569091797, 0.04194831848144531, 0.043251991271972656, 0.0445556640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 6.0, 12.0, 9.0, 12.0, 21.0, 15.0, 26.0, 37.0, 35.0, 48.0, 54.0, 46.0, 63.0, 56.0, 43.0, 75.0, 56.0, 57.0, 53.0, 25.0, 43.0, 38.0, 23.0, 20.0, 23.0, 10.0, 20.0, 9.0, 5.0, 13.0, 8.0, 4.0, 6.0, 3.0, 2.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.708766937255859e-06, -4.550442099571228e-06, -4.392117261886597e-06, -4.233792424201965e-06, -4.075467586517334e-06, -3.917142748832703e-06, -3.7588179111480713e-06, -3.60049307346344e-06, -3.4421682357788086e-06, -3.2838433980941772e-06, -3.125518560409546e-06, -2.9671937227249146e-06, -2.808868885040283e-06, -2.650544047355652e-06, -2.4922192096710205e-06, -2.333894371986389e-06, -2.175569534301758e-06, -2.0172446966171265e-06, -1.8589198589324951e-06, -1.7005950212478638e-06, -1.5422701835632324e-06, -1.383945345878601e-06, -1.2256205081939697e-06, -1.0672956705093384e-06, -9.08970832824707e-07, -7.506459951400757e-07, -5.923211574554443e-07, -4.33996319770813e-07, -2.7567148208618164e-07, -1.1734664440155029e-07, 4.0978193283081055e-08, 1.993030309677124e-07, 3.5762786865234375e-07, 5.159527063369751e-07, 6.742775440216064e-07, 8.326023817062378e-07, 9.909272193908691e-07, 1.1492520570755005e-06, 1.3075768947601318e-06, 1.4659017324447632e-06, 1.6242265701293945e-06, 1.7825514078140259e-06, 1.9408762454986572e-06, 2.0992010831832886e-06, 2.25752592086792e-06, 2.4158507585525513e-06, 2.5741755962371826e-06, 2.732500433921814e-06, 2.8908252716064453e-06, 3.0491501092910767e-06, 3.207474946975708e-06, 3.3657997846603394e-06, 3.5241246223449707e-06, 3.682449460029602e-06, 3.840774297714233e-06, 3.999099135398865e-06, 4.157423973083496e-06, 4.3157488107681274e-06, 4.474073648452759e-06, 4.63239848613739e-06, 4.7907233238220215e-06, 4.949048161506653e-06, 5.107372999191284e-06, 5.2656978368759155e-06, 5.424022674560547e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 1.0, 8.0, 8.0, 18.0, 17.0, 48.0, 120.0, 339.0, 1487.0, 19481.0, 667361.0, 348370.0, 9834.0, 1018.0, 263.0, 105.0, 37.0, 20.0, 12.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050384521484375, -0.04797220230102539, -0.04555988311767578, -0.04314756393432617, -0.04073524475097656, -0.03832292556762695, -0.035910606384277344, -0.033498287200927734, -0.031085968017578125, -0.028673648834228516, -0.026261329650878906, -0.023849010467529297, -0.021436691284179688, -0.019024372100830078, -0.01661205291748047, -0.01419973373413086, -0.01178741455078125, -0.00937509536743164, -0.006962776184082031, -0.004550457000732422, -0.0021381378173828125, 0.0002741813659667969, 0.0026865005493164062, 0.005098819732666016, 0.007511138916015625, 0.009923458099365234, 0.012335777282714844, 0.014748096466064453, 0.017160415649414062, 0.019572734832763672, 0.02198505401611328, 0.02439737319946289, 0.0268096923828125, 0.02922201156616211, 0.03163433074951172, 0.03404664993286133, 0.03645896911621094, 0.03887128829956055, 0.041283607482910156, 0.043695926666259766, 0.046108245849609375, 0.048520565032958984, 0.050932884216308594, 0.0533452033996582, 0.05575752258300781, 0.05816984176635742, 0.06058216094970703, 0.06299448013305664, 0.06540679931640625, 0.06781911849975586, 0.07023143768310547, 0.07264375686645508, 0.07505607604980469, 0.0774683952331543, 0.0798807144165039, 0.08229303359985352, 0.08470535278320312, 0.08711767196655273, 0.08952999114990234, 0.09194231033325195, 0.09435462951660156, 0.09676694869995117, 0.09917926788330078, 0.10159158706665039, 0.10400390625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 0.0, 6.0, 7.0, 12.0, 11.0, 12.0, 9.0, 27.0, 18.0, 47.0, 41.0, 43.0, 45.0, 78.0, 60.0, 50.0, 85.0, 72.0, 69.0, 40.0, 42.0, 45.0, 40.0, 25.0, 23.0, 22.0, 11.0, 14.0, 10.0, 10.0, 4.0, 1.0, 6.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0255126953125, -0.024693012237548828, -0.023873329162597656, -0.023053646087646484, -0.022233963012695312, -0.02141427993774414, -0.02059459686279297, -0.019774913787841797, -0.018955230712890625, -0.018135547637939453, -0.01731586456298828, -0.01649618148803711, -0.015676498413085938, -0.014856815338134766, -0.014037132263183594, -0.013217449188232422, -0.01239776611328125, -0.011578083038330078, -0.010758399963378906, -0.009938716888427734, -0.009119033813476562, -0.00829935073852539, -0.007479667663574219, -0.006659984588623047, -0.005840301513671875, -0.005020618438720703, -0.004200935363769531, -0.0033812522888183594, -0.0025615692138671875, -0.0017418861389160156, -0.0009222030639648438, -0.00010251998901367188, 0.0007171630859375, 0.0015368461608886719, 0.0023565292358398438, 0.0031762123107910156, 0.0039958953857421875, 0.004815578460693359, 0.005635261535644531, 0.006454944610595703, 0.007274627685546875, 0.008094310760498047, 0.008913993835449219, 0.00973367691040039, 0.010553359985351562, 0.011373043060302734, 0.012192726135253906, 0.013012409210205078, 0.01383209228515625, 0.014651775360107422, 0.015471458435058594, 0.016291141510009766, 0.017110824584960938, 0.01793050765991211, 0.01875019073486328, 0.019569873809814453, 0.020389556884765625, 0.021209239959716797, 0.02202892303466797, 0.02284860610961914, 0.023668289184570312, 0.024487972259521484, 0.025307655334472656, 0.026127338409423828, 0.026947021484375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 17.0, 43.0, 87.0, 200.0, 260.0, 199.0, 111.0, 47.0, 23.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4193289279937744, -1.3881479501724243, -1.3569669723510742, -1.3257858753204346, -1.2946048974990845, -1.2634239196777344, -1.2322429418563843, -1.2010619640350342, -1.1698808670043945, -1.1386998891830444, -1.1075189113616943, -1.0763378143310547, -1.0451568365097046, -1.0139758586883545, -0.9827948808670044, -0.9516138434410095, -0.9204328656196594, -0.8892518877983093, -0.8580708503723145, -0.8268898725509644, -0.7957088351249695, -0.7645278573036194, -0.7333468198776245, -0.7021658420562744, -0.6709848642349243, -0.6398038864135742, -0.6086228489875793, -0.5774418711662292, -0.5462608337402344, -0.5150798559188843, -0.4838988482952118, -0.4527178406715393, -0.42153674364089966, -0.3903557360172272, -0.3591747283935547, -0.3279937505722046, -0.2968127131462097, -0.2656317353248596, -0.23445072770118713, -0.20326972007751465, -0.17208871245384216, -0.14090770483016968, -0.10972670465707779, -0.0785457044839859, -0.047364696860313416, -0.01618368923664093, 0.014997303485870361, 0.04617831110954285, 0.07735931873321533, 0.10854032635688782, 0.1397213339805603, 0.1709023267030716, 0.20208333432674408, 0.23326434195041656, 0.26444533467292786, 0.29562634229660034, 0.3268073499202728, 0.3579883575439453, 0.3891693651676178, 0.4203503727912903, 0.4515313506126404, 0.48271238803863525, 0.5138933658599854, 0.5450743436813354, 0.5762553811073303]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 9.0, 6.0, 8.0, 16.0, 9.0, 15.0, 14.0, 14.0, 16.0, 22.0, 9.0, 27.0, 24.0, 36.0, 26.0, 33.0, 37.0, 49.0, 32.0, 28.0, 41.0, 50.0, 34.0, 43.0, 45.0, 34.0, 45.0, 25.0, 24.0, 33.0, 28.0, 24.0, 14.0, 15.0, 24.0, 13.0, 16.0, 9.0, 15.0, 8.0, 5.0, 9.0, 3.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4623953700065613, -0.44809389114379883, -0.4337924122810364, -0.4194909334182739, -0.4051894545555115, -0.390887975692749, -0.3765864968299866, -0.36228498816490173, -0.3479835093021393, -0.33368203043937683, -0.3193805515766144, -0.30507907271385193, -0.2907775938510895, -0.27647608518600464, -0.2621746063232422, -0.24787312746047974, -0.23357166349887848, -0.21927018463611603, -0.20496870577335358, -0.19066721200942993, -0.17636573314666748, -0.16206425428390503, -0.14776277542114258, -0.13346129655838013, -0.11915981024503708, -0.10485833138227463, -0.09055684506893158, -0.07625536620616913, -0.06195388361811638, -0.04765240103006363, -0.03335092216730118, -0.01904943585395813, -0.004747956991195679, 0.009553524665534496, 0.02385500632226467, 0.03815648704767227, 0.05245796963572502, 0.06675945222377777, 0.08106093108654022, 0.09536241739988327, 0.10966389626264572, 0.12396537512540817, 0.13826686143875122, 0.15256834030151367, 0.16686981916427612, 0.18117129802703857, 0.19547277688980103, 0.20977427065372467, 0.22407574951648712, 0.23837722837924957, 0.2526787221431732, 0.26698020100593567, 0.2812816798686981, 0.29558315873146057, 0.309884637594223, 0.3241861164569855, 0.3384875953197479, 0.3527890741825104, 0.3670905530452728, 0.3813920319080353, 0.39569351077079773, 0.40999501943588257, 0.424296498298645, 0.43859797716140747, 0.4528994560241699]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 9.0, 20.0, 14.0, 27.0, 48.0, 85.0, 123.0, 197.0, 336.0, 712.0, 1413.0, 2985.0, 7964.0, 32047.0, 3154925.0, 951426.0, 28830.0, 7269.0, 2936.0, 1329.0, 651.0, 380.0, 190.0, 116.0, 74.0, 55.0, 26.0, 29.0, 12.0, 12.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1044921875, -0.10111808776855469, -0.09774398803710938, -0.09436988830566406, -0.09099578857421875, -0.08762168884277344, -0.08424758911132812, -0.08087348937988281, -0.0774993896484375, -0.07412528991699219, -0.07075119018554688, -0.06737709045410156, -0.06400299072265625, -0.06062889099121094, -0.057254791259765625, -0.05388069152832031, -0.050506591796875, -0.04713249206542969, -0.043758392333984375, -0.04038429260253906, -0.03701019287109375, -0.03363609313964844, -0.030261993408203125, -0.026887893676757812, -0.0235137939453125, -0.020139694213867188, -0.016765594482421875, -0.013391494750976562, -0.01001739501953125, -0.0066432952880859375, -0.003269195556640625, 0.0001049041748046875, 0.00347900390625, 0.0068531036376953125, 0.010227203369140625, 0.013601303100585938, 0.01697540283203125, 0.020349502563476562, 0.023723602294921875, 0.027097702026367188, 0.0304718017578125, 0.03384590148925781, 0.037220001220703125, 0.04059410095214844, 0.04396820068359375, 0.04734230041503906, 0.050716400146484375, 0.05409049987792969, 0.057464599609375, 0.06083869934082031, 0.06421279907226562, 0.06758689880371094, 0.07096099853515625, 0.07433509826660156, 0.07770919799804688, 0.08108329772949219, 0.0844573974609375, 0.08783149719238281, 0.09120559692382812, 0.09457969665527344, 0.09795379638671875, 0.10132789611816406, 0.10470199584960938, 0.10807609558105469, 0.1114501953125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 9.0, 8.0, 19.0, 27.0, 35.0, 51.0, 57.0, 62.0, 72.0, 80.0, 85.0, 99.0, 60.0, 62.0, 55.0, 55.0, 44.0, 24.0, 32.0, 16.0, 18.0, 8.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031982421875, -0.030585289001464844, -0.029188156127929688, -0.02779102325439453, -0.026393890380859375, -0.02499675750732422, -0.023599624633789062, -0.022202491760253906, -0.02080535888671875, -0.019408226013183594, -0.018011093139648438, -0.01661396026611328, -0.015216827392578125, -0.013819694519042969, -0.012422561645507812, -0.011025428771972656, -0.0096282958984375, -0.008231163024902344, -0.0068340301513671875, -0.005436897277832031, -0.004039764404296875, -0.0026426315307617188, -0.0012454986572265625, 0.00015163421630859375, 0.00154876708984375, 0.0029458999633789062, 0.0043430328369140625, 0.005740165710449219, 0.007137298583984375, 0.008534431457519531, 0.009931564331054688, 0.011328697204589844, 0.012725830078125, 0.014122962951660156, 0.015520095825195312, 0.01691722869873047, 0.018314361572265625, 0.01971149444580078, 0.021108627319335938, 0.022505760192871094, 0.02390289306640625, 0.025300025939941406, 0.026697158813476562, 0.02809429168701172, 0.029491424560546875, 0.03088855743408203, 0.03228569030761719, 0.033682823181152344, 0.0350799560546875, 0.036477088928222656, 0.03787422180175781, 0.03927135467529297, 0.040668487548828125, 0.04206562042236328, 0.04346275329589844, 0.044859886169433594, 0.04625701904296875, 0.047654151916503906, 0.04905128479003906, 0.05044841766357422, 0.051845550537109375, 0.05324268341064453, 0.05463981628417969, 0.056036949157714844, 0.05743408203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 12.0, 13.0, 22.0, 30.0, 41.0, 80.0, 136.0, 239.0, 426.0, 726.0, 1420.0, 3215.0, 8155.0, 33199.0, 800467.0, 3286307.0, 43003.0, 9663.0, 3596.0, 1600.0, 858.0, 449.0, 256.0, 148.0, 81.0, 43.0, 30.0, 22.0, 12.0, 5.0, 12.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0950927734375, -0.09193038940429688, -0.08876800537109375, -0.08560562133789062, -0.0824432373046875, -0.07928085327148438, -0.07611846923828125, -0.07295608520507812, -0.069793701171875, -0.06663131713867188, -0.06346893310546875, -0.060306549072265625, -0.0571441650390625, -0.053981781005859375, -0.05081939697265625, -0.047657012939453125, -0.04449462890625, -0.041332244873046875, -0.03816986083984375, -0.035007476806640625, -0.0318450927734375, -0.028682708740234375, -0.02552032470703125, -0.022357940673828125, -0.019195556640625, -0.016033172607421875, -0.01287078857421875, -0.009708404541015625, -0.0065460205078125, -0.003383636474609375, -0.00022125244140625, 0.002941131591796875, 0.006103515625, 0.009265899658203125, 0.01242828369140625, 0.015590667724609375, 0.0187530517578125, 0.021915435791015625, 0.02507781982421875, 0.028240203857421875, 0.031402587890625, 0.034564971923828125, 0.03772735595703125, 0.040889739990234375, 0.0440521240234375, 0.047214508056640625, 0.05037689208984375, 0.053539276123046875, 0.05670166015625, 0.059864044189453125, 0.06302642822265625, 0.06618881225585938, 0.0693511962890625, 0.07251358032226562, 0.07567596435546875, 0.07883834838867188, 0.082000732421875, 0.08516311645507812, 0.08832550048828125, 0.09148788452148438, 0.0946502685546875, 0.09781265258789062, 0.10097503662109375, 0.10413742065429688, 0.1072998046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 9.0, 2.0, 9.0, 12.0, 16.0, 25.0, 45.0, 90.0, 286.0, 2779.0, 554.0, 124.0, 45.0, 29.0, 12.0, 9.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0927734375, -0.09078598022460938, -0.08879852294921875, -0.08681106567382812, -0.0848236083984375, -0.08283615112304688, -0.08084869384765625, -0.07886123657226562, -0.076873779296875, -0.07488632202148438, -0.07289886474609375, -0.07091140747070312, -0.0689239501953125, -0.06693649291992188, -0.06494903564453125, -0.06296157836914062, -0.06097412109375, -0.058986663818359375, -0.05699920654296875, -0.055011749267578125, -0.0530242919921875, -0.051036834716796875, -0.04904937744140625, -0.047061920166015625, -0.045074462890625, -0.043087005615234375, -0.04109954833984375, -0.039112091064453125, -0.0371246337890625, -0.035137176513671875, -0.03314971923828125, -0.031162261962890625, -0.0291748046875, -0.027187347412109375, -0.02519989013671875, -0.023212432861328125, -0.0212249755859375, -0.019237518310546875, -0.01725006103515625, -0.015262603759765625, -0.013275146484375, -0.011287689208984375, -0.00930023193359375, -0.007312774658203125, -0.0053253173828125, -0.003337860107421875, -0.00135040283203125, 0.000637054443359375, 0.00262451171875, 0.004611968994140625, 0.00659942626953125, 0.008586883544921875, 0.0105743408203125, 0.012561798095703125, 0.01454925537109375, 0.016536712646484375, 0.018524169921875, 0.020511627197265625, 0.02249908447265625, 0.024486541748046875, 0.0264739990234375, 0.028461456298828125, 0.03044891357421875, 0.032436370849609375, 0.034423828125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 17.0, 227.0, 750.0, 17.0, 3.0], "bins": [-3.605652332305908, -3.5468263626098633, -3.4880003929138184, -3.4291741847991943, -3.3703482151031494, -3.3115222454071045, -3.2526960372924805, -3.1938700675964355, -3.1350440979003906, -3.0762181282043457, -3.017392158508301, -2.9585659503936768, -2.899739980697632, -2.840914011001587, -2.782087802886963, -2.723261833190918, -2.664435863494873, -2.605609893798828, -2.546783924102783, -2.487957715988159, -2.4291317462921143, -2.3703057765960693, -2.3114795684814453, -2.2526535987854004, -2.1938276290893555, -2.1350016593933105, -2.0761756896972656, -2.0173494815826416, -1.9585235118865967, -1.8996975421905518, -1.8408714532852173, -1.7820453643798828, -1.723219394683838, -1.664393424987793, -1.6055673360824585, -1.546741247177124, -1.487915277481079, -1.4290893077850342, -1.3702632188796997, -1.3114371299743652, -1.2526111602783203, -1.1937851905822754, -1.134959101676941, -1.0761330127716064, -1.0173070430755615, -0.9584810137748718, -0.8996549844741821, -0.8408289551734924, -0.7820029258728027, -0.723176896572113, -0.6643508672714233, -0.6055248379707336, -0.546698808670044, -0.48787277936935425, -0.42904675006866455, -0.37022072076797485, -0.31139469146728516, -0.25256866216659546, -0.19374263286590576, -0.13491660356521606, -0.07609057426452637, -0.01726454496383667, 0.04156148433685303, 0.10038751363754272, 0.15921355783939362]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 7.0, 17.0, 23.0, 33.0, 47.0, 58.0, 81.0, 67.0, 89.0, 101.0, 85.0, 74.0, 79.0, 55.0, 46.0, 36.0, 38.0, 21.0, 8.0, 9.0, 3.0, 8.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2488701343536377, -0.24163968861103058, -0.23440924286842346, -0.22717881202697754, -0.21994836628437042, -0.2127179205417633, -0.2054874747991562, -0.19825702905654907, -0.19102659821510315, -0.18379615247249603, -0.17656570672988892, -0.169335275888443, -0.16210483014583588, -0.15487438440322876, -0.14764393866062164, -0.14041349291801453, -0.1331830471754074, -0.1259526014328003, -0.11872216314077377, -0.11149171739816666, -0.10426127910614014, -0.09703083336353302, -0.0898003876209259, -0.08256994187831879, -0.07533950358629227, -0.06810905784368515, -0.06087861955165863, -0.053648173809051514, -0.046417731791734695, -0.03918728977441788, -0.03195684403181076, -0.024726402014493942, -0.017495959997177124, -0.010265517048537731, -0.0030350740998983383, 0.004195369780063629, 0.011425811797380447, 0.018656253814697266, 0.025886699557304382, 0.0331171415746212, 0.04034758359193802, 0.04757802560925484, 0.054808467626571655, 0.06203891336917877, 0.06926935911178589, 0.07649979740381241, 0.08373024314641953, 0.09096068143844604, 0.09819112718105316, 0.10542157292366028, 0.1126520112156868, 0.11988245695829391, 0.12711289525032043, 0.13434334099292755, 0.14157378673553467, 0.14880423247814178, 0.1560346782207489, 0.16326512396335602, 0.17049556970596313, 0.17772600054740906, 0.18495644629001617, 0.1921868920326233, 0.1994173377752304, 0.20664778351783752, 0.21387821435928345]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 3.0, 5.0, 5.0, 6.0, 13.0, 14.0, 27.0, 30.0, 42.0, 88.0, 127.0, 205.0, 419.0, 809.0, 1701.0, 4501.0, 14313.0, 64728.0, 388660.0, 465657.0, 80997.0, 17242.0, 5129.0, 1886.0, 821.0, 439.0, 275.0, 169.0, 87.0, 44.0, 37.0, 21.0, 17.0, 10.0, 11.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09112548828125, -0.08828353881835938, -0.08544158935546875, -0.08259963989257812, -0.0797576904296875, -0.07691574096679688, -0.07407379150390625, -0.07123184204101562, -0.068389892578125, -0.06554794311523438, -0.06270599365234375, -0.059864044189453125, -0.0570220947265625, -0.054180145263671875, -0.05133819580078125, -0.048496246337890625, -0.045654296875, -0.042812347412109375, -0.03997039794921875, -0.037128448486328125, -0.0342864990234375, -0.031444549560546875, -0.02860260009765625, -0.025760650634765625, -0.022918701171875, -0.020076751708984375, -0.01723480224609375, -0.014392852783203125, -0.0115509033203125, -0.008708953857421875, -0.00586700439453125, -0.003025054931640625, -0.00018310546875, 0.002658843994140625, 0.00550079345703125, 0.008342742919921875, 0.0111846923828125, 0.014026641845703125, 0.01686859130859375, 0.019710540771484375, 0.022552490234375, 0.025394439697265625, 0.02823638916015625, 0.031078338623046875, 0.0339202880859375, 0.036762237548828125, 0.03960418701171875, 0.042446136474609375, 0.0452880859375, 0.048130035400390625, 0.05097198486328125, 0.053813934326171875, 0.0566558837890625, 0.059497833251953125, 0.06233978271484375, 0.06518173217773438, 0.068023681640625, 0.07086563110351562, 0.07370758056640625, 0.07654953002929688, 0.0793914794921875, 0.08223342895507812, 0.08507537841796875, 0.08791732788085938, 0.09075927734375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 5.0, 5.0, 8.0, 3.0, 20.0, 19.0, 40.0, 40.0, 43.0, 61.0, 55.0, 68.0, 64.0, 66.0, 77.0, 68.0, 64.0, 70.0, 58.0, 40.0, 29.0, 28.0, 15.0, 11.0, 20.0, 11.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034454345703125, -0.03312206268310547, -0.03178977966308594, -0.030457496643066406, -0.029125213623046875, -0.027792930603027344, -0.026460647583007812, -0.02512836456298828, -0.02379608154296875, -0.02246379852294922, -0.021131515502929688, -0.019799232482910156, -0.018466949462890625, -0.017134666442871094, -0.015802383422851562, -0.014470100402832031, -0.0131378173828125, -0.011805534362792969, -0.010473251342773438, -0.009140968322753906, -0.007808685302734375, -0.006476402282714844, -0.0051441192626953125, -0.0038118362426757812, -0.00247955322265625, -0.0011472702026367188, 0.0001850128173828125, 0.0015172958374023438, 0.002849578857421875, 0.004181861877441406, 0.0055141448974609375, 0.006846427917480469, 0.0081787109375, 0.009510993957519531, 0.010843276977539062, 0.012175559997558594, 0.013507843017578125, 0.014840126037597656, 0.016172409057617188, 0.01750469207763672, 0.01883697509765625, 0.02016925811767578, 0.021501541137695312, 0.022833824157714844, 0.024166107177734375, 0.025498390197753906, 0.026830673217773438, 0.02816295623779297, 0.0294952392578125, 0.03082752227783203, 0.03215980529785156, 0.033492088317871094, 0.034824371337890625, 0.036156654357910156, 0.03748893737792969, 0.03882122039794922, 0.04015350341796875, 0.04148578643798828, 0.04281806945800781, 0.044150352478027344, 0.045482635498046875, 0.046814918518066406, 0.04814720153808594, 0.04947948455810547, 0.050811767578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 1.0, 9.0, 7.0, 17.0, 14.0, 27.0, 22.0, 40.0, 62.0, 66.0, 92.0, 139.0, 201.0, 353.0, 691.0, 1982.0, 7511.0, 41253.0, 397017.0, 530545.0, 54899.0, 9189.0, 2400.0, 873.0, 404.0, 207.0, 130.0, 95.0, 66.0, 72.0, 37.0, 41.0, 24.0, 11.0, 18.0, 16.0, 3.0, 3.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0909423828125, -0.08801555633544922, -0.08508872985839844, -0.08216190338134766, -0.07923507690429688, -0.0763082504272461, -0.07338142395019531, -0.07045459747314453, -0.06752777099609375, -0.06460094451904297, -0.06167411804199219, -0.058747291564941406, -0.055820465087890625, -0.052893638610839844, -0.04996681213378906, -0.04703998565673828, -0.0441131591796875, -0.04118633270263672, -0.03825950622558594, -0.035332679748535156, -0.032405853271484375, -0.029479026794433594, -0.026552200317382812, -0.02362537384033203, -0.02069854736328125, -0.01777172088623047, -0.014844894409179688, -0.011918067932128906, -0.008991241455078125, -0.006064414978027344, -0.0031375885009765625, -0.00021076202392578125, 0.002716064453125, 0.005642890930175781, 0.008569717407226562, 0.011496543884277344, 0.014423370361328125, 0.017350196838378906, 0.020277023315429688, 0.02320384979248047, 0.02613067626953125, 0.02905750274658203, 0.03198432922363281, 0.034911155700683594, 0.037837982177734375, 0.040764808654785156, 0.04369163513183594, 0.04661846160888672, 0.0495452880859375, 0.05247211456298828, 0.05539894104003906, 0.058325767517089844, 0.061252593994140625, 0.0641794204711914, 0.06710624694824219, 0.07003307342529297, 0.07295989990234375, 0.07588672637939453, 0.07881355285644531, 0.0817403793334961, 0.08466720581054688, 0.08759403228759766, 0.09052085876464844, 0.09344768524169922, 0.09637451171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 6.0, 7.0, 10.0, 9.0, 9.0, 13.0, 17.0, 22.0, 21.0, 26.0, 26.0, 39.0, 47.0, 29.0, 46.0, 32.0, 50.0, 46.0, 47.0, 34.0, 48.0, 29.0, 41.0, 42.0, 42.0, 35.0, 28.0, 30.0, 30.0, 21.0, 19.0, 19.0, 16.0, 15.0, 11.0, 12.0, 5.0, 9.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1112060546875, -0.10784339904785156, -0.10448074340820312, -0.10111808776855469, -0.09775543212890625, -0.09439277648925781, -0.09103012084960938, -0.08766746520996094, -0.0843048095703125, -0.08094215393066406, -0.07757949829101562, -0.07421684265136719, -0.07085418701171875, -0.06749153137207031, -0.06412887573242188, -0.06076622009277344, -0.057403564453125, -0.05404090881347656, -0.050678253173828125, -0.04731559753417969, -0.04395294189453125, -0.04059028625488281, -0.037227630615234375, -0.03386497497558594, -0.0305023193359375, -0.027139663696289062, -0.023777008056640625, -0.020414352416992188, -0.01705169677734375, -0.013689041137695312, -0.010326385498046875, -0.0069637298583984375, -0.00360107421875, -0.0002384185791015625, 0.003124237060546875, 0.0064868927001953125, 0.00984954833984375, 0.013212203979492188, 0.016574859619140625, 0.019937515258789062, 0.0233001708984375, 0.026662826538085938, 0.030025482177734375, 0.03338813781738281, 0.03675079345703125, 0.04011344909667969, 0.043476104736328125, 0.04683876037597656, 0.050201416015625, 0.05356407165527344, 0.056926727294921875, 0.06028938293457031, 0.06365203857421875, 0.06701469421386719, 0.07037734985351562, 0.07374000549316406, 0.0771026611328125, 0.08046531677246094, 0.08382797241210938, 0.08719062805175781, 0.09055328369140625, 0.09391593933105469, 0.09727859497070312, 0.10064125061035156, 0.10400390625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 13.0, 19.0, 15.0, 34.0, 48.0, 110.0, 114.0, 255.0, 537.0, 1142.0, 3140.0, 13649.0, 114509.0, 807799.0, 90483.0, 11666.0, 2861.0, 1058.0, 479.0, 242.0, 132.0, 84.0, 47.0, 29.0, 21.0, 14.0, 13.0, 8.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05743408203125, -0.055814266204833984, -0.05419445037841797, -0.05257463455200195, -0.05095481872558594, -0.04933500289916992, -0.047715187072753906, -0.04609537124633789, -0.044475555419921875, -0.04285573959350586, -0.041235923767089844, -0.03961610794067383, -0.03799629211425781, -0.0363764762878418, -0.03475666046142578, -0.033136844635009766, -0.03151702880859375, -0.029897212982177734, -0.02827739715576172, -0.026657581329345703, -0.025037765502929688, -0.023417949676513672, -0.021798133850097656, -0.02017831802368164, -0.018558502197265625, -0.01693868637084961, -0.015318870544433594, -0.013699054718017578, -0.012079238891601562, -0.010459423065185547, -0.008839607238769531, -0.007219791412353516, -0.0055999755859375, -0.003980159759521484, -0.0023603439331054688, -0.0007405281066894531, 0.0008792877197265625, 0.002499103546142578, 0.004118919372558594, 0.005738735198974609, 0.007358551025390625, 0.00897836685180664, 0.010598182678222656, 0.012217998504638672, 0.013837814331054688, 0.015457630157470703, 0.01707744598388672, 0.018697261810302734, 0.02031707763671875, 0.021936893463134766, 0.02355670928955078, 0.025176525115966797, 0.026796340942382812, 0.028416156768798828, 0.030035972595214844, 0.03165578842163086, 0.033275604248046875, 0.03489542007446289, 0.036515235900878906, 0.03813505172729492, 0.03975486755371094, 0.04137468338012695, 0.04299449920654297, 0.044614315032958984, 0.046234130859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 11.0, 16.0, 16.0, 29.0, 41.0, 40.0, 47.0, 67.0, 69.0, 92.0, 91.0, 74.0, 62.0, 78.0, 56.0, 53.0, 34.0, 25.0, 31.0, 5.0, 18.0, 6.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.867813110351562e-06, -7.63777643442154e-06, -7.407739758491516e-06, -7.177703082561493e-06, -6.94766640663147e-06, -6.7176297307014465e-06, -6.487593054771423e-06, -6.2575563788414e-06, -6.027519702911377e-06, -5.797483026981354e-06, -5.5674463510513306e-06, -5.337409675121307e-06, -5.107372999191284e-06, -4.877336323261261e-06, -4.647299647331238e-06, -4.417262971401215e-06, -4.187226295471191e-06, -3.957189619541168e-06, -3.727152943611145e-06, -3.497116267681122e-06, -3.2670795917510986e-06, -3.0370429158210754e-06, -2.8070062398910522e-06, -2.576969563961029e-06, -2.346932888031006e-06, -2.1168962121009827e-06, -1.8868595361709595e-06, -1.6568228602409363e-06, -1.426786184310913e-06, -1.1967495083808899e-06, -9.667128324508667e-07, -7.366761565208435e-07, -5.066394805908203e-07, -2.766028046607971e-07, -4.6566128730773926e-08, 1.8347054719924927e-07, 4.1350722312927246e-07, 6.435438990592957e-07, 8.735805749893188e-07, 1.103617250919342e-06, 1.3336539268493652e-06, 1.5636906027793884e-06, 1.7937272787094116e-06, 2.023763954639435e-06, 2.253800630569458e-06, 2.483837306499481e-06, 2.7138739824295044e-06, 2.9439106583595276e-06, 3.1739473342895508e-06, 3.403984010219574e-06, 3.634020686149597e-06, 3.86405736207962e-06, 4.0940940380096436e-06, 4.324130713939667e-06, 4.55416738986969e-06, 4.784204065799713e-06, 5.014240741729736e-06, 5.2442774176597595e-06, 5.474314093589783e-06, 5.704350769519806e-06, 5.934387445449829e-06, 6.164424121379852e-06, 6.3944607973098755e-06, 6.624497473239899e-06, 6.854534149169922e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 8.0, 7.0, 8.0, 21.0, 40.0, 95.0, 175.0, 398.0, 948.0, 2721.0, 11399.0, 104733.0, 814840.0, 97636.0, 11094.0, 2668.0, 958.0, 441.0, 159.0, 98.0, 41.0, 18.0, 13.0, 4.0, 8.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048431396484375, -0.04666948318481445, -0.044907569885253906, -0.04314565658569336, -0.04138374328613281, -0.039621829986572266, -0.03785991668701172, -0.03609800338745117, -0.034336090087890625, -0.03257417678833008, -0.03081226348876953, -0.029050350189208984, -0.027288436889648438, -0.02552652359008789, -0.023764610290527344, -0.022002696990966797, -0.02024078369140625, -0.018478870391845703, -0.016716957092285156, -0.01495504379272461, -0.013193130493164062, -0.011431217193603516, -0.009669303894042969, -0.007907390594482422, -0.006145477294921875, -0.004383563995361328, -0.0026216506958007812, -0.0008597373962402344, 0.0009021759033203125, 0.0026640892028808594, 0.004426002502441406, 0.006187915802001953, 0.0079498291015625, 0.009711742401123047, 0.011473655700683594, 0.01323556900024414, 0.014997482299804688, 0.016759395599365234, 0.01852130889892578, 0.020283222198486328, 0.022045135498046875, 0.023807048797607422, 0.02556896209716797, 0.027330875396728516, 0.029092788696289062, 0.03085470199584961, 0.032616615295410156, 0.0343785285949707, 0.03614044189453125, 0.0379023551940918, 0.039664268493652344, 0.04142618179321289, 0.04318809509277344, 0.044950008392333984, 0.04671192169189453, 0.04847383499145508, 0.050235748291015625, 0.05199766159057617, 0.05375957489013672, 0.055521488189697266, 0.05728340148925781, 0.05904531478881836, 0.060807228088378906, 0.06256914138793945, 0.0643310546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 14.0, 27.0, 65.0, 100.0, 176.0, 194.0, 160.0, 104.0, 55.0, 32.0, 27.0, 6.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05926513671875, -0.057114601135253906, -0.05496406555175781, -0.05281352996826172, -0.050662994384765625, -0.04851245880126953, -0.04636192321777344, -0.044211387634277344, -0.04206085205078125, -0.039910316467285156, -0.03775978088378906, -0.03560924530029297, -0.033458709716796875, -0.03130817413330078, -0.029157638549804688, -0.027007102966308594, -0.0248565673828125, -0.022706031799316406, -0.020555496215820312, -0.01840496063232422, -0.016254425048828125, -0.014103889465332031, -0.011953353881835938, -0.009802818298339844, -0.00765228271484375, -0.005501747131347656, -0.0033512115478515625, -0.0012006759643554688, 0.000949859619140625, 0.0031003952026367188, 0.0052509307861328125, 0.007401466369628906, 0.009552001953125, 0.011702537536621094, 0.013853073120117188, 0.01600360870361328, 0.018154144287109375, 0.02030467987060547, 0.022455215454101562, 0.024605751037597656, 0.02675628662109375, 0.028906822204589844, 0.031057357788085938, 0.03320789337158203, 0.035358428955078125, 0.03750896453857422, 0.03965950012207031, 0.041810035705566406, 0.0439605712890625, 0.046111106872558594, 0.04826164245605469, 0.05041217803955078, 0.052562713623046875, 0.05471324920654297, 0.05686378479003906, 0.059014320373535156, 0.06116485595703125, 0.06331539154052734, 0.06546592712402344, 0.06761646270751953, 0.06976699829101562, 0.07191753387451172, 0.07406806945800781, 0.0762186050415039, 0.078369140625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 9.0, 12.0, 26.0, 34.0, 82.0, 162.0, 209.0, 187.0, 132.0, 82.0, 32.0, 19.0, 10.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.593990683555603, -0.5698919296264648, -0.5457931756973267, -0.5216944217681885, -0.49759572744369507, -0.4734969735145569, -0.4493982195854187, -0.4252994656562805, -0.4012007415294647, -0.37710198760032654, -0.35300326347351074, -0.32890450954437256, -0.3048057556152344, -0.2807070314884186, -0.2566082775592804, -0.2325095385313034, -0.20841079950332642, -0.18431206047534943, -0.16021332144737244, -0.13611456751823425, -0.11201582849025726, -0.08791708946228027, -0.06381833553314209, -0.0397195965051651, -0.01562085747718811, 0.008477885276079178, 0.032576628029346466, 0.05667537450790405, 0.08077411353588104, 0.10487285256385803, 0.12897160649299622, 0.1530703455209732, 0.17716902494430542, 0.2012677639722824, 0.2253665030002594, 0.24946525692939758, 0.2735639810562134, 0.29766273498535156, 0.32176148891448975, 0.34586024284362793, 0.3699589669704437, 0.3940577208995819, 0.4181564450263977, 0.4422551989555359, 0.4663539528846741, 0.49045267701148987, 0.5145514011383057, 0.5386501550674438, 0.562748908996582, 0.5868476629257202, 0.6109464168548584, 0.6350451707839966, 0.65914386510849, 0.6832426190376282, 0.7073413729667664, 0.7314401268959045, 0.755538821220398, 0.7796375751495361, 0.8037363290786743, 0.8278350830078125, 0.8519337773323059, 0.8760325312614441, 0.9001312851905823, 0.9242300391197205, 0.9483287930488586]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 11.0, 7.0, 10.0, 5.0, 6.0, 14.0, 13.0, 14.0, 27.0, 20.0, 26.0, 20.0, 30.0, 34.0, 26.0, 42.0, 34.0, 41.0, 42.0, 43.0, 43.0, 35.0, 37.0, 31.0, 38.0, 33.0, 36.0, 32.0, 40.0, 24.0, 24.0, 29.0, 15.0, 12.0, 23.0, 21.0, 9.0, 12.0, 13.0, 8.0, 3.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5212919116020203, -0.5057680010795593, -0.4902441203594208, -0.47472020983695984, -0.4591963291168213, -0.44367241859436035, -0.4281485378742218, -0.41262462735176086, -0.3971007466316223, -0.3815768361091614, -0.3660529553890228, -0.3505290448665619, -0.33500516414642334, -0.3194812536239624, -0.30395737290382385, -0.2884334623813629, -0.27290958166122437, -0.2573856711387634, -0.24186179041862488, -0.22633789479732513, -0.2108139991760254, -0.19529008865356445, -0.1797662079334259, -0.16424229741096497, -0.14871838688850403, -0.13319449126720428, -0.11767059564590454, -0.1021467000246048, -0.08662280440330505, -0.07109890133142471, -0.05557500571012497, -0.040051110088825226, -0.02452722191810608, -0.00900332536548376, 0.0065205711871385574, 0.02204446867108345, 0.037568364292383194, 0.053092263638973236, 0.06861615926027298, 0.08414005488157272, 0.09966395050287247, 0.11518784612417221, 0.13071174919605255, 0.1462356448173523, 0.16175954043865204, 0.17728343605995178, 0.19280733168125153, 0.20833122730255127, 0.223855122923851, 0.23937901854515076, 0.2549029290676117, 0.27042680978775024, 0.2859507203102112, 0.30147460103034973, 0.31699851155281067, 0.3325223922729492, 0.34804630279541016, 0.3635702133178711, 0.37909409403800964, 0.3946180045604706, 0.41014188528060913, 0.42566579580307007, 0.4411896765232086, 0.45671358704566956, 0.4722374677658081]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 16.0, 20.0, 11.0, 22.0, 23.0, 41.0, 73.0, 129.0, 180.0, 261.0, 476.0, 871.0, 2111.0, 7004.0, 134735.0, 4035144.0, 8534.0, 2401.0, 893.0, 502.0, 281.0, 171.0, 119.0, 66.0, 58.0, 33.0, 26.0, 27.0, 18.0, 8.0, 9.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0888671875, -0.0848388671875, -0.080810546875, -0.0767822265625, -0.07275390625, -0.0687255859375, -0.064697265625, -0.0606689453125, -0.056640625, -0.0526123046875, -0.048583984375, -0.0445556640625, -0.04052734375, -0.0364990234375, -0.032470703125, -0.0284423828125, -0.0244140625, -0.0203857421875, -0.016357421875, -0.0123291015625, -0.00830078125, -0.0042724609375, -0.000244140625, 0.0037841796875, 0.0078125, 0.0118408203125, 0.015869140625, 0.0198974609375, 0.02392578125, 0.0279541015625, 0.031982421875, 0.0360107421875, 0.0400390625, 0.0440673828125, 0.048095703125, 0.0521240234375, 0.05615234375, 0.0601806640625, 0.064208984375, 0.0682373046875, 0.072265625, 0.0762939453125, 0.080322265625, 0.0843505859375, 0.08837890625, 0.0924072265625, 0.096435546875, 0.1004638671875, 0.1044921875, 0.1085205078125, 0.112548828125, 0.1165771484375, 0.12060546875, 0.1246337890625, 0.128662109375, 0.1326904296875, 0.13671875, 0.1407470703125, 0.144775390625, 0.1488037109375, 0.15283203125, 0.1568603515625, 0.160888671875, 0.1649169921875, 0.1689453125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 11.0, 13.0, 23.0, 25.0, 39.0, 54.0, 65.0, 61.0, 68.0, 77.0, 79.0, 83.0, 67.0, 71.0, 66.0, 48.0, 40.0, 27.0, 24.0, 10.0, 15.0, 8.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035308837890625, -0.03381681442260742, -0.032324790954589844, -0.030832767486572266, -0.029340744018554688, -0.02784872055053711, -0.02635669708251953, -0.024864673614501953, -0.023372650146484375, -0.021880626678466797, -0.02038860321044922, -0.01889657974243164, -0.017404556274414062, -0.015912532806396484, -0.014420509338378906, -0.012928485870361328, -0.01143646240234375, -0.009944438934326172, -0.008452415466308594, -0.006960391998291016, -0.0054683685302734375, -0.003976345062255859, -0.0024843215942382812, -0.0009922981262207031, 0.000499725341796875, 0.001991748809814453, 0.0034837722778320312, 0.004975795745849609, 0.0064678192138671875, 0.007959842681884766, 0.009451866149902344, 0.010943889617919922, 0.0124359130859375, 0.013927936553955078, 0.015419960021972656, 0.016911983489990234, 0.018404006958007812, 0.01989603042602539, 0.02138805389404297, 0.022880077362060547, 0.024372100830078125, 0.025864124298095703, 0.02735614776611328, 0.02884817123413086, 0.030340194702148438, 0.031832218170166016, 0.033324241638183594, 0.03481626510620117, 0.03630828857421875, 0.03780031204223633, 0.039292335510253906, 0.040784358978271484, 0.04227638244628906, 0.04376840591430664, 0.04526042938232422, 0.0467524528503418, 0.048244476318359375, 0.04973649978637695, 0.05122852325439453, 0.05272054672241211, 0.05421257019042969, 0.055704593658447266, 0.057196617126464844, 0.05868864059448242, 0.0601806640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 4.0, 9.0, 10.0, 16.0, 20.0, 23.0, 40.0, 62.0, 70.0, 114.0, 155.0, 212.0, 362.0, 601.0, 1053.0, 2081.0, 5984.0, 34175.0, 4102124.0, 36078.0, 6100.0, 2220.0, 1080.0, 592.0, 370.0, 249.0, 148.0, 95.0, 70.0, 36.0, 36.0, 30.0, 17.0, 10.0, 8.0, 9.0, 3.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0703125, -0.06755638122558594, -0.06480026245117188, -0.06204414367675781, -0.05928802490234375, -0.05653190612792969, -0.053775787353515625, -0.05101966857910156, -0.0482635498046875, -0.04550743103027344, -0.042751312255859375, -0.03999519348144531, -0.03723907470703125, -0.03448295593261719, -0.031726837158203125, -0.028970718383789062, -0.026214599609375, -0.023458480834960938, -0.020702362060546875, -0.017946243286132812, -0.01519012451171875, -0.012434005737304688, -0.009677886962890625, -0.0069217681884765625, -0.0041656494140625, -0.0014095306396484375, 0.001346588134765625, 0.0041027069091796875, 0.00685882568359375, 0.009614944458007812, 0.012371063232421875, 0.015127182006835938, 0.01788330078125, 0.020639419555664062, 0.023395538330078125, 0.026151657104492188, 0.02890777587890625, 0.03166389465332031, 0.034420013427734375, 0.03717613220214844, 0.0399322509765625, 0.04268836975097656, 0.045444488525390625, 0.04820060729980469, 0.05095672607421875, 0.05371284484863281, 0.056468963623046875, 0.05922508239746094, 0.061981201171875, 0.06473731994628906, 0.06749343872070312, 0.07024955749511719, 0.07300567626953125, 0.07576179504394531, 0.07851791381835938, 0.08127403259277344, 0.0840301513671875, 0.08678627014160156, 0.08954238891601562, 0.09229850769042969, 0.09505462646484375, 0.09781074523925781, 0.10056686401367188, 0.10332298278808594, 0.1060791015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 11.0, 18.0, 27.0, 77.0, 3608.0, 217.0, 56.0, 16.0, 9.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.018157958984375, -0.017637014389038086, -0.017116069793701172, -0.016595125198364258, -0.016074180603027344, -0.01555323600769043, -0.015032291412353516, -0.014511346817016602, -0.013990402221679688, -0.013469457626342773, -0.01294851303100586, -0.012427568435668945, -0.011906623840332031, -0.011385679244995117, -0.010864734649658203, -0.010343790054321289, -0.009822845458984375, -0.009301900863647461, -0.008780956268310547, -0.008260011672973633, -0.007739067077636719, -0.007218122482299805, -0.006697177886962891, -0.0061762332916259766, -0.0056552886962890625, -0.0051343441009521484, -0.004613399505615234, -0.00409245491027832, -0.0035715103149414062, -0.003050565719604492, -0.002529621124267578, -0.002008676528930664, -0.00148773193359375, -0.0009667873382568359, -0.0004458427429199219, 7.510185241699219e-05, 0.0005960464477539062, 0.0011169910430908203, 0.0016379356384277344, 0.0021588802337646484, 0.0026798248291015625, 0.0032007694244384766, 0.0037217140197753906, 0.004242658615112305, 0.004763603210449219, 0.005284547805786133, 0.005805492401123047, 0.006326436996459961, 0.006847381591796875, 0.007368326187133789, 0.007889270782470703, 0.008410215377807617, 0.008931159973144531, 0.009452104568481445, 0.00997304916381836, 0.010493993759155273, 0.011014938354492188, 0.011535882949829102, 0.012056827545166016, 0.01257777214050293, 0.013098716735839844, 0.013619661331176758, 0.014140605926513672, 0.014661550521850586, 0.0151824951171875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 8.0, 1.0, 7.0, 8.0, 7.0, 13.0, 21.0, 38.0, 36.0, 70.0, 82.0, 85.0, 101.0, 119.0, 122.0, 74.0, 67.0, 49.0, 34.0, 22.0, 19.0, 8.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0473005585372448, -0.045961614698171616, -0.04462267458438873, -0.04328373074531555, -0.04194479063153267, -0.04060584679245949, -0.039266906678676605, -0.037927962839603424, -0.03658902272582054, -0.03525007888674736, -0.03391113877296448, -0.032572194933891296, -0.031233254820108414, -0.029894312843680382, -0.02855537086725235, -0.02721642702817917, -0.025877485051751137, -0.024538543075323105, -0.023199601098895073, -0.02186065912246704, -0.02052171714603901, -0.019182775169610977, -0.017843831330537796, -0.016504891216754913, -0.015165948309004307, -0.013827006332576275, -0.012488064356148243, -0.011149121448397636, -0.009810179471969604, -0.008471237495541573, -0.007132295519113541, -0.005793353542685509, -0.004454411566257477, -0.003115469589829445, -0.0017765273805707693, -0.00043758517131209373, 0.0009013568051159382, 0.00224029878154397, 0.0035792412236332893, 0.004918183200061321, 0.006257125176489353, 0.007596067152917385, 0.008935009129345417, 0.010273952037096024, 0.011612894013524055, 0.012951835989952087, 0.01429077796638012, 0.01562971994280815, 0.016968661919236183, 0.018307603895664215, 0.019646545872092247, 0.02098548784852028, 0.02232442982494831, 0.023663371801376343, 0.025002315640449524, 0.026341255754232407, 0.027680199593305588, 0.02901914156973362, 0.03035808354616165, 0.03169702738523483, 0.033035967499017715, 0.0343749113380909, 0.03571385145187378, 0.03705279529094696, 0.03839173540472984]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 17.0, 12.0, 15.0, 8.0, 19.0, 17.0, 23.0, 33.0, 24.0, 40.0, 36.0, 35.0, 30.0, 30.0, 31.0, 41.0, 47.0, 32.0, 38.0, 41.0, 48.0, 49.0, 28.0, 36.0, 30.0, 33.0, 24.0, 23.0, 19.0, 21.0, 19.0, 16.0, 19.0, 13.0, 5.0, 8.0, 10.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.02288973331451416, -0.02215542271733284, -0.02142111398279667, -0.020686805248260498, -0.019952494651079178, -0.019218184053897858, -0.018483875319361687, -0.017749566584825516, -0.017015255987644196, -0.016280945390462875, -0.015546636655926704, -0.014812326990067959, -0.014078017324209213, -0.013343707658350468, -0.012609397992491722, -0.011875088326632977, -0.011140778660774231, -0.010406468994915485, -0.00967215932905674, -0.008937849663197994, -0.008203539997339249, -0.007469230331480503, -0.0067349206656217575, -0.006000610999763012, -0.005266301333904266, -0.004531991668045521, -0.003797682002186775, -0.0030633723363280296, -0.002329062670469284, -0.0015947530046105385, -0.0008604433387517929, -0.00012613367289304733, 0.0006081759929656982, 0.0013424856588244438, 0.0020767953246831894, 0.002811104990541935, 0.0035454146564006805, 0.004279724322259426, 0.005014033988118172, 0.005748343653976917, 0.006482653319835663, 0.007216962985694408, 0.007951272651553154, 0.0086855823174119, 0.009419891983270645, 0.01015420164912939, 0.010888511314988136, 0.011622820980846882, 0.012357130646705627, 0.013091440312564373, 0.013825749978423119, 0.014560059644281864, 0.01529436931014061, 0.01602867990732193, 0.0167629886418581, 0.017497297376394272, 0.018231607973575592, 0.018965918570756912, 0.019700227305293083, 0.020434536039829254, 0.021168846637010574, 0.021903157234191895, 0.022637465968728065, 0.023371774703264236, 0.024106085300445557]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 9.0, 14.0, 19.0, 36.0, 66.0, 94.0, 161.0, 267.0, 493.0, 1026.0, 2353.0, 6582.0, 22259.0, 88294.0, 354772.0, 418966.0, 112303.0, 27580.0, 7940.0, 2781.0, 1160.0, 582.0, 337.0, 158.0, 101.0, 65.0, 37.0, 27.0, 18.0, 12.0, 5.0, 8.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0693359375, -0.06710529327392578, -0.06487464904785156, -0.06264400482177734, -0.060413360595703125, -0.058182716369628906, -0.05595207214355469, -0.05372142791748047, -0.05149078369140625, -0.04926013946533203, -0.04702949523925781, -0.044798851013183594, -0.042568206787109375, -0.040337562561035156, -0.03810691833496094, -0.03587627410888672, -0.0336456298828125, -0.03141498565673828, -0.029184341430664062, -0.026953697204589844, -0.024723052978515625, -0.022492408752441406, -0.020261764526367188, -0.01803112030029297, -0.01580047607421875, -0.013569831848144531, -0.011339187622070312, -0.009108543395996094, -0.006877899169921875, -0.004647254943847656, -0.0024166107177734375, -0.00018596649169921875, 0.002044677734375, 0.004275321960449219, 0.0065059661865234375, 0.008736610412597656, 0.010967254638671875, 0.013197898864746094, 0.015428543090820312, 0.01765918731689453, 0.01988983154296875, 0.02212047576904297, 0.024351119995117188, 0.026581764221191406, 0.028812408447265625, 0.031043052673339844, 0.03327369689941406, 0.03550434112548828, 0.0377349853515625, 0.03996562957763672, 0.04219627380371094, 0.044426918029785156, 0.046657562255859375, 0.048888206481933594, 0.05111885070800781, 0.05334949493408203, 0.05558013916015625, 0.05781078338623047, 0.06004142761230469, 0.062272071838378906, 0.06450271606445312, 0.06673336029052734, 0.06896400451660156, 0.07119464874267578, 0.07342529296875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 11.0, 18.0, 25.0, 33.0, 38.0, 46.0, 52.0, 69.0, 68.0, 74.0, 71.0, 69.0, 74.0, 65.0, 62.0, 46.0, 44.0, 41.0, 23.0, 20.0, 10.0, 11.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035308837890625, -0.03382587432861328, -0.03234291076660156, -0.030859947204589844, -0.029376983642578125, -0.027894020080566406, -0.026411056518554688, -0.02492809295654297, -0.02344512939453125, -0.02196216583251953, -0.020479202270507812, -0.018996238708496094, -0.017513275146484375, -0.016030311584472656, -0.014547348022460938, -0.013064384460449219, -0.0115814208984375, -0.010098457336425781, -0.008615493774414062, -0.007132530212402344, -0.005649566650390625, -0.004166603088378906, -0.0026836395263671875, -0.0012006759643554688, 0.00028228759765625, 0.0017652511596679688, 0.0032482147216796875, 0.004731178283691406, 0.006214141845703125, 0.007697105407714844, 0.009180068969726562, 0.010663032531738281, 0.01214599609375, 0.013628959655761719, 0.015111923217773438, 0.016594886779785156, 0.018077850341796875, 0.019560813903808594, 0.021043777465820312, 0.02252674102783203, 0.02400970458984375, 0.02549266815185547, 0.026975631713867188, 0.028458595275878906, 0.029941558837890625, 0.031424522399902344, 0.03290748596191406, 0.03439044952392578, 0.0358734130859375, 0.03735637664794922, 0.03883934020996094, 0.040322303771972656, 0.041805267333984375, 0.043288230895996094, 0.04477119445800781, 0.04625415802001953, 0.04773712158203125, 0.04922008514404297, 0.05070304870605469, 0.052186012268066406, 0.053668975830078125, 0.055151939392089844, 0.05663490295410156, 0.05811786651611328, 0.059600830078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 1.0, 9.0, 8.0, 7.0, 14.0, 19.0, 22.0, 33.0, 43.0, 54.0, 71.0, 100.0, 172.0, 253.0, 539.0, 1595.0, 8456.0, 82074.0, 764830.0, 171398.0, 14718.0, 2448.0, 711.0, 325.0, 191.0, 122.0, 82.0, 70.0, 43.0, 32.0, 21.0, 31.0, 16.0, 11.0, 12.0, 12.0, 5.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.111083984375, -0.10778141021728516, -0.10447883605957031, -0.10117626190185547, -0.09787368774414062, -0.09457111358642578, -0.09126853942871094, -0.0879659652709961, -0.08466339111328125, -0.0813608169555664, -0.07805824279785156, -0.07475566864013672, -0.07145309448242188, -0.06815052032470703, -0.06484794616699219, -0.061545372009277344, -0.0582427978515625, -0.054940223693847656, -0.05163764953613281, -0.04833507537841797, -0.045032501220703125, -0.04172992706298828, -0.03842735290527344, -0.035124778747558594, -0.03182220458984375, -0.028519630432128906, -0.025217056274414062, -0.02191448211669922, -0.018611907958984375, -0.015309333801269531, -0.012006759643554688, -0.008704185485839844, -0.005401611328125, -0.0020990371704101562, 0.0012035369873046875, 0.004506111145019531, 0.007808685302734375, 0.011111259460449219, 0.014413833618164062, 0.017716407775878906, 0.02101898193359375, 0.024321556091308594, 0.027624130249023438, 0.03092670440673828, 0.034229278564453125, 0.03753185272216797, 0.04083442687988281, 0.044137001037597656, 0.0474395751953125, 0.050742149353027344, 0.05404472351074219, 0.05734729766845703, 0.060649871826171875, 0.06395244598388672, 0.06725502014160156, 0.0705575942993164, 0.07386016845703125, 0.0771627426147461, 0.08046531677246094, 0.08376789093017578, 0.08707046508789062, 0.09037303924560547, 0.09367561340332031, 0.09697818756103516, 0.10028076171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 11.0, 11.0, 8.0, 7.0, 12.0, 25.0, 18.0, 35.0, 31.0, 26.0, 25.0, 36.0, 35.0, 47.0, 41.0, 44.0, 41.0, 46.0, 45.0, 49.0, 37.0, 46.0, 36.0, 47.0, 41.0, 33.0, 19.0, 25.0, 15.0, 15.0, 15.0, 15.0, 9.0, 16.0, 5.0, 8.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.113525390625, -0.11011123657226562, -0.10669708251953125, -0.10328292846679688, -0.0998687744140625, -0.09645462036132812, -0.09304046630859375, -0.08962631225585938, -0.086212158203125, -0.08279800415039062, -0.07938385009765625, -0.07596969604492188, -0.0725555419921875, -0.06914138793945312, -0.06572723388671875, -0.062313079833984375, -0.05889892578125, -0.055484771728515625, -0.05207061767578125, -0.048656463623046875, -0.0452423095703125, -0.041828155517578125, -0.03841400146484375, -0.034999847412109375, -0.031585693359375, -0.028171539306640625, -0.02475738525390625, -0.021343231201171875, -0.0179290771484375, -0.014514923095703125, -0.01110076904296875, -0.007686614990234375, -0.0042724609375, -0.000858306884765625, 0.00255584716796875, 0.005970001220703125, 0.0093841552734375, 0.012798309326171875, 0.01621246337890625, 0.019626617431640625, 0.023040771484375, 0.026454925537109375, 0.02986907958984375, 0.033283233642578125, 0.0366973876953125, 0.040111541748046875, 0.04352569580078125, 0.046939849853515625, 0.05035400390625, 0.053768157958984375, 0.05718231201171875, 0.060596466064453125, 0.0640106201171875, 0.06742477416992188, 0.07083892822265625, 0.07425308227539062, 0.077667236328125, 0.08108139038085938, 0.08449554443359375, 0.08790969848632812, 0.0913238525390625, 0.09473800659179688, 0.09815216064453125, 0.10156631469726562, 0.10498046875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 16.0, 16.0, 30.0, 35.0, 62.0, 113.0, 185.0, 390.0, 716.0, 1764.0, 5117.0, 18522.0, 104801.0, 713356.0, 167740.0, 25270.0, 6396.0, 2174.0, 883.0, 451.0, 200.0, 112.0, 64.0, 52.0, 22.0, 25.0, 8.0, 9.0, 11.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0404052734375, -0.039301395416259766, -0.03819751739501953, -0.0370936393737793, -0.03598976135253906, -0.03488588333129883, -0.033782005310058594, -0.03267812728881836, -0.031574249267578125, -0.03047037124633789, -0.029366493225097656, -0.028262615203857422, -0.027158737182617188, -0.026054859161376953, -0.02495098114013672, -0.023847103118896484, -0.02274322509765625, -0.021639347076416016, -0.02053546905517578, -0.019431591033935547, -0.018327713012695312, -0.017223834991455078, -0.016119956970214844, -0.01501607894897461, -0.013912200927734375, -0.01280832290649414, -0.011704444885253906, -0.010600566864013672, -0.009496688842773438, -0.008392810821533203, -0.007288932800292969, -0.006185054779052734, -0.0050811767578125, -0.003977298736572266, -0.0028734207153320312, -0.0017695426940917969, -0.0006656646728515625, 0.0004382133483886719, 0.0015420913696289062, 0.0026459693908691406, 0.003749847412109375, 0.004853725433349609, 0.005957603454589844, 0.007061481475830078, 0.008165359497070312, 0.009269237518310547, 0.010373115539550781, 0.011476993560791016, 0.01258087158203125, 0.013684749603271484, 0.014788627624511719, 0.015892505645751953, 0.016996383666992188, 0.018100261688232422, 0.019204139709472656, 0.02030801773071289, 0.021411895751953125, 0.02251577377319336, 0.023619651794433594, 0.024723529815673828, 0.025827407836914062, 0.026931285858154297, 0.02803516387939453, 0.029139041900634766, 0.030242919921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 4.0, 14.0, 11.0, 13.0, 31.0, 34.0, 49.0, 70.0, 88.0, 103.0, 112.0, 84.0, 79.0, 77.0, 50.0, 45.0, 33.0, 26.0, 19.0, 13.0, 6.0, 11.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.079673767089844e-06, -5.815178155899048e-06, -5.550682544708252e-06, -5.286186933517456e-06, -5.02169132232666e-06, -4.757195711135864e-06, -4.492700099945068e-06, -4.2282044887542725e-06, -3.9637088775634766e-06, -3.6992132663726807e-06, -3.4347176551818848e-06, -3.170222043991089e-06, -2.905726432800293e-06, -2.641230821609497e-06, -2.376735210418701e-06, -2.1122395992279053e-06, -1.8477439880371094e-06, -1.5832483768463135e-06, -1.3187527656555176e-06, -1.0542571544647217e-06, -7.897615432739258e-07, -5.252659320831299e-07, -2.60770320892334e-07, 3.725290298461914e-09, 2.682209014892578e-07, 5.327165126800537e-07, 7.972121238708496e-07, 1.0617077350616455e-06, 1.3262033462524414e-06, 1.5906989574432373e-06, 1.8551945686340332e-06, 2.119690179824829e-06, 2.384185791015625e-06, 2.648681402206421e-06, 2.913177013397217e-06, 3.1776726245880127e-06, 3.4421682357788086e-06, 3.7066638469696045e-06, 3.9711594581604e-06, 4.235655069351196e-06, 4.500150680541992e-06, 4.764646291732788e-06, 5.029141902923584e-06, 5.29363751411438e-06, 5.558133125305176e-06, 5.822628736495972e-06, 6.087124347686768e-06, 6.3516199588775635e-06, 6.616115570068359e-06, 6.880611181259155e-06, 7.145106792449951e-06, 7.409602403640747e-06, 7.674098014831543e-06, 7.938593626022339e-06, 8.203089237213135e-06, 8.46758484840393e-06, 8.732080459594727e-06, 8.996576070785522e-06, 9.261071681976318e-06, 9.525567293167114e-06, 9.79006290435791e-06, 1.0054558515548706e-05, 1.0319054126739502e-05, 1.0583549737930298e-05, 1.0848045349121094e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 5.0, 8.0, 17.0, 17.0, 23.0, 38.0, 55.0, 79.0, 97.0, 202.0, 312.0, 525.0, 876.0, 1701.0, 3724.0, 8408.0, 23096.0, 81239.0, 374565.0, 419880.0, 91297.0, 25132.0, 9172.0, 3834.0, 1894.0, 938.0, 516.0, 325.0, 186.0, 113.0, 77.0, 51.0, 26.0, 27.0, 26.0, 21.0, 12.0, 9.0, 4.0, 4.0, 5.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02496337890625, -0.02420783042907715, -0.023452281951904297, -0.022696733474731445, -0.021941184997558594, -0.021185636520385742, -0.02043008804321289, -0.01967453956604004, -0.018918991088867188, -0.018163442611694336, -0.017407894134521484, -0.016652345657348633, -0.01589679718017578, -0.01514124870300293, -0.014385700225830078, -0.013630151748657227, -0.012874603271484375, -0.012119054794311523, -0.011363506317138672, -0.01060795783996582, -0.009852409362792969, -0.009096860885620117, -0.008341312408447266, -0.007585763931274414, -0.0068302154541015625, -0.006074666976928711, -0.005319118499755859, -0.004563570022583008, -0.0038080215454101562, -0.0030524730682373047, -0.002296924591064453, -0.0015413761138916016, -0.00078582763671875, -3.0279159545898438e-05, 0.0007252693176269531, 0.0014808177947998047, 0.0022363662719726562, 0.002991914749145508, 0.0037474632263183594, 0.004503011703491211, 0.0052585601806640625, 0.006014108657836914, 0.006769657135009766, 0.007525205612182617, 0.008280754089355469, 0.00903630256652832, 0.009791851043701172, 0.010547399520874023, 0.011302947998046875, 0.012058496475219727, 0.012814044952392578, 0.01356959342956543, 0.014325141906738281, 0.015080690383911133, 0.015836238861083984, 0.016591787338256836, 0.017347335815429688, 0.01810288429260254, 0.01885843276977539, 0.019613981246948242, 0.020369529724121094, 0.021125078201293945, 0.021880626678466797, 0.02263617515563965, 0.0233917236328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 9.0, 4.0, 6.0, 14.0, 10.0, 13.0, 22.0, 14.0, 32.0, 23.0, 26.0, 38.0, 54.0, 66.0, 72.0, 90.0, 86.0, 84.0, 66.0, 42.0, 53.0, 29.0, 29.0, 26.0, 18.0, 15.0, 9.0, 14.0, 8.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0271148681640625, -0.02626657485961914, -0.02541828155517578, -0.024569988250732422, -0.023721694946289062, -0.022873401641845703, -0.022025108337402344, -0.021176815032958984, -0.020328521728515625, -0.019480228424072266, -0.018631935119628906, -0.017783641815185547, -0.016935348510742188, -0.016087055206298828, -0.015238761901855469, -0.01439046859741211, -0.01354217529296875, -0.01269388198852539, -0.011845588684082031, -0.010997295379638672, -0.010149002075195312, -0.009300708770751953, -0.008452415466308594, -0.007604122161865234, -0.006755828857421875, -0.005907535552978516, -0.005059242248535156, -0.004210948944091797, -0.0033626556396484375, -0.002514362335205078, -0.0016660690307617188, -0.0008177757263183594, 3.0517578125e-05, 0.0008788108825683594, 0.0017271041870117188, 0.002575397491455078, 0.0034236907958984375, 0.004271984100341797, 0.005120277404785156, 0.005968570709228516, 0.006816864013671875, 0.007665157318115234, 0.008513450622558594, 0.009361743927001953, 0.010210037231445312, 0.011058330535888672, 0.011906623840332031, 0.01275491714477539, 0.01360321044921875, 0.01445150375366211, 0.015299797058105469, 0.016148090362548828, 0.016996383666992188, 0.017844676971435547, 0.018692970275878906, 0.019541263580322266, 0.020389556884765625, 0.021237850189208984, 0.022086143493652344, 0.022934436798095703, 0.023782730102539062, 0.024631023406982422, 0.02547931671142578, 0.02632761001586914, 0.0271759033203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 9.0, 25.0, 47.0, 88.0, 169.0, 218.0, 207.0, 141.0, 51.0, 21.0, 12.0, 12.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.158263921737671, -1.133397102355957, -1.1085302829742432, -1.0836634635925293, -1.0587966442108154, -1.0339298248291016, -1.0090630054473877, -0.9841962456703186, -0.9593294262886047, -0.9344626069068909, -0.909595787525177, -0.8847289681434631, -0.8598621487617493, -0.8349953889846802, -0.8101285696029663, -0.7852617502212524, -0.7603949308395386, -0.7355281114578247, -0.7106612920761108, -0.685794472694397, -0.6609276533126831, -0.6360608339309692, -0.6111940145492554, -0.5863272547721863, -0.5614603757858276, -0.5365935564041138, -0.5117267370223999, -0.48685991764068604, -0.46199312806129456, -0.4371263086795807, -0.4122594892978668, -0.38739269971847534, -0.3625258803367615, -0.3376590609550476, -0.31279224157333374, -0.2879254221916199, -0.2630586326122284, -0.23819181323051453, -0.21332499384880066, -0.18845818936824799, -0.16359136998653412, -0.13872455060482025, -0.11385774612426758, -0.08899092674255371, -0.06412411481142044, -0.03925730288028717, -0.014390483498573303, 0.01047632098197937, 0.03534314036369324, 0.06020995229482651, 0.08507676422595978, 0.10994358360767365, 0.13481038808822632, 0.15967720746994019, 0.18454402685165405, 0.20941083133220673, 0.2342776507139206, 0.25914445519447327, 0.28401127457618713, 0.308878093957901, 0.33374491333961487, 0.35861170291900635, 0.3834785223007202, 0.4083453416824341, 0.43321216106414795]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 8.0, 13.0, 12.0, 16.0, 14.0, 22.0, 23.0, 27.0, 27.0, 31.0, 33.0, 42.0, 47.0, 49.0, 47.0, 56.0, 62.0, 59.0, 44.0, 51.0, 37.0, 47.0, 37.0, 28.0, 28.0, 22.0, 18.0, 15.0, 17.0, 14.0, 9.0, 13.0, 11.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.564853310585022, -0.5463145971298218, -0.5277758240699768, -0.5092371106147766, -0.49069836735725403, -0.47215962409973145, -0.45362088084220886, -0.4350821375846863, -0.4165434241294861, -0.3980046808719635, -0.3794659376144409, -0.3609272241592407, -0.34238848090171814, -0.32384973764419556, -0.305310994386673, -0.2867722511291504, -0.2682335078716278, -0.24969476461410522, -0.23115603625774384, -0.21261729300022125, -0.19407856464385986, -0.17553982138633728, -0.1570010781288147, -0.1384623497724533, -0.11992360651493073, -0.10138487070798874, -0.08284613490104675, -0.06430739164352417, -0.045768655836582184, -0.027229920029640198, -0.008691176772117615, 0.009847551584243774, 0.028386294841766357, 0.046925030648708344, 0.06546376645565033, 0.08400250971317291, 0.1025412455201149, 0.12107998132705688, 0.13961872458457947, 0.15815745294094086, 0.17669619619846344, 0.19523493945598602, 0.2137736678123474, 0.23231241106987, 0.2508511543273926, 0.2693898677825928, 0.28792864084243774, 0.30646735429763794, 0.3250060975551605, 0.3435448408126831, 0.3620835840702057, 0.38062232732772827, 0.39916104078292847, 0.41769978404045105, 0.43623852729797363, 0.45477724075317383, 0.4733160138130188, 0.4918547570705414, 0.510393500328064, 0.5289322137832642, 0.5474709868431091, 0.5660097002983093, 0.5845484733581543, 0.6030871868133545, 0.6216259002685547]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 11.0, 31.0, 35.0, 77.0, 161.0, 321.0, 804.0, 2099.0, 8665.0, 4036084.0, 136054.0, 6760.0, 1806.0, 695.0, 331.0, 138.0, 96.0, 39.0, 21.0, 16.0, 6.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10430908203125, -0.10043621063232422, -0.09656333923339844, -0.09269046783447266, -0.08881759643554688, -0.0849447250366211, -0.08107185363769531, -0.07719898223876953, -0.07332611083984375, -0.06945323944091797, -0.06558036804199219, -0.061707496643066406, -0.057834625244140625, -0.053961753845214844, -0.05008888244628906, -0.04621601104736328, -0.0423431396484375, -0.03847026824951172, -0.03459739685058594, -0.030724525451660156, -0.026851654052734375, -0.022978782653808594, -0.019105911254882812, -0.015233039855957031, -0.01136016845703125, -0.007487297058105469, -0.0036144256591796875, 0.00025844573974609375, 0.004131317138671875, 0.008004188537597656, 0.011877059936523438, 0.01574993133544922, 0.019622802734375, 0.02349567413330078, 0.027368545532226562, 0.031241416931152344, 0.035114288330078125, 0.038987159729003906, 0.04286003112792969, 0.04673290252685547, 0.05060577392578125, 0.05447864532470703, 0.05835151672363281, 0.062224388122558594, 0.06609725952148438, 0.06997013092041016, 0.07384300231933594, 0.07771587371826172, 0.0815887451171875, 0.08546161651611328, 0.08933448791503906, 0.09320735931396484, 0.09708023071289062, 0.1009531021118164, 0.10482597351074219, 0.10869884490966797, 0.11257171630859375, 0.11644458770751953, 0.12031745910644531, 0.1241903305053711, 0.12806320190429688, 0.13193607330322266, 0.13580894470214844, 0.13968181610107422, 0.1435546875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 17.0, 17.0, 25.0, 30.0, 44.0, 56.0, 76.0, 78.0, 66.0, 71.0, 75.0, 77.0, 71.0, 59.0, 60.0, 44.0, 36.0, 24.0, 16.0, 12.0, 13.0, 5.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035369873046875, -0.03383970260620117, -0.032309532165527344, -0.030779361724853516, -0.029249191284179688, -0.02771902084350586, -0.02618885040283203, -0.024658679962158203, -0.023128509521484375, -0.021598339080810547, -0.02006816864013672, -0.01853799819946289, -0.017007827758789062, -0.015477657318115234, -0.013947486877441406, -0.012417316436767578, -0.01088714599609375, -0.009356975555419922, -0.007826805114746094, -0.006296634674072266, -0.0047664642333984375, -0.0032362937927246094, -0.0017061233520507812, -0.00017595291137695312, 0.001354217529296875, 0.002884387969970703, 0.004414558410644531, 0.005944728851318359, 0.0074748992919921875, 0.009005069732666016, 0.010535240173339844, 0.012065410614013672, 0.0135955810546875, 0.015125751495361328, 0.016655921936035156, 0.018186092376708984, 0.019716262817382812, 0.02124643325805664, 0.02277660369873047, 0.024306774139404297, 0.025836944580078125, 0.027367115020751953, 0.02889728546142578, 0.03042745590209961, 0.03195762634277344, 0.033487796783447266, 0.035017967224121094, 0.03654813766479492, 0.03807830810546875, 0.03960847854614258, 0.041138648986816406, 0.042668819427490234, 0.04419898986816406, 0.04572916030883789, 0.04725933074951172, 0.04878950119018555, 0.050319671630859375, 0.0518498420715332, 0.05338001251220703, 0.05491018295288086, 0.05644035339355469, 0.057970523834228516, 0.059500694274902344, 0.06103086471557617, 0.06256103515625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 6.0, 14.0, 14.0, 32.0, 44.0, 56.0, 51.0, 88.0, 126.0, 168.0, 238.0, 305.0, 420.0, 670.0, 1136.0, 2040.0, 4709.0, 14832.0, 94549.0, 4012911.0, 44071.0, 9710.0, 3615.0, 1628.0, 939.0, 515.0, 377.0, 269.0, 196.0, 144.0, 115.0, 84.0, 64.0, 38.0, 24.0, 14.0, 16.0, 22.0, 7.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043670654296875, -0.0421295166015625, -0.04058837890625, -0.0390472412109375, -0.037506103515625, -0.0359649658203125, -0.034423828125, -0.0328826904296875, -0.031341552734375, -0.0298004150390625, -0.02825927734375, -0.0267181396484375, -0.025177001953125, -0.0236358642578125, -0.0220947265625, -0.0205535888671875, -0.019012451171875, -0.0174713134765625, -0.01593017578125, -0.0143890380859375, -0.012847900390625, -0.0113067626953125, -0.009765625, -0.0082244873046875, -0.006683349609375, -0.0051422119140625, -0.00360107421875, -0.0020599365234375, -0.000518798828125, 0.0010223388671875, 0.0025634765625, 0.0041046142578125, 0.005645751953125, 0.0071868896484375, 0.00872802734375, 0.0102691650390625, 0.011810302734375, 0.0133514404296875, 0.014892578125, 0.0164337158203125, 0.017974853515625, 0.0195159912109375, 0.02105712890625, 0.0225982666015625, 0.024139404296875, 0.0256805419921875, 0.0272216796875, 0.0287628173828125, 0.030303955078125, 0.0318450927734375, 0.03338623046875, 0.0349273681640625, 0.036468505859375, 0.0380096435546875, 0.03955078125, 0.0410919189453125, 0.042633056640625, 0.0441741943359375, 0.04571533203125, 0.0472564697265625, 0.048797607421875, 0.0503387451171875, 0.0518798828125, 0.0534210205078125, 0.054962158203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 17.0, 21.0, 30.0, 75.0, 166.0, 3560.0, 114.0, 30.0, 15.0, 9.0, 6.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01377105712890625, -0.013316988945007324, -0.012862920761108398, -0.012408852577209473, -0.011954784393310547, -0.011500716209411621, -0.011046648025512695, -0.01059257984161377, -0.010138511657714844, -0.009684443473815918, -0.009230375289916992, -0.008776307106018066, -0.00832223892211914, -0.007868170738220215, -0.007414102554321289, -0.006960034370422363, -0.0065059661865234375, -0.006051898002624512, -0.005597829818725586, -0.00514376163482666, -0.004689693450927734, -0.004235625267028809, -0.003781557083129883, -0.003327488899230957, -0.0028734207153320312, -0.0024193525314331055, -0.0019652843475341797, -0.001511216163635254, -0.0010571479797363281, -0.0006030797958374023, -0.00014901161193847656, 0.0003050565719604492, 0.000759124755859375, 0.0012131929397583008, 0.0016672611236572266, 0.0021213293075561523, 0.002575397491455078, 0.003029465675354004, 0.0034835338592529297, 0.0039376020431518555, 0.004391670227050781, 0.004845738410949707, 0.005299806594848633, 0.005753874778747559, 0.006207942962646484, 0.00666201114654541, 0.007116079330444336, 0.007570147514343262, 0.008024215698242188, 0.008478283882141113, 0.008932352066040039, 0.009386420249938965, 0.00984048843383789, 0.010294556617736816, 0.010748624801635742, 0.011202692985534668, 0.011656761169433594, 0.01211082935333252, 0.012564897537231445, 0.013018965721130371, 0.013473033905029297, 0.013927102088928223, 0.014381170272827148, 0.014835238456726074, 0.015289306640625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 5.0, 7.0, 14.0, 35.0, 43.0, 61.0, 81.0, 131.0, 111.0, 131.0, 105.0, 69.0, 71.0, 46.0, 32.0, 21.0, 13.0, 8.0, 8.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042052026838064194, -0.0405997671186924, -0.0391475073993206, -0.037695251405239105, -0.03624299168586731, -0.034790731966495514, -0.03333847224712372, -0.03188621252775192, -0.030433954671025276, -0.02898169495165348, -0.027529437094926834, -0.02607717737555504, -0.024624917656183243, -0.023172659799456596, -0.0217204000800848, -0.020268142223358154, -0.01881588250398636, -0.017363622784614563, -0.015911364927887917, -0.014459105208516121, -0.0130068464204669, -0.011554587632417679, -0.010102327913045883, -0.008650069124996662, -0.007197810336947441, -0.00574555154889822, -0.004293292295187712, -0.0028410330414772034, -0.0013887742534279823, 6.348453462123871e-05, 0.0015157442539930344, 0.0029680030420422554, 0.004420265555381775, 0.005872524343430996, 0.007324783597141504, 0.008777042850852013, 0.010229301638901234, 0.011681560426950455, 0.01313382014632225, 0.014586078934371471, 0.016038337722420692, 0.017490597441792488, 0.018942855298519135, 0.02039511501789093, 0.021847374737262726, 0.023299632593989372, 0.024751892313361168, 0.026204150170087814, 0.02765640988945961, 0.029108669608831406, 0.030560927465558052, 0.0320131853222847, 0.033465445041656494, 0.03491770476102829, 0.036369964480400085, 0.03782222419977188, 0.03927448391914368, 0.04072674363851547, 0.04217900335788727, 0.043631263077259064, 0.04508351907134056, 0.04653577879071236, 0.04798803851008415, 0.04944029822945595, 0.050892554223537445]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 9.0, 7.0, 5.0, 11.0, 10.0, 13.0, 17.0, 19.0, 23.0, 24.0, 21.0, 32.0, 37.0, 47.0, 41.0, 36.0, 54.0, 53.0, 55.0, 44.0, 46.0, 38.0, 39.0, 53.0, 31.0, 32.0, 32.0, 25.0, 27.0, 22.0, 16.0, 7.0, 18.0, 14.0, 4.0, 7.0, 8.0, 6.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.023328185081481934, -0.022642087191343307, -0.02195599116384983, -0.021269895136356354, -0.020583797246217728, -0.0198976993560791, -0.019211603328585625, -0.018525507301092148, -0.01783940941095352, -0.017153311520814896, -0.01646721549332142, -0.015781119465827942, -0.015095021575689316, -0.014408924616873264, -0.013722827658057213, -0.013036730699241161, -0.01235063374042511, -0.011664536781609058, -0.010978439822793007, -0.010292342863976955, -0.009606245905160904, -0.008920148946344852, -0.008234051987528801, -0.0075479550287127495, -0.006861858069896698, -0.0061757611110806465, -0.005489664152264595, -0.0048035671934485435, -0.004117470234632492, -0.0034313732758164406, -0.002745276317000389, -0.0020591793581843376, -0.0013730823993682861, -0.0006869854405522346, -8.884817361831665e-07, 0.0006852084770798683, 0.0013713054358959198, 0.0020574023947119713, 0.0027434993535280228, 0.0034295963123440742, 0.004115693271160126, 0.004801790229976177, 0.005487887188792229, 0.00617398414760828, 0.006860081106424332, 0.007546178065240383, 0.008232275024056435, 0.008918371982872486, 0.009604468941688538, 0.010290565900504589, 0.01097666285932064, 0.011662759818136692, 0.012348856776952744, 0.013034953735768795, 0.013721050694584846, 0.014407147653400898, 0.01509324461221695, 0.015779342502355576, 0.016465438529849052, 0.01715153455734253, 0.017837632447481155, 0.01852373033761978, 0.01920982636511326, 0.019895922392606735, 0.02058202028274536]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 25.0, 36.0, 58.0, 118.0, 225.0, 509.0, 1035.0, 3196.0, 12610.0, 80593.0, 574495.0, 325288.0, 39451.0, 7286.0, 2111.0, 797.0, 324.0, 157.0, 96.0, 52.0, 27.0, 21.0, 16.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0767822265625, -0.07355880737304688, -0.07033538818359375, -0.06711196899414062, -0.0638885498046875, -0.060665130615234375, -0.05744171142578125, -0.054218292236328125, -0.050994873046875, -0.047771453857421875, -0.04454803466796875, -0.041324615478515625, -0.0381011962890625, -0.034877777099609375, -0.03165435791015625, -0.028430938720703125, -0.02520751953125, -0.021984100341796875, -0.01876068115234375, -0.015537261962890625, -0.0123138427734375, -0.009090423583984375, -0.00586700439453125, -0.002643585205078125, 0.000579833984375, 0.003803253173828125, 0.00702667236328125, 0.010250091552734375, 0.0134735107421875, 0.016696929931640625, 0.01992034912109375, 0.023143768310546875, 0.0263671875, 0.029590606689453125, 0.03281402587890625, 0.036037445068359375, 0.0392608642578125, 0.042484283447265625, 0.04570770263671875, 0.048931121826171875, 0.052154541015625, 0.055377960205078125, 0.05860137939453125, 0.061824798583984375, 0.0650482177734375, 0.06827163696289062, 0.07149505615234375, 0.07471847534179688, 0.07794189453125, 0.08116531372070312, 0.08438873291015625, 0.08761215209960938, 0.0908355712890625, 0.09405899047851562, 0.09728240966796875, 0.10050582885742188, 0.103729248046875, 0.10695266723632812, 0.11017608642578125, 0.11339950561523438, 0.1166229248046875, 0.11984634399414062, 0.12306976318359375, 0.12629318237304688, 0.1295166015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 11.0, 8.0, 14.0, 25.0, 38.0, 46.0, 50.0, 65.0, 82.0, 67.0, 70.0, 77.0, 63.0, 68.0, 70.0, 65.0, 42.0, 39.0, 24.0, 28.0, 12.0, 11.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035552978515625, -0.03402900695800781, -0.032505035400390625, -0.030981063842773438, -0.02945709228515625, -0.027933120727539062, -0.026409149169921875, -0.024885177612304688, -0.0233612060546875, -0.021837234497070312, -0.020313262939453125, -0.018789291381835938, -0.01726531982421875, -0.015741348266601562, -0.014217376708984375, -0.012693405151367188, -0.01116943359375, -0.009645462036132812, -0.008121490478515625, -0.0065975189208984375, -0.00507354736328125, -0.0035495758056640625, -0.002025604248046875, -0.0005016326904296875, 0.0010223388671875, 0.0025463104248046875, 0.004070281982421875, 0.0055942535400390625, 0.00711822509765625, 0.008642196655273438, 0.010166168212890625, 0.011690139770507812, 0.013214111328125, 0.014738082885742188, 0.016262054443359375, 0.017786026000976562, 0.01930999755859375, 0.020833969116210938, 0.022357940673828125, 0.023881912231445312, 0.0254058837890625, 0.026929855346679688, 0.028453826904296875, 0.029977798461914062, 0.03150177001953125, 0.03302574157714844, 0.034549713134765625, 0.03607368469238281, 0.03759765625, 0.03912162780761719, 0.040645599365234375, 0.04216957092285156, 0.04369354248046875, 0.04521751403808594, 0.046741485595703125, 0.04826545715332031, 0.0497894287109375, 0.05131340026855469, 0.052837371826171875, 0.05436134338378906, 0.05588531494140625, 0.05740928649902344, 0.058933258056640625, 0.06045722961425781, 0.061981201171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 8.0, 8.0, 10.0, 14.0, 14.0, 32.0, 41.0, 75.0, 78.0, 125.0, 178.0, 377.0, 980.0, 4441.0, 39025.0, 692981.0, 288698.0, 17397.0, 2635.0, 648.0, 291.0, 155.0, 113.0, 54.0, 45.0, 33.0, 24.0, 21.0, 10.0, 7.0, 15.0, 2.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10333251953125, -0.0998687744140625, -0.096405029296875, -0.0929412841796875, -0.0894775390625, -0.0860137939453125, -0.082550048828125, -0.0790863037109375, -0.07562255859375, -0.0721588134765625, -0.068695068359375, -0.0652313232421875, -0.061767578125, -0.0583038330078125, -0.054840087890625, -0.0513763427734375, -0.04791259765625, -0.0444488525390625, -0.040985107421875, -0.0375213623046875, -0.0340576171875, -0.0305938720703125, -0.027130126953125, -0.0236663818359375, -0.02020263671875, -0.0167388916015625, -0.013275146484375, -0.0098114013671875, -0.00634765625, -0.0028839111328125, 0.000579833984375, 0.0040435791015625, 0.00750732421875, 0.0109710693359375, 0.014434814453125, 0.0178985595703125, 0.0213623046875, 0.0248260498046875, 0.028289794921875, 0.0317535400390625, 0.03521728515625, 0.0386810302734375, 0.042144775390625, 0.0456085205078125, 0.049072265625, 0.0525360107421875, 0.055999755859375, 0.0594635009765625, 0.06292724609375, 0.0663909912109375, 0.069854736328125, 0.0733184814453125, 0.0767822265625, 0.0802459716796875, 0.083709716796875, 0.0871734619140625, 0.09063720703125, 0.0941009521484375, 0.097564697265625, 0.1010284423828125, 0.1044921875, 0.1079559326171875, 0.111419677734375, 0.1148834228515625, 0.11834716796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 6.0, 2.0, 6.0, 8.0, 8.0, 12.0, 10.0, 19.0, 13.0, 23.0, 23.0, 37.0, 40.0, 36.0, 24.0, 35.0, 34.0, 43.0, 37.0, 47.0, 34.0, 39.0, 53.0, 37.0, 44.0, 29.0, 43.0, 33.0, 24.0, 37.0, 24.0, 36.0, 19.0, 11.0, 13.0, 13.0, 13.0, 5.0, 7.0, 7.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.10302734375, -0.09991836547851562, -0.09680938720703125, -0.09370040893554688, -0.0905914306640625, -0.08748245239257812, -0.08437347412109375, -0.08126449584960938, -0.078155517578125, -0.07504653930664062, -0.07193756103515625, -0.06882858276367188, -0.0657196044921875, -0.06261062622070312, -0.05950164794921875, -0.056392669677734375, -0.05328369140625, -0.050174713134765625, -0.04706573486328125, -0.043956756591796875, -0.0408477783203125, -0.037738800048828125, -0.03462982177734375, -0.031520843505859375, -0.028411865234375, -0.025302886962890625, -0.02219390869140625, -0.019084930419921875, -0.0159759521484375, -0.012866973876953125, -0.00975799560546875, -0.006649017333984375, -0.0035400390625, -0.000431060791015625, 0.00267791748046875, 0.005786895751953125, 0.0088958740234375, 0.012004852294921875, 0.01511383056640625, 0.018222808837890625, 0.021331787109375, 0.024440765380859375, 0.02754974365234375, 0.030658721923828125, 0.0337677001953125, 0.036876678466796875, 0.03998565673828125, 0.043094635009765625, 0.04620361328125, 0.049312591552734375, 0.05242156982421875, 0.055530548095703125, 0.0586395263671875, 0.061748504638671875, 0.06485748291015625, 0.06796646118164062, 0.071075439453125, 0.07418441772460938, 0.07729339599609375, 0.08040237426757812, 0.0835113525390625, 0.08662033081054688, 0.08972930908203125, 0.09283828735351562, 0.095947265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 5.0, 6.0, 8.0, 8.0, 22.0, 18.0, 43.0, 77.0, 155.0, 231.0, 598.0, 1527.0, 5410.0, 30722.0, 363630.0, 589479.0, 46081.0, 7326.0, 1902.0, 676.0, 266.0, 146.0, 78.0, 41.0, 29.0, 16.0, 12.0, 19.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.034515380859375, -0.033472537994384766, -0.03242969512939453, -0.0313868522644043, -0.030344009399414062, -0.029301166534423828, -0.028258323669433594, -0.02721548080444336, -0.026172637939453125, -0.02512979507446289, -0.024086952209472656, -0.023044109344482422, -0.022001266479492188, -0.020958423614501953, -0.01991558074951172, -0.018872737884521484, -0.01782989501953125, -0.016787052154541016, -0.01574420928955078, -0.014701366424560547, -0.013658523559570312, -0.012615680694580078, -0.011572837829589844, -0.01052999496459961, -0.009487152099609375, -0.00844430923461914, -0.007401466369628906, -0.006358623504638672, -0.0053157806396484375, -0.004272937774658203, -0.0032300949096679688, -0.0021872520446777344, -0.0011444091796875, -0.00010156631469726562, 0.0009412765502929688, 0.001984119415283203, 0.0030269622802734375, 0.004069805145263672, 0.005112648010253906, 0.006155490875244141, 0.007198333740234375, 0.00824117660522461, 0.009284019470214844, 0.010326862335205078, 0.011369705200195312, 0.012412548065185547, 0.013455390930175781, 0.014498233795166016, 0.01554107666015625, 0.016583919525146484, 0.01762676239013672, 0.018669605255126953, 0.019712448120117188, 0.020755290985107422, 0.021798133850097656, 0.02284097671508789, 0.023883819580078125, 0.02492666244506836, 0.025969505310058594, 0.027012348175048828, 0.028055191040039062, 0.029098033905029297, 0.03014087677001953, 0.031183719635009766, 0.0322265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 7.0, 14.0, 15.0, 19.0, 22.0, 49.0, 50.0, 45.0, 77.0, 69.0, 83.0, 105.0, 75.0, 52.0, 86.0, 59.0, 31.0, 43.0, 29.0, 12.0, 15.0, 9.0, 6.0, 7.0, 2.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.424022674560547e-06, -5.22565096616745e-06, -5.027279257774353e-06, -4.828907549381256e-06, -4.630535840988159e-06, -4.432164132595062e-06, -4.233792424201965e-06, -4.035420715808868e-06, -3.8370490074157715e-06, -3.6386772990226746e-06, -3.4403055906295776e-06, -3.2419338822364807e-06, -3.043562173843384e-06, -2.845190465450287e-06, -2.64681875705719e-06, -2.448447048664093e-06, -2.250075340270996e-06, -2.051703631877899e-06, -1.8533319234848022e-06, -1.6549602150917053e-06, -1.4565885066986084e-06, -1.2582167983055115e-06, -1.0598450899124146e-06, -8.614733815193176e-07, -6.631016731262207e-07, -4.647299647331238e-07, -2.6635825634002686e-07, -6.798654794692993e-08, 1.30385160446167e-07, 3.287568688392639e-07, 5.271285772323608e-07, 7.255002856254578e-07, 9.238719940185547e-07, 1.1222437024116516e-06, 1.3206154108047485e-06, 1.5189871191978455e-06, 1.7173588275909424e-06, 1.9157305359840393e-06, 2.1141022443771362e-06, 2.312473952770233e-06, 2.51084566116333e-06, 2.709217369556427e-06, 2.907589077949524e-06, 3.105960786342621e-06, 3.3043324947357178e-06, 3.5027042031288147e-06, 3.7010759115219116e-06, 3.8994476199150085e-06, 4.0978193283081055e-06, 4.296191036701202e-06, 4.494562745094299e-06, 4.692934453487396e-06, 4.891306161880493e-06, 5.08967787027359e-06, 5.288049578666687e-06, 5.486421287059784e-06, 5.684792995452881e-06, 5.883164703845978e-06, 6.081536412239075e-06, 6.279908120632172e-06, 6.4782798290252686e-06, 6.6766515374183655e-06, 6.875023245811462e-06, 7.073394954204559e-06, 7.271766662597656e-06]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 7.0, 13.0, 16.0, 18.0, 33.0, 52.0, 105.0, 130.0, 221.0, 398.0, 772.0, 1661.0, 5358.0, 24029.0, 195413.0, 683802.0, 113485.0, 15984.0, 4082.0, 1447.0, 658.0, 332.0, 179.0, 127.0, 65.0, 52.0, 34.0, 26.0, 15.0, 12.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.033203125, -0.03226470947265625, -0.0313262939453125, -0.03038787841796875, -0.029449462890625, -0.02851104736328125, -0.0275726318359375, -0.02663421630859375, -0.02569580078125, -0.02475738525390625, -0.0238189697265625, -0.02288055419921875, -0.021942138671875, -0.02100372314453125, -0.0200653076171875, -0.01912689208984375, -0.0181884765625, -0.01725006103515625, -0.0163116455078125, -0.01537322998046875, -0.014434814453125, -0.01349639892578125, -0.0125579833984375, -0.01161956787109375, -0.01068115234375, -0.00974273681640625, -0.0088043212890625, -0.00786590576171875, -0.006927490234375, -0.00598907470703125, -0.0050506591796875, -0.00411224365234375, -0.003173828125, -0.00223541259765625, -0.0012969970703125, -0.00035858154296875, 0.000579833984375, 0.00151824951171875, 0.0024566650390625, 0.00339508056640625, 0.00433349609375, 0.00527191162109375, 0.0062103271484375, 0.00714874267578125, 0.008087158203125, 0.00902557373046875, 0.0099639892578125, 0.01090240478515625, 0.0118408203125, 0.01277923583984375, 0.0137176513671875, 0.01465606689453125, 0.015594482421875, 0.01653289794921875, 0.0174713134765625, 0.01840972900390625, 0.01934814453125, 0.02028656005859375, 0.0212249755859375, 0.02216339111328125, 0.023101806640625, 0.02404022216796875, 0.0249786376953125, 0.02591705322265625, 0.02685546875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 11.0, 25.0, 48.0, 61.0, 104.0, 158.0, 185.0, 137.0, 115.0, 75.0, 30.0, 25.0, 11.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0557861328125, -0.053826332092285156, -0.05186653137207031, -0.04990673065185547, -0.047946929931640625, -0.04598712921142578, -0.04402732849121094, -0.042067527770996094, -0.04010772705078125, -0.038147926330566406, -0.03618812561035156, -0.03422832489013672, -0.032268524169921875, -0.03030872344970703, -0.028348922729492188, -0.026389122009277344, -0.0244293212890625, -0.022469520568847656, -0.020509719848632812, -0.01854991912841797, -0.016590118408203125, -0.014630317687988281, -0.012670516967773438, -0.010710716247558594, -0.00875091552734375, -0.006791114807128906, -0.0048313140869140625, -0.0028715133666992188, -0.000911712646484375, 0.0010480880737304688, 0.0030078887939453125, 0.004967689514160156, 0.006927490234375, 0.008887290954589844, 0.010847091674804688, 0.012806892395019531, 0.014766693115234375, 0.01672649383544922, 0.018686294555664062, 0.020646095275878906, 0.02260589599609375, 0.024565696716308594, 0.026525497436523438, 0.02848529815673828, 0.030445098876953125, 0.03240489959716797, 0.03436470031738281, 0.036324501037597656, 0.0382843017578125, 0.040244102478027344, 0.04220390319824219, 0.04416370391845703, 0.046123504638671875, 0.04808330535888672, 0.05004310607910156, 0.052002906799316406, 0.05396270751953125, 0.055922508239746094, 0.05788230895996094, 0.05984210968017578, 0.061801910400390625, 0.06376171112060547, 0.06572151184082031, 0.06768131256103516, 0.06964111328125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 13.0, 28.0, 74.0, 178.0, 258.0, 242.0, 128.0, 59.0, 10.0, 10.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5753464698791504, -1.5437520742416382, -1.5121577978134155, -1.4805634021759033, -1.4489690065383911, -1.4173747301101685, -1.3857803344726562, -1.354185938835144, -1.3225916624069214, -1.2909972667694092, -1.2594029903411865, -1.2278085947036743, -1.196214199066162, -1.1646199226379395, -1.1330255270004272, -1.101431131362915, -1.0698368549346924, -1.0382424592971802, -1.0066481828689575, -0.9750537872314453, -0.9434594511985779, -0.9118651151657104, -0.8802707195281982, -0.8486763834953308, -0.8170819282531738, -0.7854875922203064, -0.7538931965827942, -0.7222988605499268, -0.6907045245170593, -0.6591101884841919, -0.6275157928466797, -0.5959214568138123, -0.5643270611763, -0.5327327251434326, -0.5011383295059204, -0.469543993473053, -0.43794965744018555, -0.4063552916049957, -0.3747609257698059, -0.3431665897369385, -0.31157222390174866, -0.27997785806655884, -0.2483835220336914, -0.2167891561985016, -0.18519480526447296, -0.15360045433044434, -0.12200608849525452, -0.09041173756122589, -0.058817386627197266, -0.02722303196787834, 0.004371322691440582, 0.035965681076049805, 0.06756003201007843, 0.09915438294410706, 0.13074874877929688, 0.1623430997133255, 0.19393745064735413, 0.22553180158138275, 0.2571261525154114, 0.2887205183506012, 0.320314884185791, 0.35190922021865845, 0.38350358605384827, 0.4150979518890381, 0.4466922879219055]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 8.0, 6.0, 4.0, 11.0, 10.0, 14.0, 15.0, 20.0, 22.0, 16.0, 30.0, 24.0, 23.0, 35.0, 35.0, 22.0, 53.0, 48.0, 42.0, 55.0, 44.0, 41.0, 48.0, 43.0, 46.0, 42.0, 23.0, 41.0, 30.0, 19.0, 21.0, 18.0, 18.0, 8.0, 12.0, 9.0, 9.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 4.0, 0.0, 4.0], "bins": [-0.5901949405670166, -0.5741485953330994, -0.5581021904945374, -0.5420558452606201, -0.5260095000267029, -0.5099631547927856, -0.49391674995422363, -0.4778704047203064, -0.4618240296840668, -0.44577765464782715, -0.4297313094139099, -0.4136849343776703, -0.39763855934143066, -0.3815922141075134, -0.3655458390712738, -0.3494994640350342, -0.33345311880111694, -0.3174067437648773, -0.3013603985309601, -0.28531402349472046, -0.2692676782608032, -0.2532213032245636, -0.23717492818832397, -0.22112856805324554, -0.20508220791816711, -0.18903584778308868, -0.17298948764801025, -0.15694311261177063, -0.1408967524766922, -0.12485039234161377, -0.10880402475595474, -0.09275765717029572, -0.07671123743057251, -0.06066487357020378, -0.04461850970983505, -0.028572145849466324, -0.012525781989097595, 0.003520578145980835, 0.019566945731639862, 0.03561331331729889, 0.05165967345237732, 0.06770603358745575, 0.08375240117311478, 0.0997987687587738, 0.11584512889385223, 0.13189148902893066, 0.1479378640651703, 0.16398422420024872, 0.18003058433532715, 0.19607694447040558, 0.212123304605484, 0.22816967964172363, 0.24421603977680206, 0.2602623999118805, 0.2763087749481201, 0.29235512018203735, 0.308401495218277, 0.3244478702545166, 0.34049421548843384, 0.35654059052467346, 0.3725869655609131, 0.3886333107948303, 0.40467968583106995, 0.42072606086730957, 0.4367724061012268]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 10.0, 13.0, 17.0, 29.0, 42.0, 52.0, 69.0, 158.0, 483.0, 2588.0, 4155622.0, 33090.0, 1447.0, 325.0, 131.0, 72.0, 45.0, 32.0, 22.0, 18.0, 4.0, 5.0, 9.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15966796875, -0.15201187133789062, -0.14435577392578125, -0.13669967651367188, -0.1290435791015625, -0.12138748168945312, -0.11373138427734375, -0.10607528686523438, -0.098419189453125, -0.09076309204101562, -0.08310699462890625, -0.07545089721679688, -0.0677947998046875, -0.060138702392578125, -0.05248260498046875, -0.044826507568359375, -0.03717041015625, -0.029514312744140625, -0.02185821533203125, -0.014202117919921875, -0.0065460205078125, 0.001110076904296875, 0.00876617431640625, 0.016422271728515625, 0.024078369140625, 0.031734466552734375, 0.03939056396484375, 0.047046661376953125, 0.0547027587890625, 0.062358856201171875, 0.07001495361328125, 0.07767105102539062, 0.0853271484375, 0.09298324584960938, 0.10063934326171875, 0.10829544067382812, 0.1159515380859375, 0.12360763549804688, 0.13126373291015625, 0.13891983032226562, 0.146575927734375, 0.15423202514648438, 0.16188812255859375, 0.16954421997070312, 0.1772003173828125, 0.18485641479492188, 0.19251251220703125, 0.20016860961914062, 0.20782470703125, 0.21548080444335938, 0.22313690185546875, 0.23079299926757812, 0.2384490966796875, 0.24610519409179688, 0.25376129150390625, 0.2614173889160156, 0.269073486328125, 0.2767295837402344, 0.28438568115234375, 0.2920417785644531, 0.2996978759765625, 0.3073539733886719, 0.31501007080078125, 0.3226661682128906, 0.330322265625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 7.0, 5.0, 13.0, 21.0, 27.0, 44.0, 42.0, 58.0, 73.0, 74.0, 75.0, 69.0, 65.0, 69.0, 61.0, 70.0, 46.0, 34.0, 37.0, 27.0, 27.0, 15.0, 17.0, 3.0, 6.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0352783203125, -0.0338129997253418, -0.032347679138183594, -0.03088235855102539, -0.029417037963867188, -0.027951717376708984, -0.02648639678955078, -0.025021076202392578, -0.023555755615234375, -0.022090435028076172, -0.02062511444091797, -0.019159793853759766, -0.017694473266601562, -0.01622915267944336, -0.014763832092285156, -0.013298511505126953, -0.01183319091796875, -0.010367870330810547, -0.008902549743652344, -0.007437229156494141, -0.0059719085693359375, -0.004506587982177734, -0.0030412673950195312, -0.0015759468078613281, -0.000110626220703125, 0.0013546943664550781, 0.0028200149536132812, 0.004285335540771484, 0.0057506561279296875, 0.007215976715087891, 0.008681297302246094, 0.010146617889404297, 0.0116119384765625, 0.013077259063720703, 0.014542579650878906, 0.01600790023803711, 0.017473220825195312, 0.018938541412353516, 0.02040386199951172, 0.021869182586669922, 0.023334503173828125, 0.024799823760986328, 0.02626514434814453, 0.027730464935302734, 0.029195785522460938, 0.03066110610961914, 0.032126426696777344, 0.03359174728393555, 0.03505706787109375, 0.03652238845825195, 0.037987709045410156, 0.03945302963256836, 0.04091835021972656, 0.042383670806884766, 0.04384899139404297, 0.04531431198120117, 0.046779632568359375, 0.04824495315551758, 0.04971027374267578, 0.051175594329833984, 0.05264091491699219, 0.05410623550415039, 0.055571556091308594, 0.0570368766784668, 0.058502197265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 4.0, 1.0, 9.0, 9.0, 13.0, 22.0, 39.0, 51.0, 65.0, 86.0, 113.0, 178.0, 227.0, 299.0, 553.0, 1016.0, 2199.0, 8459.0, 4020870.0, 148689.0, 6843.0, 2012.0, 885.0, 514.0, 303.0, 240.0, 157.0, 119.0, 88.0, 60.0, 39.0, 28.0, 36.0, 22.0, 10.0, 4.0, 9.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.089111328125, -0.08632087707519531, -0.08353042602539062, -0.08073997497558594, -0.07794952392578125, -0.07515907287597656, -0.07236862182617188, -0.06957817077636719, -0.0667877197265625, -0.06399726867675781, -0.061206817626953125, -0.05841636657714844, -0.05562591552734375, -0.05283546447753906, -0.050045013427734375, -0.04725456237792969, -0.044464111328125, -0.04167366027832031, -0.038883209228515625, -0.03609275817871094, -0.03330230712890625, -0.030511856079101562, -0.027721405029296875, -0.024930953979492188, -0.0221405029296875, -0.019350051879882812, -0.016559600830078125, -0.013769149780273438, -0.01097869873046875, -0.008188247680664062, -0.005397796630859375, -0.0026073455810546875, 0.00018310546875, 0.0029735565185546875, 0.005764007568359375, 0.008554458618164062, 0.01134490966796875, 0.014135360717773438, 0.016925811767578125, 0.019716262817382812, 0.0225067138671875, 0.025297164916992188, 0.028087615966796875, 0.030878067016601562, 0.03366851806640625, 0.03645896911621094, 0.039249420166015625, 0.04203987121582031, 0.044830322265625, 0.04762077331542969, 0.050411224365234375, 0.05320167541503906, 0.05599212646484375, 0.05878257751464844, 0.061573028564453125, 0.06436347961425781, 0.0671539306640625, 0.06994438171386719, 0.07273483276367188, 0.07552528381347656, 0.07831573486328125, 0.08110618591308594, 0.08389663696289062, 0.08668708801269531, 0.0894775390625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 38.0, 3783.0, 193.0, 28.0, 13.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0308990478515625, -0.029830217361450195, -0.02876138687133789, -0.027692556381225586, -0.02662372589111328, -0.025554895401000977, -0.024486064910888672, -0.023417234420776367, -0.022348403930664062, -0.021279573440551758, -0.020210742950439453, -0.01914191246032715, -0.018073081970214844, -0.01700425148010254, -0.015935420989990234, -0.01486659049987793, -0.013797760009765625, -0.01272892951965332, -0.011660099029541016, -0.010591268539428711, -0.009522438049316406, -0.008453607559204102, -0.007384777069091797, -0.006315946578979492, -0.0052471160888671875, -0.004178285598754883, -0.003109455108642578, -0.0020406246185302734, -0.0009717941284179688, 9.703636169433594e-05, 0.0011658668518066406, 0.0022346973419189453, 0.00330352783203125, 0.004372358322143555, 0.005441188812255859, 0.006510019302368164, 0.007578849792480469, 0.008647680282592773, 0.009716510772705078, 0.010785341262817383, 0.011854171752929688, 0.012923002243041992, 0.013991832733154297, 0.015060663223266602, 0.016129493713378906, 0.01719832420349121, 0.018267154693603516, 0.01933598518371582, 0.020404815673828125, 0.02147364616394043, 0.022542476654052734, 0.02361130714416504, 0.024680137634277344, 0.02574896812438965, 0.026817798614501953, 0.027886629104614258, 0.028955459594726562, 0.030024290084838867, 0.031093120574951172, 0.03216195106506348, 0.03323078155517578, 0.034299612045288086, 0.03536844253540039, 0.036437273025512695, 0.037506103515625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 10.0, 17.0, 58.0, 210.0, 364.0, 232.0, 73.0, 28.0, 18.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1842198669910431, -0.17964476346969604, -0.175069659948349, -0.17049455642700195, -0.1659194529056549, -0.16134434938430786, -0.15676924586296082, -0.15219414234161377, -0.14761903882026672, -0.14304393529891968, -0.13846883177757263, -0.13389372825622559, -0.12931862473487854, -0.1247435212135315, -0.12016841024160385, -0.1155933067202568, -0.11101819574832916, -0.10644309222698212, -0.10186798870563507, -0.09729288518428802, -0.09271778166294098, -0.08814267814159393, -0.08356756716966629, -0.07899246364831924, -0.0744173601269722, -0.06984225660562515, -0.0652671530842781, -0.06069204583764076, -0.056116942316293716, -0.05154183879494667, -0.046966731548309326, -0.04239162802696228, -0.03781653195619583, -0.033241428434848785, -0.02866632305085659, -0.024091217666864395, -0.01951611414551735, -0.014941010624170303, -0.010365905240178108, -0.005790799856185913, -0.0012156963348388672, 0.0033594081178307533, 0.007934512570500374, 0.012509617023169994, 0.017084721475839615, 0.02165982499718666, 0.026234930381178856, 0.03081003576517105, 0.0353851392865181, 0.03996024280786514, 0.04453534632921219, 0.04911045357584953, 0.05368555709719658, 0.058260660618543625, 0.06283576786518097, 0.06741087138652802, 0.07198597490787506, 0.0765610784292221, 0.08113618195056915, 0.0857112854719162, 0.09028638899326324, 0.09486149251461029, 0.09943660348653793, 0.10401170700788498, 0.10858681052923203]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 8.0, 15.0, 16.0, 13.0, 19.0, 16.0, 26.0, 27.0, 29.0, 28.0, 37.0, 56.0, 39.0, 45.0, 36.0, 28.0, 37.0, 49.0, 50.0, 36.0, 39.0, 40.0, 31.0, 32.0, 40.0, 31.0, 28.0, 21.0, 26.0, 18.0, 14.0, 14.0, 8.0, 3.0, 7.0, 7.0, 7.0, 5.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03635615110397339, -0.03526175767183304, -0.03416736051440239, -0.03307296335697174, -0.03197856992483139, -0.03088417463004589, -0.02978977933526039, -0.02869538404047489, -0.027600988745689392, -0.026506593450903893, -0.025412198156118393, -0.024317802861332893, -0.023223407566547394, -0.022129012271761894, -0.021034616976976395, -0.019940221682190895, -0.018845826387405396, -0.017751431092619896, -0.016657035797834396, -0.015562640503048897, -0.014468245208263397, -0.013373849913477898, -0.012279454618692398, -0.011185059323906898, -0.010090664029121399, -0.0089962687343359, -0.0079018734395504, -0.0068074781447649, -0.005713082849979401, -0.004618687555193901, -0.0035242922604084015, -0.002429896965622902, -0.0013355016708374023, -0.00024110637605190277, 0.0008532889187335968, 0.0019476842135190964, 0.003042079508304596, 0.0041364748030900955, 0.005230870097875595, 0.006325265392661095, 0.007419660687446594, 0.008514055982232094, 0.009608451277017593, 0.010702846571803093, 0.011797241866588593, 0.012891637161374092, 0.013986032456159592, 0.015080427750945091, 0.01617482304573059, 0.01726921834051609, 0.01836361363530159, 0.01945800893008709, 0.02055240422487259, 0.02164679951965809, 0.022741194814443588, 0.023835590109229088, 0.024929985404014587, 0.026024380698800087, 0.027118775993585587, 0.028213171288371086, 0.029307566583156586, 0.030401961877942085, 0.031496357172727585, 0.032590754330158234, 0.033685147762298584]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 14.0, 18.0, 15.0, 31.0, 47.0, 51.0, 78.0, 135.0, 187.0, 269.0, 430.0, 700.0, 1244.0, 2147.0, 5234.0, 17921.0, 136704.0, 723469.0, 131584.0, 17799.0, 5071.0, 2184.0, 1197.0, 710.0, 454.0, 247.0, 198.0, 121.0, 75.0, 54.0, 30.0, 28.0, 22.0, 8.0, 16.0, 15.0, 9.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.10028076171875, -0.09709644317626953, -0.09391212463378906, -0.0907278060913086, -0.08754348754882812, -0.08435916900634766, -0.08117485046386719, -0.07799053192138672, -0.07480621337890625, -0.07162189483642578, -0.06843757629394531, -0.06525325775146484, -0.062068939208984375, -0.058884620666503906, -0.05570030212402344, -0.05251598358154297, -0.0493316650390625, -0.04614734649658203, -0.04296302795410156, -0.039778709411621094, -0.036594390869140625, -0.033410072326660156, -0.030225753784179688, -0.02704143524169922, -0.02385711669921875, -0.02067279815673828, -0.017488479614257812, -0.014304161071777344, -0.011119842529296875, -0.007935523986816406, -0.0047512054443359375, -0.0015668869018554688, 0.001617431640625, 0.004801750183105469, 0.007986068725585938, 0.011170387268066406, 0.014354705810546875, 0.017539024353027344, 0.020723342895507812, 0.02390766143798828, 0.02709197998046875, 0.03027629852294922, 0.03346061706542969, 0.036644935607910156, 0.039829254150390625, 0.043013572692871094, 0.04619789123535156, 0.04938220977783203, 0.0525665283203125, 0.05575084686279297, 0.05893516540527344, 0.062119483947753906, 0.06530380249023438, 0.06848812103271484, 0.07167243957519531, 0.07485675811767578, 0.07804107666015625, 0.08122539520263672, 0.08440971374511719, 0.08759403228759766, 0.09077835083007812, 0.0939626693725586, 0.09714698791503906, 0.10033130645751953, 0.103515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 6.0, 8.0, 6.0, 9.0, 21.0, 27.0, 48.0, 35.0, 59.0, 67.0, 59.0, 81.0, 78.0, 77.0, 46.0, 74.0, 58.0, 49.0, 42.0, 42.0, 21.0, 25.0, 25.0, 14.0, 5.0, 8.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03607177734375, -0.03458118438720703, -0.03309059143066406, -0.031599998474121094, -0.030109405517578125, -0.028618812561035156, -0.027128219604492188, -0.02563762664794922, -0.02414703369140625, -0.02265644073486328, -0.021165847778320312, -0.019675254821777344, -0.018184661865234375, -0.016694068908691406, -0.015203475952148438, -0.013712882995605469, -0.0122222900390625, -0.010731697082519531, -0.009241104125976562, -0.007750511169433594, -0.006259918212890625, -0.004769325256347656, -0.0032787322998046875, -0.0017881393432617188, -0.00029754638671875, 0.0011930465698242188, 0.0026836395263671875, 0.004174232482910156, 0.005664825439453125, 0.007155418395996094, 0.008646011352539062, 0.010136604309082031, 0.011627197265625, 0.013117790222167969, 0.014608383178710938, 0.016098976135253906, 0.017589569091796875, 0.019080162048339844, 0.020570755004882812, 0.02206134796142578, 0.02355194091796875, 0.02504253387451172, 0.026533126831054688, 0.028023719787597656, 0.029514312744140625, 0.031004905700683594, 0.03249549865722656, 0.03398609161376953, 0.0354766845703125, 0.03696727752685547, 0.03845787048339844, 0.039948463439941406, 0.041439056396484375, 0.042929649353027344, 0.04442024230957031, 0.04591083526611328, 0.04740142822265625, 0.04889202117919922, 0.05038261413574219, 0.051873207092285156, 0.053363800048828125, 0.054854393005371094, 0.05634498596191406, 0.05783557891845703, 0.059326171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 14.0, 12.0, 17.0, 26.0, 45.0, 59.0, 118.0, 165.0, 287.0, 499.0, 870.0, 1860.0, 5130.0, 34722.0, 842636.0, 146587.0, 9929.0, 2774.0, 1229.0, 603.0, 340.0, 230.0, 137.0, 74.0, 62.0, 39.0, 25.0, 20.0, 11.0, 11.0, 2.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1416015625, -0.13752269744873047, -0.13344383239746094, -0.1293649673461914, -0.12528610229492188, -0.12120723724365234, -0.11712837219238281, -0.11304950714111328, -0.10897064208984375, -0.10489177703857422, -0.10081291198730469, -0.09673404693603516, -0.09265518188476562, -0.0885763168334961, -0.08449745178222656, -0.08041858673095703, -0.0763397216796875, -0.07226085662841797, -0.06818199157714844, -0.0641031265258789, -0.060024261474609375, -0.055945396423339844, -0.05186653137207031, -0.04778766632080078, -0.04370880126953125, -0.03962993621826172, -0.03555107116699219, -0.031472206115722656, -0.027393341064453125, -0.023314476013183594, -0.019235610961914062, -0.015156745910644531, -0.011077880859375, -0.006999015808105469, -0.0029201507568359375, 0.0011587142944335938, 0.005237579345703125, 0.009316444396972656, 0.013395309448242188, 0.01747417449951172, 0.02155303955078125, 0.02563190460205078, 0.029710769653320312, 0.033789634704589844, 0.037868499755859375, 0.041947364807128906, 0.04602622985839844, 0.05010509490966797, 0.0541839599609375, 0.05826282501220703, 0.06234169006347656, 0.0664205551147461, 0.07049942016601562, 0.07457828521728516, 0.07865715026855469, 0.08273601531982422, 0.08681488037109375, 0.09089374542236328, 0.09497261047363281, 0.09905147552490234, 0.10313034057617188, 0.1072092056274414, 0.11128807067871094, 0.11536693572998047, 0.11944580078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 12.0, 17.0, 15.0, 17.0, 21.0, 25.0, 25.0, 38.0, 44.0, 34.0, 50.0, 50.0, 54.0, 42.0, 51.0, 41.0, 57.0, 45.0, 42.0, 36.0, 29.0, 40.0, 25.0, 30.0, 26.0, 27.0, 17.0, 14.0, 20.0, 9.0, 9.0, 5.0, 9.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1295166015625, -0.12566089630126953, -0.12180519104003906, -0.1179494857788086, -0.11409378051757812, -0.11023807525634766, -0.10638236999511719, -0.10252666473388672, -0.09867095947265625, -0.09481525421142578, -0.09095954895019531, -0.08710384368896484, -0.08324813842773438, -0.0793924331665039, -0.07553672790527344, -0.07168102264404297, -0.0678253173828125, -0.06396961212158203, -0.06011390686035156, -0.056258201599121094, -0.052402496337890625, -0.048546791076660156, -0.04469108581542969, -0.04083538055419922, -0.03697967529296875, -0.03312397003173828, -0.029268264770507812, -0.025412559509277344, -0.021556854248046875, -0.017701148986816406, -0.013845443725585938, -0.009989738464355469, -0.006134033203125, -0.0022783279418945312, 0.0015773773193359375, 0.005433082580566406, 0.009288787841796875, 0.013144493103027344, 0.017000198364257812, 0.02085590362548828, 0.02471160888671875, 0.02856731414794922, 0.03242301940917969, 0.036278724670410156, 0.040134429931640625, 0.043990135192871094, 0.04784584045410156, 0.05170154571533203, 0.0555572509765625, 0.05941295623779297, 0.06326866149902344, 0.0671243667602539, 0.07098007202148438, 0.07483577728271484, 0.07869148254394531, 0.08254718780517578, 0.08640289306640625, 0.09025859832763672, 0.09411430358886719, 0.09797000885009766, 0.10182571411132812, 0.1056814193725586, 0.10953712463378906, 0.11339282989501953, 0.11724853515625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 5.0, 10.0, 10.0, 10.0, 22.0, 30.0, 36.0, 56.0, 83.0, 109.0, 156.0, 278.0, 477.0, 942.0, 1902.0, 5014.0, 21210.0, 381189.0, 599451.0, 27319.0, 5787.0, 2121.0, 929.0, 551.0, 272.0, 200.0, 118.0, 78.0, 45.0, 40.0, 17.0, 20.0, 19.0, 12.0, 7.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032012939453125, -0.03091144561767578, -0.029809951782226562, -0.028708457946777344, -0.027606964111328125, -0.026505470275878906, -0.025403976440429688, -0.02430248260498047, -0.02320098876953125, -0.02209949493408203, -0.020998001098632812, -0.019896507263183594, -0.018795013427734375, -0.017693519592285156, -0.016592025756835938, -0.015490531921386719, -0.0143890380859375, -0.013287544250488281, -0.012186050415039062, -0.011084556579589844, -0.009983062744140625, -0.008881568908691406, -0.0077800750732421875, -0.006678581237792969, -0.00557708740234375, -0.004475593566894531, -0.0033740997314453125, -0.0022726058959960938, -0.001171112060546875, -6.961822509765625e-05, 0.0010318756103515625, 0.0021333694458007812, 0.00323486328125, 0.004336357116699219, 0.0054378509521484375, 0.006539344787597656, 0.007640838623046875, 0.008742332458496094, 0.009843826293945312, 0.010945320129394531, 0.01204681396484375, 0.013148307800292969, 0.014249801635742188, 0.015351295471191406, 0.016452789306640625, 0.017554283142089844, 0.018655776977539062, 0.01975727081298828, 0.0208587646484375, 0.02196025848388672, 0.023061752319335938, 0.024163246154785156, 0.025264739990234375, 0.026366233825683594, 0.027467727661132812, 0.02856922149658203, 0.02967071533203125, 0.03077220916748047, 0.03187370300292969, 0.032975196838378906, 0.034076690673828125, 0.035178184509277344, 0.03627967834472656, 0.03738117218017578, 0.038482666015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 10.0, 16.0, 21.0, 32.0, 54.0, 51.0, 59.0, 79.0, 67.0, 110.0, 81.0, 91.0, 89.0, 53.0, 56.0, 34.0, 34.0, 11.0, 8.0, 6.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.616115570068359e-06, -6.401911377906799e-06, -6.187707185745239e-06, -5.973502993583679e-06, -5.759298801422119e-06, -5.545094609260559e-06, -5.330890417098999e-06, -5.116686224937439e-06, -4.902482032775879e-06, -4.688277840614319e-06, -4.474073648452759e-06, -4.259869456291199e-06, -4.045665264129639e-06, -3.831461071968079e-06, -3.6172568798065186e-06, -3.4030526876449585e-06, -3.1888484954833984e-06, -2.9746443033218384e-06, -2.7604401111602783e-06, -2.5462359189987183e-06, -2.332031726837158e-06, -2.117827534675598e-06, -1.903623342514038e-06, -1.689419150352478e-06, -1.475214958190918e-06, -1.261010766029358e-06, -1.0468065738677979e-06, -8.326023817062378e-07, -6.183981895446777e-07, -4.041939973831177e-07, -1.8998980522155762e-07, 2.421438694000244e-08, 2.384185791015625e-07, 4.5262277126312256e-07, 6.668269634246826e-07, 8.810311555862427e-07, 1.0952353477478027e-06, 1.3094395399093628e-06, 1.5236437320709229e-06, 1.737847924232483e-06, 1.952052116394043e-06, 2.166256308555603e-06, 2.380460500717163e-06, 2.594664692878723e-06, 2.808868885040283e-06, 3.0230730772018433e-06, 3.2372772693634033e-06, 3.4514814615249634e-06, 3.6656856536865234e-06, 3.8798898458480835e-06, 4.0940940380096436e-06, 4.308298230171204e-06, 4.522502422332764e-06, 4.736706614494324e-06, 4.950910806655884e-06, 5.165114998817444e-06, 5.379319190979004e-06, 5.593523383140564e-06, 5.807727575302124e-06, 6.021931767463684e-06, 6.236135959625244e-06, 6.450340151786804e-06, 6.664544343948364e-06, 6.878748536109924e-06, 7.092952728271484e-06]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 8.0, 7.0, 15.0, 22.0, 31.0, 42.0, 64.0, 121.0, 185.0, 319.0, 659.0, 1515.0, 3926.0, 23212.0, 885294.0, 121338.0, 7554.0, 2195.0, 928.0, 430.0, 262.0, 139.0, 76.0, 56.0, 38.0, 29.0, 21.0, 16.0, 11.0, 4.0, 9.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0521240234375, -0.05024433135986328, -0.04836463928222656, -0.046484947204589844, -0.044605255126953125, -0.042725563049316406, -0.04084587097167969, -0.03896617889404297, -0.03708648681640625, -0.03520679473876953, -0.03332710266113281, -0.031447410583496094, -0.029567718505859375, -0.027688026428222656, -0.025808334350585938, -0.02392864227294922, -0.0220489501953125, -0.02016925811767578, -0.018289566040039062, -0.016409873962402344, -0.014530181884765625, -0.012650489807128906, -0.010770797729492188, -0.008891105651855469, -0.00701141357421875, -0.005131721496582031, -0.0032520294189453125, -0.0013723373413085938, 0.000507354736328125, 0.0023870468139648438, 0.0042667388916015625, 0.006146430969238281, 0.008026123046875, 0.009905815124511719, 0.011785507202148438, 0.013665199279785156, 0.015544891357421875, 0.017424583435058594, 0.019304275512695312, 0.02118396759033203, 0.02306365966796875, 0.02494335174560547, 0.026823043823242188, 0.028702735900878906, 0.030582427978515625, 0.032462120056152344, 0.03434181213378906, 0.03622150421142578, 0.0381011962890625, 0.03998088836669922, 0.04186058044433594, 0.043740272521972656, 0.045619964599609375, 0.047499656677246094, 0.04937934875488281, 0.05125904083251953, 0.05313873291015625, 0.05501842498779297, 0.05689811706542969, 0.058777809143066406, 0.060657501220703125, 0.06253719329833984, 0.06441688537597656, 0.06629657745361328, 0.06817626953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 7.0, 5.0, 12.0, 12.0, 26.0, 86.0, 283.0, 358.0, 125.0, 45.0, 11.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07916259765625, -0.07559680938720703, -0.07203102111816406, -0.0684652328491211, -0.06489944458007812, -0.061333656311035156, -0.05776786804199219, -0.05420207977294922, -0.05063629150390625, -0.04707050323486328, -0.04350471496582031, -0.039938926696777344, -0.036373138427734375, -0.032807350158691406, -0.029241561889648438, -0.02567577362060547, -0.0221099853515625, -0.01854419708251953, -0.014978408813476562, -0.011412620544433594, -0.007846832275390625, -0.004281044006347656, -0.0007152557373046875, 0.0028505325317382812, 0.00641632080078125, 0.009982109069824219, 0.013547897338867188, 0.017113685607910156, 0.020679473876953125, 0.024245262145996094, 0.027811050415039062, 0.03137683868408203, 0.034942626953125, 0.03850841522216797, 0.04207420349121094, 0.045639991760253906, 0.049205780029296875, 0.052771568298339844, 0.05633735656738281, 0.05990314483642578, 0.06346893310546875, 0.06703472137451172, 0.07060050964355469, 0.07416629791259766, 0.07773208618164062, 0.0812978744506836, 0.08486366271972656, 0.08842945098876953, 0.0919952392578125, 0.09556102752685547, 0.09912681579589844, 0.1026926040649414, 0.10625839233398438, 0.10982418060302734, 0.11338996887207031, 0.11695575714111328, 0.12052154541015625, 0.12408733367919922, 0.1276531219482422, 0.13121891021728516, 0.13478469848632812, 0.1383504867553711, 0.14191627502441406, 0.14548206329345703, 0.1490478515625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 13.0, 16.0, 41.0, 55.0, 76.0, 109.0, 147.0, 105.0, 112.0, 90.0, 49.0, 48.0, 35.0, 28.0, 18.0, 17.0, 10.0, 5.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.549359142780304, -0.5338426828384399, -0.5183262228965759, -0.5028097033500671, -0.4872932434082031, -0.4717767834663391, -0.4562603235244751, -0.4407438635826111, -0.4252273738384247, -0.40971091389656067, -0.39419442415237427, -0.37867796421051025, -0.36316150426864624, -0.34764501452445984, -0.3321285545825958, -0.3166120648384094, -0.3010956048965454, -0.2855791449546814, -0.270062655210495, -0.254546195268631, -0.23902972042560577, -0.22351324558258057, -0.20799678564071655, -0.19248031079769135, -0.17696383595466614, -0.16144736111164093, -0.14593088626861572, -0.1304144263267517, -0.1148979514837265, -0.0993814766407013, -0.08386500924825668, -0.06834854185581207, -0.05283209681510925, -0.037315625697374344, -0.021799154579639435, -0.006282683461904526, 0.009233787655830383, 0.02475026249885559, 0.0402667298913002, 0.05578319728374481, 0.07129967212677002, 0.08681614696979523, 0.10233261436223984, 0.11784908175468445, 0.13336555659770966, 0.14888203144073486, 0.16439849138259888, 0.17991496622562408, 0.1954314410686493, 0.2109479159116745, 0.2264643907546997, 0.24198085069656372, 0.25749731063842773, 0.27301380038261414, 0.28853026032447815, 0.30404675006866455, 0.31956321001052856, 0.3350796699523926, 0.350596159696579, 0.366112619638443, 0.3816291093826294, 0.3971455693244934, 0.4126620292663574, 0.42817848920822144, 0.44369497895240784]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 11.0, 13.0, 18.0, 23.0, 23.0, 19.0, 33.0, 34.0, 34.0, 39.0, 43.0, 45.0, 53.0, 52.0, 50.0, 61.0, 59.0, 40.0, 48.0, 43.0, 42.0, 43.0, 37.0, 23.0, 17.0, 19.0, 9.0, 14.0, 12.0, 5.0, 5.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5751937031745911, -0.5555937886238098, -0.5359938144683838, -0.5163938999176025, -0.4967939257621765, -0.4771939814090729, -0.45759403705596924, -0.437994122505188, -0.41839414834976196, -0.3987942039966583, -0.3791942596435547, -0.35959431529045105, -0.3399943709373474, -0.3203944265842438, -0.30079448223114014, -0.2811945676803589, -0.26159462332725525, -0.2419946789741516, -0.22239473462104797, -0.20279479026794434, -0.1831948459148407, -0.16359490156173706, -0.14399497210979462, -0.12439502775669098, -0.10479508340358734, -0.0851951390504837, -0.06559519469738007, -0.045995257794857025, -0.026395313441753387, -0.00679536908864975, 0.012804567813873291, 0.03240451216697693, 0.052004456520080566, 0.0716044008731842, 0.09120434522628784, 0.11080428212881088, 0.13040423393249512, 0.15000417828559875, 0.1696041077375412, 0.18920405209064484, 0.20880399644374847, 0.2284039407968521, 0.24800388514995575, 0.2676038146018982, 0.28720375895500183, 0.30680370330810547, 0.3264036476612091, 0.34600359201431274, 0.3656035363674164, 0.38520348072052, 0.40480342507362366, 0.4244033694267273, 0.44400331377983093, 0.46360325813293457, 0.4832031726837158, 0.5028031468391418, 0.5224030613899231, 0.5420029759407043, 0.5616029500961304, 0.5812028646469116, 0.6008028388023376, 0.6204027533531189, 0.6400027275085449, 0.6596026420593262, 0.6792026162147522]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 6.0, 6.0, 22.0, 27.0, 31.0, 47.0, 74.0, 125.0, 338.0, 1550.0, 66081.0, 4122557.0, 2562.0, 439.0, 153.0, 95.0, 49.0, 37.0, 29.0, 13.0, 10.0, 7.0, 5.0, 2.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1961669921875, -0.18865394592285156, -0.18114089965820312, -0.1736278533935547, -0.16611480712890625, -0.1586017608642578, -0.15108871459960938, -0.14357566833496094, -0.1360626220703125, -0.12854957580566406, -0.12103652954101562, -0.11352348327636719, -0.10601043701171875, -0.09849739074707031, -0.09098434448242188, -0.08347129821777344, -0.075958251953125, -0.06844520568847656, -0.060932159423828125, -0.05341911315917969, -0.04590606689453125, -0.03839302062988281, -0.030879974365234375, -0.023366928100585938, -0.0158538818359375, -0.008340835571289062, -0.000827789306640625, 0.0066852569580078125, 0.01419830322265625, 0.021711349487304688, 0.029224395751953125, 0.03673744201660156, 0.04425048828125, 0.05176353454589844, 0.059276580810546875, 0.06678962707519531, 0.07430267333984375, 0.08181571960449219, 0.08932876586914062, 0.09684181213378906, 0.1043548583984375, 0.11186790466308594, 0.11938095092773438, 0.1268939971923828, 0.13440704345703125, 0.1419200897216797, 0.14943313598632812, 0.15694618225097656, 0.164459228515625, 0.17197227478027344, 0.17948532104492188, 0.1869983673095703, 0.19451141357421875, 0.2020244598388672, 0.20953750610351562, 0.21705055236816406, 0.2245635986328125, 0.23207664489746094, 0.23958969116210938, 0.2471027374267578, 0.25461578369140625, 0.2621288299560547, 0.2696418762207031, 0.27715492248535156, 0.28466796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 6.0, 7.0, 6.0, 13.0, 14.0, 14.0, 29.0, 32.0, 52.0, 63.0, 61.0, 65.0, 84.0, 70.0, 72.0, 50.0, 73.0, 57.0, 42.0, 51.0, 31.0, 35.0, 20.0, 19.0, 12.0, 7.0, 6.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035308837890625, -0.033901214599609375, -0.03249359130859375, -0.031085968017578125, -0.0296783447265625, -0.028270721435546875, -0.02686309814453125, -0.025455474853515625, -0.0240478515625, -0.022640228271484375, -0.02123260498046875, -0.019824981689453125, -0.0184173583984375, -0.017009735107421875, -0.01560211181640625, -0.014194488525390625, -0.012786865234375, -0.011379241943359375, -0.00997161865234375, -0.008563995361328125, -0.0071563720703125, -0.005748748779296875, -0.00434112548828125, -0.002933502197265625, -0.00152587890625, -0.000118255615234375, 0.00128936767578125, 0.002696990966796875, 0.0041046142578125, 0.005512237548828125, 0.00691986083984375, 0.008327484130859375, 0.009735107421875, 0.011142730712890625, 0.01255035400390625, 0.013957977294921875, 0.0153656005859375, 0.016773223876953125, 0.01818084716796875, 0.019588470458984375, 0.02099609375, 0.022403717041015625, 0.02381134033203125, 0.025218963623046875, 0.0266265869140625, 0.028034210205078125, 0.02944183349609375, 0.030849456787109375, 0.032257080078125, 0.033664703369140625, 0.03507232666015625, 0.036479949951171875, 0.0378875732421875, 0.039295196533203125, 0.04070281982421875, 0.042110443115234375, 0.04351806640625, 0.044925689697265625, 0.04633331298828125, 0.047740936279296875, 0.0491485595703125, 0.050556182861328125, 0.05196380615234375, 0.053371429443359375, 0.054779052734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 12.0, 13.0, 18.0, 29.0, 42.0, 35.0, 78.0, 93.0, 136.0, 205.0, 351.0, 576.0, 1304.0, 4508.0, 208036.0, 3970323.0, 5255.0, 1517.0, 658.0, 365.0, 230.0, 142.0, 104.0, 66.0, 53.0, 34.0, 25.0, 18.0, 13.0, 11.0, 5.0, 4.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1947021484375, -0.18944740295410156, -0.18419265747070312, -0.1789379119873047, -0.17368316650390625, -0.1684284210205078, -0.16317367553710938, -0.15791893005371094, -0.1526641845703125, -0.14740943908691406, -0.14215469360351562, -0.1368999481201172, -0.13164520263671875, -0.1263904571533203, -0.12113571166992188, -0.11588096618652344, -0.110626220703125, -0.10537147521972656, -0.10011672973632812, -0.09486198425292969, -0.08960723876953125, -0.08435249328613281, -0.07909774780273438, -0.07384300231933594, -0.0685882568359375, -0.06333351135253906, -0.058078765869140625, -0.05282402038574219, -0.04756927490234375, -0.04231452941894531, -0.037059783935546875, -0.03180503845214844, -0.02655029296875, -0.021295547485351562, -0.016040802001953125, -0.010786056518554688, -0.00553131103515625, -0.0002765655517578125, 0.004978179931640625, 0.010232925415039062, 0.0154876708984375, 0.020742416381835938, 0.025997161865234375, 0.03125190734863281, 0.03650665283203125, 0.04176139831542969, 0.047016143798828125, 0.05227088928222656, 0.057525634765625, 0.06278038024902344, 0.06803512573242188, 0.07328987121582031, 0.07854461669921875, 0.08379936218261719, 0.08905410766601562, 0.09430885314941406, 0.0995635986328125, 0.10481834411621094, 0.11007308959960938, 0.11532783508300781, 0.12058258056640625, 0.1258373260498047, 0.13109207153320312, 0.13634681701660156, 0.1416015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 12.0, 28.0, 158.0, 3792.0, 60.0, 17.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08453369140625, -0.08199787139892578, -0.07946205139160156, -0.07692623138427734, -0.07439041137695312, -0.0718545913696289, -0.06931877136230469, -0.06678295135498047, -0.06424713134765625, -0.06171131134033203, -0.05917549133300781, -0.056639671325683594, -0.054103851318359375, -0.051568031311035156, -0.04903221130371094, -0.04649639129638672, -0.0439605712890625, -0.04142475128173828, -0.03888893127441406, -0.036353111267089844, -0.033817291259765625, -0.031281471252441406, -0.028745651245117188, -0.02620983123779297, -0.02367401123046875, -0.02113819122314453, -0.018602371215820312, -0.016066551208496094, -0.013530731201171875, -0.010994911193847656, -0.008459091186523438, -0.005923271179199219, -0.003387451171875, -0.0008516311645507812, 0.0016841888427734375, 0.004220008850097656, 0.006755828857421875, 0.009291648864746094, 0.011827468872070312, 0.014363288879394531, 0.01689910888671875, 0.01943492889404297, 0.021970748901367188, 0.024506568908691406, 0.027042388916015625, 0.029578208923339844, 0.03211402893066406, 0.03464984893798828, 0.0371856689453125, 0.03972148895263672, 0.04225730895996094, 0.044793128967285156, 0.047328948974609375, 0.049864768981933594, 0.05240058898925781, 0.05493640899658203, 0.05747222900390625, 0.06000804901123047, 0.06254386901855469, 0.0650796890258789, 0.06761550903320312, 0.07015132904052734, 0.07268714904785156, 0.07522296905517578, 0.0777587890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 6.0, 6.0, 13.0, 22.0, 27.0, 43.0, 57.0, 68.0, 122.0, 112.0, 104.0, 109.0, 76.0, 52.0, 44.0, 32.0, 28.0, 21.0, 17.0, 9.0, 9.0, 3.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10873913764953613, -0.1051316112279892, -0.10152409225702286, -0.09791657328605652, -0.09430904686450958, -0.09070152044296265, -0.08709400147199631, -0.08348648250102997, -0.07987895607948303, -0.0762714296579361, -0.07266391068696976, -0.06905639171600342, -0.06544886529445648, -0.061841342598199844, -0.05823381990194321, -0.05462629720568657, -0.05101877450942993, -0.047411251813173294, -0.043803729116916656, -0.04019620642066002, -0.03658868372440338, -0.032981161028146744, -0.029373638331890106, -0.02576611563563347, -0.02215859293937683, -0.018551070243120193, -0.014943547546863556, -0.011336024850606918, -0.007728502154350281, -0.004120979458093643, -0.0005134567618370056, 0.003094065934419632, 0.0067015886306762695, 0.010309111326932907, 0.013916634023189545, 0.017524156719446182, 0.02113167941570282, 0.024739202111959457, 0.028346724808216095, 0.03195424750447273, 0.03556177020072937, 0.03916929289698601, 0.042776815593242645, 0.04638433828949928, 0.04999186098575592, 0.05359938368201256, 0.057206906378269196, 0.06081442907452583, 0.06442195177078247, 0.0680294781923294, 0.07163699716329575, 0.07524451613426208, 0.07885204255580902, 0.08245956897735596, 0.0860670879483223, 0.08967460691928864, 0.09328213334083557, 0.09688965976238251, 0.10049717873334885, 0.10410469770431519, 0.10771222412586212, 0.11131975054740906, 0.1149272695183754, 0.11853478848934174, 0.12214231491088867]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 5.0, 6.0, 13.0, 12.0, 19.0, 24.0, 19.0, 36.0, 42.0, 61.0, 58.0, 59.0, 66.0, 69.0, 59.0, 78.0, 69.0, 58.0, 56.0, 47.0, 35.0, 27.0, 23.0, 14.0, 24.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1327633261680603, -0.12909595668315887, -0.12542858719825745, -0.12176122516393661, -0.11809385567903519, -0.11442648619413376, -0.11075912415981293, -0.1070917546749115, -0.10342438519001007, -0.09975701570510864, -0.09608964622020721, -0.09242228418588638, -0.08875491470098495, -0.08508754521608353, -0.0814201831817627, -0.07775281369686127, -0.07408544421195984, -0.07041807472705841, -0.06675070524215698, -0.06308334320783615, -0.05941597372293472, -0.055748604238033295, -0.052081238478422165, -0.048413872718811035, -0.04474650323390961, -0.04107913374900818, -0.03741176798939705, -0.03374440222978592, -0.03007703274488449, -0.026409665122628212, -0.022742297500371933, -0.019074929878115654, -0.015407562255859375, -0.011740194633603096, -0.008072827011346817, -0.004405459389090538, -0.000738091766834259, 0.00292927585542202, 0.006596643477678299, 0.010264011099934578, 0.013931378722190857, 0.017598746344447136, 0.021266113966703415, 0.024933481588959694, 0.028600849211215973, 0.0322682186961174, 0.03593558445572853, 0.03960295021533966, 0.04327031970024109, 0.04693768918514252, 0.05060505494475365, 0.05427242070436478, 0.057939790189266205, 0.06160715967416763, 0.06527452170848846, 0.06894189119338989, 0.07260926067829132, 0.07627663016319275, 0.07994399964809418, 0.08361136168241501, 0.08727873116731644, 0.09094610065221786, 0.0946134626865387, 0.09828083217144012, 0.10194820165634155]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 12.0, 23.0, 25.0, 58.0, 64.0, 135.0, 222.0, 447.0, 788.0, 1676.0, 3835.0, 10179.0, 29992.0, 108724.0, 415534.0, 350872.0, 86217.0, 24620.0, 8525.0, 3522.0, 1482.0, 706.0, 357.0, 224.0, 114.0, 73.0, 44.0, 14.0, 19.0, 12.0, 3.0, 6.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05035400390625, -0.048333168029785156, -0.04631233215332031, -0.04429149627685547, -0.042270660400390625, -0.04024982452392578, -0.03822898864746094, -0.036208152770996094, -0.03418731689453125, -0.032166481018066406, -0.030145645141601562, -0.02812480926513672, -0.026103973388671875, -0.02408313751220703, -0.022062301635742188, -0.020041465759277344, -0.0180206298828125, -0.015999794006347656, -0.013978958129882812, -0.011958122253417969, -0.009937286376953125, -0.007916450500488281, -0.0058956146240234375, -0.0038747787475585938, -0.00185394287109375, 0.00016689300537109375, 0.0021877288818359375, 0.004208564758300781, 0.006229400634765625, 0.008250236511230469, 0.010271072387695312, 0.012291908264160156, 0.014312744140625, 0.016333580017089844, 0.018354415893554688, 0.02037525177001953, 0.022396087646484375, 0.02441692352294922, 0.026437759399414062, 0.028458595275878906, 0.03047943115234375, 0.032500267028808594, 0.03452110290527344, 0.03654193878173828, 0.038562774658203125, 0.04058361053466797, 0.04260444641113281, 0.044625282287597656, 0.0466461181640625, 0.048666954040527344, 0.05068778991699219, 0.05270862579345703, 0.054729461669921875, 0.05675029754638672, 0.05877113342285156, 0.060791969299316406, 0.06281280517578125, 0.0648336410522461, 0.06685447692871094, 0.06887531280517578, 0.07089614868164062, 0.07291698455810547, 0.07493782043457031, 0.07695865631103516, 0.0789794921875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 8.0, 8.0, 8.0, 19.0, 11.0, 26.0, 23.0, 42.0, 52.0, 54.0, 58.0, 79.0, 67.0, 80.0, 59.0, 76.0, 59.0, 52.0, 47.0, 38.0, 34.0, 25.0, 21.0, 19.0, 9.0, 11.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03729248046875, -0.03584480285644531, -0.034397125244140625, -0.03294944763183594, -0.03150177001953125, -0.030054092407226562, -0.028606414794921875, -0.027158737182617188, -0.0257110595703125, -0.024263381958007812, -0.022815704345703125, -0.021368026733398438, -0.01992034912109375, -0.018472671508789062, -0.017024993896484375, -0.015577316284179688, -0.014129638671875, -0.012681961059570312, -0.011234283447265625, -0.009786605834960938, -0.00833892822265625, -0.0068912506103515625, -0.005443572998046875, -0.0039958953857421875, -0.0025482177734375, -0.0011005401611328125, 0.000347137451171875, 0.0017948150634765625, 0.00324249267578125, 0.0046901702880859375, 0.006137847900390625, 0.0075855255126953125, 0.009033203125, 0.010480880737304688, 0.011928558349609375, 0.013376235961914062, 0.01482391357421875, 0.016271591186523438, 0.017719268798828125, 0.019166946411132812, 0.0206146240234375, 0.022062301635742188, 0.023509979248046875, 0.024957656860351562, 0.02640533447265625, 0.027853012084960938, 0.029300689697265625, 0.030748367309570312, 0.032196044921875, 0.03364372253417969, 0.035091400146484375, 0.03653907775878906, 0.03798675537109375, 0.03943443298339844, 0.040882110595703125, 0.04232978820800781, 0.0437774658203125, 0.04522514343261719, 0.046672821044921875, 0.04812049865722656, 0.04956817626953125, 0.05101585388183594, 0.052463531494140625, 0.05391120910644531, 0.05535888671875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 8.0, 10.0, 9.0, 12.0, 18.0, 26.0, 24.0, 37.0, 55.0, 58.0, 96.0, 141.0, 253.0, 377.0, 650.0, 1500.0, 4076.0, 14173.0, 73501.0, 597315.0, 303577.0, 38605.0, 8752.0, 2763.0, 1085.0, 530.0, 284.0, 179.0, 130.0, 84.0, 63.0, 42.0, 30.0, 19.0, 19.0, 12.0, 7.0, 9.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07342529296875, -0.07104301452636719, -0.06866073608398438, -0.06627845764160156, -0.06389617919921875, -0.06151390075683594, -0.059131622314453125, -0.05674934387207031, -0.0543670654296875, -0.05198478698730469, -0.049602508544921875, -0.04722023010253906, -0.04483795166015625, -0.04245567321777344, -0.040073394775390625, -0.03769111633300781, -0.035308837890625, -0.03292655944824219, -0.030544281005859375, -0.028162002563476562, -0.02577972412109375, -0.023397445678710938, -0.021015167236328125, -0.018632888793945312, -0.0162506103515625, -0.013868331909179688, -0.011486053466796875, -0.009103775024414062, -0.00672149658203125, -0.0043392181396484375, -0.001956939697265625, 0.0004253387451171875, 0.0028076171875, 0.0051898956298828125, 0.007572174072265625, 0.009954452514648438, 0.01233673095703125, 0.014719009399414062, 0.017101287841796875, 0.019483566284179688, 0.0218658447265625, 0.024248123168945312, 0.026630401611328125, 0.029012680053710938, 0.03139495849609375, 0.03377723693847656, 0.036159515380859375, 0.03854179382324219, 0.040924072265625, 0.04330635070800781, 0.045688629150390625, 0.04807090759277344, 0.05045318603515625, 0.05283546447753906, 0.055217742919921875, 0.05760002136230469, 0.0599822998046875, 0.06236457824707031, 0.06474685668945312, 0.06712913513183594, 0.06951141357421875, 0.07189369201660156, 0.07427597045898438, 0.07665824890136719, 0.07904052734375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 2.0, 12.0, 14.0, 16.0, 24.0, 27.0, 43.0, 37.0, 46.0, 55.0, 49.0, 60.0, 54.0, 74.0, 58.0, 58.0, 57.0, 58.0, 42.0, 46.0, 39.0, 42.0, 20.0, 16.0, 15.0, 11.0, 11.0, 10.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1883544921875, -0.1832714080810547, -0.17818832397460938, -0.17310523986816406, -0.16802215576171875, -0.16293907165527344, -0.15785598754882812, -0.1527729034423828, -0.1476898193359375, -0.1426067352294922, -0.13752365112304688, -0.13244056701660156, -0.12735748291015625, -0.12227439880371094, -0.11719131469726562, -0.11210823059082031, -0.107025146484375, -0.10194206237792969, -0.09685897827148438, -0.09177589416503906, -0.08669281005859375, -0.08160972595214844, -0.07652664184570312, -0.07144355773925781, -0.0663604736328125, -0.06127738952636719, -0.056194305419921875, -0.05111122131347656, -0.04602813720703125, -0.04094505310058594, -0.035861968994140625, -0.030778884887695312, -0.02569580078125, -0.020612716674804688, -0.015529632568359375, -0.010446548461914062, -0.00536346435546875, -0.0002803802490234375, 0.004802703857421875, 0.009885787963867188, 0.0149688720703125, 0.020051956176757812, 0.025135040283203125, 0.030218124389648438, 0.03530120849609375, 0.04038429260253906, 0.045467376708984375, 0.05055046081542969, 0.055633544921875, 0.06071662902832031, 0.06579971313476562, 0.07088279724121094, 0.07596588134765625, 0.08104896545410156, 0.08613204956054688, 0.09121513366699219, 0.0962982177734375, 0.10138130187988281, 0.10646438598632812, 0.11154747009277344, 0.11663055419921875, 0.12171363830566406, 0.12679672241210938, 0.1318798065185547, 0.136962890625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 15.0, 9.0, 32.0, 40.0, 93.0, 199.0, 427.0, 1381.0, 6951.0, 93508.0, 887052.0, 51865.0, 5109.0, 1142.0, 363.0, 144.0, 84.0, 36.0, 35.0, 19.0, 7.0, 2.0, 8.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04180908203125, -0.04059410095214844, -0.039379119873046875, -0.03816413879394531, -0.03694915771484375, -0.03573417663574219, -0.034519195556640625, -0.03330421447753906, -0.0320892333984375, -0.030874252319335938, -0.029659271240234375, -0.028444290161132812, -0.02722930908203125, -0.026014328002929688, -0.024799346923828125, -0.023584365844726562, -0.022369384765625, -0.021154403686523438, -0.019939422607421875, -0.018724441528320312, -0.01750946044921875, -0.016294479370117188, -0.015079498291015625, -0.013864517211914062, -0.0126495361328125, -0.011434555053710938, -0.010219573974609375, -0.009004592895507812, -0.00778961181640625, -0.0065746307373046875, -0.005359649658203125, -0.0041446685791015625, -0.0029296875, -0.0017147064208984375, -0.000499725341796875, 0.0007152557373046875, 0.00193023681640625, 0.0031452178955078125, 0.004360198974609375, 0.0055751800537109375, 0.0067901611328125, 0.008005142211914062, 0.009220123291015625, 0.010435104370117188, 0.01165008544921875, 0.012865066528320312, 0.014080047607421875, 0.015295028686523438, 0.016510009765625, 0.017724990844726562, 0.018939971923828125, 0.020154953002929688, 0.02136993408203125, 0.022584915161132812, 0.023799896240234375, 0.025014877319335938, 0.0262298583984375, 0.027444839477539062, 0.028659820556640625, 0.029874801635742188, 0.03108978271484375, 0.03230476379394531, 0.033519744873046875, 0.03473472595214844, 0.03594970703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 9.0, 13.0, 15.0, 18.0, 15.0, 35.0, 62.0, 60.0, 77.0, 87.0, 109.0, 104.0, 91.0, 91.0, 63.0, 45.0, 38.0, 24.0, 16.0, 11.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.881092071533203e-06, -8.646398782730103e-06, -8.411705493927002e-06, -8.177012205123901e-06, -7.9423189163208e-06, -7.7076256275177e-06, -7.4729323387146e-06, -7.238239049911499e-06, -7.0035457611083984e-06, -6.768852472305298e-06, -6.534159183502197e-06, -6.299465894699097e-06, -6.064772605895996e-06, -5.8300793170928955e-06, -5.595386028289795e-06, -5.360692739486694e-06, -5.125999450683594e-06, -4.891306161880493e-06, -4.656612873077393e-06, -4.421919584274292e-06, -4.187226295471191e-06, -3.952533006668091e-06, -3.7178397178649902e-06, -3.4831464290618896e-06, -3.248453140258789e-06, -3.0137598514556885e-06, -2.779066562652588e-06, -2.5443732738494873e-06, -2.3096799850463867e-06, -2.074986696243286e-06, -1.8402934074401855e-06, -1.605600118637085e-06, -1.3709068298339844e-06, -1.1362135410308838e-06, -9.015202522277832e-07, -6.668269634246826e-07, -4.3213367462158203e-07, -1.9744038581848145e-07, 3.725290298461914e-08, 2.7194619178771973e-07, 5.066394805908203e-07, 7.413327693939209e-07, 9.760260581970215e-07, 1.210719347000122e-06, 1.4454126358032227e-06, 1.6801059246063232e-06, 1.914799213409424e-06, 2.1494925022125244e-06, 2.384185791015625e-06, 2.6188790798187256e-06, 2.853572368621826e-06, 3.0882656574249268e-06, 3.3229589462280273e-06, 3.557652235031128e-06, 3.7923455238342285e-06, 4.027038812637329e-06, 4.26173210144043e-06, 4.49642539024353e-06, 4.731118679046631e-06, 4.9658119678497314e-06, 5.200505256652832e-06, 5.435198545455933e-06, 5.669891834259033e-06, 5.904585123062134e-06, 6.139278411865234e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 19.0, 27.0, 40.0, 92.0, 181.0, 651.0, 3507.0, 110892.0, 915480.0, 15590.0, 1437.0, 371.0, 133.0, 52.0, 37.0, 22.0, 10.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07757568359375, -0.07560014724731445, -0.0736246109008789, -0.07164907455444336, -0.06967353820800781, -0.06769800186157227, -0.06572246551513672, -0.06374692916870117, -0.061771392822265625, -0.05979585647583008, -0.05782032012939453, -0.055844783782958984, -0.05386924743652344, -0.05189371109008789, -0.049918174743652344, -0.0479426383972168, -0.04596710205078125, -0.0439915657043457, -0.042016029357910156, -0.04004049301147461, -0.03806495666503906, -0.036089420318603516, -0.03411388397216797, -0.03213834762573242, -0.030162811279296875, -0.028187274932861328, -0.02621173858642578, -0.024236202239990234, -0.022260665893554688, -0.02028512954711914, -0.018309593200683594, -0.016334056854248047, -0.0143585205078125, -0.012382984161376953, -0.010407447814941406, -0.00843191146850586, -0.0064563751220703125, -0.004480838775634766, -0.0025053024291992188, -0.0005297660827636719, 0.001445770263671875, 0.003421306610107422, 0.005396842956542969, 0.007372379302978516, 0.009347915649414062, 0.01132345199584961, 0.013298988342285156, 0.015274524688720703, 0.01725006103515625, 0.019225597381591797, 0.021201133728027344, 0.02317667007446289, 0.025152206420898438, 0.027127742767333984, 0.02910327911376953, 0.031078815460205078, 0.033054351806640625, 0.03502988815307617, 0.03700542449951172, 0.038980960845947266, 0.04095649719238281, 0.04293203353881836, 0.044907569885253906, 0.04688310623168945, 0.048858642578125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 8.0, 17.0, 26.0, 65.0, 135.0, 211.0, 227.0, 148.0, 83.0, 34.0, 20.0, 12.0, 8.0, 7.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.11785888671875, -0.11551141738891602, -0.11316394805908203, -0.11081647872924805, -0.10846900939941406, -0.10612154006958008, -0.1037740707397461, -0.10142660140991211, -0.09907913208007812, -0.09673166275024414, -0.09438419342041016, -0.09203672409057617, -0.08968925476074219, -0.0873417854309082, -0.08499431610107422, -0.08264684677124023, -0.08029937744140625, -0.07795190811157227, -0.07560443878173828, -0.0732569694519043, -0.07090950012207031, -0.06856203079223633, -0.06621456146240234, -0.06386709213256836, -0.061519622802734375, -0.05917215347290039, -0.056824684143066406, -0.05447721481323242, -0.05212974548339844, -0.04978227615356445, -0.04743480682373047, -0.045087337493896484, -0.0427398681640625, -0.040392398834228516, -0.03804492950439453, -0.03569746017456055, -0.03334999084472656, -0.031002521514892578, -0.028655052185058594, -0.02630758285522461, -0.023960113525390625, -0.02161264419555664, -0.019265174865722656, -0.016917705535888672, -0.014570236206054688, -0.012222766876220703, -0.009875297546386719, -0.007527828216552734, -0.00518035888671875, -0.0028328895568847656, -0.00048542022705078125, 0.0018620491027832031, 0.0042095184326171875, 0.006556987762451172, 0.008904457092285156, 0.01125192642211914, 0.013599395751953125, 0.01594686508178711, 0.018294334411621094, 0.020641803741455078, 0.022989273071289062, 0.025336742401123047, 0.02768421173095703, 0.030031681060791016, 0.032379150390625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 12.0, 13.0, 17.0, 51.0, 82.0, 142.0, 229.0, 184.0, 139.0, 58.0, 28.0, 21.0, 13.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9361363053321838, -0.9138217568397522, -0.8915072083473206, -0.8691926598548889, -0.8468781113624573, -0.8245635628700256, -0.8022490739822388, -0.7799345254898071, -0.7576199769973755, -0.7353054285049438, -0.7129908800125122, -0.6906763315200806, -0.6683617830276489, -0.6460472345352173, -0.6237326860427856, -0.601418137550354, -0.5791035890579224, -0.5567890405654907, -0.5344744920730591, -0.5121599435806274, -0.4898453950881958, -0.46753084659576416, -0.4452163279056549, -0.42290177941322327, -0.4005872309207916, -0.37827268242836, -0.35595813393592834, -0.3336436152458191, -0.31132906675338745, -0.2890145182609558, -0.26669996976852417, -0.24438542127609253, -0.22207093238830566, -0.19975638389587402, -0.17744183540344238, -0.15512730181217194, -0.1328127533197403, -0.11049820482730865, -0.08818367123603821, -0.06586912274360657, -0.04355457425117493, -0.021240029484033585, 0.0010745152831077576, 0.0233890563249588, 0.04570360481739044, 0.06801815330982208, 0.09033268690109253, 0.11264723539352417, 0.1349617838859558, 0.15727633237838745, 0.1795908808708191, 0.20190541446208954, 0.22421996295452118, 0.24653451144695282, 0.26884904503822327, 0.2911635935306549, 0.31347814202308655, 0.3357926905155182, 0.35810723900794983, 0.3804217576980591, 0.4027363061904907, 0.42505085468292236, 0.447365403175354, 0.46967995166778564, 0.4919945001602173]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 4.0, 12.0, 14.0, 7.0, 7.0, 15.0, 21.0, 17.0, 20.0, 31.0, 26.0, 30.0, 35.0, 34.0, 39.0, 42.0, 34.0, 56.0, 40.0, 51.0, 47.0, 39.0, 30.0, 41.0, 34.0, 34.0, 36.0, 31.0, 32.0, 19.0, 28.0, 20.0, 12.0, 10.0, 10.0, 6.0, 3.0, 8.0, 9.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5566298365592957, -0.5407960414886475, -0.5249622464179993, -0.5091284513473511, -0.49329468607902527, -0.4774608910083771, -0.46162712574005127, -0.4457933306694031, -0.4299595355987549, -0.4141257405281067, -0.3982919454574585, -0.3824581801891327, -0.3666243851184845, -0.3507905900478363, -0.3349568247795105, -0.3191230297088623, -0.3032892346382141, -0.2874554395675659, -0.2716216444969177, -0.2557878792285919, -0.23995408415794373, -0.22412028908729553, -0.20828650891780853, -0.19245272874832153, -0.17661893367767334, -0.16078513860702515, -0.14495135843753815, -0.12911757826805115, -0.11328378319740295, -0.09744999557733536, -0.08161620795726776, -0.06578242033720016, -0.049948692321777344, -0.03411490470170975, -0.01828111708164215, -0.0024473294615745544, 0.013386458158493042, 0.02922024577856064, 0.045054033398628235, 0.06088782101869583, 0.07672160863876343, 0.09255539625883102, 0.10838918387889862, 0.12422297149896622, 0.1400567591190338, 0.155890554189682, 0.171724334359169, 0.187558114528656, 0.2033919095993042, 0.2192257046699524, 0.2350594848394394, 0.2508932650089264, 0.2667270600795746, 0.2825608551502228, 0.2983946204185486, 0.3142284154891968, 0.33006221055984497, 0.34589600563049316, 0.36172980070114136, 0.37756356596946716, 0.39339736104011536, 0.40923115611076355, 0.42506492137908936, 0.44089871644973755, 0.45673251152038574]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 5.0, 15.0, 14.0, 38.0, 43.0, 87.0, 141.0, 241.0, 534.0, 1306.0, 3307.0, 10519.0, 56237.0, 3644236.0, 443604.0, 24289.0, 5996.0, 2118.0, 726.0, 349.0, 159.0, 90.0, 61.0, 41.0, 29.0, 18.0, 14.0, 9.0, 8.0, 8.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0947265625, -0.09192276000976562, -0.08911895751953125, -0.08631515502929688, -0.0835113525390625, -0.08070755004882812, -0.07790374755859375, -0.07509994506835938, -0.072296142578125, -0.06949234008789062, -0.06668853759765625, -0.06388473510742188, -0.0610809326171875, -0.058277130126953125, -0.05547332763671875, -0.052669525146484375, -0.04986572265625, -0.047061920166015625, -0.04425811767578125, -0.041454315185546875, -0.0386505126953125, -0.035846710205078125, -0.03304290771484375, -0.030239105224609375, -0.027435302734375, -0.024631500244140625, -0.02182769775390625, -0.019023895263671875, -0.0162200927734375, -0.013416290283203125, -0.01061248779296875, -0.007808685302734375, -0.0050048828125, -0.002201080322265625, 0.00060272216796875, 0.003406524658203125, 0.0062103271484375, 0.009014129638671875, 0.01181793212890625, 0.014621734619140625, 0.017425537109375, 0.020229339599609375, 0.02303314208984375, 0.025836944580078125, 0.0286407470703125, 0.031444549560546875, 0.03424835205078125, 0.037052154541015625, 0.03985595703125, 0.042659759521484375, 0.04546356201171875, 0.048267364501953125, 0.0510711669921875, 0.053874969482421875, 0.05667877197265625, 0.059482574462890625, 0.062286376953125, 0.06509017944335938, 0.06789398193359375, 0.07069778442382812, 0.0735015869140625, 0.07630538940429688, 0.07910919189453125, 0.08191299438476562, 0.084716796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 10.0, 11.0, 26.0, 17.0, 40.0, 36.0, 44.0, 51.0, 65.0, 63.0, 85.0, 69.0, 65.0, 65.0, 52.0, 51.0, 51.0, 44.0, 39.0, 30.0, 18.0, 19.0, 16.0, 7.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03619384765625, -0.03489398956298828, -0.03359413146972656, -0.032294273376464844, -0.030994415283203125, -0.029694557189941406, -0.028394699096679688, -0.02709484100341797, -0.02579498291015625, -0.02449512481689453, -0.023195266723632812, -0.021895408630371094, -0.020595550537109375, -0.019295692443847656, -0.017995834350585938, -0.01669597625732422, -0.0153961181640625, -0.014096260070800781, -0.012796401977539062, -0.011496543884277344, -0.010196685791015625, -0.008896827697753906, -0.0075969696044921875, -0.006297111511230469, -0.00499725341796875, -0.0036973953247070312, -0.0023975372314453125, -0.0010976791381835938, 0.000202178955078125, 0.0015020370483398438, 0.0028018951416015625, 0.004101753234863281, 0.005401611328125, 0.006701469421386719, 0.008001327514648438, 0.009301185607910156, 0.010601043701171875, 0.011900901794433594, 0.013200759887695312, 0.014500617980957031, 0.01580047607421875, 0.01710033416748047, 0.018400192260742188, 0.019700050354003906, 0.020999908447265625, 0.022299766540527344, 0.023599624633789062, 0.02489948272705078, 0.0261993408203125, 0.02749919891357422, 0.028799057006835938, 0.030098915100097656, 0.031398773193359375, 0.032698631286621094, 0.03399848937988281, 0.03529834747314453, 0.03659820556640625, 0.03789806365966797, 0.03919792175292969, 0.040497779846191406, 0.041797637939453125, 0.043097496032714844, 0.04439735412597656, 0.04569721221923828, 0.0469970703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 7.0, 2.0, 5.0, 10.0, 16.0, 25.0, 18.0, 56.0, 102.0, 255.0, 842.0, 3529.0, 35141.0, 4042300.0, 103734.0, 6462.0, 1156.0, 339.0, 130.0, 54.0, 37.0, 16.0, 12.0, 9.0, 7.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.14772987365722656, -0.14274978637695312, -0.1377696990966797, -0.13278961181640625, -0.1278095245361328, -0.12282943725585938, -0.11784934997558594, -0.1128692626953125, -0.10788917541503906, -0.10290908813476562, -0.09792900085449219, -0.09294891357421875, -0.08796882629394531, -0.08298873901367188, -0.07800865173339844, -0.073028564453125, -0.06804847717285156, -0.06306838989257812, -0.05808830261230469, -0.05310821533203125, -0.04812812805175781, -0.043148040771484375, -0.03816795349121094, -0.0331878662109375, -0.028207778930664062, -0.023227691650390625, -0.018247604370117188, -0.01326751708984375, -0.008287429809570312, -0.003307342529296875, 0.0016727447509765625, 0.00665283203125, 0.011632919311523438, 0.016613006591796875, 0.021593093872070312, 0.02657318115234375, 0.03155326843261719, 0.036533355712890625, 0.04151344299316406, 0.0464935302734375, 0.05147361755371094, 0.056453704833984375, 0.06143379211425781, 0.06641387939453125, 0.07139396667480469, 0.07637405395507812, 0.08135414123535156, 0.086334228515625, 0.09131431579589844, 0.09629440307617188, 0.10127449035644531, 0.10625457763671875, 0.11123466491699219, 0.11621475219726562, 0.12119483947753906, 0.1261749267578125, 0.13115501403808594, 0.13613510131835938, 0.1411151885986328, 0.14609527587890625, 0.1510753631591797, 0.15605545043945312, 0.16103553771972656, 0.166015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 5.0, 13.0, 17.0, 24.0, 26.0, 40.0, 70.0, 210.0, 977.0, 2027.0, 403.0, 100.0, 42.0, 37.0, 23.0, 12.0, 9.0, 4.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09222412109375, -0.08907222747802734, -0.08592033386230469, -0.08276844024658203, -0.07961654663085938, -0.07646465301513672, -0.07331275939941406, -0.0701608657836914, -0.06700897216796875, -0.0638570785522461, -0.06070518493652344, -0.05755329132080078, -0.054401397705078125, -0.05124950408935547, -0.04809761047363281, -0.044945716857910156, -0.0417938232421875, -0.038641929626464844, -0.03549003601074219, -0.03233814239501953, -0.029186248779296875, -0.02603435516357422, -0.022882461547851562, -0.019730567932128906, -0.01657867431640625, -0.013426780700683594, -0.010274887084960938, -0.007122993469238281, -0.003971099853515625, -0.0008192062377929688, 0.0023326873779296875, 0.005484580993652344, 0.008636474609375, 0.011788368225097656, 0.014940261840820312, 0.01809215545654297, 0.021244049072265625, 0.02439594268798828, 0.027547836303710938, 0.030699729919433594, 0.03385162353515625, 0.037003517150878906, 0.04015541076660156, 0.04330730438232422, 0.046459197998046875, 0.04961109161376953, 0.05276298522949219, 0.055914878845214844, 0.0590667724609375, 0.062218666076660156, 0.06537055969238281, 0.06852245330810547, 0.07167434692382812, 0.07482624053955078, 0.07797813415527344, 0.0811300277709961, 0.08428192138671875, 0.0874338150024414, 0.09058570861816406, 0.09373760223388672, 0.09688949584960938, 0.10004138946533203, 0.10319328308105469, 0.10634517669677734, 0.1094970703125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 9.0, 11.0, 16.0, 38.0, 58.0, 109.0, 201.0, 237.0, 172.0, 82.0, 29.0, 17.0, 9.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9746444821357727, -0.9533088207244873, -0.9319731593132019, -0.9106374979019165, -0.8893017768859863, -0.8679661154747009, -0.8466304540634155, -0.8252947926521301, -0.8039591312408447, -0.7826234698295593, -0.7612878084182739, -0.7399521470069885, -0.7186164855957031, -0.697280764579773, -0.6759451031684875, -0.6546094417572021, -0.6332737803459167, -0.6119381189346313, -0.590602457523346, -0.5692667961120605, -0.5479310750961304, -0.526595413684845, -0.5052597522735596, -0.48392409086227417, -0.46258842945098877, -0.44125276803970337, -0.41991710662841797, -0.3985814154148102, -0.3772457540035248, -0.3559100925922394, -0.3345744013786316, -0.3132387399673462, -0.2919030785560608, -0.2705674171447754, -0.2492317408323288, -0.2278960645198822, -0.2065604031085968, -0.1852247416973114, -0.1638890653848648, -0.1425533890724182, -0.12121772766113281, -0.09988205879926682, -0.07854638993740082, -0.05721072107553482, -0.03587505221366882, -0.014539383351802826, 0.006796285510063171, 0.028131961822509766, 0.049467623233795166, 0.07080329209566116, 0.09213896095752716, 0.11347462981939316, 0.13481029868125916, 0.15614596009254456, 0.17748163640499115, 0.19881731271743774, 0.22015297412872314, 0.24148863554000854, 0.26282429695129395, 0.28415998816490173, 0.30549564957618713, 0.32683131098747253, 0.3481670022010803, 0.3695026636123657, 0.3908383250236511]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 7.0, 7.0, 5.0, 8.0, 6.0, 12.0, 12.0, 18.0, 11.0, 17.0, 18.0, 22.0, 35.0, 25.0, 31.0, 19.0, 30.0, 45.0, 25.0, 41.0, 34.0, 46.0, 38.0, 42.0, 33.0, 50.0, 29.0, 28.0, 44.0, 32.0, 26.0, 31.0, 14.0, 26.0, 21.0, 18.0, 15.0, 18.0, 13.0, 6.0, 14.0, 5.0, 3.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.22781729698181152, -0.21995075047016144, -0.21208421885967255, -0.20421767234802246, -0.19635114073753357, -0.18848459422588348, -0.1806180477142334, -0.1727515161037445, -0.16488496959209442, -0.15701842308044434, -0.14915189146995544, -0.14128534495830536, -0.13341879844665527, -0.12555226683616638, -0.1176857203245163, -0.10981918126344681, -0.10195264220237732, -0.09408610314130783, -0.08621956408023834, -0.07835301756858826, -0.07048647850751877, -0.06261993944644928, -0.05475339666008949, -0.046886853873729706, -0.03902031481266022, -0.03115377388894558, -0.023287232965230942, -0.015420692041516304, -0.007554151117801666, 0.00031238794326782227, 0.00817893072962761, 0.016045473515987396, 0.023912012577056885, 0.03177855163812637, 0.03964509442448616, 0.04751163721084595, 0.055378176271915436, 0.06324471533298492, 0.07111126184463501, 0.0789778009057045, 0.08684433996677399, 0.09471087902784348, 0.10257741808891296, 0.11044396460056305, 0.11831050366163254, 0.12617704272270203, 0.1340435892343521, 0.1419101357460022, 0.1497766673564911, 0.15764321386814117, 0.16550974547863007, 0.17337629199028015, 0.18124282360076904, 0.18910937011241913, 0.1969759166240692, 0.2048424482345581, 0.2127089947462082, 0.22057554125785828, 0.22844207286834717, 0.23630861937999725, 0.24417516589164734, 0.25204169750213623, 0.2599082291126251, 0.2677747905254364, 0.2756413221359253]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 20.0, 18.0, 20.0, 47.0, 61.0, 116.0, 165.0, 339.0, 608.0, 1199.0, 2933.0, 7255.0, 20937.0, 69278.0, 222220.0, 399518.0, 221101.0, 69115.0, 20999.0, 7251.0, 2719.0, 1267.0, 581.0, 288.0, 179.0, 116.0, 56.0, 45.0, 30.0, 20.0, 12.0, 11.0, 10.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04986572265625, -0.048230648040771484, -0.04659557342529297, -0.04496049880981445, -0.04332542419433594, -0.04169034957885742, -0.040055274963378906, -0.03842020034790039, -0.036785125732421875, -0.03515005111694336, -0.033514976501464844, -0.03187990188598633, -0.030244827270507812, -0.028609752655029297, -0.02697467803955078, -0.025339603424072266, -0.02370452880859375, -0.022069454193115234, -0.02043437957763672, -0.018799304962158203, -0.017164230346679688, -0.015529155731201172, -0.013894081115722656, -0.01225900650024414, -0.010623931884765625, -0.00898885726928711, -0.007353782653808594, -0.005718708038330078, -0.0040836334228515625, -0.002448558807373047, -0.0008134841918945312, 0.0008215904235839844, 0.0024566650390625, 0.004091739654541016, 0.005726814270019531, 0.007361888885498047, 0.008996963500976562, 0.010632038116455078, 0.012267112731933594, 0.01390218734741211, 0.015537261962890625, 0.01717233657836914, 0.018807411193847656, 0.020442485809326172, 0.022077560424804688, 0.023712635040283203, 0.02534770965576172, 0.026982784271240234, 0.02861785888671875, 0.030252933502197266, 0.03188800811767578, 0.0335230827331543, 0.03515815734863281, 0.03679323196411133, 0.038428306579589844, 0.04006338119506836, 0.041698455810546875, 0.04333353042602539, 0.044968605041503906, 0.04660367965698242, 0.04823875427246094, 0.04987382888793945, 0.05150890350341797, 0.053143978118896484, 0.054779052734375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 8.0, 7.0, 9.0, 15.0, 15.0, 18.0, 27.0, 38.0, 39.0, 51.0, 60.0, 54.0, 67.0, 72.0, 60.0, 66.0, 49.0, 63.0, 52.0, 44.0, 44.0, 31.0, 38.0, 17.0, 18.0, 17.0, 5.0, 5.0, 9.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.035125732421875, -0.03385019302368164, -0.03257465362548828, -0.03129911422729492, -0.030023574829101562, -0.028748035430908203, -0.027472496032714844, -0.026196956634521484, -0.024921417236328125, -0.023645877838134766, -0.022370338439941406, -0.021094799041748047, -0.019819259643554688, -0.018543720245361328, -0.01726818084716797, -0.01599264144897461, -0.01471710205078125, -0.01344156265258789, -0.012166023254394531, -0.010890483856201172, -0.009614944458007812, -0.008339405059814453, -0.007063865661621094, -0.005788326263427734, -0.004512786865234375, -0.0032372474670410156, -0.0019617080688476562, -0.0006861686706542969, 0.0005893707275390625, 0.0018649101257324219, 0.0031404495239257812, 0.004415988922119141, 0.0056915283203125, 0.006967067718505859, 0.008242607116699219, 0.009518146514892578, 0.010793685913085938, 0.012069225311279297, 0.013344764709472656, 0.014620304107666016, 0.015895843505859375, 0.017171382904052734, 0.018446922302246094, 0.019722461700439453, 0.020998001098632812, 0.022273540496826172, 0.02354907989501953, 0.02482461929321289, 0.02610015869140625, 0.02737569808959961, 0.02865123748779297, 0.029926776885986328, 0.031202316284179688, 0.03247785568237305, 0.033753395080566406, 0.035028934478759766, 0.036304473876953125, 0.037580013275146484, 0.038855552673339844, 0.0401310920715332, 0.04140663146972656, 0.04268217086791992, 0.04395771026611328, 0.04523324966430664, 0.0465087890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 9.0, 5.0, 6.0, 7.0, 9.0, 21.0, 23.0, 37.0, 43.0, 57.0, 98.0, 181.0, 272.0, 426.0, 711.0, 1380.0, 3570.0, 15691.0, 156705.0, 748477.0, 103141.0, 11791.0, 2957.0, 1249.0, 667.0, 370.0, 237.0, 116.0, 82.0, 56.0, 50.0, 35.0, 19.0, 10.0, 10.0, 10.0, 1.0, 5.0, 7.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09515380859375, -0.0924673080444336, -0.08978080749511719, -0.08709430694580078, -0.08440780639648438, -0.08172130584716797, -0.07903480529785156, -0.07634830474853516, -0.07366180419921875, -0.07097530364990234, -0.06828880310058594, -0.06560230255126953, -0.06291580200195312, -0.06022930145263672, -0.05754280090332031, -0.054856300354003906, -0.0521697998046875, -0.049483299255371094, -0.04679679870605469, -0.04411029815673828, -0.041423797607421875, -0.03873729705810547, -0.03605079650878906, -0.033364295959472656, -0.03067779541015625, -0.027991294860839844, -0.025304794311523438, -0.02261829376220703, -0.019931793212890625, -0.01724529266357422, -0.014558792114257812, -0.011872291564941406, -0.009185791015625, -0.006499290466308594, -0.0038127899169921875, -0.0011262893676757812, 0.001560211181640625, 0.004246711730957031, 0.0069332122802734375, 0.009619712829589844, 0.01230621337890625, 0.014992713928222656, 0.017679214477539062, 0.02036571502685547, 0.023052215576171875, 0.02573871612548828, 0.028425216674804688, 0.031111717224121094, 0.0337982177734375, 0.036484718322753906, 0.03917121887207031, 0.04185771942138672, 0.044544219970703125, 0.04723072052001953, 0.04991722106933594, 0.052603721618652344, 0.05529022216796875, 0.057976722717285156, 0.06066322326660156, 0.06334972381591797, 0.06603622436523438, 0.06872272491455078, 0.07140922546386719, 0.0740957260131836, 0.0767822265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 10.0, 8.0, 12.0, 19.0, 13.0, 22.0, 22.0, 29.0, 33.0, 31.0, 35.0, 38.0, 55.0, 50.0, 60.0, 50.0, 50.0, 56.0, 56.0, 34.0, 53.0, 28.0, 33.0, 31.0, 26.0, 25.0, 22.0, 13.0, 27.0, 14.0, 5.0, 8.0, 5.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.112548828125, -0.10906410217285156, -0.10557937622070312, -0.10209465026855469, -0.09860992431640625, -0.09512519836425781, -0.09164047241210938, -0.08815574645996094, -0.0846710205078125, -0.08118629455566406, -0.07770156860351562, -0.07421684265136719, -0.07073211669921875, -0.06724739074707031, -0.06376266479492188, -0.06027793884277344, -0.056793212890625, -0.05330848693847656, -0.049823760986328125, -0.04633903503417969, -0.04285430908203125, -0.03936958312988281, -0.035884857177734375, -0.03240013122558594, -0.0289154052734375, -0.025430679321289062, -0.021945953369140625, -0.018461227416992188, -0.01497650146484375, -0.011491775512695312, -0.008007049560546875, -0.0045223236083984375, -0.00103759765625, 0.0024471282958984375, 0.005931854248046875, 0.009416580200195312, 0.01290130615234375, 0.016386032104492188, 0.019870758056640625, 0.023355484008789062, 0.0268402099609375, 0.030324935913085938, 0.033809661865234375, 0.03729438781738281, 0.04077911376953125, 0.04426383972167969, 0.047748565673828125, 0.05123329162597656, 0.054718017578125, 0.05820274353027344, 0.061687469482421875, 0.06517219543457031, 0.06865692138671875, 0.07214164733886719, 0.07562637329101562, 0.07911109924316406, 0.0825958251953125, 0.08608055114746094, 0.08956527709960938, 0.09305000305175781, 0.09653472900390625, 0.10001945495605469, 0.10350418090820312, 0.10698890686035156, 0.1104736328125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 7.0, 7.0, 8.0, 9.0, 17.0, 24.0, 36.0, 41.0, 54.0, 107.0, 186.0, 315.0, 680.0, 1375.0, 3530.0, 13889.0, 240071.0, 753627.0, 25613.0, 5321.0, 1867.0, 803.0, 411.0, 252.0, 130.0, 64.0, 37.0, 19.0, 22.0, 20.0, 13.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0592041015625, -0.05772972106933594, -0.056255340576171875, -0.05478096008300781, -0.05330657958984375, -0.05183219909667969, -0.050357818603515625, -0.04888343811035156, -0.0474090576171875, -0.04593467712402344, -0.044460296630859375, -0.04298591613769531, -0.04151153564453125, -0.04003715515136719, -0.038562774658203125, -0.03708839416503906, -0.035614013671875, -0.03413963317871094, -0.032665252685546875, -0.031190872192382812, -0.02971649169921875, -0.028242111206054688, -0.026767730712890625, -0.025293350219726562, -0.0238189697265625, -0.022344589233398438, -0.020870208740234375, -0.019395828247070312, -0.01792144775390625, -0.016447067260742188, -0.014972686767578125, -0.013498306274414062, -0.01202392578125, -0.010549545288085938, -0.009075164794921875, -0.0076007843017578125, -0.00612640380859375, -0.0046520233154296875, -0.003177642822265625, -0.0017032623291015625, -0.0002288818359375, 0.0012454986572265625, 0.002719879150390625, 0.0041942596435546875, 0.00566864013671875, 0.0071430206298828125, 0.008617401123046875, 0.010091781616210938, 0.011566162109375, 0.013040542602539062, 0.014514923095703125, 0.015989303588867188, 0.01746368408203125, 0.018938064575195312, 0.020412445068359375, 0.021886825561523438, 0.0233612060546875, 0.024835586547851562, 0.026309967041015625, 0.027784347534179688, 0.02925872802734375, 0.030733108520507812, 0.032207489013671875, 0.03368186950683594, 0.03515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 7.0, 27.0, 60.0, 111.0, 183.0, 262.0, 174.0, 86.0, 39.0, 13.0, 10.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2099742889404297e-05, -1.1439435184001923e-05, -1.0779127478599548e-05, -1.0118819773197174e-05, -9.4585120677948e-06, -8.798204362392426e-06, -8.137896656990051e-06, -7.477588951587677e-06, -6.817281246185303e-06, -6.1569735407829285e-06, -5.496665835380554e-06, -4.83635812997818e-06, -4.176050424575806e-06, -3.5157427191734314e-06, -2.855435013771057e-06, -2.195127308368683e-06, -1.5348196029663086e-06, -8.745118975639343e-07, -2.1420419216156006e-07, 4.461035132408142e-07, 1.1064112186431885e-06, 1.7667189240455627e-06, 2.427026629447937e-06, 3.0873343348503113e-06, 3.7476420402526855e-06, 4.40794974565506e-06, 5.068257451057434e-06, 5.728565156459808e-06, 6.388872861862183e-06, 7.049180567264557e-06, 7.709488272666931e-06, 8.369795978069305e-06, 9.03010368347168e-06, 9.690411388874054e-06, 1.0350719094276428e-05, 1.1011026799678802e-05, 1.1671334505081177e-05, 1.2331642210483551e-05, 1.2991949915885925e-05, 1.36522576212883e-05, 1.4312565326690674e-05, 1.4972873032093048e-05, 1.5633180737495422e-05, 1.6293488442897797e-05, 1.695379614830017e-05, 1.7614103853702545e-05, 1.827441155910492e-05, 1.8934719264507294e-05, 1.9595026969909668e-05, 2.0255334675312042e-05, 2.0915642380714417e-05, 2.157595008611679e-05, 2.2236257791519165e-05, 2.289656549692154e-05, 2.3556873202323914e-05, 2.4217180907726288e-05, 2.4877488613128662e-05, 2.5537796318531036e-05, 2.619810402393341e-05, 2.6858411729335785e-05, 2.751871943473816e-05, 2.8179027140140533e-05, 2.8839334845542908e-05, 2.9499642550945282e-05, 3.0159950256347656e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 13.0, 13.0, 21.0, 22.0, 34.0, 46.0, 70.0, 72.0, 128.0, 192.0, 368.0, 667.0, 1487.0, 3492.0, 10677.0, 53411.0, 605699.0, 326378.0, 32628.0, 7734.0, 2680.0, 1228.0, 575.0, 334.0, 185.0, 122.0, 59.0, 55.0, 36.0, 26.0, 21.0, 19.0, 13.0, 6.0, 6.0, 3.0, 6.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.034332275390625, -0.03337526321411133, -0.032418251037597656, -0.031461238861083984, -0.030504226684570312, -0.02954721450805664, -0.02859020233154297, -0.027633190155029297, -0.026676177978515625, -0.025719165802001953, -0.02476215362548828, -0.02380514144897461, -0.022848129272460938, -0.021891117095947266, -0.020934104919433594, -0.019977092742919922, -0.01902008056640625, -0.018063068389892578, -0.017106056213378906, -0.016149044036865234, -0.015192031860351562, -0.01423501968383789, -0.013278007507324219, -0.012320995330810547, -0.011363983154296875, -0.010406970977783203, -0.009449958801269531, -0.00849294662475586, -0.0075359344482421875, -0.006578922271728516, -0.005621910095214844, -0.004664897918701172, -0.0037078857421875, -0.002750873565673828, -0.0017938613891601562, -0.0008368492126464844, 0.0001201629638671875, 0.0010771751403808594, 0.0020341873168945312, 0.002991199493408203, 0.003948211669921875, 0.004905223846435547, 0.005862236022949219, 0.006819248199462891, 0.0077762603759765625, 0.008733272552490234, 0.009690284729003906, 0.010647296905517578, 0.01160430908203125, 0.012561321258544922, 0.013518333435058594, 0.014475345611572266, 0.015432357788085938, 0.01638936996459961, 0.01734638214111328, 0.018303394317626953, 0.019260406494140625, 0.020217418670654297, 0.02117443084716797, 0.02213144302368164, 0.023088455200195312, 0.024045467376708984, 0.025002479553222656, 0.025959491729736328, 0.02691650390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 12.0, 14.0, 28.0, 18.0, 26.0, 30.0, 37.0, 53.0, 59.0, 78.0, 79.0, 75.0, 75.0, 71.0, 72.0, 67.0, 46.0, 30.0, 26.0, 14.0, 25.0, 17.0, 3.0, 4.0, 8.0, 4.0, 2.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.033355712890625, -0.03246879577636719, -0.031581878662109375, -0.030694961547851562, -0.02980804443359375, -0.028921127319335938, -0.028034210205078125, -0.027147293090820312, -0.0262603759765625, -0.025373458862304688, -0.024486541748046875, -0.023599624633789062, -0.02271270751953125, -0.021825790405273438, -0.020938873291015625, -0.020051956176757812, -0.0191650390625, -0.018278121948242188, -0.017391204833984375, -0.016504287719726562, -0.01561737060546875, -0.014730453491210938, -0.013843536376953125, -0.012956619262695312, -0.0120697021484375, -0.011182785034179688, -0.010295867919921875, -0.009408950805664062, -0.00852203369140625, -0.0076351165771484375, -0.006748199462890625, -0.0058612823486328125, -0.004974365234375, -0.0040874481201171875, -0.003200531005859375, -0.0023136138916015625, -0.00142669677734375, -0.0005397796630859375, 0.000347137451171875, 0.0012340545654296875, 0.0021209716796875, 0.0030078887939453125, 0.003894805908203125, 0.0047817230224609375, 0.00566864013671875, 0.0065555572509765625, 0.007442474365234375, 0.008329391479492188, 0.00921630859375, 0.010103225708007812, 0.010990142822265625, 0.011877059936523438, 0.01276397705078125, 0.013650894165039062, 0.014537811279296875, 0.015424728393554688, 0.0163116455078125, 0.017198562622070312, 0.018085479736328125, 0.018972396850585938, 0.01985931396484375, 0.020746231079101562, 0.021633148193359375, 0.022520065307617188, 0.023406982421875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 17.0, 135.0, 495.0, 286.0, 51.0, 12.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.9301581382751465, -2.8724172115325928, -2.81467604637146, -2.7569351196289062, -2.6991939544677734, -2.6414530277252197, -2.583712100982666, -2.525970935821533, -2.4682300090789795, -2.410489082336426, -2.352747917175293, -2.2950069904327393, -2.2372658252716064, -2.1795248985290527, -2.12178373336792, -2.064042806625366, -2.0063016414642334, -1.9485605955123901, -1.8908195495605469, -1.8330786228179932, -1.77533757686615, -1.7175965309143066, -1.6598554849624634, -1.6021144390106201, -1.5443735122680664, -1.4866324663162231, -1.4288914203643799, -1.3711504936218262, -1.313409447669983, -1.2556684017181396, -1.1979273557662964, -1.1401863098144531, -1.0824451446533203, -1.024704098701477, -0.9669631123542786, -0.9092220664024353, -0.851481020450592, -0.7937400341033936, -0.7359989881515503, -0.678257942199707, -0.6205170154571533, -0.5627759695053101, -0.5050349831581116, -0.4472939372062683, -0.38955289125442505, -0.3318118751049042, -0.2740708589553833, -0.21632981300354004, -0.15858876705169678, -0.10084773600101471, -0.04310671240091324, 0.014634311199188232, 0.0723753422498703, 0.13011637330055237, 0.18785738945007324, 0.2455984354019165, 0.3033394515514374, 0.36108046770095825, 0.4188215136528015, 0.4765625298023224, 0.5343035459518433, 0.5920445919036865, 0.6497856378555298, 0.707526683807373, 0.7652676701545715]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 9.0, 7.0, 5.0, 10.0, 8.0, 10.0, 20.0, 22.0, 21.0, 13.0, 27.0, 36.0, 34.0, 28.0, 41.0, 40.0, 39.0, 58.0, 60.0, 62.0, 54.0, 39.0, 47.0, 47.0, 42.0, 34.0, 27.0, 24.0, 23.0, 21.0, 15.0, 14.0, 13.0, 13.0, 11.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4282081127166748, -0.41456690430641174, -0.4009256958961487, -0.38728445768356323, -0.37364324927330017, -0.3600020408630371, -0.34636083245277405, -0.332719624042511, -0.31907838582992554, -0.3054371774196625, -0.2917959690093994, -0.27815473079681396, -0.2645135223865509, -0.25087231397628784, -0.23723110556602478, -0.22358989715576172, -0.20994868874549866, -0.1963074803352356, -0.18266625702381134, -0.16902504861354828, -0.15538382530212402, -0.14174261689186096, -0.1281014084815979, -0.11446019262075424, -0.10081897675991058, -0.08717776089906693, -0.07353654503822327, -0.059895336627960205, -0.04625412076711655, -0.03261290490627289, -0.018971696496009827, -0.005330480635166168, 0.00831073522567749, 0.021951949223876, 0.03559316322207451, 0.04923437535762787, 0.06287559121847153, 0.07651680707931519, 0.09015801548957825, 0.1037992313504219, 0.11744044721126556, 0.13108165562152863, 0.14472287893295288, 0.15836408734321594, 0.172005295753479, 0.18564651906490326, 0.19928772747516632, 0.21292895078659058, 0.22657015919685364, 0.2402113676071167, 0.25385257601737976, 0.2674937844276428, 0.28113502264022827, 0.29477623105049133, 0.3084174394607544, 0.32205864787101746, 0.3356998562812805, 0.3493410646915436, 0.36298227310180664, 0.3766235113143921, 0.39026471972465515, 0.4039059281349182, 0.4175471365451813, 0.43118834495544434, 0.4448295831680298]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 6.0, 4.0, 10.0, 15.0, 19.0, 21.0, 22.0, 50.0, 48.0, 69.0, 100.0, 142.0, 196.0, 295.0, 6319.0, 4182907.0, 3044.0, 322.0, 200.0, 146.0, 107.0, 92.0, 34.0, 35.0, 31.0, 17.0, 10.0, 9.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0], "bins": [-0.55224609375, -0.5400943756103516, -0.5279426574707031, -0.5157909393310547, -0.5036392211914062, -0.4914875030517578, -0.4793357849121094, -0.46718406677246094, -0.4550323486328125, -0.44288063049316406, -0.4307289123535156, -0.4185771942138672, -0.40642547607421875, -0.3942737579345703, -0.3821220397949219, -0.36997032165527344, -0.357818603515625, -0.34566688537597656, -0.3335151672363281, -0.3213634490966797, -0.30921173095703125, -0.2970600128173828, -0.2849082946777344, -0.27275657653808594, -0.2606048583984375, -0.24845314025878906, -0.23630142211914062, -0.2241497039794922, -0.21199798583984375, -0.1998462677001953, -0.18769454956054688, -0.17554283142089844, -0.16339111328125, -0.15123939514160156, -0.13908767700195312, -0.1269359588623047, -0.11478424072265625, -0.10263252258300781, -0.09048080444335938, -0.07832908630371094, -0.0661773681640625, -0.05402565002441406, -0.041873931884765625, -0.029722213745117188, -0.01757049560546875, -0.0054187774658203125, 0.006732940673828125, 0.018884658813476562, 0.031036376953125, 0.04318809509277344, 0.055339813232421875, 0.06749153137207031, 0.07964324951171875, 0.09179496765136719, 0.10394668579101562, 0.11609840393066406, 0.1282501220703125, 0.14040184020996094, 0.15255355834960938, 0.1647052764892578, 0.17685699462890625, 0.1890087127685547, 0.20116043090820312, 0.21331214904785156, 0.2254638671875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 4.0, 10.0, 12.0, 15.0, 13.0, 23.0, 28.0, 37.0, 36.0, 58.0, 66.0, 67.0, 55.0, 63.0, 59.0, 64.0, 59.0, 55.0, 50.0, 53.0, 35.0, 26.0, 34.0, 12.0, 14.0, 12.0, 11.0, 5.0, 7.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0347900390625, -0.03355550765991211, -0.03232097625732422, -0.031086444854736328, -0.029851913452148438, -0.028617382049560547, -0.027382850646972656, -0.026148319244384766, -0.024913787841796875, -0.023679256439208984, -0.022444725036621094, -0.021210193634033203, -0.019975662231445312, -0.018741130828857422, -0.01750659942626953, -0.01627206802368164, -0.01503753662109375, -0.01380300521850586, -0.012568473815917969, -0.011333942413330078, -0.010099411010742188, -0.008864879608154297, -0.007630348205566406, -0.006395816802978516, -0.005161285400390625, -0.003926753997802734, -0.0026922225952148438, -0.0014576911926269531, -0.0002231597900390625, 0.0010113716125488281, 0.0022459030151367188, 0.0034804344177246094, 0.0047149658203125, 0.005949497222900391, 0.007184028625488281, 0.008418560028076172, 0.009653091430664062, 0.010887622833251953, 0.012122154235839844, 0.013356685638427734, 0.014591217041015625, 0.015825748443603516, 0.017060279846191406, 0.018294811248779297, 0.019529342651367188, 0.020763874053955078, 0.02199840545654297, 0.02323293685913086, 0.02446746826171875, 0.02570199966430664, 0.02693653106689453, 0.028171062469482422, 0.029405593872070312, 0.030640125274658203, 0.031874656677246094, 0.033109188079833984, 0.034343719482421875, 0.035578250885009766, 0.036812782287597656, 0.03804731369018555, 0.03928184509277344, 0.04051637649536133, 0.04175090789794922, 0.04298543930053711, 0.044219970703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 11.0, 16.0, 23.0, 35.0, 50.0, 127.0, 203.0, 427.0, 943.0, 2586.0, 10485.0, 70981.0, 3757546.0, 320604.0, 23128.0, 4674.0, 1417.0, 516.0, 221.0, 131.0, 64.0, 36.0, 15.0, 13.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0970458984375, -0.094329833984375, -0.09161376953125, -0.088897705078125, -0.086181640625, -0.083465576171875, -0.08074951171875, -0.078033447265625, -0.0753173828125, -0.072601318359375, -0.06988525390625, -0.067169189453125, -0.064453125, -0.061737060546875, -0.05902099609375, -0.056304931640625, -0.0535888671875, -0.050872802734375, -0.04815673828125, -0.045440673828125, -0.042724609375, -0.040008544921875, -0.03729248046875, -0.034576416015625, -0.0318603515625, -0.029144287109375, -0.02642822265625, -0.023712158203125, -0.02099609375, -0.018280029296875, -0.01556396484375, -0.012847900390625, -0.0101318359375, -0.007415771484375, -0.00469970703125, -0.001983642578125, 0.000732421875, 0.003448486328125, 0.00616455078125, 0.008880615234375, 0.0115966796875, 0.014312744140625, 0.01702880859375, 0.019744873046875, 0.0224609375, 0.025177001953125, 0.02789306640625, 0.030609130859375, 0.0333251953125, 0.036041259765625, 0.03875732421875, 0.041473388671875, 0.044189453125, 0.046905517578125, 0.04962158203125, 0.052337646484375, 0.0550537109375, 0.057769775390625, 0.06048583984375, 0.063201904296875, 0.06591796875, 0.068634033203125, 0.07135009765625, 0.074066162109375, 0.0767822265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 7.0, 19.0, 18.0, 23.0, 43.0, 78.0, 179.0, 566.0, 1571.0, 992.0, 302.0, 100.0, 56.0, 30.0, 22.0, 13.0, 11.0, 7.0, 9.0, 5.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0948486328125, -0.09240531921386719, -0.08996200561523438, -0.08751869201660156, -0.08507537841796875, -0.08263206481933594, -0.08018875122070312, -0.07774543762207031, -0.0753021240234375, -0.07285881042480469, -0.07041549682617188, -0.06797218322753906, -0.06552886962890625, -0.06308555603027344, -0.060642242431640625, -0.05819892883300781, -0.055755615234375, -0.05331230163574219, -0.050868988037109375, -0.04842567443847656, -0.04598236083984375, -0.04353904724121094, -0.041095733642578125, -0.03865242004394531, -0.0362091064453125, -0.03376579284667969, -0.031322479248046875, -0.028879165649414062, -0.02643585205078125, -0.023992538452148438, -0.021549224853515625, -0.019105911254882812, -0.01666259765625, -0.014219284057617188, -0.011775970458984375, -0.009332656860351562, -0.00688934326171875, -0.0044460296630859375, -0.002002716064453125, 0.0004405975341796875, 0.0028839111328125, 0.0053272247314453125, 0.007770538330078125, 0.010213851928710938, 0.01265716552734375, 0.015100479125976562, 0.017543792724609375, 0.019987106323242188, 0.022430419921875, 0.024873733520507812, 0.027317047119140625, 0.029760360717773438, 0.03220367431640625, 0.03464698791503906, 0.037090301513671875, 0.03953361511230469, 0.0419769287109375, 0.04442024230957031, 0.046863555908203125, 0.04930686950683594, 0.05175018310546875, 0.05419349670410156, 0.056636810302734375, 0.05908012390136719, 0.0615234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 10.0, 25.0, 97.0, 267.0, 325.0, 162.0, 67.0, 24.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7058895826339722, -0.6779361367225647, -0.6499826312065125, -0.622029185295105, -0.5940756797790527, -0.5661222338676453, -0.5381687879562378, -0.5102152824401855, -0.4822618365287781, -0.4543083608150482, -0.42635488510131836, -0.3984014391899109, -0.37044796347618103, -0.34249448776245117, -0.3145410120487213, -0.28658753633499146, -0.2586340606212616, -0.23068058490753174, -0.20272712409496307, -0.17477364838123322, -0.14682018756866455, -0.11886671185493469, -0.09091323614120483, -0.06295977532863617, -0.03500629961490631, -0.0070528294891119, 0.02090064063668251, 0.04885411262512207, 0.07680758088827133, 0.1047610491514206, 0.13271452486515045, 0.16066798567771912, 0.18862146139144897, 0.21657493710517883, 0.2445283979177475, 0.27248185873031616, 0.300435334444046, 0.3283888101577759, 0.35634228587150574, 0.3842957615852356, 0.41224920749664307, 0.4402026832103729, 0.4681561589241028, 0.49610960483551025, 0.5240631103515625, 0.55201655626297, 0.5799700021743774, 0.6079235076904297, 0.6358770132064819, 0.6638304591178894, 0.6917839646339417, 0.7197374105453491, 0.7476909160614014, 0.7756443619728088, 0.8035978078842163, 0.8315513134002686, 0.859504759311676, 0.8874582052230835, 0.9154117107391357, 0.9433651566505432, 0.9713186621665955, 0.9992721080780029, 1.0272256135940552, 1.0551789999008179, 1.0831325054168701]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 2.0, 10.0, 9.0, 7.0, 17.0, 12.0, 23.0, 18.0, 23.0, 34.0, 38.0, 34.0, 38.0, 57.0, 57.0, 54.0, 57.0, 55.0, 57.0, 59.0, 60.0, 50.0, 41.0, 39.0, 28.0, 31.0, 19.0, 14.0, 15.0, 12.0, 8.0, 11.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.24626260995864868, -0.23725372552871704, -0.2282448410987854, -0.21923595666885376, -0.21022705733776093, -0.20121817290782928, -0.19220928847789764, -0.1832003891468048, -0.17419150471687317, -0.16518262028694153, -0.1561737358570099, -0.14716485142707825, -0.1381559520959854, -0.12914706766605377, -0.12013818323612213, -0.1111292913556099, -0.10212041437625885, -0.09311152994632721, -0.08410263806581497, -0.07509375363588333, -0.0660848617553711, -0.05707597732543945, -0.04806709289550781, -0.039058201014995575, -0.030049316585063934, -0.021040428429841995, -0.012031542137265205, -0.0030226558446884155, 0.0059862323105335236, 0.014995120465755463, 0.024004004895687103, 0.03301289677619934, 0.04202178120613098, 0.05103066936135292, 0.06003955751657486, 0.0690484419465065, 0.07805733382701874, 0.08706621825695038, 0.09607510268688202, 0.10508399456739426, 0.1140928789973259, 0.12310176342725754, 0.13211065530776978, 0.14111953973770142, 0.15012842416763306, 0.1591373085975647, 0.16814619302749634, 0.17715509235858917, 0.1861639767885208, 0.19517286121845245, 0.2041817456483841, 0.21319064497947693, 0.22219952940940857, 0.2312084138393402, 0.24021729826927185, 0.2492261826992035, 0.25823506712913513, 0.2672439515590668, 0.2762528359889984, 0.28526172041893005, 0.2942706048488617, 0.3032795190811157, 0.31228840351104736, 0.321297287940979, 0.33030617237091064]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 6.0, 6.0, 5.0, 9.0, 16.0, 24.0, 41.0, 49.0, 79.0, 133.0, 247.0, 463.0, 916.0, 2069.0, 5519.0, 16903.0, 66098.0, 278818.0, 468489.0, 155275.0, 36366.0, 10446.0, 3567.0, 1460.0, 688.0, 344.0, 187.0, 123.0, 70.0, 40.0, 26.0, 19.0, 14.0, 10.0, 3.0, 7.0, 3.0, 5.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0587158203125, -0.0565643310546875, -0.054412841796875, -0.0522613525390625, -0.05010986328125, -0.0479583740234375, -0.045806884765625, -0.0436553955078125, -0.04150390625, -0.0393524169921875, -0.037200927734375, -0.0350494384765625, -0.03289794921875, -0.0307464599609375, -0.028594970703125, -0.0264434814453125, -0.0242919921875, -0.0221405029296875, -0.019989013671875, -0.0178375244140625, -0.01568603515625, -0.0135345458984375, -0.011383056640625, -0.0092315673828125, -0.007080078125, -0.0049285888671875, -0.002777099609375, -0.0006256103515625, 0.00152587890625, 0.0036773681640625, 0.005828857421875, 0.0079803466796875, 0.0101318359375, 0.0122833251953125, 0.014434814453125, 0.0165863037109375, 0.01873779296875, 0.0208892822265625, 0.023040771484375, 0.0251922607421875, 0.02734375, 0.0294952392578125, 0.031646728515625, 0.0337982177734375, 0.03594970703125, 0.0381011962890625, 0.040252685546875, 0.0424041748046875, 0.0445556640625, 0.0467071533203125, 0.048858642578125, 0.0510101318359375, 0.05316162109375, 0.0553131103515625, 0.057464599609375, 0.0596160888671875, 0.061767578125, 0.0639190673828125, 0.066070556640625, 0.0682220458984375, 0.07037353515625, 0.0725250244140625, 0.074676513671875, 0.0768280029296875, 0.0789794921875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 4.0, 10.0, 10.0, 14.0, 11.0, 26.0, 26.0, 38.0, 42.0, 59.0, 63.0, 63.0, 60.0, 68.0, 60.0, 67.0, 64.0, 57.0, 52.0, 46.0, 31.0, 32.0, 21.0, 14.0, 14.0, 13.0, 10.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.036407470703125, -0.035109519958496094, -0.03381156921386719, -0.03251361846923828, -0.031215667724609375, -0.02991771697998047, -0.028619766235351562, -0.027321815490722656, -0.02602386474609375, -0.024725914001464844, -0.023427963256835938, -0.02213001251220703, -0.020832061767578125, -0.01953411102294922, -0.018236160278320312, -0.016938209533691406, -0.0156402587890625, -0.014342308044433594, -0.013044357299804688, -0.011746406555175781, -0.010448455810546875, -0.009150505065917969, -0.007852554321289062, -0.006554603576660156, -0.00525665283203125, -0.003958702087402344, -0.0026607513427734375, -0.0013628005981445312, -6.4849853515625e-05, 0.0012331008911132812, 0.0025310516357421875, 0.0038290023803710938, 0.005126953125, 0.006424903869628906, 0.0077228546142578125, 0.009020805358886719, 0.010318756103515625, 0.011616706848144531, 0.012914657592773438, 0.014212608337402344, 0.01551055908203125, 0.016808509826660156, 0.018106460571289062, 0.01940441131591797, 0.020702362060546875, 0.02200031280517578, 0.023298263549804688, 0.024596214294433594, 0.0258941650390625, 0.027192115783691406, 0.028490066528320312, 0.02978801727294922, 0.031085968017578125, 0.03238391876220703, 0.03368186950683594, 0.034979820251464844, 0.03627777099609375, 0.037575721740722656, 0.03887367248535156, 0.04017162322998047, 0.041469573974609375, 0.04276752471923828, 0.04406547546386719, 0.045363426208496094, 0.046661376953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 11.0, 15.0, 27.0, 45.0, 46.0, 98.0, 182.0, 352.0, 785.0, 2495.0, 13440.0, 190913.0, 775089.0, 56141.0, 6198.0, 1480.0, 558.0, 309.0, 139.0, 85.0, 46.0, 32.0, 17.0, 17.0, 7.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.13818359375, -0.1341543197631836, -0.1301250457763672, -0.12609577178955078, -0.12206649780273438, -0.11803722381591797, -0.11400794982910156, -0.10997867584228516, -0.10594940185546875, -0.10192012786865234, -0.09789085388183594, -0.09386157989501953, -0.08983230590820312, -0.08580303192138672, -0.08177375793457031, -0.0777444839477539, -0.0737152099609375, -0.0696859359741211, -0.06565666198730469, -0.06162738800048828, -0.057598114013671875, -0.05356884002685547, -0.04953956604003906, -0.045510292053222656, -0.04148101806640625, -0.037451744079589844, -0.03342247009277344, -0.02939319610595703, -0.025363922119140625, -0.02133464813232422, -0.017305374145507812, -0.013276100158691406, -0.009246826171875, -0.005217552185058594, -0.0011882781982421875, 0.0028409957885742188, 0.006870269775390625, 0.010899543762207031, 0.014928817749023438, 0.018958091735839844, 0.02298736572265625, 0.027016639709472656, 0.031045913696289062, 0.03507518768310547, 0.039104461669921875, 0.04313373565673828, 0.04716300964355469, 0.051192283630371094, 0.0552215576171875, 0.059250831604003906, 0.06328010559082031, 0.06730937957763672, 0.07133865356445312, 0.07536792755126953, 0.07939720153808594, 0.08342647552490234, 0.08745574951171875, 0.09148502349853516, 0.09551429748535156, 0.09954357147216797, 0.10357284545898438, 0.10760211944580078, 0.11163139343261719, 0.1156606674194336, 0.11968994140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 6.0, 6.0, 10.0, 8.0, 6.0, 9.0, 13.0, 14.0, 10.0, 17.0, 24.0, 18.0, 21.0, 26.0, 29.0, 34.0, 32.0, 48.0, 50.0, 38.0, 44.0, 39.0, 51.0, 41.0, 33.0, 43.0, 36.0, 30.0, 42.0, 29.0, 25.0, 36.0, 13.0, 24.0, 22.0, 9.0, 16.0, 12.0, 8.0, 5.0, 9.0, 3.0, 6.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0], "bins": [-0.10321044921875, -0.10014057159423828, -0.09707069396972656, -0.09400081634521484, -0.09093093872070312, -0.0878610610961914, -0.08479118347167969, -0.08172130584716797, -0.07865142822265625, -0.07558155059814453, -0.07251167297363281, -0.0694417953491211, -0.06637191772460938, -0.06330204010009766, -0.06023216247558594, -0.05716228485107422, -0.0540924072265625, -0.05102252960205078, -0.04795265197753906, -0.044882774353027344, -0.041812896728515625, -0.038743019104003906, -0.03567314147949219, -0.03260326385498047, -0.02953338623046875, -0.02646350860595703, -0.023393630981445312, -0.020323753356933594, -0.017253875732421875, -0.014183998107910156, -0.011114120483398438, -0.008044242858886719, -0.004974365234375, -0.0019044876098632812, 0.0011653900146484375, 0.004235267639160156, 0.007305145263671875, 0.010375022888183594, 0.013444900512695312, 0.01651477813720703, 0.01958465576171875, 0.02265453338623047, 0.025724411010742188, 0.028794288635253906, 0.031864166259765625, 0.034934043884277344, 0.03800392150878906, 0.04107379913330078, 0.0441436767578125, 0.04721355438232422, 0.05028343200683594, 0.053353309631347656, 0.056423187255859375, 0.059493064880371094, 0.06256294250488281, 0.06563282012939453, 0.06870269775390625, 0.07177257537841797, 0.07484245300292969, 0.0779123306274414, 0.08098220825195312, 0.08405208587646484, 0.08712196350097656, 0.09019184112548828, 0.09326171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 15.0, 36.0, 43.0, 49.0, 119.0, 269.0, 884.0, 5360.0, 961747.0, 76082.0, 2914.0, 594.0, 221.0, 109.0, 42.0, 26.0, 10.0, 13.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2685546875, -0.2606201171875, -0.252685546875, -0.2447509765625, -0.23681640625, -0.2288818359375, -0.220947265625, -0.2130126953125, -0.205078125, -0.1971435546875, -0.189208984375, -0.1812744140625, -0.17333984375, -0.1654052734375, -0.157470703125, -0.1495361328125, -0.1416015625, -0.1336669921875, -0.125732421875, -0.1177978515625, -0.10986328125, -0.1019287109375, -0.093994140625, -0.0860595703125, -0.078125, -0.0701904296875, -0.062255859375, -0.0543212890625, -0.04638671875, -0.0384521484375, -0.030517578125, -0.0225830078125, -0.0146484375, -0.0067138671875, 0.001220703125, 0.0091552734375, 0.01708984375, 0.0250244140625, 0.032958984375, 0.0408935546875, 0.048828125, 0.0567626953125, 0.064697265625, 0.0726318359375, 0.08056640625, 0.0885009765625, 0.096435546875, 0.1043701171875, 0.1123046875, 0.1202392578125, 0.128173828125, 0.1361083984375, 0.14404296875, 0.1519775390625, 0.159912109375, 0.1678466796875, 0.17578125, 0.1837158203125, 0.191650390625, 0.1995849609375, 0.20751953125, 0.2154541015625, 0.223388671875, 0.2313232421875, 0.2392578125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 5.0, 5.0, 19.0, 38.0, 87.0, 222.0, 311.0, 163.0, 68.0, 25.0, 17.0, 10.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.0517578125e-05, -2.95126810669899e-05, -2.8507784008979797e-05, -2.7502886950969696e-05, -2.6497989892959595e-05, -2.5493092834949493e-05, -2.4488195776939392e-05, -2.348329871892929e-05, -2.247840166091919e-05, -2.1473504602909088e-05, -2.0468607544898987e-05, -1.9463710486888885e-05, -1.8458813428878784e-05, -1.7453916370868683e-05, -1.644901931285858e-05, -1.544412225484848e-05, -1.4439225196838379e-05, -1.3434328138828278e-05, -1.2429431080818176e-05, -1.1424534022808075e-05, -1.0419636964797974e-05, -9.414739906787872e-06, -8.409842848777771e-06, -7.40494579076767e-06, -6.400048732757568e-06, -5.395151674747467e-06, -4.390254616737366e-06, -3.3853575587272644e-06, -2.380460500717163e-06, -1.3755634427070618e-06, -3.7066638469696045e-07, 6.342306733131409e-07, 1.6391277313232422e-06, 2.6440247893333435e-06, 3.648921847343445e-06, 4.653818905353546e-06, 5.6587159633636475e-06, 6.663613021373749e-06, 7.66851007938385e-06, 8.673407137393951e-06, 9.678304195404053e-06, 1.0683201253414154e-05, 1.1688098311424255e-05, 1.2692995369434357e-05, 1.3697892427444458e-05, 1.470278948545456e-05, 1.570768654346466e-05, 1.6712583601474762e-05, 1.7717480659484863e-05, 1.8722377717494965e-05, 1.9727274775505066e-05, 2.0732171833515167e-05, 2.173706889152527e-05, 2.274196594953537e-05, 2.374686300754547e-05, 2.4751760065555573e-05, 2.5756657123565674e-05, 2.6761554181575775e-05, 2.7766451239585876e-05, 2.8771348297595978e-05, 2.977624535560608e-05, 3.078114241361618e-05, 3.178603947162628e-05, 3.279093652963638e-05, 3.3795833587646484e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 11.0, 12.0, 16.0, 23.0, 37.0, 73.0, 170.0, 375.0, 1238.0, 6216.0, 132390.0, 887531.0, 16932.0, 2400.0, 628.0, 228.0, 103.0, 49.0, 26.0, 21.0, 17.0, 17.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1226806640625, -0.11919784545898438, -0.11571502685546875, -0.11223220825195312, -0.1087493896484375, -0.10526657104492188, -0.10178375244140625, -0.09830093383789062, -0.094818115234375, -0.09133529663085938, -0.08785247802734375, -0.08436965942382812, -0.0808868408203125, -0.07740402221679688, -0.07392120361328125, -0.07043838500976562, -0.06695556640625, -0.06347274780273438, -0.05998992919921875, -0.056507110595703125, -0.0530242919921875, -0.049541473388671875, -0.04605865478515625, -0.042575836181640625, -0.039093017578125, -0.035610198974609375, -0.03212738037109375, -0.028644561767578125, -0.0251617431640625, -0.021678924560546875, -0.01819610595703125, -0.014713287353515625, -0.01123046875, -0.007747650146484375, -0.00426483154296875, -0.000782012939453125, 0.0027008056640625, 0.006183624267578125, 0.00966644287109375, 0.013149261474609375, 0.016632080078125, 0.020114898681640625, 0.02359771728515625, 0.027080535888671875, 0.0305633544921875, 0.034046173095703125, 0.03752899169921875, 0.041011810302734375, 0.04449462890625, 0.047977447509765625, 0.05146026611328125, 0.054943084716796875, 0.0584259033203125, 0.061908721923828125, 0.06539154052734375, 0.06887435913085938, 0.072357177734375, 0.07583999633789062, 0.07932281494140625, 0.08280563354492188, 0.0862884521484375, 0.08977127075195312, 0.09325408935546875, 0.09673690795898438, 0.1002197265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 0.0, 9.0, 5.0, 7.0, 8.0, 21.0, 28.0, 44.0, 92.0, 122.0, 142.0, 170.0, 110.0, 75.0, 58.0, 38.0, 27.0, 13.0, 8.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062469482421875, -0.060259342193603516, -0.05804920196533203, -0.05583906173706055, -0.05362892150878906, -0.05141878128051758, -0.049208641052246094, -0.04699850082397461, -0.044788360595703125, -0.04257822036743164, -0.040368080139160156, -0.03815793991088867, -0.03594779968261719, -0.0337376594543457, -0.03152751922607422, -0.029317378997802734, -0.02710723876953125, -0.024897098541259766, -0.02268695831298828, -0.020476818084716797, -0.018266677856445312, -0.016056537628173828, -0.013846397399902344, -0.01163625717163086, -0.009426116943359375, -0.007215976715087891, -0.005005836486816406, -0.002795696258544922, -0.0005855560302734375, 0.0016245841979980469, 0.0038347244262695312, 0.006044864654541016, 0.0082550048828125, 0.010465145111083984, 0.012675285339355469, 0.014885425567626953, 0.017095565795898438, 0.019305706024169922, 0.021515846252441406, 0.02372598648071289, 0.025936126708984375, 0.02814626693725586, 0.030356407165527344, 0.03256654739379883, 0.03477668762207031, 0.0369868278503418, 0.03919696807861328, 0.041407108306884766, 0.04361724853515625, 0.045827388763427734, 0.04803752899169922, 0.0502476692199707, 0.05245780944824219, 0.05466794967651367, 0.056878089904785156, 0.05908823013305664, 0.061298370361328125, 0.06350851058959961, 0.0657186508178711, 0.06792879104614258, 0.07013893127441406, 0.07234907150268555, 0.07455921173095703, 0.07676935195922852, 0.0789794921875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 21.0, 42.0, 179.0, 496.0, 225.0, 25.0, 9.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.421905517578125, -3.3378658294677734, -3.253826141357422, -3.1697864532470703, -3.0857467651367188, -3.001706838607788, -2.9176671504974365, -2.833627462387085, -2.7495877742767334, -2.665548086166382, -2.5815083980560303, -2.4974687099456787, -2.413428783416748, -2.3293890953063965, -2.245349407196045, -2.1613097190856934, -2.077270030975342, -1.9932303428649902, -1.9091906547546387, -1.8251508474349976, -1.741111159324646, -1.6570714712142944, -1.5730316638946533, -1.4889919757843018, -1.4049522876739502, -1.3209125995635986, -1.236872911453247, -1.152833104133606, -1.0687934160232544, -0.9847537279129028, -0.9007139801979065, -0.8166742324829102, -0.7326343059539795, -0.6485946178436279, -0.5645548701286316, -0.48051515221595764, -0.3964754343032837, -0.31243571639060974, -0.2283959984779358, -0.14435625076293945, -0.06031656265258789, 0.02372315526008606, 0.10776287317276001, 0.19180259108543396, 0.2758423089981079, 0.35988202691078186, 0.4439217448234558, 0.5279614925384521, 0.6120011806488037, 0.6960408687591553, 0.7800806164741516, 0.864120364189148, 0.9481600522994995, 1.032199740409851, 1.1162395477294922, 1.2002792358398438, 1.2843189239501953, 1.3683586120605469, 1.4523983001708984, 1.5364381074905396, 1.6204777956008911, 1.7045174837112427, 1.7885572910308838, 1.8725969791412354, 1.956636667251587]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 10.0, 6.0, 15.0, 24.0, 29.0, 19.0, 25.0, 29.0, 31.0, 50.0, 51.0, 45.0, 50.0, 73.0, 56.0, 70.0, 54.0, 46.0, 45.0, 40.0, 32.0, 39.0, 28.0, 27.0, 19.0, 12.0, 15.0, 11.0, 8.0, 6.0, 5.0, 8.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5406304597854614, -0.5234950184822083, -0.5063595771789551, -0.4892241358757019, -0.47208869457244873, -0.45495325326919556, -0.43781778216362, -0.4206823408603668, -0.40354689955711365, -0.3864114582538605, -0.3692760169506073, -0.3521405756473541, -0.33500510454177856, -0.3178696632385254, -0.3007342219352722, -0.28359878063201904, -0.26646333932876587, -0.2493278980255127, -0.23219245672225952, -0.21505700051784515, -0.19792155921459198, -0.1807861179113388, -0.16365066170692444, -0.14651522040367126, -0.1293797791004181, -0.11224433779716492, -0.09510888904333115, -0.07797344028949738, -0.0608379989862442, -0.04370255768299103, -0.026567108929157257, -0.009431660175323486, 0.007703840732574463, 0.024839285761117935, 0.04197473078966141, 0.05911017581820488, 0.07624562084674835, 0.09338106215000153, 0.1105165109038353, 0.12765195965766907, 0.14478740096092224, 0.16192284226417542, 0.1790582835674286, 0.19619373977184296, 0.21332918107509613, 0.2304646223783493, 0.24760007858276367, 0.26473551988601685, 0.28187096118927, 0.2990064024925232, 0.31614184379577637, 0.33327728509902954, 0.3504127264022827, 0.3675481677055359, 0.38468363881111145, 0.4018190801143646, 0.4189545214176178, 0.43608996272087097, 0.45322540402412415, 0.4703608453273773, 0.4874963164329529, 0.504631757736206, 0.5217671990394592, 0.5389026403427124, 0.5560380816459656]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 15.0, 14.0, 16.0, 30.0, 36.0, 60.0, 95.0, 206.0, 518.0, 2965.0, 39223.0, 3702019.0, 437466.0, 9526.0, 1245.0, 388.0, 174.0, 76.0, 53.0, 34.0, 23.0, 17.0, 16.0, 12.0, 11.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1370849609375, -0.13314247131347656, -0.12919998168945312, -0.1252574920654297, -0.12131500244140625, -0.11737251281738281, -0.11343002319335938, -0.10948753356933594, -0.1055450439453125, -0.10160255432128906, -0.09766006469726562, -0.09371757507324219, -0.08977508544921875, -0.08583259582519531, -0.08189010620117188, -0.07794761657714844, -0.074005126953125, -0.07006263732910156, -0.06612014770507812, -0.06217765808105469, -0.05823516845703125, -0.05429267883300781, -0.050350189208984375, -0.04640769958496094, -0.0424652099609375, -0.03852272033691406, -0.034580230712890625, -0.030637741088867188, -0.02669525146484375, -0.022752761840820312, -0.018810272216796875, -0.014867782592773438, -0.01092529296875, -0.0069828033447265625, -0.003040313720703125, 0.0009021759033203125, 0.00484466552734375, 0.008787155151367188, 0.012729644775390625, 0.016672134399414062, 0.0206146240234375, 0.024557113647460938, 0.028499603271484375, 0.03244209289550781, 0.03638458251953125, 0.04032707214355469, 0.044269561767578125, 0.04821205139160156, 0.052154541015625, 0.05609703063964844, 0.060039520263671875, 0.06398200988769531, 0.06792449951171875, 0.07186698913574219, 0.07580947875976562, 0.07975196838378906, 0.0836944580078125, 0.08763694763183594, 0.09157943725585938, 0.09552192687988281, 0.09946441650390625, 0.10340690612792969, 0.10734939575195312, 0.11129188537597656, 0.115234375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 8.0, 14.0, 14.0, 17.0, 25.0, 25.0, 37.0, 43.0, 48.0, 64.0, 78.0, 53.0, 71.0, 81.0, 69.0, 56.0, 60.0, 50.0, 45.0, 35.0, 18.0, 26.0, 21.0, 14.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03424072265625, -0.03292226791381836, -0.03160381317138672, -0.030285358428955078, -0.028966903686523438, -0.027648448944091797, -0.026329994201660156, -0.025011539459228516, -0.023693084716796875, -0.022374629974365234, -0.021056175231933594, -0.019737720489501953, -0.018419265747070312, -0.017100811004638672, -0.01578235626220703, -0.01446390151977539, -0.01314544677734375, -0.01182699203491211, -0.010508537292480469, -0.009190082550048828, -0.007871627807617188, -0.006553173065185547, -0.005234718322753906, -0.003916263580322266, -0.002597808837890625, -0.0012793540954589844, 3.910064697265625e-05, 0.0013575553894042969, 0.0026760101318359375, 0.003994464874267578, 0.005312919616699219, 0.006631374359130859, 0.0079498291015625, 0.00926828384399414, 0.010586738586425781, 0.011905193328857422, 0.013223648071289062, 0.014542102813720703, 0.015860557556152344, 0.017179012298583984, 0.018497467041015625, 0.019815921783447266, 0.021134376525878906, 0.022452831268310547, 0.023771286010742188, 0.025089740753173828, 0.02640819549560547, 0.02772665023803711, 0.02904510498046875, 0.03036355972290039, 0.03168201446533203, 0.03300046920776367, 0.03431892395019531, 0.03563737869262695, 0.036955833435058594, 0.038274288177490234, 0.039592742919921875, 0.040911197662353516, 0.042229652404785156, 0.0435481071472168, 0.04486656188964844, 0.04618501663208008, 0.04750347137451172, 0.04882192611694336, 0.050140380859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 5.0, 12.0, 24.0, 27.0, 34.0, 53.0, 99.0, 219.0, 642.0, 3485.0, 71533.0, 4073505.0, 41194.0, 2391.0, 525.0, 207.0, 96.0, 70.0, 36.0, 40.0, 19.0, 19.0, 14.0, 13.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2457275390625, -0.23949623107910156, -0.23326492309570312, -0.2270336151123047, -0.22080230712890625, -0.2145709991455078, -0.20833969116210938, -0.20210838317871094, -0.1958770751953125, -0.18964576721191406, -0.18341445922851562, -0.1771831512451172, -0.17095184326171875, -0.1647205352783203, -0.15848922729492188, -0.15225791931152344, -0.146026611328125, -0.13979530334472656, -0.13356399536132812, -0.1273326873779297, -0.12110137939453125, -0.11487007141113281, -0.10863876342773438, -0.10240745544433594, -0.0961761474609375, -0.08994483947753906, -0.08371353149414062, -0.07748222351074219, -0.07125091552734375, -0.06501960754394531, -0.058788299560546875, -0.05255699157714844, -0.04632568359375, -0.04009437561035156, -0.033863067626953125, -0.027631759643554688, -0.02140045166015625, -0.015169143676757812, -0.008937835693359375, -0.0027065277099609375, 0.0035247802734375, 0.009756088256835938, 0.015987396240234375, 0.022218704223632812, 0.02845001220703125, 0.03468132019042969, 0.040912628173828125, 0.04714393615722656, 0.053375244140625, 0.05960655212402344, 0.06583786010742188, 0.07206916809082031, 0.07830047607421875, 0.08453178405761719, 0.09076309204101562, 0.09699440002441406, 0.1032257080078125, 0.10945701599121094, 0.11568832397460938, 0.12191963195800781, 0.12815093994140625, 0.1343822479248047, 0.14061355590820312, 0.14684486389160156, 0.153076171875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 16.0, 19.0, 21.0, 35.0, 71.0, 152.0, 406.0, 1185.0, 1279.0, 464.0, 166.0, 96.0, 55.0, 31.0, 19.0, 15.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09490966796875, -0.09140872955322266, -0.08790779113769531, -0.08440685272216797, -0.08090591430664062, -0.07740497589111328, -0.07390403747558594, -0.0704030990600586, -0.06690216064453125, -0.0634012222290039, -0.05990028381347656, -0.05639934539794922, -0.052898406982421875, -0.04939746856689453, -0.04589653015136719, -0.042395591735839844, -0.0388946533203125, -0.035393714904785156, -0.03189277648925781, -0.02839183807373047, -0.024890899658203125, -0.02138996124267578, -0.017889022827148438, -0.014388084411621094, -0.01088714599609375, -0.007386207580566406, -0.0038852691650390625, -0.00038433074951171875, 0.003116607666015625, 0.006617546081542969, 0.010118484497070312, 0.013619422912597656, 0.017120361328125, 0.020621299743652344, 0.024122238159179688, 0.02762317657470703, 0.031124114990234375, 0.03462505340576172, 0.03812599182128906, 0.041626930236816406, 0.04512786865234375, 0.048628807067871094, 0.05212974548339844, 0.05563068389892578, 0.059131622314453125, 0.06263256072998047, 0.06613349914550781, 0.06963443756103516, 0.0731353759765625, 0.07663631439208984, 0.08013725280761719, 0.08363819122314453, 0.08713912963867188, 0.09064006805419922, 0.09414100646972656, 0.0976419448852539, 0.10114288330078125, 0.1046438217163086, 0.10814476013183594, 0.11164569854736328, 0.11514663696289062, 0.11864757537841797, 0.12214851379394531, 0.12564945220947266, 0.129150390625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 4.0, 3.0, 9.0, 22.0, 29.0, 45.0, 67.0, 103.0, 150.0, 140.0, 139.0, 74.0, 58.0, 46.0, 27.0, 23.0, 15.0, 11.0, 10.0, 3.0, 2.0, 9.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5232629179954529, -0.5013665556907654, -0.4794701933860779, -0.457573801279068, -0.4356774389743805, -0.413781076669693, -0.3918846845626831, -0.3699883222579956, -0.3480919599533081, -0.3261955976486206, -0.3042992353439331, -0.2824028432369232, -0.2605064809322357, -0.23861011862754822, -0.21671374142169952, -0.19481736421585083, -0.17292100191116333, -0.15102463960647583, -0.12912826240062714, -0.10723189264535904, -0.08533552289009094, -0.06343915313482285, -0.04154278337955475, -0.019646406173706055, 0.0022499561309814453, 0.024146325886249542, 0.04604269564151764, 0.06793906539678574, 0.08983543515205383, 0.11173180490732193, 0.13362817466259003, 0.15552455186843872, 0.17742091417312622, 0.19931727647781372, 0.22121365368366241, 0.2431100308895111, 0.2650063931941986, 0.2869027554988861, 0.308799147605896, 0.3306955099105835, 0.352591872215271, 0.3744882345199585, 0.396384596824646, 0.4182809889316559, 0.4401773512363434, 0.4620737135410309, 0.48397010564804077, 0.5058664679527283, 0.5277628302574158, 0.5496591925621033, 0.5715555548667908, 0.5934519171714783, 0.6153483390808105, 0.637244701385498, 0.6591410636901855, 0.681037425994873, 0.7029337882995605, 0.724830150604248, 0.7467265129089355, 0.768622875213623, 0.7905192375183105, 0.8124156594276428, 0.8343120217323303, 0.8562083840370178, 0.8781047463417053]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 5.0, 6.0, 8.0, 5.0, 11.0, 20.0, 14.0, 15.0, 13.0, 25.0, 19.0, 28.0, 32.0, 36.0, 53.0, 42.0, 46.0, 53.0, 50.0, 55.0, 60.0, 56.0, 47.0, 46.0, 35.0, 38.0, 46.0, 32.0, 20.0, 12.0, 15.0, 11.0, 18.0, 8.0, 4.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39403003454208374, -0.3812677264213562, -0.3685053884983063, -0.35574308037757874, -0.3429807424545288, -0.33021843433380127, -0.31745612621307373, -0.3046937882900238, -0.29193148016929626, -0.2791691720485687, -0.2664068341255188, -0.25364452600479126, -0.24088220298290253, -0.2281198799610138, -0.21535755693912506, -0.20259523391723633, -0.1898329108953476, -0.17707058787345886, -0.16430826485157013, -0.1515459418296814, -0.13878363370895386, -0.12602131068706512, -0.11325898766517639, -0.10049667209386826, -0.08773434907197952, -0.07497202605009079, -0.062209710478782654, -0.04944738745689392, -0.036685068160295486, -0.023922748863697052, -0.011160425841808319, 0.001601889729499817, 0.01436421275138855, 0.027126532047986984, 0.03988885134458542, 0.05265117436647415, 0.06541348993778229, 0.07817581295967102, 0.09093813598155975, 0.10370045155286789, 0.11646277457475662, 0.12922509014606476, 0.1419874131679535, 0.15474973618984222, 0.16751205921173096, 0.1802743673324585, 0.19303670525550842, 0.20579901337623596, 0.2185613363981247, 0.23132365942001343, 0.24408598244190216, 0.2568483054637909, 0.26961061358451843, 0.28237295150756836, 0.2951352596282959, 0.30789756774902344, 0.32065990567207336, 0.3334222137928009, 0.34618455171585083, 0.35894685983657837, 0.3717091977596283, 0.38447150588035583, 0.39723384380340576, 0.4099961519241333, 0.42275846004486084]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 8.0, 14.0, 19.0, 34.0, 50.0, 61.0, 120.0, 242.0, 333.0, 605.0, 1062.0, 2036.0, 3767.0, 7497.0, 15253.0, 33381.0, 77568.0, 173763.0, 293326.0, 235100.0, 112453.0, 49097.0, 21689.0, 10221.0, 5019.0, 2607.0, 1374.0, 742.0, 422.0, 254.0, 152.0, 88.0, 57.0, 42.0, 24.0, 22.0, 15.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042999267578125, -0.04159975051879883, -0.040200233459472656, -0.038800716400146484, -0.03740119934082031, -0.03600168228149414, -0.03460216522216797, -0.0332026481628418, -0.031803131103515625, -0.030403614044189453, -0.02900409698486328, -0.02760457992553711, -0.026205062866210938, -0.024805545806884766, -0.023406028747558594, -0.022006511688232422, -0.02060699462890625, -0.019207477569580078, -0.017807960510253906, -0.016408443450927734, -0.015008926391601562, -0.01360940933227539, -0.012209892272949219, -0.010810375213623047, -0.009410858154296875, -0.008011341094970703, -0.006611824035644531, -0.005212306976318359, -0.0038127899169921875, -0.0024132728576660156, -0.0010137557983398438, 0.0003857612609863281, 0.0017852783203125, 0.003184795379638672, 0.004584312438964844, 0.005983829498291016, 0.0073833465576171875, 0.00878286361694336, 0.010182380676269531, 0.011581897735595703, 0.012981414794921875, 0.014380931854248047, 0.01578044891357422, 0.01717996597290039, 0.018579483032226562, 0.019979000091552734, 0.021378517150878906, 0.022778034210205078, 0.02417755126953125, 0.025577068328857422, 0.026976585388183594, 0.028376102447509766, 0.029775619506835938, 0.03117513656616211, 0.03257465362548828, 0.03397417068481445, 0.035373687744140625, 0.0367732048034668, 0.03817272186279297, 0.03957223892211914, 0.04097175598144531, 0.042371273040771484, 0.043770790100097656, 0.04517030715942383, 0.04656982421875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 10.0, 11.0, 17.0, 26.0, 21.0, 37.0, 43.0, 45.0, 58.0, 61.0, 71.0, 80.0, 66.0, 76.0, 69.0, 58.0, 65.0, 49.0, 35.0, 37.0, 16.0, 10.0, 11.0, 8.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039825439453125, -0.038361549377441406, -0.03689765930175781, -0.03543376922607422, -0.033969879150390625, -0.03250598907470703, -0.031042098999023438, -0.029578208923339844, -0.02811431884765625, -0.026650428771972656, -0.025186538696289062, -0.02372264862060547, -0.022258758544921875, -0.02079486846923828, -0.019330978393554688, -0.017867088317871094, -0.0164031982421875, -0.014939308166503906, -0.013475418090820312, -0.012011528015136719, -0.010547637939453125, -0.009083747863769531, -0.0076198577880859375, -0.006155967712402344, -0.00469207763671875, -0.0032281875610351562, -0.0017642974853515625, -0.00030040740966796875, 0.001163482666015625, 0.0026273727416992188, 0.0040912628173828125, 0.005555152893066406, 0.00701904296875, 0.008482933044433594, 0.009946823120117188, 0.011410713195800781, 0.012874603271484375, 0.014338493347167969, 0.015802383422851562, 0.017266273498535156, 0.01873016357421875, 0.020194053649902344, 0.021657943725585938, 0.02312183380126953, 0.024585723876953125, 0.02604961395263672, 0.027513504028320312, 0.028977394104003906, 0.0304412841796875, 0.031905174255371094, 0.03336906433105469, 0.03483295440673828, 0.036296844482421875, 0.03776073455810547, 0.03922462463378906, 0.040688514709472656, 0.04215240478515625, 0.043616294860839844, 0.04508018493652344, 0.04654407501220703, 0.048007965087890625, 0.04947185516357422, 0.05093574523925781, 0.052399635314941406, 0.053863525390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 8.0, 11.0, 9.0, 22.0, 23.0, 27.0, 29.0, 35.0, 72.0, 85.0, 110.0, 183.0, 234.0, 376.0, 660.0, 1267.0, 2676.0, 7489.0, 31653.0, 315607.0, 623152.0, 48063.0, 9735.0, 3313.0, 1492.0, 787.0, 472.0, 309.0, 148.0, 130.0, 91.0, 60.0, 56.0, 34.0, 34.0, 16.0, 11.0, 15.0, 10.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.125732421875, -0.12181663513183594, -0.11790084838867188, -0.11398506164550781, -0.11006927490234375, -0.10615348815917969, -0.10223770141601562, -0.09832191467285156, -0.0944061279296875, -0.09049034118652344, -0.08657455444335938, -0.08265876770019531, -0.07874298095703125, -0.07482719421386719, -0.07091140747070312, -0.06699562072753906, -0.063079833984375, -0.05916404724121094, -0.055248260498046875, -0.05133247375488281, -0.04741668701171875, -0.04350090026855469, -0.039585113525390625, -0.03566932678222656, -0.0317535400390625, -0.027837753295898438, -0.023921966552734375, -0.020006179809570312, -0.01609039306640625, -0.012174606323242188, -0.008258819580078125, -0.0043430328369140625, -0.00042724609375, 0.0034885406494140625, 0.007404327392578125, 0.011320114135742188, 0.01523590087890625, 0.019151687622070312, 0.023067474365234375, 0.026983261108398438, 0.0308990478515625, 0.03481483459472656, 0.038730621337890625, 0.04264640808105469, 0.04656219482421875, 0.05047798156738281, 0.054393768310546875, 0.05830955505371094, 0.062225341796875, 0.06614112854003906, 0.07005691528320312, 0.07397270202636719, 0.07788848876953125, 0.08180427551269531, 0.08572006225585938, 0.08963584899902344, 0.0935516357421875, 0.09746742248535156, 0.10138320922851562, 0.10529899597167969, 0.10921478271484375, 0.11313056945800781, 0.11704635620117188, 0.12096214294433594, 0.1248779296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 5.0, 5.0, 7.0, 9.0, 9.0, 11.0, 16.0, 24.0, 15.0, 19.0, 34.0, 33.0, 49.0, 37.0, 50.0, 60.0, 49.0, 46.0, 54.0, 53.0, 54.0, 58.0, 45.0, 44.0, 27.0, 22.0, 31.0, 21.0, 19.0, 15.0, 17.0, 4.0, 10.0, 10.0, 4.0, 8.0, 2.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.148193359375, -0.1439657211303711, -0.1397380828857422, -0.13551044464111328, -0.13128280639648438, -0.12705516815185547, -0.12282752990722656, -0.11859989166259766, -0.11437225341796875, -0.11014461517333984, -0.10591697692871094, -0.10168933868408203, -0.09746170043945312, -0.09323406219482422, -0.08900642395019531, -0.0847787857055664, -0.0805511474609375, -0.0763235092163086, -0.07209587097167969, -0.06786823272705078, -0.06364059448242188, -0.05941295623779297, -0.05518531799316406, -0.050957679748535156, -0.04673004150390625, -0.042502403259277344, -0.03827476501464844, -0.03404712677001953, -0.029819488525390625, -0.02559185028076172, -0.021364212036132812, -0.017136573791503906, -0.012908935546875, -0.008681297302246094, -0.0044536590576171875, -0.00022602081298828125, 0.004001617431640625, 0.008229255676269531, 0.012456893920898438, 0.016684532165527344, 0.02091217041015625, 0.025139808654785156, 0.029367446899414062, 0.03359508514404297, 0.037822723388671875, 0.04205036163330078, 0.04627799987792969, 0.050505638122558594, 0.0547332763671875, 0.058960914611816406, 0.06318855285644531, 0.06741619110107422, 0.07164382934570312, 0.07587146759033203, 0.08009910583496094, 0.08432674407958984, 0.08855438232421875, 0.09278202056884766, 0.09700965881347656, 0.10123729705810547, 0.10546493530273438, 0.10969257354736328, 0.11392021179199219, 0.1181478500366211, 0.12237548828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 9.0, 10.0, 16.0, 18.0, 27.0, 40.0, 62.0, 104.0, 151.0, 247.0, 436.0, 790.0, 1421.0, 2703.0, 5545.0, 12589.0, 46992.0, 907659.0, 45850.0, 12405.0, 5463.0, 2747.0, 1384.0, 754.0, 425.0, 254.0, 145.0, 107.0, 62.0, 40.0, 26.0, 23.0, 10.0, 12.0, 3.0, 9.0, 5.0, 5.0, 4.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10882568359375, -0.10500621795654297, -0.10118675231933594, -0.0973672866821289, -0.09354782104492188, -0.08972835540771484, -0.08590888977050781, -0.08208942413330078, -0.07826995849609375, -0.07445049285888672, -0.07063102722167969, -0.06681156158447266, -0.06299209594726562, -0.059172630310058594, -0.05535316467285156, -0.05153369903564453, -0.0477142333984375, -0.04389476776123047, -0.04007530212402344, -0.036255836486816406, -0.032436370849609375, -0.028616905212402344, -0.024797439575195312, -0.02097797393798828, -0.01715850830078125, -0.013339042663574219, -0.009519577026367188, -0.005700111389160156, -0.001880645751953125, 0.0019388198852539062, 0.0057582855224609375, 0.009577751159667969, 0.013397216796875, 0.01721668243408203, 0.021036148071289062, 0.024855613708496094, 0.028675079345703125, 0.032494544982910156, 0.03631401062011719, 0.04013347625732422, 0.04395294189453125, 0.04777240753173828, 0.05159187316894531, 0.055411338806152344, 0.059230804443359375, 0.0630502700805664, 0.06686973571777344, 0.07068920135498047, 0.0745086669921875, 0.07832813262939453, 0.08214759826660156, 0.0859670639038086, 0.08978652954101562, 0.09360599517822266, 0.09742546081542969, 0.10124492645263672, 0.10506439208984375, 0.10888385772705078, 0.11270332336425781, 0.11652278900146484, 0.12034225463867188, 0.1241617202758789, 0.12798118591308594, 0.13180065155029297, 0.1356201171875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 0.0, 6.0, 6.0, 6.0, 7.0, 9.0, 20.0, 33.0, 73.0, 212.0, 333.0, 158.0, 46.0, 24.0, 9.0, 11.0, 10.0, 7.0, 4.0, 5.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.869699478149414e-05, -4.728138446807861e-05, -4.5865774154663086e-05, -4.445016384124756e-05, -4.303455352783203e-05, -4.1618943214416504e-05, -4.0203332901000977e-05, -3.878772258758545e-05, -3.737211227416992e-05, -3.5956501960754395e-05, -3.454089164733887e-05, -3.312528133392334e-05, -3.170967102050781e-05, -3.0294060707092285e-05, -2.8878450393676758e-05, -2.746284008026123e-05, -2.6047229766845703e-05, -2.4631619453430176e-05, -2.321600914001465e-05, -2.180039882659912e-05, -2.0384788513183594e-05, -1.8969178199768066e-05, -1.755356788635254e-05, -1.6137957572937012e-05, -1.4722347259521484e-05, -1.3306736946105957e-05, -1.189112663269043e-05, -1.0475516319274902e-05, -9.059906005859375e-06, -7.644295692443848e-06, -6.22868537902832e-06, -4.813075065612793e-06, -3.3974647521972656e-06, -1.9818544387817383e-06, -5.662441253662109e-07, 8.493661880493164e-07, 2.2649765014648438e-06, 3.680586814880371e-06, 5.0961971282958984e-06, 6.511807441711426e-06, 7.927417755126953e-06, 9.34302806854248e-06, 1.0758638381958008e-05, 1.2174248695373535e-05, 1.3589859008789062e-05, 1.500546932220459e-05, 1.6421079635620117e-05, 1.7836689949035645e-05, 1.9252300262451172e-05, 2.06679105758667e-05, 2.2083520889282227e-05, 2.3499131202697754e-05, 2.491474151611328e-05, 2.633035182952881e-05, 2.7745962142944336e-05, 2.9161572456359863e-05, 3.057718276977539e-05, 3.199279308319092e-05, 3.3408403396606445e-05, 3.482401371002197e-05, 3.62396240234375e-05, 3.765523433685303e-05, 3.9070844650268555e-05, 4.048645496368408e-05, 4.190206527709961e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 16.0, 12.0, 25.0, 46.0, 54.0, 118.0, 161.0, 260.0, 452.0, 795.0, 1553.0, 2999.0, 6859.0, 19695.0, 431583.0, 550542.0, 19957.0, 6936.0, 2989.0, 1520.0, 765.0, 446.0, 292.0, 162.0, 83.0, 64.0, 37.0, 22.0, 29.0, 14.0, 17.0, 7.0, 5.0, 10.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.1374378204345703, -0.13339614868164062, -0.12935447692871094, -0.12531280517578125, -0.12127113342285156, -0.11722946166992188, -0.11318778991699219, -0.1091461181640625, -0.10510444641113281, -0.10106277465820312, -0.09702110290527344, -0.09297943115234375, -0.08893775939941406, -0.08489608764648438, -0.08085441589355469, -0.076812744140625, -0.07277107238769531, -0.06872940063476562, -0.06468772888183594, -0.06064605712890625, -0.05660438537597656, -0.052562713623046875, -0.04852104187011719, -0.0444793701171875, -0.04043769836425781, -0.036396026611328125, -0.03235435485839844, -0.02831268310546875, -0.024271011352539062, -0.020229339599609375, -0.016187667846679688, -0.01214599609375, -0.008104324340820312, -0.004062652587890625, -2.09808349609375e-05, 0.00402069091796875, 0.008062362670898438, 0.012104034423828125, 0.016145706176757812, 0.0201873779296875, 0.024229049682617188, 0.028270721435546875, 0.03231239318847656, 0.03635406494140625, 0.04039573669433594, 0.044437408447265625, 0.04847908020019531, 0.052520751953125, 0.05656242370605469, 0.060604095458984375, 0.06464576721191406, 0.06868743896484375, 0.07272911071777344, 0.07677078247070312, 0.08081245422363281, 0.0848541259765625, 0.08889579772949219, 0.09293746948242188, 0.09697914123535156, 0.10102081298828125, 0.10506248474121094, 0.10910415649414062, 0.11314582824707031, 0.1171875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 13.0, 9.0, 8.0, 11.0, 23.0, 51.0, 107.0, 214.0, 233.0, 146.0, 52.0, 23.0, 13.0, 15.0, 8.0, 6.0, 2.0, 12.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09765625, -0.09431838989257812, -0.09098052978515625, -0.08764266967773438, -0.0843048095703125, -0.08096694946289062, -0.07762908935546875, -0.07429122924804688, -0.070953369140625, -0.06761550903320312, -0.06427764892578125, -0.060939788818359375, -0.0576019287109375, -0.054264068603515625, -0.05092620849609375, -0.047588348388671875, -0.04425048828125, -0.040912628173828125, -0.03757476806640625, -0.034236907958984375, -0.0308990478515625, -0.027561187744140625, -0.02422332763671875, -0.020885467529296875, -0.017547607421875, -0.014209747314453125, -0.01087188720703125, -0.007534027099609375, -0.0041961669921875, -0.000858306884765625, 0.00247955322265625, 0.005817413330078125, 0.0091552734375, 0.012493133544921875, 0.01583099365234375, 0.019168853759765625, 0.0225067138671875, 0.025844573974609375, 0.02918243408203125, 0.032520294189453125, 0.035858154296875, 0.039196014404296875, 0.04253387451171875, 0.045871734619140625, 0.0492095947265625, 0.052547454833984375, 0.05588531494140625, 0.059223175048828125, 0.06256103515625, 0.06589889526367188, 0.06923675537109375, 0.07257461547851562, 0.0759124755859375, 0.07925033569335938, 0.08258819580078125, 0.08592605590820312, 0.089263916015625, 0.09260177612304688, 0.09593963623046875, 0.09927749633789062, 0.1026153564453125, 0.10595321655273438, 0.10929107666015625, 0.11262893676757812, 0.115966796875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 10.0, 17.0, 12.0, 31.0, 57.0, 97.0, 192.0, 317.0, 133.0, 75.0, 22.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.337963342666626, -2.2788195610046387, -2.2196755409240723, -2.160531759262085, -2.1013879776000977, -2.0422439575195312, -1.983100175857544, -1.923956274986267, -1.8648123741149902, -1.8056684732437134, -1.7465245723724365, -1.6873807907104492, -1.6282368898391724, -1.5690929889678955, -1.5099492073059082, -1.4508053064346313, -1.3916614055633545, -1.3325175046920776, -1.2733736038208008, -1.2142298221588135, -1.1550859212875366, -1.0959420204162598, -1.0367982387542725, -0.9776543378829956, -0.9185104370117188, -0.8593665361404419, -0.8002226948738098, -0.7410788536071777, -0.6819349527359009, -0.622791051864624, -0.5636472105979919, -0.5045033693313599, -0.44535958766937256, -0.3862157166004181, -0.3270718455314636, -0.26792797446250916, -0.2087841033935547, -0.14964023232460022, -0.09049636125564575, -0.031352490186691284, 0.027791380882263184, 0.08693525195121765, 0.14607912302017212, 0.2052229940891266, 0.26436686515808105, 0.3235107362270355, 0.38265460729599, 0.44179847836494446, 0.5009423494338989, 0.5600862503051758, 0.6192300915718079, 0.6783739328384399, 0.7375178337097168, 0.7966617345809937, 0.8558055758476257, 0.9149494171142578, 0.9740933179855347, 1.0332372188568115, 1.0923810005187988, 1.1515249013900757, 1.2106688022613525, 1.2698127031326294, 1.3289566040039062, 1.3881003856658936, 1.4472442865371704]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 6.0, 2.0, 4.0, 13.0, 6.0, 9.0, 19.0, 20.0, 24.0, 20.0, 29.0, 36.0, 28.0, 38.0, 41.0, 44.0, 63.0, 70.0, 86.0, 80.0, 48.0, 41.0, 40.0, 31.0, 26.0, 21.0, 26.0, 24.0, 15.0, 16.0, 14.0, 12.0, 14.0, 6.0, 8.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.6816900372505188, -0.6606816053390503, -0.6396731734275818, -0.6186647415161133, -0.5976563096046448, -0.5766478776931763, -0.5556395053863525, -0.5346310138702393, -0.5136226415634155, -0.492614209651947, -0.4716057777404785, -0.45059734582901, -0.4295889139175415, -0.408580482006073, -0.3875720798969269, -0.3665636479854584, -0.3455551862716675, -0.324546754360199, -0.30353832244873047, -0.28252989053726196, -0.26152145862579346, -0.24051304161548615, -0.21950462460517883, -0.19849619269371033, -0.17748776078224182, -0.15647932887077332, -0.1354708969593048, -0.1144624799489975, -0.09345404803752899, -0.07244561612606049, -0.051437199115753174, -0.030428767204284668, -0.009420275688171387, 0.01158815249800682, 0.03259658068418503, 0.05360500514507294, 0.07461343705654144, 0.09562186896800995, 0.11663028597831726, 0.13763871788978577, 0.15864714980125427, 0.17965558171272278, 0.20066401362419128, 0.2216724306344986, 0.2426808625459671, 0.2636892795562744, 0.2846977114677429, 0.3057061433792114, 0.32671457529067993, 0.34772300720214844, 0.36873143911361694, 0.38973987102508545, 0.41074830293655396, 0.43175673484802246, 0.4527651369571686, 0.4737735688686371, 0.4947820007801056, 0.5157904028892517, 0.5367988348007202, 0.5578072667121887, 0.5788156986236572, 0.5998241305351257, 0.6208325624465942, 0.6418409943580627, 0.6628494262695312]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 4.0, 5.0, 6.0, 17.0, 9.0, 16.0, 24.0, 22.0, 37.0, 55.0, 72.0, 120.0, 223.0, 458.0, 1339.0, 4300.0, 17378.0, 104006.0, 2399661.0, 1572269.0, 75311.0, 13429.0, 3501.0, 1010.0, 423.0, 198.0, 126.0, 73.0, 48.0, 29.0, 34.0, 18.0, 18.0, 10.0, 9.0, 4.0, 9.0, 2.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07818603515625, -0.07565784454345703, -0.07312965393066406, -0.0706014633178711, -0.06807327270507812, -0.06554508209228516, -0.06301689147949219, -0.06048870086669922, -0.05796051025390625, -0.05543231964111328, -0.05290412902832031, -0.050375938415527344, -0.047847747802734375, -0.045319557189941406, -0.04279136657714844, -0.04026317596435547, -0.0377349853515625, -0.03520679473876953, -0.03267860412597656, -0.030150413513183594, -0.027622222900390625, -0.025094032287597656, -0.022565841674804688, -0.02003765106201172, -0.01750946044921875, -0.014981269836425781, -0.012453079223632812, -0.009924888610839844, -0.007396697998046875, -0.004868507385253906, -0.0023403167724609375, 0.00018787384033203125, 0.002716064453125, 0.005244255065917969, 0.0077724456787109375, 0.010300636291503906, 0.012828826904296875, 0.015357017517089844, 0.017885208129882812, 0.02041339874267578, 0.02294158935546875, 0.02546977996826172, 0.027997970581054688, 0.030526161193847656, 0.033054351806640625, 0.035582542419433594, 0.03811073303222656, 0.04063892364501953, 0.0431671142578125, 0.04569530487060547, 0.04822349548339844, 0.050751686096191406, 0.053279876708984375, 0.055808067321777344, 0.05833625793457031, 0.06086444854736328, 0.06339263916015625, 0.06592082977294922, 0.06844902038574219, 0.07097721099853516, 0.07350540161132812, 0.0760335922241211, 0.07856178283691406, 0.08108997344970703, 0.0836181640625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 9.0, 20.0, 15.0, 19.0, 32.0, 51.0, 52.0, 68.0, 61.0, 73.0, 73.0, 79.0, 77.0, 72.0, 80.0, 56.0, 35.0, 35.0, 25.0, 16.0, 9.0, 4.0, 14.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042388916015625, -0.04082059860229492, -0.039252281188964844, -0.037683963775634766, -0.03611564636230469, -0.03454732894897461, -0.03297901153564453, -0.03141069412231445, -0.029842376708984375, -0.028274059295654297, -0.02670574188232422, -0.02513742446899414, -0.023569107055664062, -0.022000789642333984, -0.020432472229003906, -0.018864154815673828, -0.01729583740234375, -0.015727519989013672, -0.014159202575683594, -0.012590885162353516, -0.011022567749023438, -0.00945425033569336, -0.007885932922363281, -0.006317615509033203, -0.004749298095703125, -0.003180980682373047, -0.0016126632690429688, -4.4345855712890625e-05, 0.0015239715576171875, 0.0030922889709472656, 0.004660606384277344, 0.006228923797607422, 0.0077972412109375, 0.009365558624267578, 0.010933876037597656, 0.012502193450927734, 0.014070510864257812, 0.01563882827758789, 0.01720714569091797, 0.018775463104248047, 0.020343780517578125, 0.021912097930908203, 0.02348041534423828, 0.02504873275756836, 0.026617050170898438, 0.028185367584228516, 0.029753684997558594, 0.03132200241088867, 0.03289031982421875, 0.03445863723754883, 0.036026954650878906, 0.037595272064208984, 0.03916358947753906, 0.04073190689086914, 0.04230022430419922, 0.0438685417175293, 0.045436859130859375, 0.04700517654418945, 0.04857349395751953, 0.05014181137084961, 0.05171012878417969, 0.053278446197509766, 0.054846763610839844, 0.05641508102416992, 0.0579833984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 9.0, 6.0, 18.0, 21.0, 29.0, 30.0, 47.0, 65.0, 64.0, 73.0, 134.0, 216.0, 493.0, 2412.0, 48379.0, 4080464.0, 57621.0, 2719.0, 531.0, 287.0, 140.0, 114.0, 92.0, 63.0, 52.0, 41.0, 36.0, 22.0, 21.0, 14.0, 8.0, 16.0, 11.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.314453125, -0.3053436279296875, -0.296234130859375, -0.2871246337890625, -0.27801513671875, -0.2689056396484375, -0.259796142578125, -0.2506866455078125, -0.2415771484375, -0.2324676513671875, -0.223358154296875, -0.2142486572265625, -0.20513916015625, -0.1960296630859375, -0.186920166015625, -0.1778106689453125, -0.168701171875, -0.1595916748046875, -0.150482177734375, -0.1413726806640625, -0.13226318359375, -0.1231536865234375, -0.114044189453125, -0.1049346923828125, -0.0958251953125, -0.0867156982421875, -0.077606201171875, -0.0684967041015625, -0.05938720703125, -0.0502777099609375, -0.041168212890625, -0.0320587158203125, -0.02294921875, -0.0138397216796875, -0.004730224609375, 0.0043792724609375, 0.01348876953125, 0.0225982666015625, 0.031707763671875, 0.0408172607421875, 0.0499267578125, 0.0590362548828125, 0.068145751953125, 0.0772552490234375, 0.08636474609375, 0.0954742431640625, 0.104583740234375, 0.1136932373046875, 0.122802734375, 0.1319122314453125, 0.141021728515625, 0.1501312255859375, 0.15924072265625, 0.1683502197265625, 0.177459716796875, 0.1865692138671875, 0.1956787109375, 0.2047882080078125, 0.213897705078125, 0.2230072021484375, 0.23211669921875, 0.2412261962890625, 0.250335693359375, 0.2594451904296875, 0.2685546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 12.0, 7.0, 13.0, 31.0, 37.0, 41.0, 81.0, 185.0, 399.0, 1042.0, 1159.0, 546.0, 225.0, 116.0, 59.0, 36.0, 21.0, 21.0, 10.0, 15.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0775146484375, -0.0732574462890625, -0.069000244140625, -0.0647430419921875, -0.06048583984375, -0.0562286376953125, -0.051971435546875, -0.0477142333984375, -0.04345703125, -0.0391998291015625, -0.034942626953125, -0.0306854248046875, -0.02642822265625, -0.0221710205078125, -0.017913818359375, -0.0136566162109375, -0.0093994140625, -0.0051422119140625, -0.000885009765625, 0.0033721923828125, 0.00762939453125, 0.0118865966796875, 0.016143798828125, 0.0204010009765625, 0.024658203125, 0.0289154052734375, 0.033172607421875, 0.0374298095703125, 0.04168701171875, 0.0459442138671875, 0.050201416015625, 0.0544586181640625, 0.0587158203125, 0.0629730224609375, 0.067230224609375, 0.0714874267578125, 0.07574462890625, 0.0800018310546875, 0.084259033203125, 0.0885162353515625, 0.0927734375, 0.0970306396484375, 0.101287841796875, 0.1055450439453125, 0.10980224609375, 0.1140594482421875, 0.118316650390625, 0.1225738525390625, 0.1268310546875, 0.1310882568359375, 0.135345458984375, 0.1396026611328125, 0.14385986328125, 0.1481170654296875, 0.152374267578125, 0.1566314697265625, 0.160888671875, 0.1651458740234375, 0.169403076171875, 0.1736602783203125, 0.17791748046875, 0.1821746826171875, 0.186431884765625, 0.1906890869140625, 0.1949462890625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 15.0, 13.0, 37.0, 82.0, 156.0, 207.0, 181.0, 123.0, 69.0, 30.0, 25.0, 13.0, 5.0, 9.0, 4.0, 3.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6048109531402588, -1.558512568473816, -1.512214183807373, -1.4659159183502197, -1.4196175336837769, -1.373319149017334, -1.3270208835601807, -1.2807224988937378, -1.234424114227295, -1.188125729560852, -1.1418273448944092, -1.0955290794372559, -1.049230694770813, -1.0029323101043701, -0.956633985042572, -0.9103356599807739, -0.864037275314331, -0.8177388906478882, -0.7714405655860901, -0.725142240524292, -0.6788438558578491, -0.6325454711914062, -0.5862471461296082, -0.5399488210678101, -0.4936504364013672, -0.4473520815372467, -0.4010537266731262, -0.35475537180900574, -0.30845701694488525, -0.26215866208076477, -0.2158603072166443, -0.1695619523525238, -0.12326359748840332, -0.07696524262428284, -0.030666887760162354, 0.01563146710395813, 0.06192982196807861, 0.1082281768321991, 0.15452653169631958, 0.20082488656044006, 0.24712324142456055, 0.29342159628868103, 0.3397199511528015, 0.386018306016922, 0.4323166608810425, 0.47861501574516296, 0.5249133706092834, 0.5712116956710815, 0.6175100803375244, 0.6638084650039673, 0.7101067900657654, 0.7564051151275635, 0.8027034997940063, 0.8490018844604492, 0.8953002095222473, 0.9415985345840454, 0.9878969192504883, 1.0341953039169312, 1.080493688583374, 1.1267919540405273, 1.1730903387069702, 1.219388723373413, 1.2656869888305664, 1.3119853734970093, 1.3582837581634521]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 9.0, 9.0, 5.0, 20.0, 21.0, 14.0, 15.0, 21.0, 17.0, 32.0, 21.0, 45.0, 31.0, 41.0, 39.0, 46.0, 47.0, 47.0, 55.0, 38.0, 51.0, 47.0, 35.0, 41.0, 43.0, 21.0, 37.0, 23.0, 15.0, 20.0, 12.0, 9.0, 10.0, 10.0, 11.0, 4.0, 9.0, 9.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41936206817626953, -0.4051533639431, -0.39094462990760803, -0.3767359256744385, -0.36252719163894653, -0.348318487405777, -0.3341097831726074, -0.3199010491371155, -0.3056923449039459, -0.29148364067077637, -0.2772749066352844, -0.26306620240211487, -0.24885748326778412, -0.23464876413345337, -0.2204400599002838, -0.20623134076595306, -0.19202262163162231, -0.17781390249729156, -0.16360518336296082, -0.14939647912979126, -0.1351877599954605, -0.12097904086112976, -0.10677032917737961, -0.09256161749362946, -0.0783528983592987, -0.06414417922496796, -0.049935467541217804, -0.03572675213217735, -0.021518036723136902, -0.007309317588806152, 0.006899394094944, 0.021108105778694153, 0.0353168249130249, 0.04952554032206535, 0.0637342557311058, 0.07794296741485596, 0.0921516865491867, 0.10636040568351746, 0.12056911736726761, 0.13477782905101776, 0.1489865481853485, 0.16319526731967926, 0.17740398645401, 0.19161269068717957, 0.20582140982151031, 0.22003012895584106, 0.23423883318901062, 0.24844755232334137, 0.2626562714576721, 0.2768649756908417, 0.2910737097263336, 0.3052824139595032, 0.3194911479949951, 0.3336998522281647, 0.34790855646133423, 0.36211729049682617, 0.3763259947299957, 0.3905346989631653, 0.4047434329986572, 0.4189521372318268, 0.43316084146499634, 0.4473695755004883, 0.46157827973365784, 0.4757869839668274, 0.48999571800231934]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 6.0, 13.0, 23.0, 32.0, 43.0, 81.0, 96.0, 152.0, 253.0, 441.0, 596.0, 1055.0, 1822.0, 3172.0, 5869.0, 11175.0, 23658.0, 54282.0, 136681.0, 325792.0, 283577.0, 112345.0, 45378.0, 20219.0, 9657.0, 5122.0, 2789.0, 1607.0, 970.0, 596.0, 347.0, 214.0, 135.0, 105.0, 78.0, 33.0, 47.0, 28.0, 20.0, 9.0, 14.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.0869140625, -0.08455848693847656, -0.08220291137695312, -0.07984733581542969, -0.07749176025390625, -0.07513618469238281, -0.07278060913085938, -0.07042503356933594, -0.0680694580078125, -0.06571388244628906, -0.06335830688476562, -0.06100273132324219, -0.05864715576171875, -0.05629158020019531, -0.053936004638671875, -0.05158042907714844, -0.049224853515625, -0.04686927795410156, -0.044513702392578125, -0.04215812683105469, -0.03980255126953125, -0.03744697570800781, -0.035091400146484375, -0.03273582458496094, -0.0303802490234375, -0.028024673461914062, -0.025669097900390625, -0.023313522338867188, -0.02095794677734375, -0.018602371215820312, -0.016246795654296875, -0.013891220092773438, -0.01153564453125, -0.009180068969726562, -0.006824493408203125, -0.0044689178466796875, -0.00211334228515625, 0.0002422332763671875, 0.002597808837890625, 0.0049533843994140625, 0.0073089599609375, 0.009664535522460938, 0.012020111083984375, 0.014375686645507812, 0.01673126220703125, 0.019086837768554688, 0.021442413330078125, 0.023797988891601562, 0.026153564453125, 0.028509140014648438, 0.030864715576171875, 0.03322029113769531, 0.03557586669921875, 0.03793144226074219, 0.040287017822265625, 0.04264259338378906, 0.0449981689453125, 0.04735374450683594, 0.049709320068359375, 0.05206489562988281, 0.05442047119140625, 0.05677604675292969, 0.059131622314453125, 0.06148719787597656, 0.0638427734375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 12.0, 18.0, 17.0, 27.0, 32.0, 50.0, 49.0, 67.0, 59.0, 88.0, 99.0, 88.0, 67.0, 63.0, 51.0, 51.0, 55.0, 36.0, 16.0, 22.0, 9.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0538330078125, -0.05202293395996094, -0.050212860107421875, -0.04840278625488281, -0.04659271240234375, -0.04478263854980469, -0.042972564697265625, -0.04116249084472656, -0.0393524169921875, -0.03754234313964844, -0.035732269287109375, -0.03392219543457031, -0.03211212158203125, -0.030302047729492188, -0.028491973876953125, -0.026681900024414062, -0.024871826171875, -0.023061752319335938, -0.021251678466796875, -0.019441604614257812, -0.01763153076171875, -0.015821456909179688, -0.014011383056640625, -0.012201309204101562, -0.0103912353515625, -0.008581161499023438, -0.006771087646484375, -0.0049610137939453125, -0.00315093994140625, -0.0013408660888671875, 0.000469207763671875, 0.0022792816162109375, 0.00408935546875, 0.0058994293212890625, 0.007709503173828125, 0.009519577026367188, 0.01132965087890625, 0.013139724731445312, 0.014949798583984375, 0.016759872436523438, 0.0185699462890625, 0.020380020141601562, 0.022190093994140625, 0.024000167846679688, 0.02581024169921875, 0.027620315551757812, 0.029430389404296875, 0.031240463256835938, 0.033050537109375, 0.03486061096191406, 0.036670684814453125, 0.03848075866699219, 0.04029083251953125, 0.04210090637207031, 0.043910980224609375, 0.04572105407714844, 0.0475311279296875, 0.04934120178222656, 0.051151275634765625, 0.05296134948730469, 0.05477142333984375, 0.05658149719238281, 0.058391571044921875, 0.06020164489746094, 0.06201171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 7.0, 18.0, 17.0, 21.0, 21.0, 42.0, 44.0, 90.0, 125.0, 176.0, 323.0, 540.0, 1044.0, 2540.0, 6856.0, 32970.0, 644728.0, 324450.0, 24357.0, 5807.0, 2020.0, 921.0, 534.0, 315.0, 194.0, 102.0, 75.0, 57.0, 50.0, 30.0, 21.0, 9.0, 11.0, 9.0, 9.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.259521484375, -0.2513923645019531, -0.24326324462890625, -0.23513412475585938, -0.2270050048828125, -0.21887588500976562, -0.21074676513671875, -0.20261764526367188, -0.194488525390625, -0.18635940551757812, -0.17823028564453125, -0.17010116577148438, -0.1619720458984375, -0.15384292602539062, -0.14571380615234375, -0.13758468627929688, -0.12945556640625, -0.12132644653320312, -0.11319732666015625, -0.10506820678710938, -0.0969390869140625, -0.08880996704101562, -0.08068084716796875, -0.07255172729492188, -0.064422607421875, -0.056293487548828125, -0.04816436767578125, -0.040035247802734375, -0.0319061279296875, -0.023777008056640625, -0.01564788818359375, -0.007518768310546875, 0.0006103515625, 0.008739471435546875, 0.01686859130859375, 0.024997711181640625, 0.0331268310546875, 0.041255950927734375, 0.04938507080078125, 0.057514190673828125, 0.065643310546875, 0.07377243041992188, 0.08190155029296875, 0.09003067016601562, 0.0981597900390625, 0.10628890991210938, 0.11441802978515625, 0.12254714965820312, 0.13067626953125, 0.13880538940429688, 0.14693450927734375, 0.15506362915039062, 0.1631927490234375, 0.17132186889648438, 0.17945098876953125, 0.18758010864257812, 0.195709228515625, 0.20383834838867188, 0.21196746826171875, 0.22009658813476562, 0.2282257080078125, 0.23635482788085938, 0.24448394775390625, 0.2526130676269531, 0.2607421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 12.0, 7.0, 10.0, 14.0, 20.0, 20.0, 19.0, 34.0, 25.0, 37.0, 35.0, 51.0, 49.0, 45.0, 55.0, 50.0, 53.0, 54.0, 57.0, 54.0, 42.0, 40.0, 36.0, 29.0, 20.0, 22.0, 19.0, 18.0, 12.0, 12.0, 11.0, 13.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.165283203125, -0.16045188903808594, -0.15562057495117188, -0.1507892608642578, -0.14595794677734375, -0.1411266326904297, -0.13629531860351562, -0.13146400451660156, -0.1266326904296875, -0.12180137634277344, -0.11697006225585938, -0.11213874816894531, -0.10730743408203125, -0.10247611999511719, -0.09764480590820312, -0.09281349182128906, -0.087982177734375, -0.08315086364746094, -0.07831954956054688, -0.07348823547363281, -0.06865692138671875, -0.06382560729980469, -0.058994293212890625, -0.05416297912597656, -0.0493316650390625, -0.04450035095214844, -0.039669036865234375, -0.03483772277832031, -0.03000640869140625, -0.025175094604492188, -0.020343780517578125, -0.015512466430664062, -0.01068115234375, -0.0058498382568359375, -0.001018524169921875, 0.0038127899169921875, 0.00864410400390625, 0.013475418090820312, 0.018306732177734375, 0.023138046264648438, 0.0279693603515625, 0.03280067443847656, 0.037631988525390625, 0.04246330261230469, 0.04729461669921875, 0.05212593078613281, 0.056957244873046875, 0.06178855895996094, 0.066619873046875, 0.07145118713378906, 0.07628250122070312, 0.08111381530761719, 0.08594512939453125, 0.09077644348144531, 0.09560775756835938, 0.10043907165527344, 0.1052703857421875, 0.11010169982910156, 0.11493301391601562, 0.11976432800292969, 0.12459564208984375, 0.1294269561767578, 0.13425827026367188, 0.13908958435058594, 0.1439208984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 10.0, 14.0, 17.0, 27.0, 40.0, 53.0, 53.0, 84.0, 102.0, 155.0, 205.0, 283.0, 453.0, 639.0, 956.0, 1381.0, 2242.0, 3889.0, 6871.0, 13337.0, 31602.0, 118145.0, 704482.0, 104205.0, 29690.0, 12701.0, 6550.0, 3729.0, 2295.0, 1407.0, 916.0, 583.0, 414.0, 288.0, 183.0, 141.0, 108.0, 81.0, 62.0, 45.0, 28.0, 21.0, 17.0, 19.0, 6.0, 6.0, 9.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08770751953125, -0.08508682250976562, -0.08246612548828125, -0.07984542846679688, -0.0772247314453125, -0.07460403442382812, -0.07198333740234375, -0.06936264038085938, -0.066741943359375, -0.06412124633789062, -0.06150054931640625, -0.058879852294921875, -0.0562591552734375, -0.053638458251953125, -0.05101776123046875, -0.048397064208984375, -0.0457763671875, -0.043155670166015625, -0.04053497314453125, -0.037914276123046875, -0.0352935791015625, -0.032672882080078125, -0.03005218505859375, -0.027431488037109375, -0.024810791015625, -0.022190093994140625, -0.01956939697265625, -0.016948699951171875, -0.0143280029296875, -0.011707305908203125, -0.00908660888671875, -0.006465911865234375, -0.00384521484375, -0.001224517822265625, 0.00139617919921875, 0.004016876220703125, 0.0066375732421875, 0.009258270263671875, 0.01187896728515625, 0.014499664306640625, 0.017120361328125, 0.019741058349609375, 0.02236175537109375, 0.024982452392578125, 0.0276031494140625, 0.030223846435546875, 0.03284454345703125, 0.035465240478515625, 0.0380859375, 0.040706634521484375, 0.04332733154296875, 0.045948028564453125, 0.0485687255859375, 0.051189422607421875, 0.05381011962890625, 0.056430816650390625, 0.059051513671875, 0.061672210693359375, 0.06429290771484375, 0.06691360473632812, 0.0695343017578125, 0.07215499877929688, 0.07477569580078125, 0.07739639282226562, 0.08001708984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 13.0, 14.0, 21.0, 25.0, 44.0, 190.0, 438.0, 137.0, 31.0, 18.0, 12.0, 6.0, 11.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010228157043457031, -9.921751916408539e-05, -9.615346789360046e-05, -9.308941662311554e-05, -9.002536535263062e-05, -8.696131408214569e-05, -8.389726281166077e-05, -8.083321154117584e-05, -7.776916027069092e-05, -7.4705109000206e-05, -7.164105772972107e-05, -6.857700645923615e-05, -6.551295518875122e-05, -6.24489039182663e-05, -5.938485264778137e-05, -5.632080137729645e-05, -5.3256750106811523e-05, -5.01926988363266e-05, -4.7128647565841675e-05, -4.406459629535675e-05, -4.1000545024871826e-05, -3.79364937543869e-05, -3.487244248390198e-05, -3.180839121341705e-05, -2.874433994293213e-05, -2.5680288672447205e-05, -2.261623740196228e-05, -1.9552186131477356e-05, -1.648813486099243e-05, -1.3424083590507507e-05, -1.0360032320022583e-05, -7.295981049537659e-06, -4.231929779052734e-06, -1.16787850856781e-06, 1.8961727619171143e-06, 4.9602240324020386e-06, 8.024275302886963e-06, 1.1088326573371887e-05, 1.4152377843856812e-05, 1.7216429114341736e-05, 2.028048038482666e-05, 2.3344531655311584e-05, 2.640858292579651e-05, 2.9472634196281433e-05, 3.253668546676636e-05, 3.560073673725128e-05, 3.8664788007736206e-05, 4.172883927822113e-05, 4.4792890548706055e-05, 4.785694181919098e-05, 5.09209930896759e-05, 5.398504436016083e-05, 5.704909563064575e-05, 6.0113146901130676e-05, 6.31771981716156e-05, 6.624124944210052e-05, 6.930530071258545e-05, 7.236935198307037e-05, 7.54334032535553e-05, 7.849745452404022e-05, 8.156150579452515e-05, 8.462555706501007e-05, 8.7689608335495e-05, 9.075365960597992e-05, 9.381771087646484e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 10.0, 18.0, 21.0, 17.0, 36.0, 61.0, 81.0, 132.0, 217.0, 406.0, 789.0, 1658.0, 4163.0, 12552.0, 61421.0, 801641.0, 134829.0, 20152.0, 5907.0, 2229.0, 1001.0, 489.0, 254.0, 161.0, 85.0, 77.0, 40.0, 21.0, 14.0, 14.0, 9.0, 7.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12939453125, -0.12517547607421875, -0.1209564208984375, -0.11673736572265625, -0.112518310546875, -0.10829925537109375, -0.1040802001953125, -0.09986114501953125, -0.09564208984375, -0.09142303466796875, -0.0872039794921875, -0.08298492431640625, -0.078765869140625, -0.07454681396484375, -0.0703277587890625, -0.06610870361328125, -0.0618896484375, -0.05767059326171875, -0.0534515380859375, -0.04923248291015625, -0.045013427734375, -0.04079437255859375, -0.0365753173828125, -0.03235626220703125, -0.02813720703125, -0.02391815185546875, -0.0196990966796875, -0.01548004150390625, -0.011260986328125, -0.00704193115234375, -0.0028228759765625, 0.00139617919921875, 0.005615234375, 0.00983428955078125, 0.0140533447265625, 0.01827239990234375, 0.022491455078125, 0.02671051025390625, 0.0309295654296875, 0.03514862060546875, 0.03936767578125, 0.04358673095703125, 0.0478057861328125, 0.05202484130859375, 0.056243896484375, 0.06046295166015625, 0.0646820068359375, 0.06890106201171875, 0.0731201171875, 0.07733917236328125, 0.0815582275390625, 0.08577728271484375, 0.089996337890625, 0.09421539306640625, 0.0984344482421875, 0.10265350341796875, 0.10687255859375, 0.11109161376953125, 0.1153106689453125, 0.11952972412109375, 0.123748779296875, 0.12796783447265625, 0.1321868896484375, 0.13640594482421875, 0.140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 8.0, 11.0, 17.0, 18.0, 19.0, 34.0, 67.0, 111.0, 165.0, 182.0, 128.0, 55.0, 49.0, 36.0, 27.0, 14.0, 9.0, 14.0, 2.0, 1.0, 4.0, 6.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13623046875, -0.13234901428222656, -0.12846755981445312, -0.12458610534667969, -0.12070465087890625, -0.11682319641113281, -0.11294174194335938, -0.10906028747558594, -0.1051788330078125, -0.10129737854003906, -0.09741592407226562, -0.09353446960449219, -0.08965301513671875, -0.08577156066894531, -0.08189010620117188, -0.07800865173339844, -0.074127197265625, -0.07024574279785156, -0.06636428833007812, -0.06248283386230469, -0.05860137939453125, -0.05471992492675781, -0.050838470458984375, -0.04695701599121094, -0.0430755615234375, -0.03919410705566406, -0.035312652587890625, -0.03143119812011719, -0.02754974365234375, -0.023668289184570312, -0.019786834716796875, -0.015905380249023438, -0.01202392578125, -0.008142471313476562, -0.004261016845703125, -0.0003795623779296875, 0.00350189208984375, 0.0073833465576171875, 0.011264801025390625, 0.015146255493164062, 0.0190277099609375, 0.022909164428710938, 0.026790618896484375, 0.030672073364257812, 0.03455352783203125, 0.03843498229980469, 0.042316436767578125, 0.04619789123535156, 0.050079345703125, 0.05396080017089844, 0.057842254638671875, 0.06172370910644531, 0.06560516357421875, 0.06948661804199219, 0.07336807250976562, 0.07724952697753906, 0.0811309814453125, 0.08501243591308594, 0.08889389038085938, 0.09277534484863281, 0.09665679931640625, 0.10053825378417969, 0.10441970825195312, 0.10830116271972656, 0.1121826171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 6.0, 12.0, 26.0, 35.0, 89.0, 145.0, 250.0, 239.0, 98.0, 47.0, 13.0, 7.0, 8.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.36079740524292, -2.2844762802124023, -2.2081549167633057, -2.131833553314209, -2.0555124282836914, -1.9791911840438843, -1.9028699398040771, -1.82654869556427, -1.750227451324463, -1.6739062070846558, -1.5975849628448486, -1.5212637186050415, -1.4449424743652344, -1.3686212301254272, -1.2922999858856201, -1.215978741645813, -1.1396574974060059, -1.0633362531661987, -0.9870150089263916, -0.9106937646865845, -0.8343725204467773, -0.7580512762069702, -0.6817300319671631, -0.605408787727356, -0.5290875434875488, -0.4527662992477417, -0.37644505500793457, -0.30012381076812744, -0.2238025665283203, -0.14748132228851318, -0.07116007804870605, 0.005161166191101074, 0.0814826488494873, 0.15780389308929443, 0.23412513732910156, 0.3104463815689087, 0.3867676258087158, 0.46308887004852295, 0.5394101142883301, 0.6157313585281372, 0.6920526027679443, 0.7683738470077515, 0.8446950912475586, 0.9210163354873657, 0.9973375797271729, 1.07365882396698, 1.149980068206787, 1.2263013124465942, 1.3026225566864014, 1.3789438009262085, 1.4552650451660156, 1.5315862894058228, 1.6079075336456299, 1.684228777885437, 1.7605500221252441, 1.8368712663650513, 1.9131925106048584, 1.9895137548446655, 2.0658349990844727, 2.1421561241149902, 2.218477487564087, 2.2947988510131836, 2.371119976043701, 2.4474411010742188, 2.5237624645233154]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 14.0, 9.0, 10.0, 23.0, 22.0, 28.0, 36.0, 35.0, 28.0, 42.0, 36.0, 61.0, 89.0, 74.0, 95.0, 55.0, 52.0, 45.0, 50.0, 24.0, 31.0, 27.0, 26.0, 12.0, 11.0, 18.0, 8.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8212839961051941, -0.7960782647132874, -0.7708724737167358, -0.7456667423248291, -0.7204610109329224, -0.6952552795410156, -0.6700495481491089, -0.6448437571525574, -0.6196380257606506, -0.5944322943687439, -0.5692265033721924, -0.5440207719802856, -0.5188150405883789, -0.49360930919647217, -0.46840354800224304, -0.4431977868080139, -0.4179920554161072, -0.39278632402420044, -0.3675805628299713, -0.3423748016357422, -0.31716907024383545, -0.2919633388519287, -0.2667575776576996, -0.24155183136463165, -0.21634608507156372, -0.1911403387784958, -0.16593459248542786, -0.14072884619235992, -0.11552309989929199, -0.09031735360622406, -0.06511160731315613, -0.039905861020088196, -0.014700114727020264, 0.010505631566047668, 0.0357113778591156, 0.06091712415218353, 0.08612287044525146, 0.1113286167383194, 0.13653436303138733, 0.16174010932445526, 0.1869458556175232, 0.21215160191059113, 0.23735734820365906, 0.2625631093978882, 0.2877688407897949, 0.31297457218170166, 0.3381803333759308, 0.3633860945701599, 0.38859182596206665, 0.4137975573539734, 0.4390033185482025, 0.46420907974243164, 0.4894148111343384, 0.5146205425262451, 0.5398262739181519, 0.5650320649147034, 0.5902377963066101, 0.6154435276985168, 0.6406493186950684, 0.6658550500869751, 0.6910607814788818, 0.7162665128707886, 0.7414722442626953, 0.7666780352592468, 0.7918837666511536]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 20.0, 11.0, 18.0, 41.0, 54.0, 79.0, 136.0, 265.0, 508.0, 1062.0, 2646.0, 9242.0, 49876.0, 1611994.0, 2436210.0, 65858.0, 10838.0, 3012.0, 1203.0, 536.0, 257.0, 141.0, 89.0, 44.0, 32.0, 22.0, 20.0, 12.0, 10.0, 8.0, 7.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.113037109375, -0.1090087890625, -0.10498046875, -0.1009521484375, -0.096923828125, -0.0928955078125, -0.0888671875, -0.0848388671875, -0.080810546875, -0.0767822265625, -0.07275390625, -0.0687255859375, -0.064697265625, -0.0606689453125, -0.056640625, -0.0526123046875, -0.048583984375, -0.0445556640625, -0.04052734375, -0.0364990234375, -0.032470703125, -0.0284423828125, -0.0244140625, -0.0203857421875, -0.016357421875, -0.0123291015625, -0.00830078125, -0.0042724609375, -0.000244140625, 0.0037841796875, 0.0078125, 0.0118408203125, 0.015869140625, 0.0198974609375, 0.02392578125, 0.0279541015625, 0.031982421875, 0.0360107421875, 0.0400390625, 0.0440673828125, 0.048095703125, 0.0521240234375, 0.05615234375, 0.0601806640625, 0.064208984375, 0.0682373046875, 0.072265625, 0.0762939453125, 0.080322265625, 0.0843505859375, 0.08837890625, 0.0924072265625, 0.096435546875, 0.1004638671875, 0.1044921875, 0.1085205078125, 0.112548828125, 0.1165771484375, 0.12060546875, 0.1246337890625, 0.128662109375, 0.1326904296875, 0.13671875, 0.1407470703125, 0.144775390625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 12.0, 10.0, 16.0, 29.0, 38.0, 45.0, 60.0, 54.0, 77.0, 96.0, 87.0, 85.0, 82.0, 54.0, 64.0, 45.0, 53.0, 32.0, 15.0, 11.0, 10.0, 6.0, 6.0, 7.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056060791015625, -0.0541081428527832, -0.052155494689941406, -0.05020284652709961, -0.04825019836425781, -0.046297550201416016, -0.04434490203857422, -0.04239225387573242, -0.040439605712890625, -0.03848695755004883, -0.03653430938720703, -0.034581661224365234, -0.03262901306152344, -0.03067636489868164, -0.028723716735839844, -0.026771068572998047, -0.02481842041015625, -0.022865772247314453, -0.020913124084472656, -0.01896047592163086, -0.017007827758789062, -0.015055179595947266, -0.013102531433105469, -0.011149883270263672, -0.009197235107421875, -0.007244586944580078, -0.005291938781738281, -0.0033392906188964844, -0.0013866424560546875, 0.0005660057067871094, 0.0025186538696289062, 0.004471302032470703, 0.0064239501953125, 0.008376598358154297, 0.010329246520996094, 0.01228189468383789, 0.014234542846679688, 0.016187191009521484, 0.01813983917236328, 0.020092487335205078, 0.022045135498046875, 0.023997783660888672, 0.02595043182373047, 0.027903079986572266, 0.029855728149414062, 0.03180837631225586, 0.033761024475097656, 0.03571367263793945, 0.03766632080078125, 0.03961896896362305, 0.041571617126464844, 0.04352426528930664, 0.04547691345214844, 0.047429561614990234, 0.04938220977783203, 0.05133485794067383, 0.053287506103515625, 0.05524015426635742, 0.05719280242919922, 0.059145450592041016, 0.06109809875488281, 0.06305074691772461, 0.0650033950805664, 0.0669560432434082, 0.06890869140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 15.0, 22.0, 19.0, 22.0, 52.0, 55.0, 65.0, 85.0, 110.0, 154.0, 271.0, 520.0, 1521.0, 13209.0, 3748818.0, 420295.0, 6772.0, 1146.0, 388.0, 178.0, 122.0, 125.0, 66.0, 65.0, 32.0, 33.0, 27.0, 21.0, 10.0, 11.0, 13.0, 11.0, 2.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.36181640625, -0.3500938415527344, -0.33837127685546875, -0.3266487121582031, -0.3149261474609375, -0.3032035827636719, -0.29148101806640625, -0.2797584533691406, -0.268035888671875, -0.2563133239746094, -0.24459075927734375, -0.23286819458007812, -0.2211456298828125, -0.20942306518554688, -0.19770050048828125, -0.18597793579101562, -0.17425537109375, -0.16253280639648438, -0.15081024169921875, -0.13908767700195312, -0.1273651123046875, -0.11564254760742188, -0.10391998291015625, -0.09219741821289062, -0.080474853515625, -0.06875228881835938, -0.05702972412109375, -0.045307159423828125, -0.0335845947265625, -0.021862030029296875, -0.01013946533203125, 0.001583099365234375, 0.0133056640625, 0.025028228759765625, 0.03675079345703125, 0.048473358154296875, 0.0601959228515625, 0.07191848754882812, 0.08364105224609375, 0.09536361694335938, 0.107086181640625, 0.11880874633789062, 0.13053131103515625, 0.14225387573242188, 0.1539764404296875, 0.16569900512695312, 0.17742156982421875, 0.18914413452148438, 0.20086669921875, 0.21258926391601562, 0.22431182861328125, 0.23603439331054688, 0.2477569580078125, 0.2594795227050781, 0.27120208740234375, 0.2829246520996094, 0.294647216796875, 0.3063697814941406, 0.31809234619140625, 0.3298149108886719, 0.3415374755859375, 0.3532600402832031, 0.36498260498046875, 0.3767051696777344, 0.388427734375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 7.0, 3.0, 13.0, 9.0, 13.0, 26.0, 29.0, 48.0, 88.0, 168.0, 382.0, 828.0, 1148.0, 654.0, 289.0, 146.0, 86.0, 50.0, 33.0, 15.0, 17.0, 3.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171142578125, -0.16617202758789062, -0.16120147705078125, -0.15623092651367188, -0.1512603759765625, -0.14628982543945312, -0.14131927490234375, -0.13634872436523438, -0.131378173828125, -0.12640762329101562, -0.12143707275390625, -0.11646652221679688, -0.1114959716796875, -0.10652542114257812, -0.10155487060546875, -0.09658432006835938, -0.09161376953125, -0.08664321899414062, -0.08167266845703125, -0.07670211791992188, -0.0717315673828125, -0.06676101684570312, -0.06179046630859375, -0.056819915771484375, -0.051849365234375, -0.046878814697265625, -0.04190826416015625, -0.036937713623046875, -0.0319671630859375, -0.026996612548828125, -0.02202606201171875, -0.017055511474609375, -0.0120849609375, -0.007114410400390625, -0.00214385986328125, 0.002826690673828125, 0.0077972412109375, 0.012767791748046875, 0.01773834228515625, 0.022708892822265625, 0.027679443359375, 0.032649993896484375, 0.03762054443359375, 0.042591094970703125, 0.0475616455078125, 0.052532196044921875, 0.05750274658203125, 0.062473297119140625, 0.06744384765625, 0.07241439819335938, 0.07738494873046875, 0.08235549926757812, 0.0873260498046875, 0.09229660034179688, 0.09726715087890625, 0.10223770141601562, 0.107208251953125, 0.11217880249023438, 0.11714935302734375, 0.12211990356445312, 0.1270904541015625, 0.13206100463867188, 0.13703155517578125, 0.14200210571289062, 0.14697265625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 11.0, 10.0, 14.0, 22.0, 37.0, 65.0, 108.0, 154.0, 165.0, 128.0, 117.0, 61.0, 41.0, 13.0, 22.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2470269203186035, -1.198002815246582, -1.14897882938385, -1.0999547243118286, -1.0509306192398071, -1.0019066333770752, -0.9528825283050537, -0.903858482837677, -0.8548344373703003, -0.8058103919029236, -0.7567862868309021, -0.7077622413635254, -0.6587381958961487, -0.609714150428772, -0.5606900453567505, -0.5116659998893738, -0.4626418948173523, -0.4136178195476532, -0.3645937740802765, -0.3155696988105774, -0.2665456533432007, -0.2175215780735016, -0.1684975028038025, -0.11947345733642578, -0.07044938206672668, -0.021425317972898483, 0.027598746120929718, 0.07662281394004822, 0.12564687430858612, 0.17467093467712402, 0.22369500994682312, 0.27271905541419983, 0.3217431306838989, 0.370767205953598, 0.41979125142097473, 0.46881532669067383, 0.5178393721580505, 0.5668634176254272, 0.6158875226974487, 0.6649115681648254, 0.7139356136322021, 0.7629596590995789, 0.8119837641716003, 0.861007809638977, 0.9100318551063538, 0.9590559005737305, 1.008080005645752, 1.0571041107177734, 1.106128215789795, 1.1551523208618164, 1.2041763067245483, 1.2532004117965698, 1.3022245168685913, 1.3512485027313232, 1.4002726078033447, 1.4492967128753662, 1.4983206987380981, 1.5473448038101196, 1.5963687896728516, 1.645392894744873, 1.6944169998168945, 1.7434409856796265, 1.792465090751648, 1.8414890766143799, 1.8905131816864014]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 12.0, 10.0, 14.0, 15.0, 17.0, 12.0, 14.0, 24.0, 24.0, 24.0, 31.0, 27.0, 24.0, 35.0, 40.0, 36.0, 44.0, 45.0, 45.0, 29.0, 42.0, 44.0, 35.0, 30.0, 36.0, 27.0, 25.0, 31.0, 27.0, 31.0, 16.0, 22.0, 13.0, 21.0, 18.0, 7.0, 7.0, 6.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.5141165256500244, -0.4993908703327179, -0.48466524481773376, -0.46993958950042725, -0.4552139639854431, -0.4404883086681366, -0.4257626533508301, -0.41103702783584595, -0.39631137251853943, -0.3815857172012329, -0.3668600916862488, -0.35213443636894226, -0.33740881085395813, -0.3226831555366516, -0.3079575300216675, -0.29323187470436096, -0.27850621938705444, -0.2637805640697479, -0.2490549385547638, -0.23432928323745728, -0.21960364282131195, -0.20487800240516663, -0.1901523619890213, -0.17542672157287598, -0.16070109605789185, -0.14597545564174652, -0.1312498152256012, -0.11652416735887527, -0.10179851949214935, -0.08707287907600403, -0.0723472386598587, -0.05762159079313278, -0.04289594292640686, -0.028170298784971237, -0.013444656506180763, 0.0012809857726097107, 0.016006629914045334, 0.030732274055480957, 0.04545791447162628, 0.0601835623383522, 0.07490920275449753, 0.08963484317064285, 0.10436049103736877, 0.1190861314535141, 0.13381177186965942, 0.14853742718696594, 0.16326305270195007, 0.1779887080192566, 0.19271434843540192, 0.20743998885154724, 0.22216562926769257, 0.2368912696838379, 0.2516169250011444, 0.2663425803184509, 0.28106820583343506, 0.2957938611507416, 0.3105194866657257, 0.3252451419830322, 0.33997076749801636, 0.3546964228153229, 0.369422048330307, 0.3841477036476135, 0.39887332916259766, 0.4135989844799042, 0.4283246397972107]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 5.0, 12.0, 17.0, 18.0, 25.0, 37.0, 67.0, 121.0, 171.0, 286.0, 461.0, 789.0, 1407.0, 2526.0, 4538.0, 9006.0, 18636.0, 41012.0, 94236.0, 206941.0, 301211.0, 199353.0, 90990.0, 39721.0, 18238.0, 8570.0, 4474.0, 2358.0, 1363.0, 754.0, 470.0, 319.0, 154.0, 90.0, 65.0, 43.0, 26.0, 14.0, 11.0, 9.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0791015625, -0.07666587829589844, -0.07423019409179688, -0.07179450988769531, -0.06935882568359375, -0.06692314147949219, -0.06448745727539062, -0.06205177307128906, -0.0596160888671875, -0.05718040466308594, -0.054744720458984375, -0.05230903625488281, -0.04987335205078125, -0.04743766784667969, -0.045001983642578125, -0.04256629943847656, -0.040130615234375, -0.03769493103027344, -0.035259246826171875, -0.03282356262207031, -0.03038787841796875, -0.027952194213867188, -0.025516510009765625, -0.023080825805664062, -0.0206451416015625, -0.018209457397460938, -0.015773773193359375, -0.013338088989257812, -0.01090240478515625, -0.008466720581054688, -0.006031036376953125, -0.0035953521728515625, -0.00115966796875, 0.0012760162353515625, 0.003711700439453125, 0.0061473846435546875, 0.00858306884765625, 0.011018753051757812, 0.013454437255859375, 0.015890121459960938, 0.0183258056640625, 0.020761489868164062, 0.023197174072265625, 0.025632858276367188, 0.02806854248046875, 0.030504226684570312, 0.032939910888671875, 0.03537559509277344, 0.037811279296875, 0.04024696350097656, 0.042682647705078125, 0.04511833190917969, 0.04755401611328125, 0.04998970031738281, 0.052425384521484375, 0.05486106872558594, 0.0572967529296875, 0.05973243713378906, 0.062168121337890625, 0.06460380554199219, 0.06703948974609375, 0.06947517395019531, 0.07191085815429688, 0.07434654235839844, 0.0767822265625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 11.0, 14.0, 10.0, 30.0, 30.0, 29.0, 48.0, 49.0, 66.0, 53.0, 83.0, 79.0, 62.0, 79.0, 56.0, 60.0, 48.0, 38.0, 40.0, 40.0, 24.0, 11.0, 13.0, 11.0, 8.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0667724609375, -0.0646219253540039, -0.06247138977050781, -0.06032085418701172, -0.058170318603515625, -0.05601978302001953, -0.05386924743652344, -0.051718711853027344, -0.04956817626953125, -0.047417640686035156, -0.04526710510253906, -0.04311656951904297, -0.040966033935546875, -0.03881549835205078, -0.03666496276855469, -0.034514427185058594, -0.0323638916015625, -0.030213356018066406, -0.028062820434570312, -0.02591228485107422, -0.023761749267578125, -0.02161121368408203, -0.019460678100585938, -0.017310142517089844, -0.01515960693359375, -0.013009071350097656, -0.010858535766601562, -0.008708000183105469, -0.006557464599609375, -0.004406929016113281, -0.0022563934326171875, -0.00010585784912109375, 0.002044677734375, 0.004195213317871094, 0.0063457489013671875, 0.008496284484863281, 0.010646820068359375, 0.012797355651855469, 0.014947891235351562, 0.017098426818847656, 0.01924896240234375, 0.021399497985839844, 0.023550033569335938, 0.02570056915283203, 0.027851104736328125, 0.03000164031982422, 0.03215217590332031, 0.034302711486816406, 0.0364532470703125, 0.038603782653808594, 0.04075431823730469, 0.04290485382080078, 0.045055389404296875, 0.04720592498779297, 0.04935646057128906, 0.051506996154785156, 0.05365753173828125, 0.055808067321777344, 0.05795860290527344, 0.06010913848876953, 0.062259674072265625, 0.06441020965576172, 0.06656074523925781, 0.0687112808227539, 0.07086181640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 8.0, 13.0, 12.0, 18.0, 22.0, 37.0, 63.0, 106.0, 143.0, 238.0, 414.0, 643.0, 1226.0, 2431.0, 6082.0, 22004.0, 120942.0, 665288.0, 183789.0, 30848.0, 7946.0, 2981.0, 1439.0, 743.0, 420.0, 273.0, 139.0, 84.0, 81.0, 38.0, 31.0, 15.0, 10.0, 14.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1558837890625, -0.1500263214111328, -0.14416885375976562, -0.13831138610839844, -0.13245391845703125, -0.12659645080566406, -0.12073898315429688, -0.11488151550292969, -0.1090240478515625, -0.10316658020019531, -0.09730911254882812, -0.09145164489746094, -0.08559417724609375, -0.07973670959472656, -0.07387924194335938, -0.06802177429199219, -0.062164306640625, -0.05630683898925781, -0.050449371337890625, -0.04459190368652344, -0.03873443603515625, -0.03287696838378906, -0.027019500732421875, -0.021162033081054688, -0.0153045654296875, -0.009447097778320312, -0.003589630126953125, 0.0022678375244140625, 0.00812530517578125, 0.013982772827148438, 0.019840240478515625, 0.025697708129882812, 0.03155517578125, 0.03741264343261719, 0.043270111083984375, 0.04912757873535156, 0.05498504638671875, 0.06084251403808594, 0.06669998168945312, 0.07255744934082031, 0.0784149169921875, 0.08427238464355469, 0.09012985229492188, 0.09598731994628906, 0.10184478759765625, 0.10770225524902344, 0.11355972290039062, 0.11941719055175781, 0.125274658203125, 0.1311321258544922, 0.13698959350585938, 0.14284706115722656, 0.14870452880859375, 0.15456199645996094, 0.16041946411132812, 0.1662769317626953, 0.1721343994140625, 0.1779918670654297, 0.18384933471679688, 0.18970680236816406, 0.19556427001953125, 0.20142173767089844, 0.20727920532226562, 0.2131366729736328, 0.218994140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 8.0, 6.0, 2.0, 7.0, 6.0, 10.0, 6.0, 10.0, 12.0, 15.0, 16.0, 17.0, 28.0, 26.0, 29.0, 42.0, 53.0, 41.0, 61.0, 47.0, 55.0, 59.0, 43.0, 59.0, 37.0, 38.0, 35.0, 31.0, 37.0, 20.0, 22.0, 29.0, 20.0, 11.0, 19.0, 14.0, 10.0, 5.0, 6.0, 7.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.1720256805419922, -0.16643905639648438, -0.16085243225097656, -0.15526580810546875, -0.14967918395996094, -0.14409255981445312, -0.1385059356689453, -0.1329193115234375, -0.1273326873779297, -0.12174606323242188, -0.11615943908691406, -0.11057281494140625, -0.10498619079589844, -0.09939956665039062, -0.09381294250488281, -0.088226318359375, -0.08263969421386719, -0.07705307006835938, -0.07146644592285156, -0.06587982177734375, -0.06029319763183594, -0.054706573486328125, -0.04911994934082031, -0.0435333251953125, -0.03794670104980469, -0.032360076904296875, -0.026773452758789062, -0.02118682861328125, -0.015600204467773438, -0.010013580322265625, -0.0044269561767578125, 0.00115966796875, 0.0067462921142578125, 0.012332916259765625, 0.017919540405273438, 0.02350616455078125, 0.029092788696289062, 0.034679412841796875, 0.04026603698730469, 0.0458526611328125, 0.05143928527832031, 0.057025909423828125, 0.06261253356933594, 0.06819915771484375, 0.07378578186035156, 0.07937240600585938, 0.08495903015136719, 0.090545654296875, 0.09613227844238281, 0.10171890258789062, 0.10730552673339844, 0.11289215087890625, 0.11847877502441406, 0.12406539916992188, 0.1296520233154297, 0.1352386474609375, 0.1408252716064453, 0.14641189575195312, 0.15199851989746094, 0.15758514404296875, 0.16317176818847656, 0.16875839233398438, 0.1743450164794922, 0.179931640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 11.0, 10.0, 17.0, 12.0, 21.0, 53.0, 53.0, 67.0, 99.0, 172.0, 263.0, 373.0, 619.0, 1050.0, 1916.0, 3761.0, 7689.0, 18586.0, 59474.0, 528296.0, 337695.0, 54933.0, 17690.0, 7552.0, 3511.0, 1827.0, 1095.0, 625.0, 345.0, 234.0, 132.0, 100.0, 62.0, 49.0, 45.0, 30.0, 22.0, 15.0, 10.0, 9.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1080322265625, -0.10465335845947266, -0.10127449035644531, -0.09789562225341797, -0.09451675415039062, -0.09113788604736328, -0.08775901794433594, -0.0843801498413086, -0.08100128173828125, -0.0776224136352539, -0.07424354553222656, -0.07086467742919922, -0.06748580932617188, -0.06410694122314453, -0.06072807312011719, -0.057349205017089844, -0.0539703369140625, -0.050591468811035156, -0.04721260070800781, -0.04383373260498047, -0.040454864501953125, -0.03707599639892578, -0.03369712829589844, -0.030318260192871094, -0.02693939208984375, -0.023560523986816406, -0.020181655883789062, -0.01680278778076172, -0.013423919677734375, -0.010045051574707031, -0.0066661834716796875, -0.0032873153686523438, 9.1552734375e-05, 0.0034704208374023438, 0.0068492889404296875, 0.010228157043457031, 0.013607025146484375, 0.01698589324951172, 0.020364761352539062, 0.023743629455566406, 0.02712249755859375, 0.030501365661621094, 0.03388023376464844, 0.03725910186767578, 0.040637969970703125, 0.04401683807373047, 0.04739570617675781, 0.050774574279785156, 0.0541534423828125, 0.057532310485839844, 0.06091117858886719, 0.06429004669189453, 0.06766891479492188, 0.07104778289794922, 0.07442665100097656, 0.0778055191040039, 0.08118438720703125, 0.0845632553100586, 0.08794212341308594, 0.09132099151611328, 0.09469985961914062, 0.09807872772216797, 0.10145759582519531, 0.10483646392822266, 0.10821533203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 6.0, 1.0, 12.0, 10.0, 9.0, 12.0, 30.0, 46.0, 121.0, 246.0, 237.0, 111.0, 44.0, 34.0, 20.0, 12.0, 7.0, 3.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.632638931274414e-05, -5.363300442695618e-05, -5.093961954116821e-05, -4.824623465538025e-05, -4.5552849769592285e-05, -4.285946488380432e-05, -4.016607999801636e-05, -3.7472695112228394e-05, -3.477931022644043e-05, -3.2085925340652466e-05, -2.9392540454864502e-05, -2.6699155569076538e-05, -2.4005770683288574e-05, -2.131238579750061e-05, -1.8619000911712646e-05, -1.5925616025924683e-05, -1.3232231140136719e-05, -1.0538846254348755e-05, -7.845461368560791e-06, -5.152076482772827e-06, -2.4586915969848633e-06, 2.3469328880310059e-07, 2.9280781745910645e-06, 5.621463060379028e-06, 8.314847946166992e-06, 1.1008232831954956e-05, 1.370161771774292e-05, 1.6395002603530884e-05, 1.9088387489318848e-05, 2.178177237510681e-05, 2.4475157260894775e-05, 2.716854214668274e-05, 2.9861927032470703e-05, 3.255531191825867e-05, 3.524869680404663e-05, 3.7942081689834595e-05, 4.063546657562256e-05, 4.332885146141052e-05, 4.6022236347198486e-05, 4.871562123298645e-05, 5.1409006118774414e-05, 5.410239100456238e-05, 5.679577589035034e-05, 5.9489160776138306e-05, 6.218254566192627e-05, 6.487593054771423e-05, 6.75693154335022e-05, 7.026270031929016e-05, 7.295608520507812e-05, 7.564947009086609e-05, 7.834285497665405e-05, 8.103623986244202e-05, 8.372962474822998e-05, 8.642300963401794e-05, 8.911639451980591e-05, 9.180977940559387e-05, 9.450316429138184e-05, 9.71965491771698e-05, 9.988993406295776e-05, 0.00010258331894874573, 0.00010527670383453369, 0.00010797008872032166, 0.00011066347360610962, 0.00011335685849189758, 0.00011605024337768555]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 7.0, 4.0, 10.0, 12.0, 26.0, 29.0, 52.0, 102.0, 172.0, 337.0, 753.0, 1527.0, 3616.0, 9565.0, 30340.0, 147542.0, 701484.0, 113653.0, 25204.0, 8085.0, 3211.0, 1420.0, 638.0, 308.0, 196.0, 103.0, 53.0, 39.0, 19.0, 16.0, 14.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10662841796875, -0.10300540924072266, -0.09938240051269531, -0.09575939178466797, -0.09213638305664062, -0.08851337432861328, -0.08489036560058594, -0.0812673568725586, -0.07764434814453125, -0.0740213394165039, -0.07039833068847656, -0.06677532196044922, -0.06315231323242188, -0.05952930450439453, -0.05590629577636719, -0.052283287048339844, -0.0486602783203125, -0.045037269592285156, -0.04141426086425781, -0.03779125213623047, -0.034168243408203125, -0.03054523468017578, -0.026922225952148438, -0.023299217224121094, -0.01967620849609375, -0.016053199768066406, -0.012430191040039062, -0.008807182312011719, -0.005184173583984375, -0.0015611648559570312, 0.0020618438720703125, 0.005684852600097656, 0.009307861328125, 0.012930870056152344, 0.016553878784179688, 0.02017688751220703, 0.023799896240234375, 0.02742290496826172, 0.031045913696289062, 0.034668922424316406, 0.03829193115234375, 0.041914939880371094, 0.04553794860839844, 0.04916095733642578, 0.052783966064453125, 0.05640697479248047, 0.06002998352050781, 0.06365299224853516, 0.0672760009765625, 0.07089900970458984, 0.07452201843261719, 0.07814502716064453, 0.08176803588867188, 0.08539104461669922, 0.08901405334472656, 0.0926370620727539, 0.09626007080078125, 0.0998830795288086, 0.10350608825683594, 0.10712909698486328, 0.11075210571289062, 0.11437511444091797, 0.11799812316894531, 0.12162113189697266, 0.125244140625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 2.0, 3.0, 8.0, 8.0, 10.0, 16.0, 15.0, 19.0, 26.0, 30.0, 43.0, 42.0, 59.0, 99.0, 114.0, 125.0, 94.0, 66.0, 65.0, 36.0, 23.0, 21.0, 11.0, 11.0, 11.0, 8.0, 5.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.102783203125, -0.09965229034423828, -0.09652137756347656, -0.09339046478271484, -0.09025955200195312, -0.0871286392211914, -0.08399772644042969, -0.08086681365966797, -0.07773590087890625, -0.07460498809814453, -0.07147407531738281, -0.0683431625366211, -0.06521224975585938, -0.062081336975097656, -0.05895042419433594, -0.05581951141357422, -0.0526885986328125, -0.04955768585205078, -0.04642677307128906, -0.043295860290527344, -0.040164947509765625, -0.037034034729003906, -0.03390312194824219, -0.03077220916748047, -0.02764129638671875, -0.02451038360595703, -0.021379470825195312, -0.018248558044433594, -0.015117645263671875, -0.011986732482910156, -0.008855819702148438, -0.005724906921386719, -0.002593994140625, 0.0005369186401367188, 0.0036678314208984375, 0.006798744201660156, 0.009929656982421875, 0.013060569763183594, 0.016191482543945312, 0.01932239532470703, 0.02245330810546875, 0.02558422088623047, 0.028715133666992188, 0.031846046447753906, 0.034976959228515625, 0.038107872009277344, 0.04123878479003906, 0.04436969757080078, 0.0475006103515625, 0.05063152313232422, 0.05376243591308594, 0.056893348693847656, 0.060024261474609375, 0.0631551742553711, 0.06628608703613281, 0.06941699981689453, 0.07254791259765625, 0.07567882537841797, 0.07880973815917969, 0.0819406509399414, 0.08507156372070312, 0.08820247650146484, 0.09133338928222656, 0.09446430206298828, 0.09759521484375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 9.0, 15.0, 38.0, 74.0, 142.0, 291.0, 174.0, 116.0, 48.0, 40.0, 30.0, 9.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.921916127204895, -0.8487141728401184, -0.7755122184753418, -0.70231032371521, -0.6291083097457886, -0.5559064149856567, -0.4827044606208801, -0.4095025062561035, -0.3363005518913269, -0.2630985975265503, -0.18989665806293488, -0.11669471859931946, -0.04349276423454285, 0.029709190130233765, 0.10291111469268799, 0.1761130690574646, 0.2493150234222412, 0.3225169777870178, 0.39571893215179443, 0.46892085671424866, 0.5421228408813477, 0.6153247356414795, 0.6885266900062561, 0.7617286443710327, 0.8349305987358093, 0.9081325531005859, 0.9813345074653625, 1.0545364618301392, 1.127738356590271, 1.2009403705596924, 1.2741422653198242, 1.347344160079956, 1.420546293258667, 1.4937481880187988, 1.5669502019882202, 1.640152096748352, 1.7133541107177734, 1.7865560054779053, 1.859757900238037, 1.9329599142074585, 2.00616192817688, 2.0793638229370117, 2.1525657176971436, 2.2257678508758545, 2.2989697456359863, 2.372171640396118, 2.44537353515625, 2.518575668334961, 2.5917773246765137, 2.6649792194366455, 2.7381811141967773, 2.8113832473754883, 2.88458514213562, 2.957787036895752, 3.030988931655884, 3.1041908264160156, 3.1773929595947266, 3.2505948543548584, 3.3237967491149902, 3.396998882293701, 3.470200777053833, 3.543402671813965, 3.6166045665740967, 3.6898064613342285, 3.7630085945129395]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 6.0, 8.0, 5.0, 7.0, 16.0, 12.0, 11.0, 19.0, 12.0, 27.0, 28.0, 22.0, 28.0, 21.0, 29.0, 35.0, 36.0, 63.0, 48.0, 56.0, 69.0, 61.0, 48.0, 45.0, 33.0, 17.0, 27.0, 20.0, 28.0, 10.0, 20.0, 14.0, 16.0, 11.0, 13.0, 15.0, 8.0, 11.0, 8.0, 3.0, 5.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5277829766273499, -0.5080547332763672, -0.4883265495300293, -0.468598335981369, -0.44887012243270874, -0.42914190888404846, -0.4094136953353882, -0.3896854817867279, -0.3699572682380676, -0.35022905468940735, -0.33050084114074707, -0.3107726275920868, -0.2910444140434265, -0.27131620049476624, -0.25158798694610596, -0.23185977339744568, -0.2121315598487854, -0.19240334630012512, -0.17267513275146484, -0.15294691920280457, -0.1332187056541443, -0.11349049210548401, -0.09376227855682373, -0.07403406500816345, -0.054305851459503174, -0.034577637910842896, -0.014849424362182617, 0.004878789186477661, 0.02460700273513794, 0.04433521628379822, 0.0640634298324585, 0.08379164338111877, 0.10351985692977905, 0.12324807047843933, 0.1429762840270996, 0.1627044975757599, 0.18243271112442017, 0.20216092467308044, 0.22188913822174072, 0.241617351770401, 0.2613455653190613, 0.28107377886772156, 0.30080199241638184, 0.3205302059650421, 0.3402584195137024, 0.35998663306236267, 0.37971484661102295, 0.3994430601596832, 0.4191712737083435, 0.4388994872570038, 0.45862770080566406, 0.47835591435432434, 0.4980841279029846, 0.5178123712539673, 0.5375405550003052, 0.5572687387466431, 0.5769969820976257, 0.5967252254486084, 0.6164534091949463, 0.6361815929412842, 0.6559098362922668, 0.6756380796432495, 0.6953662633895874, 0.7150944471359253, 0.734822690486908]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 11.0, 9.0, 16.0, 22.0, 36.0, 58.0, 120.0, 175.0, 307.0, 556.0, 1082.0, 2289.0, 5295.0, 13931.0, 50576.0, 519344.0, 3175678.0, 359415.0, 43759.0, 12481.0, 4781.0, 2145.0, 1026.0, 504.0, 273.0, 162.0, 84.0, 58.0, 23.0, 21.0, 14.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09942626953125, -0.09566593170166016, -0.09190559387207031, -0.08814525604248047, -0.08438491821289062, -0.08062458038330078, -0.07686424255371094, -0.0731039047241211, -0.06934356689453125, -0.0655832290649414, -0.06182289123535156, -0.05806255340576172, -0.054302215576171875, -0.05054187774658203, -0.04678153991699219, -0.043021202087402344, -0.0392608642578125, -0.035500526428222656, -0.03174018859863281, -0.02797985076904297, -0.024219512939453125, -0.02045917510986328, -0.016698837280273438, -0.012938499450683594, -0.00917816162109375, -0.005417823791503906, -0.0016574859619140625, 0.0021028518676757812, 0.005863189697265625, 0.009623527526855469, 0.013383865356445312, 0.017144203186035156, 0.020904541015625, 0.024664878845214844, 0.028425216674804688, 0.03218555450439453, 0.035945892333984375, 0.03970623016357422, 0.04346656799316406, 0.047226905822753906, 0.05098724365234375, 0.054747581481933594, 0.05850791931152344, 0.06226825714111328, 0.06602859497070312, 0.06978893280029297, 0.07354927062988281, 0.07730960845947266, 0.0810699462890625, 0.08483028411865234, 0.08859062194824219, 0.09235095977783203, 0.09611129760742188, 0.09987163543701172, 0.10363197326660156, 0.1073923110961914, 0.11115264892578125, 0.1149129867553711, 0.11867332458496094, 0.12243366241455078, 0.12619400024414062, 0.12995433807373047, 0.1337146759033203, 0.13747501373291016, 0.1412353515625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 13.0, 8.0, 10.0, 16.0, 34.0, 23.0, 27.0, 39.0, 48.0, 49.0, 43.0, 57.0, 73.0, 64.0, 66.0, 45.0, 65.0, 58.0, 50.0, 51.0, 32.0, 33.0, 20.0, 25.0, 18.0, 10.0, 6.0, 8.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058502197265625, -0.05660295486450195, -0.054703712463378906, -0.05280447006225586, -0.05090522766113281, -0.049005985260009766, -0.04710674285888672, -0.04520750045776367, -0.043308258056640625, -0.04140901565551758, -0.03950977325439453, -0.037610530853271484, -0.03571128845214844, -0.03381204605102539, -0.031912803649902344, -0.030013561248779297, -0.02811431884765625, -0.026215076446533203, -0.024315834045410156, -0.02241659164428711, -0.020517349243164062, -0.018618106842041016, -0.01671886444091797, -0.014819622039794922, -0.012920379638671875, -0.011021137237548828, -0.009121894836425781, -0.007222652435302734, -0.0053234100341796875, -0.0034241676330566406, -0.0015249252319335938, 0.0003743171691894531, 0.0022735595703125, 0.004172801971435547, 0.006072044372558594, 0.00797128677368164, 0.009870529174804688, 0.011769771575927734, 0.013669013977050781, 0.015568256378173828, 0.017467498779296875, 0.019366741180419922, 0.02126598358154297, 0.023165225982666016, 0.025064468383789062, 0.02696371078491211, 0.028862953186035156, 0.030762195587158203, 0.03266143798828125, 0.0345606803894043, 0.036459922790527344, 0.03835916519165039, 0.04025840759277344, 0.042157649993896484, 0.04405689239501953, 0.04595613479614258, 0.047855377197265625, 0.04975461959838867, 0.05165386199951172, 0.053553104400634766, 0.05545234680175781, 0.05735158920288086, 0.059250831604003906, 0.06115007400512695, 0.06304931640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 13.0, 8.0, 23.0, 35.0, 48.0, 79.0, 107.0, 228.0, 465.0, 1492.0, 7988.0, 436368.0, 3727803.0, 16342.0, 1968.0, 618.0, 285.0, 158.0, 75.0, 64.0, 48.0, 26.0, 14.0, 5.0, 8.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6552734375, -0.638946533203125, -0.62261962890625, -0.606292724609375, -0.5899658203125, -0.573638916015625, -0.55731201171875, -0.540985107421875, -0.524658203125, -0.508331298828125, -0.49200439453125, -0.475677490234375, -0.4593505859375, -0.443023681640625, -0.42669677734375, -0.410369873046875, -0.39404296875, -0.377716064453125, -0.36138916015625, -0.345062255859375, -0.3287353515625, -0.312408447265625, -0.29608154296875, -0.279754638671875, -0.263427734375, -0.247100830078125, -0.23077392578125, -0.214447021484375, -0.1981201171875, -0.181793212890625, -0.16546630859375, -0.149139404296875, -0.1328125, -0.116485595703125, -0.10015869140625, -0.083831787109375, -0.0675048828125, -0.051177978515625, -0.03485107421875, -0.018524169921875, -0.002197265625, 0.014129638671875, 0.03045654296875, 0.046783447265625, 0.0631103515625, 0.079437255859375, 0.09576416015625, 0.112091064453125, 0.12841796875, 0.144744873046875, 0.16107177734375, 0.177398681640625, 0.1937255859375, 0.210052490234375, 0.22637939453125, 0.242706298828125, 0.259033203125, 0.275360107421875, 0.29168701171875, 0.308013916015625, 0.3243408203125, 0.340667724609375, 0.35699462890625, 0.373321533203125, 0.3896484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 8.0, 8.0, 23.0, 22.0, 42.0, 104.0, 222.0, 807.0, 1819.0, 648.0, 186.0, 98.0, 28.0, 18.0, 13.0, 10.0, 7.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.27841949462890625, -0.2670440673828125, -0.25566864013671875, -0.244293212890625, -0.23291778564453125, -0.2215423583984375, -0.21016693115234375, -0.19879150390625, -0.18741607666015625, -0.1760406494140625, -0.16466522216796875, -0.153289794921875, -0.14191436767578125, -0.1305389404296875, -0.11916351318359375, -0.1077880859375, -0.09641265869140625, -0.0850372314453125, -0.07366180419921875, -0.062286376953125, -0.05091094970703125, -0.0395355224609375, -0.02816009521484375, -0.01678466796875, -0.00540924072265625, 0.0059661865234375, 0.01734161376953125, 0.028717041015625, 0.04009246826171875, 0.0514678955078125, 0.06284332275390625, 0.07421875, 0.08559417724609375, 0.0969696044921875, 0.10834503173828125, 0.119720458984375, 0.13109588623046875, 0.1424713134765625, 0.15384674072265625, 0.16522216796875, 0.17659759521484375, 0.1879730224609375, 0.19934844970703125, 0.210723876953125, 0.22209930419921875, 0.2334747314453125, 0.24485015869140625, 0.2562255859375, 0.26760101318359375, 0.2789764404296875, 0.29035186767578125, 0.301727294921875, 0.31310272216796875, 0.3244781494140625, 0.33585357666015625, 0.34722900390625, 0.35860443115234375, 0.3699798583984375, 0.38135528564453125, 0.392730712890625, 0.40410614013671875, 0.4154815673828125, 0.42685699462890625, 0.438232421875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 3.0, 11.0, 17.0, 26.0, 67.0, 75.0, 132.0, 162.0, 177.0, 132.0, 88.0, 46.0, 24.0, 11.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1492176055908203, -2.08962345123291, -2.030029058456421, -1.9704347848892212, -1.9108405113220215, -1.8512463569641113, -1.7916520833969116, -1.732057809829712, -1.6724635362625122, -1.6128692626953125, -1.5532749891281128, -1.493680715560913, -1.434086561203003, -1.3744921684265137, -1.3148980140686035, -1.2553037405014038, -1.195709466934204, -1.1361151933670044, -1.0765209197998047, -1.016926646232605, -0.95733243227005, -0.8977381587028503, -0.8381439447402954, -0.7785496711730957, -0.718955397605896, -0.6593611240386963, -0.5997668504714966, -0.5401726365089417, -0.48057836294174194, -0.42098408937454224, -0.3613898456096649, -0.3017956018447876, -0.2422013282775879, -0.18260706961154938, -0.12301281094551086, -0.06341855227947235, -0.003824293613433838, 0.05576997995376587, 0.11536422371864319, 0.1749584674835205, 0.23455274105072021, 0.2941470146179199, 0.35374125838279724, 0.41333550214767456, 0.47292977571487427, 0.532524049282074, 0.5921182632446289, 0.6517125368118286, 0.7113068103790283, 0.770901083946228, 0.8304953575134277, 0.8900895714759827, 0.9496838450431824, 1.0092780590057373, 1.068872332572937, 1.1284666061401367, 1.1880608797073364, 1.2476551532745361, 1.3072494268417358, 1.3668437004089355, 1.4264378547668457, 1.486032247543335, 1.5456264019012451, 1.6052206754684448, 1.6648149490356445]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 1.0, 3.0, 6.0, 7.0, 8.0, 6.0, 7.0, 21.0, 13.0, 21.0, 21.0, 36.0, 37.0, 40.0, 48.0, 45.0, 58.0, 51.0, 50.0, 86.0, 55.0, 46.0, 56.0, 46.0, 45.0, 39.0, 35.0, 21.0, 23.0, 19.0, 15.0, 11.0, 5.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-1.2590217590332031, -1.2276915311813354, -1.1963613033294678, -1.1650310754776, -1.1337008476257324, -1.1023706197738647, -1.071040391921997, -1.0397100448608398, -1.0083799362182617, -0.977049708366394, -0.9457194805145264, -0.9143892526626587, -0.883059024810791, -0.8517287969589233, -0.8203985095024109, -0.7890682816505432, -0.7577379941940308, -0.7264077663421631, -0.6950775384902954, -0.6637473106384277, -0.6324170827865601, -0.6010868549346924, -0.5697565674781799, -0.5384263396263123, -0.5070961117744446, -0.4757658839225769, -0.44443565607070923, -0.41310539841651917, -0.3817751705646515, -0.3504449427127838, -0.31911468505859375, -0.2877844572067261, -0.25645434856414795, -0.22512412071228027, -0.1937938779592514, -0.16246363520622253, -0.13113340735435486, -0.09980317950248718, -0.06847293674945831, -0.03714269399642944, -0.005812466144561768, 0.025517769157886505, 0.05684800446033478, 0.08817823976278305, 0.11950847506523132, 0.150838702917099, 0.18216894567012787, 0.21349918842315674, 0.24482941627502441, 0.2761596441268921, 0.30748987197875977, 0.33882012963294983, 0.3701503574848175, 0.4014805853366852, 0.43281084299087524, 0.4641410708427429, 0.4954712986946106, 0.5268015265464783, 0.558131754398346, 0.5894619822502136, 0.6207922697067261, 0.6521224975585938, 0.6834527254104614, 0.7147829532623291, 0.7461131811141968]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 10.0, 11.0, 15.0, 25.0, 42.0, 66.0, 91.0, 155.0, 292.0, 478.0, 935.0, 1874.0, 3767.0, 8351.0, 19776.0, 49096.0, 132324.0, 325008.0, 306566.0, 121025.0, 45058.0, 18388.0, 7847.0, 3581.0, 1798.0, 851.0, 461.0, 265.0, 132.0, 85.0, 62.0, 38.0, 17.0, 16.0, 12.0, 8.0, 6.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0970458984375, -0.09380626678466797, -0.09056663513183594, -0.0873270034790039, -0.08408737182617188, -0.08084774017333984, -0.07760810852050781, -0.07436847686767578, -0.07112884521484375, -0.06788921356201172, -0.06464958190917969, -0.061409950256347656, -0.058170318603515625, -0.054930686950683594, -0.05169105529785156, -0.04845142364501953, -0.0452117919921875, -0.04197216033935547, -0.03873252868652344, -0.035492897033691406, -0.032253265380859375, -0.029013633728027344, -0.025774002075195312, -0.02253437042236328, -0.01929473876953125, -0.01605510711669922, -0.012815475463867188, -0.009575843811035156, -0.006336212158203125, -0.0030965805053710938, 0.0001430511474609375, 0.0033826828002929688, 0.006622314453125, 0.009861946105957031, 0.013101577758789062, 0.016341209411621094, 0.019580841064453125, 0.022820472717285156, 0.026060104370117188, 0.02929973602294922, 0.03253936767578125, 0.03577899932861328, 0.03901863098144531, 0.042258262634277344, 0.045497894287109375, 0.048737525939941406, 0.05197715759277344, 0.05521678924560547, 0.0584564208984375, 0.06169605255126953, 0.06493568420410156, 0.0681753158569336, 0.07141494750976562, 0.07465457916259766, 0.07789421081542969, 0.08113384246826172, 0.08437347412109375, 0.08761310577392578, 0.09085273742675781, 0.09409236907958984, 0.09733200073242188, 0.1005716323852539, 0.10381126403808594, 0.10705089569091797, 0.11029052734375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 6.0, 7.0, 11.0, 17.0, 20.0, 26.0, 45.0, 63.0, 67.0, 81.0, 79.0, 84.0, 104.0, 63.0, 79.0, 70.0, 50.0, 37.0, 27.0, 21.0, 24.0, 13.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11474609375, -0.11124992370605469, -0.10775375366210938, -0.10425758361816406, -0.10076141357421875, -0.09726524353027344, -0.09376907348632812, -0.09027290344238281, -0.0867767333984375, -0.08328056335449219, -0.07978439331054688, -0.07628822326660156, -0.07279205322265625, -0.06929588317871094, -0.06579971313476562, -0.06230354309082031, -0.058807373046875, -0.05531120300292969, -0.051815032958984375, -0.04831886291503906, -0.04482269287109375, -0.04132652282714844, -0.037830352783203125, -0.03433418273925781, -0.0308380126953125, -0.027341842651367188, -0.023845672607421875, -0.020349502563476562, -0.01685333251953125, -0.013357162475585938, -0.009860992431640625, -0.0063648223876953125, -0.00286865234375, 0.0006275177001953125, 0.004123687744140625, 0.0076198577880859375, 0.01111602783203125, 0.014612197875976562, 0.018108367919921875, 0.021604537963867188, 0.0251007080078125, 0.028596878051757812, 0.032093048095703125, 0.03558921813964844, 0.03908538818359375, 0.04258155822753906, 0.046077728271484375, 0.04957389831542969, 0.053070068359375, 0.05656623840332031, 0.060062408447265625, 0.06355857849121094, 0.06705474853515625, 0.07055091857910156, 0.07404708862304688, 0.07754325866699219, 0.0810394287109375, 0.08453559875488281, 0.08803176879882812, 0.09152793884277344, 0.09502410888671875, 0.09852027893066406, 0.10201644897460938, 0.10551261901855469, 0.1090087890625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 0.0, 5.0, 4.0, 5.0, 9.0, 18.0, 13.0, 18.0, 27.0, 38.0, 44.0, 48.0, 63.0, 101.0, 99.0, 148.0, 198.0, 346.0, 495.0, 959.0, 1987.0, 5122.0, 16516.0, 71382.0, 594630.0, 284675.0, 50793.0, 12739.0, 4057.0, 1650.0, 828.0, 438.0, 275.0, 200.0, 137.0, 133.0, 77.0, 47.0, 44.0, 43.0, 37.0, 21.0, 24.0, 9.0, 12.0, 8.0, 6.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.19970703125, -0.19344520568847656, -0.18718338012695312, -0.1809215545654297, -0.17465972900390625, -0.1683979034423828, -0.16213607788085938, -0.15587425231933594, -0.1496124267578125, -0.14335060119628906, -0.13708877563476562, -0.1308269500732422, -0.12456512451171875, -0.11830329895019531, -0.11204147338867188, -0.10577964782714844, -0.099517822265625, -0.09325599670410156, -0.08699417114257812, -0.08073234558105469, -0.07447052001953125, -0.06820869445800781, -0.061946868896484375, -0.05568504333496094, -0.0494232177734375, -0.04316139221191406, -0.036899566650390625, -0.030637741088867188, -0.02437591552734375, -0.018114089965820312, -0.011852264404296875, -0.0055904388427734375, 0.00067138671875, 0.0069332122802734375, 0.013195037841796875, 0.019456863403320312, 0.02571868896484375, 0.03198051452636719, 0.038242340087890625, 0.04450416564941406, 0.0507659912109375, 0.05702781677246094, 0.06328964233398438, 0.06955146789550781, 0.07581329345703125, 0.08207511901855469, 0.08833694458007812, 0.09459877014160156, 0.100860595703125, 0.10712242126464844, 0.11338424682617188, 0.11964607238769531, 0.12590789794921875, 0.1321697235107422, 0.13843154907226562, 0.14469337463378906, 0.1509552001953125, 0.15721702575683594, 0.16347885131835938, 0.1697406768798828, 0.17600250244140625, 0.1822643280029297, 0.18852615356445312, 0.19478797912597656, 0.2010498046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 1.0, 3.0, 7.0, 11.0, 6.0, 7.0, 8.0, 8.0, 18.0, 20.0, 26.0, 25.0, 28.0, 43.0, 31.0, 54.0, 66.0, 58.0, 66.0, 60.0, 61.0, 68.0, 65.0, 47.0, 50.0, 26.0, 28.0, 20.0, 23.0, 10.0, 14.0, 8.0, 12.0, 7.0, 4.0, 2.0, 7.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3291015625, -0.31844329833984375, -0.3077850341796875, -0.29712677001953125, -0.286468505859375, -0.27581024169921875, -0.2651519775390625, -0.25449371337890625, -0.24383544921875, -0.23317718505859375, -0.2225189208984375, -0.21186065673828125, -0.201202392578125, -0.19054412841796875, -0.1798858642578125, -0.16922760009765625, -0.1585693359375, -0.14791107177734375, -0.1372528076171875, -0.12659454345703125, -0.115936279296875, -0.10527801513671875, -0.0946197509765625, -0.08396148681640625, -0.07330322265625, -0.06264495849609375, -0.0519866943359375, -0.04132843017578125, -0.030670166015625, -0.02001190185546875, -0.0093536376953125, 0.00130462646484375, 0.011962890625, 0.02262115478515625, 0.0332794189453125, 0.04393768310546875, 0.054595947265625, 0.06525421142578125, 0.0759124755859375, 0.08657073974609375, 0.09722900390625, 0.10788726806640625, 0.1185455322265625, 0.12920379638671875, 0.139862060546875, 0.15052032470703125, 0.1611785888671875, 0.17183685302734375, 0.1824951171875, 0.19315338134765625, 0.2038116455078125, 0.21446990966796875, 0.225128173828125, 0.23578643798828125, 0.2464447021484375, 0.25710296630859375, 0.26776123046875, 0.27841949462890625, 0.2890777587890625, 0.29973602294921875, 0.310394287109375, 0.32105255126953125, 0.3317108154296875, 0.34236907958984375, 0.35302734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 12.0, 12.0, 18.0, 14.0, 34.0, 54.0, 78.0, 106.0, 152.0, 217.0, 310.0, 544.0, 884.0, 1669.0, 3331.0, 6897.0, 16744.0, 47835.0, 181686.0, 641542.0, 95207.0, 29360.0, 11084.0, 5016.0, 2416.0, 1337.0, 749.0, 430.0, 265.0, 167.0, 106.0, 79.0, 57.0, 48.0, 26.0, 18.0, 12.0, 9.0, 11.0, 5.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.07965087890625, -0.07710456848144531, -0.07455825805664062, -0.07201194763183594, -0.06946563720703125, -0.06691932678222656, -0.06437301635742188, -0.06182670593261719, -0.0592803955078125, -0.05673408508300781, -0.054187774658203125, -0.05164146423339844, -0.04909515380859375, -0.04654884338378906, -0.044002532958984375, -0.04145622253417969, -0.038909912109375, -0.03636360168457031, -0.033817291259765625, -0.03127098083496094, -0.02872467041015625, -0.026178359985351562, -0.023632049560546875, -0.021085739135742188, -0.0185394287109375, -0.015993118286132812, -0.013446807861328125, -0.010900497436523438, -0.00835418701171875, -0.0058078765869140625, -0.003261566162109375, -0.0007152557373046875, 0.0018310546875, 0.0043773651123046875, 0.006923675537109375, 0.009469985961914062, 0.01201629638671875, 0.014562606811523438, 0.017108917236328125, 0.019655227661132812, 0.0222015380859375, 0.024747848510742188, 0.027294158935546875, 0.029840469360351562, 0.03238677978515625, 0.03493309020996094, 0.037479400634765625, 0.04002571105957031, 0.042572021484375, 0.04511833190917969, 0.047664642333984375, 0.05021095275878906, 0.05275726318359375, 0.05530357360839844, 0.057849884033203125, 0.06039619445800781, 0.0629425048828125, 0.06548881530761719, 0.06803512573242188, 0.07058143615722656, 0.07312774658203125, 0.07567405700683594, 0.07822036743164062, 0.08076667785644531, 0.08331298828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 23.0, 23.0, 20.0, 37.0, 64.0, 93.0, 158.0, 216.0, 107.0, 67.0, 54.0, 33.0, 19.0, 18.0, 13.0, 14.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26173210144043e-05, -4.105735570192337e-05, -3.9497390389442444e-05, -3.793742507696152e-05, -3.637745976448059e-05, -3.4817494451999664e-05, -3.325752913951874e-05, -3.169756382703781e-05, -3.0137598514556885e-05, -2.8577633202075958e-05, -2.7017667889595032e-05, -2.5457702577114105e-05, -2.389773726463318e-05, -2.2337771952152252e-05, -2.0777806639671326e-05, -1.92178413271904e-05, -1.7657876014709473e-05, -1.6097910702228546e-05, -1.453794538974762e-05, -1.2977980077266693e-05, -1.1418014764785767e-05, -9.85804945230484e-06, -8.298084139823914e-06, -6.738118827342987e-06, -5.1781535148620605e-06, -3.618188202381134e-06, -2.0582228899002075e-06, -4.98257577419281e-07, 1.0617077350616455e-06, 2.621673047542572e-06, 4.1816383600234985e-06, 5.741603672504425e-06, 7.3015689849853516e-06, 8.861534297466278e-06, 1.0421499609947205e-05, 1.1981464922428131e-05, 1.3541430234909058e-05, 1.5101395547389984e-05, 1.666136085987091e-05, 1.8221326172351837e-05, 1.9781291484832764e-05, 2.134125679731369e-05, 2.2901222109794617e-05, 2.4461187422275543e-05, 2.602115273475647e-05, 2.7581118047237396e-05, 2.9141083359718323e-05, 3.070104867219925e-05, 3.2261013984680176e-05, 3.38209792971611e-05, 3.538094460964203e-05, 3.6940909922122955e-05, 3.850087523460388e-05, 4.006084054708481e-05, 4.1620805859565735e-05, 4.318077117204666e-05, 4.474073648452759e-05, 4.6300701797008514e-05, 4.786066710948944e-05, 4.942063242197037e-05, 5.0980597734451294e-05, 5.254056304693222e-05, 5.410052835941315e-05, 5.5660493671894073e-05, 5.7220458984375e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 5.0, 6.0, 12.0, 19.0, 17.0, 22.0, 48.0, 46.0, 85.0, 142.0, 237.0, 423.0, 754.0, 1530.0, 3734.0, 11035.0, 41468.0, 248678.0, 651641.0, 64090.0, 15686.0, 4883.0, 1882.0, 959.0, 446.0, 252.0, 146.0, 99.0, 74.0, 39.0, 29.0, 22.0, 12.0, 10.0, 8.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11883544921875, -0.11535453796386719, -0.11187362670898438, -0.10839271545410156, -0.10491180419921875, -0.10143089294433594, -0.09794998168945312, -0.09446907043457031, -0.0909881591796875, -0.08750724792480469, -0.08402633666992188, -0.08054542541503906, -0.07706451416015625, -0.07358360290527344, -0.07010269165039062, -0.06662178039550781, -0.063140869140625, -0.05965995788574219, -0.056179046630859375, -0.05269813537597656, -0.04921722412109375, -0.04573631286621094, -0.042255401611328125, -0.03877449035644531, -0.0352935791015625, -0.03181266784667969, -0.028331756591796875, -0.024850845336914062, -0.02136993408203125, -0.017889022827148438, -0.014408111572265625, -0.010927200317382812, -0.0074462890625, -0.0039653778076171875, -0.000484466552734375, 0.0029964447021484375, 0.00647735595703125, 0.009958267211914062, 0.013439178466796875, 0.016920089721679688, 0.0204010009765625, 0.023881912231445312, 0.027362823486328125, 0.030843734741210938, 0.03432464599609375, 0.03780555725097656, 0.041286468505859375, 0.04476737976074219, 0.048248291015625, 0.05172920227050781, 0.055210113525390625, 0.05869102478027344, 0.06217193603515625, 0.06565284729003906, 0.06913375854492188, 0.07261466979980469, 0.0760955810546875, 0.07957649230957031, 0.08305740356445312, 0.08653831481933594, 0.09001922607421875, 0.09350013732910156, 0.09698104858398438, 0.10046195983886719, 0.10394287109375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 12.0, 21.0, 13.0, 10.0, 24.0, 28.0, 38.0, 39.0, 62.0, 96.0, 104.0, 117.0, 110.0, 74.0, 58.0, 43.0, 39.0, 24.0, 17.0, 12.0, 10.0, 7.0, 7.0, 8.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.098388671875, -0.09525871276855469, -0.09212875366210938, -0.08899879455566406, -0.08586883544921875, -0.08273887634277344, -0.07960891723632812, -0.07647895812988281, -0.0733489990234375, -0.07021903991699219, -0.06708908081054688, -0.06395912170410156, -0.06082916259765625, -0.05769920349121094, -0.054569244384765625, -0.05143928527832031, -0.048309326171875, -0.04517936706542969, -0.042049407958984375, -0.03891944885253906, -0.03578948974609375, -0.03265953063964844, -0.029529571533203125, -0.026399612426757812, -0.0232696533203125, -0.020139694213867188, -0.017009735107421875, -0.013879776000976562, -0.01074981689453125, -0.0076198577880859375, -0.004489898681640625, -0.0013599395751953125, 0.00177001953125, 0.0048999786376953125, 0.008029937744140625, 0.011159896850585938, 0.01428985595703125, 0.017419815063476562, 0.020549774169921875, 0.023679733276367188, 0.0268096923828125, 0.029939651489257812, 0.033069610595703125, 0.03619956970214844, 0.03932952880859375, 0.04245948791503906, 0.045589447021484375, 0.04871940612792969, 0.051849365234375, 0.05497932434082031, 0.058109283447265625, 0.06123924255371094, 0.06436920166015625, 0.06749916076660156, 0.07062911987304688, 0.07375907897949219, 0.0768890380859375, 0.08001899719238281, 0.08314895629882812, 0.08627891540527344, 0.08940887451171875, 0.09253883361816406, 0.09566879272460938, 0.09879875183105469, 0.1019287109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 11.0, 9.0, 17.0, 26.0, 42.0, 92.0, 200.0, 279.0, 141.0, 90.0, 40.0, 19.0, 14.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3500641584396362, -1.283121109008789, -1.2161781787872314, -1.1492351293563843, -1.082292079925537, -1.01534903049469, -0.9484060406684875, -0.8814630508422852, -0.814520001411438, -0.7475769519805908, -0.6806339621543884, -0.613690972328186, -0.5467479228973389, -0.4798049032688141, -0.4128618836402893, -0.3459188640117645, -0.27897584438323975, -0.21203282475471497, -0.14508980512619019, -0.0781467854976654, -0.011203765869140625, 0.055739253759384155, 0.12268227338790894, 0.18962529301643372, 0.2565683126449585, 0.3235113322734833, 0.39045435190200806, 0.45739737153053284, 0.5243403911590576, 0.5912834405899048, 0.6582264304161072, 0.7251694202423096, 0.7921123504638672, 0.8590553998947144, 0.9259983897209167, 0.9929413795471191, 1.0598844289779663, 1.1268274784088135, 1.193770408630371, 1.2607134580612183, 1.3276565074920654, 1.3945995569229126, 1.4615426063537598, 1.5284855365753174, 1.5954285860061646, 1.6623716354370117, 1.7293145656585693, 1.7962576150894165, 1.8632006645202637, 1.9301437139511108, 1.997086763381958, 2.0640296936035156, 2.1309728622436523, 2.19791579246521, 2.2648587226867676, 2.3318018913269043, 2.398744821548462, 2.4656877517700195, 2.5326309204101562, 2.599573850631714, 2.6665167808532715, 2.733459949493408, 2.800402879714966, 2.8673460483551025, 2.93428897857666]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 7.0, 7.0, 11.0, 15.0, 12.0, 19.0, 14.0, 13.0, 18.0, 21.0, 41.0, 34.0, 35.0, 45.0, 69.0, 125.0, 123.0, 72.0, 51.0, 34.0, 26.0, 42.0, 36.0, 24.0, 21.0, 15.0, 14.0, 13.0, 12.0, 5.0, 8.0, 8.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4415346384048462, -1.391816258430481, -1.3420979976654053, -1.29237961769104, -1.2426612377166748, -1.1929428577423096, -1.1432244777679443, -1.0935062170028687, -1.0437878370285034, -0.9940694570541382, -0.9443511366844177, -0.8946328163146973, -0.844914436340332, -0.7951960563659668, -0.7454777359962463, -0.6957594156265259, -0.6460410356521606, -0.5963226556777954, -0.546604335308075, -0.4968859851360321, -0.44716763496398926, -0.3974492847919464, -0.34773093461990356, -0.2980125844478607, -0.24829423427581787, -0.19857588410377502, -0.14885753393173218, -0.09913918375968933, -0.049420833587646484, 0.0002975165843963623, 0.05001586675643921, 0.09973421692848206, 0.14945244789123535, 0.1991707980632782, 0.24888914823532104, 0.2986074984073639, 0.34832584857940674, 0.3980441987514496, 0.44776254892349243, 0.4974808990955353, 0.5471992492675781, 0.5969176292419434, 0.6466359496116638, 0.6963542699813843, 0.7460726499557495, 0.7957910299301147, 0.8455093502998352, 0.8952276706695557, 0.9449460506439209, 0.9946644306182861, 1.0443828105926514, 1.094101071357727, 1.1438194513320923, 1.1935378313064575, 1.2432560920715332, 1.2929744720458984, 1.3426928520202637, 1.392411231994629, 1.4421296119689941, 1.4918478727340698, 1.541566252708435, 1.5912846326828003, 1.641002893447876, 1.6907212734222412, 1.7404396533966064]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 3.0, 4.0, 6.0, 18.0, 20.0, 13.0, 29.0, 38.0, 58.0, 66.0, 101.0, 160.0, 226.0, 335.0, 583.0, 937.0, 1772.0, 3460.0, 7569.0, 21318.0, 87077.0, 753221.0, 2771771.0, 453153.0, 62343.0, 16984.0, 6350.0, 2928.0, 1469.0, 781.0, 485.0, 337.0, 204.0, 134.0, 94.0, 70.0, 54.0, 39.0, 24.0, 21.0, 6.0, 7.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1102294921875, -0.10647964477539062, -0.10272979736328125, -0.09897994995117188, -0.0952301025390625, -0.09148025512695312, -0.08773040771484375, -0.08398056030273438, -0.080230712890625, -0.07648086547851562, -0.07273101806640625, -0.06898117065429688, -0.0652313232421875, -0.061481475830078125, -0.05773162841796875, -0.053981781005859375, -0.05023193359375, -0.046482086181640625, -0.04273223876953125, -0.038982391357421875, -0.0352325439453125, -0.031482696533203125, -0.02773284912109375, -0.023983001708984375, -0.020233154296875, -0.016483306884765625, -0.01273345947265625, -0.008983612060546875, -0.0052337646484375, -0.001483917236328125, 0.00226593017578125, 0.006015777587890625, 0.009765625, 0.013515472412109375, 0.01726531982421875, 0.021015167236328125, 0.0247650146484375, 0.028514862060546875, 0.03226470947265625, 0.036014556884765625, 0.039764404296875, 0.043514251708984375, 0.04726409912109375, 0.051013946533203125, 0.0547637939453125, 0.058513641357421875, 0.06226348876953125, 0.06601333618164062, 0.06976318359375, 0.07351303100585938, 0.07726287841796875, 0.08101272583007812, 0.0847625732421875, 0.08851242065429688, 0.09226226806640625, 0.09601211547851562, 0.099761962890625, 0.10351181030273438, 0.10726165771484375, 0.11101150512695312, 0.1147613525390625, 0.11851119995117188, 0.12226104736328125, 0.12601089477539062, 0.1297607421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 9.0, 8.0, 6.0, 13.0, 11.0, 14.0, 27.0, 24.0, 47.0, 36.0, 52.0, 47.0, 69.0, 67.0, 50.0, 61.0, 55.0, 51.0, 62.0, 53.0, 38.0, 34.0, 31.0, 22.0, 19.0, 19.0, 19.0, 13.0, 16.0, 2.0, 7.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0731201171875, -0.07063007354736328, -0.06814002990722656, -0.06564998626708984, -0.06315994262695312, -0.060669898986816406, -0.05817985534667969, -0.05568981170654297, -0.05319976806640625, -0.05070972442626953, -0.04821968078613281, -0.045729637145996094, -0.043239593505859375, -0.040749549865722656, -0.03825950622558594, -0.03576946258544922, -0.0332794189453125, -0.03078937530517578, -0.028299331665039062, -0.025809288024902344, -0.023319244384765625, -0.020829200744628906, -0.018339157104492188, -0.01584911346435547, -0.01335906982421875, -0.010869026184082031, -0.008378982543945312, -0.005888938903808594, -0.003398895263671875, -0.0009088516235351562, 0.0015811920166015625, 0.004071235656738281, 0.006561279296875, 0.009051322937011719, 0.011541366577148438, 0.014031410217285156, 0.016521453857421875, 0.019011497497558594, 0.021501541137695312, 0.02399158477783203, 0.02648162841796875, 0.02897167205810547, 0.03146171569824219, 0.033951759338378906, 0.036441802978515625, 0.038931846618652344, 0.04142189025878906, 0.04391193389892578, 0.0464019775390625, 0.04889202117919922, 0.05138206481933594, 0.053872108459472656, 0.056362152099609375, 0.058852195739746094, 0.06134223937988281, 0.06383228302001953, 0.06632232666015625, 0.06881237030029297, 0.07130241394042969, 0.0737924575805664, 0.07628250122070312, 0.07877254486083984, 0.08126258850097656, 0.08375263214111328, 0.08624267578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 3.0, 13.0, 8.0, 12.0, 17.0, 20.0, 23.0, 23.0, 40.0, 61.0, 92.0, 124.0, 231.0, 418.0, 885.0, 2782.0, 11186.0, 118319.0, 3923930.0, 119940.0, 11372.0, 2741.0, 936.0, 402.0, 212.0, 116.0, 107.0, 72.0, 42.0, 27.0, 31.0, 21.0, 12.0, 13.0, 10.0, 9.0, 8.0, 3.0, 5.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37548828125, -0.3631782531738281, -0.35086822509765625, -0.3385581970214844, -0.3262481689453125, -0.3139381408691406, -0.30162811279296875, -0.2893180847167969, -0.277008056640625, -0.2646980285644531, -0.25238800048828125, -0.24007797241210938, -0.2277679443359375, -0.21545791625976562, -0.20314788818359375, -0.19083786010742188, -0.17852783203125, -0.16621780395507812, -0.15390777587890625, -0.14159774780273438, -0.1292877197265625, -0.11697769165039062, -0.10466766357421875, -0.09235763549804688, -0.080047607421875, -0.06773757934570312, -0.05542755126953125, -0.043117523193359375, -0.0308074951171875, -0.018497467041015625, -0.00618743896484375, 0.006122589111328125, 0.0184326171875, 0.030742645263671875, 0.04305267333984375, 0.055362701416015625, 0.0676727294921875, 0.07998275756835938, 0.09229278564453125, 0.10460281372070312, 0.116912841796875, 0.12922286987304688, 0.14153289794921875, 0.15384292602539062, 0.1661529541015625, 0.17846298217773438, 0.19077301025390625, 0.20308303833007812, 0.21539306640625, 0.22770309448242188, 0.24001312255859375, 0.2523231506347656, 0.2646331787109375, 0.2769432067871094, 0.28925323486328125, 0.3015632629394531, 0.313873291015625, 0.3261833190917969, 0.33849334716796875, 0.3508033752441406, 0.3631134033203125, 0.3754234313964844, 0.38773345947265625, 0.4000434875488281, 0.412353515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 9.0, 10.0, 18.0, 25.0, 19.0, 35.0, 48.0, 81.0, 153.0, 327.0, 684.0, 1072.0, 819.0, 364.0, 123.0, 85.0, 58.0, 31.0, 30.0, 22.0, 6.0, 15.0, 6.0, 2.0, 5.0, 2.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2759552001953125, -0.267486572265625, -0.2590179443359375, -0.25054931640625, -0.2420806884765625, -0.233612060546875, -0.2251434326171875, -0.2166748046875, -0.2082061767578125, -0.199737548828125, -0.1912689208984375, -0.18280029296875, -0.1743316650390625, -0.165863037109375, -0.1573944091796875, -0.14892578125, -0.1404571533203125, -0.131988525390625, -0.1235198974609375, -0.11505126953125, -0.1065826416015625, -0.098114013671875, -0.0896453857421875, -0.0811767578125, -0.0727081298828125, -0.064239501953125, -0.0557708740234375, -0.04730224609375, -0.0388336181640625, -0.030364990234375, -0.0218963623046875, -0.013427734375, -0.0049591064453125, 0.003509521484375, 0.0119781494140625, 0.02044677734375, 0.0289154052734375, 0.037384033203125, 0.0458526611328125, 0.0543212890625, 0.0627899169921875, 0.071258544921875, 0.0797271728515625, 0.08819580078125, 0.0966644287109375, 0.105133056640625, 0.1136016845703125, 0.1220703125, 0.1305389404296875, 0.139007568359375, 0.1474761962890625, 0.15594482421875, 0.1644134521484375, 0.172882080078125, 0.1813507080078125, 0.1898193359375, 0.1982879638671875, 0.206756591796875, 0.2152252197265625, 0.22369384765625, 0.2321624755859375, 0.240631103515625, 0.2490997314453125, 0.257568359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 13.0, 11.0, 24.0, 18.0, 32.0, 54.0, 88.0, 120.0, 139.0, 122.0, 109.0, 85.0, 58.0, 30.0, 22.0, 17.0, 10.0, 8.0, 11.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.3009722232818604, -2.2464120388031006, -2.19185209274292, -2.13729190826416, -2.0827317237854004, -2.0281715393066406, -1.97361159324646, -1.9190514087677002, -1.86449134349823, -1.8099312782287598, -1.75537109375, -1.7008110284805298, -1.6462509632110596, -1.5916907787322998, -1.5371307134628296, -1.4825706481933594, -1.4280104637145996, -1.3734503984451294, -1.3188902139663696, -1.2643301486968994, -1.2097699642181396, -1.1552098989486694, -1.1006498336791992, -1.0460896492004395, -0.9915295839309692, -0.9369694590568542, -0.8824093341827393, -0.827849268913269, -0.773289144039154, -0.7187290191650391, -0.6641689538955688, -0.6096088290214539, -0.5550485849380493, -0.5004884600639343, -0.4459283649921417, -0.3913682699203491, -0.33680814504623413, -0.28224802017211914, -0.22768792510032654, -0.17312783002853394, -0.11856770515441895, -0.06400759518146515, -0.009447485208511353, 0.045112624764442444, 0.09967273473739624, 0.15423285961151123, 0.20879295468330383, 0.26335304975509644, 0.3179131746292114, 0.3724732995033264, 0.427033394575119, 0.4815934896469116, 0.5361536145210266, 0.5907137393951416, 0.6452738046646118, 0.6998339295387268, 0.7543940544128418, 0.8089541792869568, 0.8635143041610718, 0.918074369430542, 0.972634494304657, 1.027194619178772, 1.0817546844482422, 1.136314868927002, 1.1908749341964722]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 4.0, 8.0, 8.0, 8.0, 11.0, 17.0, 13.0, 25.0, 27.0, 21.0, 27.0, 20.0, 36.0, 55.0, 45.0, 40.0, 43.0, 51.0, 33.0, 55.0, 47.0, 64.0, 36.0, 36.0, 36.0, 33.0, 25.0, 20.0, 17.0, 23.0, 17.0, 21.0, 15.0, 10.0, 8.0, 4.0, 8.0, 6.0, 4.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8975585103034973, -0.8654941320419312, -0.8334298133850098, -0.8013654351234436, -0.7693010568618774, -0.737236738204956, -0.7051723599433899, -0.6731079816818237, -0.6410436630249023, -0.6089792847633362, -0.5769149661064148, -0.5448505878448486, -0.5127862095832825, -0.4807218611240387, -0.4486575126647949, -0.41659313440322876, -0.3845287561416626, -0.3524644076824188, -0.32040002942085266, -0.2883356809616089, -0.2562713027000427, -0.22420695424079895, -0.19214260578155518, -0.1600782424211502, -0.12801387906074524, -0.09594951570034027, -0.0638851597905159, -0.03182080388069153, 0.00024355947971343994, 0.03230792284011841, 0.06437227129936218, 0.09643663465976715, 0.1285010576248169, 0.16056542098522186, 0.19262978434562683, 0.2246941328048706, 0.25675851106643677, 0.28882285952568054, 0.3208872079849243, 0.3529515862464905, 0.38501593470573425, 0.417080283164978, 0.4491446614265442, 0.48120900988578796, 0.5132733583450317, 0.5453377366065979, 0.5774021148681641, 0.6094664335250854, 0.6415308117866516, 0.6735951900482178, 0.7056595087051392, 0.7377238869667053, 0.7697882652282715, 0.8018525838851929, 0.833916962146759, 0.8659813404083252, 0.8980456590652466, 0.9301100373268127, 0.9621743559837341, 0.9942387342453003, 1.0263030529022217, 1.0583674907684326, 1.090431809425354, 1.1224961280822754, 1.1545605659484863]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 6.0, 12.0, 15.0, 17.0, 39.0, 37.0, 56.0, 72.0, 99.0, 174.0, 225.0, 322.0, 490.0, 694.0, 979.0, 1605.0, 2425.0, 3772.0, 5986.0, 9937.0, 16910.0, 30614.0, 57933.0, 113342.0, 211565.0, 254755.0, 156972.0, 80670.0, 41698.0, 22810.0, 12978.0, 7671.0, 4888.0, 2968.0, 1817.0, 1295.0, 816.0, 593.0, 392.0, 271.0, 204.0, 144.0, 104.0, 54.0, 42.0, 29.0, 24.0, 8.0, 14.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0902099609375, -0.08749675750732422, -0.08478355407714844, -0.08207035064697266, -0.07935714721679688, -0.0766439437866211, -0.07393074035644531, -0.07121753692626953, -0.06850433349609375, -0.06579113006591797, -0.06307792663574219, -0.060364723205566406, -0.057651519775390625, -0.054938316345214844, -0.05222511291503906, -0.04951190948486328, -0.0467987060546875, -0.04408550262451172, -0.04137229919433594, -0.038659095764160156, -0.035945892333984375, -0.033232688903808594, -0.030519485473632812, -0.02780628204345703, -0.02509307861328125, -0.02237987518310547, -0.019666671752929688, -0.016953468322753906, -0.014240264892578125, -0.011527061462402344, -0.008813858032226562, -0.006100654602050781, -0.003387451171875, -0.0006742477416992188, 0.0020389556884765625, 0.004752159118652344, 0.007465362548828125, 0.010178565979003906, 0.012891769409179688, 0.015604972839355469, 0.01831817626953125, 0.02103137969970703, 0.023744583129882812, 0.026457786560058594, 0.029170989990234375, 0.031884193420410156, 0.03459739685058594, 0.03731060028076172, 0.0400238037109375, 0.04273700714111328, 0.04545021057128906, 0.048163414001464844, 0.050876617431640625, 0.053589820861816406, 0.05630302429199219, 0.05901622772216797, 0.06172943115234375, 0.06444263458251953, 0.06715583801269531, 0.0698690414428711, 0.07258224487304688, 0.07529544830322266, 0.07800865173339844, 0.08072185516357422, 0.08343505859375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 8.0, 5.0, 15.0, 5.0, 12.0, 16.0, 26.0, 26.0, 27.0, 44.0, 38.0, 48.0, 34.0, 43.0, 47.0, 55.0, 43.0, 55.0, 48.0, 44.0, 40.0, 52.0, 39.0, 29.0, 38.0, 20.0, 17.0, 18.0, 14.0, 15.0, 13.0, 17.0, 9.0, 9.0, 6.0, 9.0, 5.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08453369140625, -0.08198738098144531, -0.07944107055664062, -0.07689476013183594, -0.07434844970703125, -0.07180213928222656, -0.06925582885742188, -0.06670951843261719, -0.0641632080078125, -0.06161689758300781, -0.059070587158203125, -0.05652427673339844, -0.05397796630859375, -0.05143165588378906, -0.048885345458984375, -0.04633903503417969, -0.043792724609375, -0.04124641418457031, -0.038700103759765625, -0.03615379333496094, -0.03360748291015625, -0.031061172485351562, -0.028514862060546875, -0.025968551635742188, -0.0234222412109375, -0.020875930786132812, -0.018329620361328125, -0.015783309936523438, -0.01323699951171875, -0.010690689086914062, -0.008144378662109375, -0.0055980682373046875, -0.0030517578125, -0.0005054473876953125, 0.002040863037109375, 0.0045871734619140625, 0.00713348388671875, 0.009679794311523438, 0.012226104736328125, 0.014772415161132812, 0.0173187255859375, 0.019865036010742188, 0.022411346435546875, 0.024957656860351562, 0.02750396728515625, 0.030050277709960938, 0.032596588134765625, 0.03514289855957031, 0.037689208984375, 0.04023551940917969, 0.042781829833984375, 0.04532814025878906, 0.04787445068359375, 0.05042076110839844, 0.052967071533203125, 0.05551338195800781, 0.0580596923828125, 0.06060600280761719, 0.06315231323242188, 0.06569862365722656, 0.06824493408203125, 0.07079124450683594, 0.07333755493164062, 0.07588386535644531, 0.07843017578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 4.0, 6.0, 5.0, 3.0, 9.0, 12.0, 21.0, 27.0, 31.0, 39.0, 66.0, 92.0, 102.0, 139.0, 229.0, 337.0, 544.0, 832.0, 1464.0, 3211.0, 9598.0, 52700.0, 706125.0, 233028.0, 27849.0, 6420.0, 2364.0, 1233.0, 674.0, 405.0, 285.0, 180.0, 153.0, 95.0, 62.0, 58.0, 33.0, 33.0, 19.0, 19.0, 12.0, 10.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.26708984375, -0.2581367492675781, -0.24918365478515625, -0.24023056030273438, -0.2312774658203125, -0.22232437133789062, -0.21337127685546875, -0.20441818237304688, -0.195465087890625, -0.18651199340820312, -0.17755889892578125, -0.16860580444335938, -0.1596527099609375, -0.15069961547851562, -0.14174652099609375, -0.13279342651367188, -0.12384033203125, -0.11488723754882812, -0.10593414306640625, -0.09698104858398438, -0.0880279541015625, -0.07907485961914062, -0.07012176513671875, -0.061168670654296875, -0.052215576171875, -0.043262481689453125, -0.03430938720703125, -0.025356292724609375, -0.0164031982421875, -0.007450103759765625, 0.00150299072265625, 0.010456085205078125, 0.0194091796875, 0.028362274169921875, 0.03731536865234375, 0.046268463134765625, 0.0552215576171875, 0.06417465209960938, 0.07312774658203125, 0.08208084106445312, 0.091033935546875, 0.09998703002929688, 0.10894012451171875, 0.11789321899414062, 0.1268463134765625, 0.13579940795898438, 0.14475250244140625, 0.15370559692382812, 0.16265869140625, 0.17161178588867188, 0.18056488037109375, 0.18951797485351562, 0.1984710693359375, 0.20742416381835938, 0.21637725830078125, 0.22533035278320312, 0.234283447265625, 0.24323654174804688, 0.25218963623046875, 0.2611427307128906, 0.2700958251953125, 0.2790489196777344, 0.28800201416015625, 0.2969551086425781, 0.305908203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 7.0, 8.0, 19.0, 19.0, 22.0, 26.0, 26.0, 38.0, 40.0, 64.0, 53.0, 52.0, 76.0, 64.0, 43.0, 64.0, 48.0, 39.0, 44.0, 46.0, 32.0, 41.0, 18.0, 22.0, 16.0, 13.0, 9.0, 8.0, 9.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.379150390625, -0.3677101135253906, -0.35626983642578125, -0.3448295593261719, -0.3333892822265625, -0.3219490051269531, -0.31050872802734375, -0.2990684509277344, -0.287628173828125, -0.2761878967285156, -0.26474761962890625, -0.2533073425292969, -0.2418670654296875, -0.23042678833007812, -0.21898651123046875, -0.20754623413085938, -0.19610595703125, -0.18466567993164062, -0.17322540283203125, -0.16178512573242188, -0.1503448486328125, -0.13890457153320312, -0.12746429443359375, -0.11602401733398438, -0.104583740234375, -0.09314346313476562, -0.08170318603515625, -0.07026290893554688, -0.0588226318359375, -0.047382354736328125, -0.03594207763671875, -0.024501800537109375, -0.0130615234375, -0.001621246337890625, 0.00981903076171875, 0.021259307861328125, 0.0326995849609375, 0.044139862060546875, 0.05558013916015625, 0.06702041625976562, 0.078460693359375, 0.08990097045898438, 0.10134124755859375, 0.11278152465820312, 0.1242218017578125, 0.13566207885742188, 0.14710235595703125, 0.15854263305664062, 0.16998291015625, 0.18142318725585938, 0.19286346435546875, 0.20430374145507812, 0.2157440185546875, 0.22718429565429688, 0.23862457275390625, 0.2500648498535156, 0.261505126953125, 0.2729454040527344, 0.28438568115234375, 0.2958259582519531, 0.3072662353515625, 0.3187065124511719, 0.33014678955078125, 0.3415870666503906, 0.35302734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 5.0, 11.0, 26.0, 36.0, 47.0, 114.0, 195.0, 364.0, 813.0, 1869.0, 5121.0, 18912.0, 107361.0, 787274.0, 99978.0, 18007.0, 5061.0, 1773.0, 769.0, 388.0, 146.0, 91.0, 59.0, 39.0, 30.0, 13.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10211181640625, -0.09886837005615234, -0.09562492370605469, -0.09238147735595703, -0.08913803100585938, -0.08589458465576172, -0.08265113830566406, -0.0794076919555664, -0.07616424560546875, -0.0729207992553711, -0.06967735290527344, -0.06643390655517578, -0.06319046020507812, -0.05994701385498047, -0.05670356750488281, -0.053460121154785156, -0.0502166748046875, -0.046973228454589844, -0.04372978210449219, -0.04048633575439453, -0.037242889404296875, -0.03399944305419922, -0.030755996704101562, -0.027512550354003906, -0.02426910400390625, -0.021025657653808594, -0.017782211303710938, -0.014538764953613281, -0.011295318603515625, -0.008051872253417969, -0.0048084259033203125, -0.0015649795532226562, 0.001678466796875, 0.004921913146972656, 0.008165359497070312, 0.011408805847167969, 0.014652252197265625, 0.01789569854736328, 0.021139144897460938, 0.024382591247558594, 0.02762603759765625, 0.030869483947753906, 0.03411293029785156, 0.03735637664794922, 0.040599822998046875, 0.04384326934814453, 0.04708671569824219, 0.050330162048339844, 0.0535736083984375, 0.056817054748535156, 0.06006050109863281, 0.06330394744873047, 0.06654739379882812, 0.06979084014892578, 0.07303428649902344, 0.0762777328491211, 0.07952117919921875, 0.0827646255493164, 0.08600807189941406, 0.08925151824951172, 0.09249496459960938, 0.09573841094970703, 0.09898185729980469, 0.10222530364990234, 0.10546875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 13.0, 12.0, 8.0, 14.0, 21.0, 36.0, 46.0, 63.0, 123.0, 168.0, 164.0, 100.0, 79.0, 38.0, 27.0, 25.0, 23.0, 6.0, 10.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.568431854248047e-05, -6.36884942650795e-05, -6.169266998767853e-05, -5.969684571027756e-05, -5.770102143287659e-05, -5.5705197155475616e-05, -5.3709372878074646e-05, -5.1713548600673676e-05, -4.9717724323272705e-05, -4.7721900045871735e-05, -4.5726075768470764e-05, -4.3730251491069794e-05, -4.173442721366882e-05, -3.973860293626785e-05, -3.774277865886688e-05, -3.574695438146591e-05, -3.375113010406494e-05, -3.175530582666397e-05, -2.9759481549263e-05, -2.776365727186203e-05, -2.576783299446106e-05, -2.377200871706009e-05, -2.177618443965912e-05, -1.9780360162258148e-05, -1.7784535884857178e-05, -1.5788711607456207e-05, -1.3792887330055237e-05, -1.1797063052654266e-05, -9.801238775253296e-06, -7.805414497852325e-06, -5.809590220451355e-06, -3.8137659430503845e-06, -1.817941665649414e-06, 1.778826117515564e-07, 2.173706889152527e-06, 4.169531166553497e-06, 6.165355443954468e-06, 8.161179721355438e-06, 1.0157003998756409e-05, 1.2152828276157379e-05, 1.414865255355835e-05, 1.614447683095932e-05, 1.814030110836029e-05, 2.013612538576126e-05, 2.213194966316223e-05, 2.4127773940563202e-05, 2.6123598217964172e-05, 2.8119422495365143e-05, 3.0115246772766113e-05, 3.2111071050167084e-05, 3.4106895327568054e-05, 3.6102719604969025e-05, 3.8098543882369995e-05, 4.0094368159770966e-05, 4.2090192437171936e-05, 4.4086016714572906e-05, 4.608184099197388e-05, 4.807766526937485e-05, 5.007348954677582e-05, 5.206931382417679e-05, 5.406513810157776e-05, 5.606096237897873e-05, 5.80567866563797e-05, 6.005261093378067e-05, 6.204843521118164e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 12.0, 15.0, 20.0, 34.0, 45.0, 53.0, 84.0, 130.0, 187.0, 310.0, 531.0, 978.0, 2078.0, 4736.0, 14105.0, 56923.0, 532869.0, 357634.0, 54650.0, 13876.0, 4829.0, 2075.0, 957.0, 542.0, 316.0, 168.0, 107.0, 77.0, 62.0, 39.0, 36.0, 17.0, 16.0, 14.0, 5.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.07916259765625, -0.07676315307617188, -0.07436370849609375, -0.07196426391601562, -0.0695648193359375, -0.06716537475585938, -0.06476593017578125, -0.062366485595703125, -0.059967041015625, -0.057567596435546875, -0.05516815185546875, -0.052768707275390625, -0.0503692626953125, -0.047969818115234375, -0.04557037353515625, -0.043170928955078125, -0.040771484375, -0.038372039794921875, -0.03597259521484375, -0.033573150634765625, -0.0311737060546875, -0.028774261474609375, -0.02637481689453125, -0.023975372314453125, -0.021575927734375, -0.019176483154296875, -0.01677703857421875, -0.014377593994140625, -0.0119781494140625, -0.009578704833984375, -0.00717926025390625, -0.004779815673828125, -0.00238037109375, 1.9073486328125e-05, 0.00241851806640625, 0.004817962646484375, 0.0072174072265625, 0.009616851806640625, 0.01201629638671875, 0.014415740966796875, 0.016815185546875, 0.019214630126953125, 0.02161407470703125, 0.024013519287109375, 0.0264129638671875, 0.028812408447265625, 0.03121185302734375, 0.033611297607421875, 0.0360107421875, 0.038410186767578125, 0.04080963134765625, 0.043209075927734375, 0.0456085205078125, 0.048007965087890625, 0.05040740966796875, 0.052806854248046875, 0.055206298828125, 0.057605743408203125, 0.06000518798828125, 0.062404632568359375, 0.0648040771484375, 0.06720352172851562, 0.06960296630859375, 0.07200241088867188, 0.07440185546875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 3.0, 6.0, 4.0, 3.0, 7.0, 13.0, 19.0, 13.0, 23.0, 23.0, 25.0, 43.0, 35.0, 47.0, 64.0, 74.0, 81.0, 84.0, 61.0, 66.0, 52.0, 49.0, 31.0, 36.0, 15.0, 20.0, 18.0, 18.0, 11.0, 8.0, 5.0, 9.0, 4.0, 4.0, 6.0, 3.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05523681640625, -0.05351734161376953, -0.05179786682128906, -0.050078392028808594, -0.048358917236328125, -0.046639442443847656, -0.04491996765136719, -0.04320049285888672, -0.04148101806640625, -0.03976154327392578, -0.03804206848144531, -0.036322593688964844, -0.034603118896484375, -0.032883644104003906, -0.031164169311523438, -0.02944469451904297, -0.0277252197265625, -0.02600574493408203, -0.024286270141601562, -0.022566795349121094, -0.020847320556640625, -0.019127845764160156, -0.017408370971679688, -0.01568889617919922, -0.01396942138671875, -0.012249946594238281, -0.010530471801757812, -0.008810997009277344, -0.007091522216796875, -0.005372047424316406, -0.0036525726318359375, -0.0019330978393554688, -0.000213623046875, 0.0015058517456054688, 0.0032253265380859375, 0.004944801330566406, 0.006664276123046875, 0.008383750915527344, 0.010103225708007812, 0.011822700500488281, 0.01354217529296875, 0.015261650085449219, 0.016981124877929688, 0.018700599670410156, 0.020420074462890625, 0.022139549255371094, 0.023859024047851562, 0.02557849884033203, 0.0272979736328125, 0.02901744842529297, 0.030736923217773438, 0.032456398010253906, 0.034175872802734375, 0.035895347595214844, 0.03761482238769531, 0.03933429718017578, 0.04105377197265625, 0.04277324676513672, 0.04449272155761719, 0.046212196350097656, 0.047931671142578125, 0.049651145935058594, 0.05137062072753906, 0.05309009552001953, 0.0548095703125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 11.0, 31.0, 44.0, 98.0, 174.0, 441.0, 118.0, 43.0, 15.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.390264511108398, -4.29127836227417, -4.192292213439941, -4.093306064605713, -3.9943201541900635, -3.895334005355835, -3.7963478565216064, -3.697361707687378, -3.5983755588531494, -3.499389410018921, -3.4004032611846924, -3.301417350769043, -3.2024312019348145, -3.103445053100586, -3.0044589042663574, -2.905472755432129, -2.8064866065979004, -2.707500457763672, -2.6085143089294434, -2.509528160095215, -2.4105422496795654, -2.311556100845337, -2.2125699520111084, -2.11358380317688, -2.0145978927612305, -1.915611743927002, -1.816625714302063, -1.7176395654678345, -1.618653416633606, -1.519667387008667, -1.4206812381744385, -1.32169508934021, -1.2227089405059814, -1.123722791671753, -1.024736762046814, -0.9257506132125854, -0.8267644643783569, -0.7277783751487732, -0.6287922859191895, -0.5298061370849609, -0.4308200478553772, -0.33183392882347107, -0.23284782469272614, -0.1338617205619812, -0.03487560153007507, 0.06411051750183105, 0.1630966067314148, 0.2620827555656433, 0.36106884479522705, 0.4600549638271332, 0.5590410828590393, 0.658027172088623, 0.7570133209228516, 0.8559994101524353, 0.954985499382019, 1.0539716482162476, 1.1529576778411865, 1.251943826675415, 1.350929856300354, 1.4499160051345825, 1.548902153968811, 1.64788818359375, 1.7468743324279785, 1.845860481262207, 1.9448466300964355]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 2.0, 8.0, 8.0, 12.0, 10.0, 7.0, 14.0, 22.0, 16.0, 14.0, 18.0, 32.0, 24.0, 26.0, 32.0, 34.0, 68.0, 134.0, 144.0, 56.0, 27.0, 29.0, 26.0, 26.0, 25.0, 25.0, 30.0, 14.0, 16.0, 18.0, 16.0, 9.0, 4.0, 9.0, 3.0, 10.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.2851760387420654, -1.2472974061965942, -1.209418773651123, -1.1715400218963623, -1.1336613893508911, -1.09578275680542, -1.0579041242599487, -1.0200254917144775, -0.9821467995643616, -0.9442681670188904, -0.9063894748687744, -0.8685108423233032, -0.830632209777832, -0.7927535176277161, -0.7548748850822449, -0.7169961929321289, -0.6791175603866577, -0.6412389278411865, -0.6033602356910706, -0.5654816031455994, -0.5276029109954834, -0.4897242784500122, -0.451845645904541, -0.41396698355674744, -0.37608832120895386, -0.3382096588611603, -0.3003309965133667, -0.2624523639678955, -0.22457370162010193, -0.18669503927230835, -0.14881639182567596, -0.11093774437904358, -0.07305920124053955, -0.03518054634332657, 0.0026981085538864136, 0.040576763451099396, 0.07845541834831238, 0.11633408069610596, 0.15421272814273834, 0.19209137558937073, 0.2299700379371643, 0.2678487002849579, 0.30572736263275146, 0.34360599517822266, 0.38148465752601624, 0.4193633198738098, 0.457241952419281, 0.4951206147670746, 0.5329992771148682, 0.5708779096603394, 0.6087566018104553, 0.6466352343559265, 0.6845139265060425, 0.7223925590515137, 0.7602711915969849, 0.798149824142456, 0.836028516292572, 0.8739071488380432, 0.9117858409881592, 0.9496644735336304, 0.9875431060791016, 1.0254218578338623, 1.0633004903793335, 1.1011791229248047, 1.1390577554702759]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 11.0, 6.0, 14.0, 16.0, 19.0, 40.0, 37.0, 62.0, 66.0, 134.0, 177.0, 323.0, 484.0, 889.0, 1599.0, 3223.0, 6657.0, 16197.0, 48869.0, 229510.0, 1439975.0, 2022303.0, 325743.0, 61789.0, 19702.0, 8020.0, 3826.0, 1876.0, 1040.0, 592.0, 344.0, 205.0, 176.0, 104.0, 73.0, 62.0, 29.0, 23.0, 19.0, 11.0, 11.0, 7.0, 5.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1588134765625, -0.15401649475097656, -0.14921951293945312, -0.1444225311279297, -0.13962554931640625, -0.1348285675048828, -0.13003158569335938, -0.12523460388183594, -0.1204376220703125, -0.11564064025878906, -0.11084365844726562, -0.10604667663574219, -0.10124969482421875, -0.09645271301269531, -0.09165573120117188, -0.08685874938964844, -0.082061767578125, -0.07726478576660156, -0.07246780395507812, -0.06767082214355469, -0.06287384033203125, -0.05807685852050781, -0.053279876708984375, -0.04848289489746094, -0.0436859130859375, -0.03888893127441406, -0.034091949462890625, -0.029294967651367188, -0.02449798583984375, -0.019701004028320312, -0.014904022216796875, -0.010107040405273438, -0.00531005859375, -0.0005130767822265625, 0.004283905029296875, 0.009080886840820312, 0.01387786865234375, 0.018674850463867188, 0.023471832275390625, 0.028268814086914062, 0.0330657958984375, 0.03786277770996094, 0.042659759521484375, 0.04745674133300781, 0.05225372314453125, 0.05705070495605469, 0.061847686767578125, 0.06664466857910156, 0.071441650390625, 0.07623863220214844, 0.08103561401367188, 0.08583259582519531, 0.09062957763671875, 0.09542655944824219, 0.10022354125976562, 0.10502052307128906, 0.1098175048828125, 0.11461448669433594, 0.11941146850585938, 0.12420845031738281, 0.12900543212890625, 0.1338024139404297, 0.13859939575195312, 0.14339637756347656, 0.148193359375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 6.0, 9.0, 12.0, 13.0, 9.0, 14.0, 22.0, 40.0, 29.0, 29.0, 42.0, 29.0, 43.0, 30.0, 48.0, 52.0, 50.0, 44.0, 51.0, 35.0, 47.0, 46.0, 31.0, 41.0, 25.0, 28.0, 18.0, 30.0, 16.0, 24.0, 13.0, 10.0, 14.0, 9.0, 7.0, 8.0, 4.0, 5.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05841064453125, -0.056298255920410156, -0.05418586730957031, -0.05207347869873047, -0.049961090087890625, -0.04784870147705078, -0.04573631286621094, -0.043623924255371094, -0.04151153564453125, -0.039399147033691406, -0.03728675842285156, -0.03517436981201172, -0.033061981201171875, -0.03094959259033203, -0.028837203979492188, -0.026724815368652344, -0.0246124267578125, -0.022500038146972656, -0.020387649536132812, -0.01827526092529297, -0.016162872314453125, -0.014050483703613281, -0.011938095092773438, -0.009825706481933594, -0.00771331787109375, -0.005600929260253906, -0.0034885406494140625, -0.0013761520385742188, 0.000736236572265625, 0.0028486251831054688, 0.0049610137939453125, 0.007073402404785156, 0.009185791015625, 0.011298179626464844, 0.013410568237304688, 0.015522956848144531, 0.017635345458984375, 0.01974773406982422, 0.021860122680664062, 0.023972511291503906, 0.02608489990234375, 0.028197288513183594, 0.030309677124023438, 0.03242206573486328, 0.034534454345703125, 0.03664684295654297, 0.03875923156738281, 0.040871620178222656, 0.0429840087890625, 0.045096397399902344, 0.04720878601074219, 0.04932117462158203, 0.051433563232421875, 0.05354595184326172, 0.05565834045410156, 0.057770729064941406, 0.05988311767578125, 0.061995506286621094, 0.06410789489746094, 0.06622028350830078, 0.06833267211914062, 0.07044506072998047, 0.07255744934082031, 0.07466983795166016, 0.0767822265625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 12.0, 16.0, 13.0, 33.0, 30.0, 54.0, 109.0, 156.0, 369.0, 780.0, 2334.0, 18238.0, 3986887.0, 177566.0, 5163.0, 1351.0, 529.0, 269.0, 131.0, 79.0, 54.0, 36.0, 22.0, 12.0, 13.0, 9.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.0927734375, -1.0645751953125, -1.036376953125, -1.0081787109375, -0.97998046875, -0.9517822265625, -0.923583984375, -0.8953857421875, -0.8671875, -0.8389892578125, -0.810791015625, -0.7825927734375, -0.75439453125, -0.7261962890625, -0.697998046875, -0.6697998046875, -0.6416015625, -0.6134033203125, -0.585205078125, -0.5570068359375, -0.52880859375, -0.5006103515625, -0.472412109375, -0.4442138671875, -0.416015625, -0.3878173828125, -0.359619140625, -0.3314208984375, -0.30322265625, -0.2750244140625, -0.246826171875, -0.2186279296875, -0.1904296875, -0.1622314453125, -0.134033203125, -0.1058349609375, -0.07763671875, -0.0494384765625, -0.021240234375, 0.0069580078125, 0.03515625, 0.0633544921875, 0.091552734375, 0.1197509765625, 0.14794921875, 0.1761474609375, 0.204345703125, 0.2325439453125, 0.2607421875, 0.2889404296875, 0.317138671875, 0.3453369140625, 0.37353515625, 0.4017333984375, 0.429931640625, 0.4581298828125, 0.486328125, 0.5145263671875, 0.542724609375, 0.5709228515625, 0.59912109375, 0.6273193359375, 0.655517578125, 0.6837158203125, 0.7119140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 7.0, 17.0, 27.0, 45.0, 90.0, 155.0, 304.0, 619.0, 1162.0, 852.0, 408.0, 170.0, 90.0, 41.0, 26.0, 21.0, 19.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378662109375, -0.3612556457519531, -0.34384918212890625, -0.3264427185058594, -0.3090362548828125, -0.2916297912597656, -0.27422332763671875, -0.2568168640136719, -0.239410400390625, -0.22200393676757812, -0.20459747314453125, -0.18719100952148438, -0.1697845458984375, -0.15237808227539062, -0.13497161865234375, -0.11756515502929688, -0.10015869140625, -0.08275222778320312, -0.06534576416015625, -0.047939300537109375, -0.0305328369140625, -0.013126373291015625, 0.00428009033203125, 0.021686553955078125, 0.039093017578125, 0.056499481201171875, 0.07390594482421875, 0.09131240844726562, 0.1087188720703125, 0.12612533569335938, 0.14353179931640625, 0.16093826293945312, 0.1783447265625, 0.19575119018554688, 0.21315765380859375, 0.23056411743164062, 0.2479705810546875, 0.2653770446777344, 0.28278350830078125, 0.3001899719238281, 0.317596435546875, 0.3350028991699219, 0.35240936279296875, 0.3698158264160156, 0.3872222900390625, 0.4046287536621094, 0.42203521728515625, 0.4394416809082031, 0.45684814453125, 0.4742546081542969, 0.49166107177734375, 0.5090675354003906, 0.5264739990234375, 0.5438804626464844, 0.5612869262695312, 0.5786933898925781, 0.596099853515625, 0.6135063171386719, 0.6309127807617188, 0.6483192443847656, 0.6657257080078125, 0.6831321716308594, 0.7005386352539062, 0.7179450988769531, 0.7353515625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 7.0, 10.0, 17.0, 37.0, 37.0, 58.0, 105.0, 178.0, 203.0, 152.0, 94.0, 38.0, 18.0, 13.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.293644905090332, -3.1518611907958984, -3.010077476501465, -2.8682937622070312, -2.7265100479125977, -2.584726333618164, -2.4429428577423096, -2.301159143447876, -2.1593754291534424, -2.017591714859009, -1.8758080005645752, -1.7340244054794312, -1.5922406911849976, -1.450456976890564, -1.30867338180542, -1.1668896675109863, -1.0251059532165527, -0.8833222389221191, -0.7415385842323303, -0.5997549295425415, -0.4579712152481079, -0.3161875009536743, -0.1744038462638855, -0.03262019157409668, 0.10916352272033691, 0.2509472072124481, 0.3927308917045593, 0.5345145463943481, 0.6762982606887817, 0.8180819749832153, 0.9598656296730042, 1.101649284362793, 1.2434329986572266, 1.3852167129516602, 1.5270004272460938, 1.6687840223312378, 1.8105677366256714, 1.952351450920105, 2.094135046005249, 2.2359187602996826, 2.377702474594116, 2.51948618888855, 2.6612699031829834, 2.803053617477417, 2.9448370933532715, 3.086620807647705, 3.2284045219421387, 3.3701882362365723, 3.511971950531006, 3.6537556648254395, 3.795539379119873, 3.9373230934143066, 4.07910680770874, 4.220890522003174, 4.362674236297607, 4.504457473754883, 4.646241188049316, 4.78802490234375, 4.929808616638184, 5.071592330932617, 5.213376045227051, 5.355159759521484, 5.496943473815918, 5.638727188110352, 5.780510902404785]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 6.0, 4.0, 6.0, 8.0, 11.0, 14.0, 18.0, 27.0, 32.0, 38.0, 33.0, 32.0, 38.0, 48.0, 57.0, 56.0, 54.0, 63.0, 59.0, 56.0, 45.0, 44.0, 34.0, 32.0, 34.0, 26.0, 18.0, 23.0, 18.0, 9.0, 7.0, 12.0, 3.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.071805953979492, -2.0084590911865234, -1.9451121091842651, -1.8817652463912964, -1.818418264389038, -1.7550714015960693, -1.6917245388031006, -1.6283775568008423, -1.565030574798584, -1.5016837120056152, -1.438336730003357, -1.3749898672103882, -1.3116428852081299, -1.2482960224151611, -1.1849491596221924, -1.121602177619934, -1.0582553148269653, -0.9949083924293518, -0.9315614700317383, -0.8682146072387695, -0.8048676252365112, -0.7415207624435425, -0.678173840045929, -0.6148269176483154, -0.5514799952507019, -0.4881330728530884, -0.42478615045547485, -0.3614392578601837, -0.2980923354625702, -0.23474541306495667, -0.17139852046966553, -0.108051598072052, -0.044704556465148926, 0.018642358481884003, 0.08198927342891693, 0.14533618092536926, 0.2086831033229828, 0.2720300257205963, 0.33537691831588745, 0.398723840713501, 0.4620707631111145, 0.525417685508728, 0.5887646079063416, 0.6521115303039551, 0.7154583930969238, 0.7788053750991821, 0.8421522378921509, 0.9054991602897644, 0.9688460826873779, 1.0321929454803467, 1.095539927482605, 1.1588867902755737, 1.222233772277832, 1.2855806350708008, 1.3489274978637695, 1.4122744798660278, 1.4756214618682861, 1.5389683246612549, 1.6023153066635132, 1.665662169456482, 1.7290091514587402, 1.792356014251709, 1.8557028770446777, 1.919049859046936, 1.9823967218399048]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 10.0, 8.0, 14.0, 18.0, 60.0, 97.0, 208.0, 467.0, 1229.0, 3474.0, 12007.0, 54297.0, 482215.0, 427340.0, 50366.0, 11297.0, 3405.0, 1175.0, 450.0, 209.0, 97.0, 55.0, 33.0, 10.0, 5.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.194091796875, -0.18526077270507812, -0.17642974853515625, -0.16759872436523438, -0.1587677001953125, -0.14993667602539062, -0.14110565185546875, -0.13227462768554688, -0.123443603515625, -0.11461257934570312, -0.10578155517578125, -0.09695053100585938, -0.0881195068359375, -0.07928848266601562, -0.07045745849609375, -0.061626434326171875, -0.05279541015625, -0.043964385986328125, -0.03513336181640625, -0.026302337646484375, -0.0174713134765625, -0.008640289306640625, 0.00019073486328125, 0.009021759033203125, 0.017852783203125, 0.026683807373046875, 0.03551483154296875, 0.044345855712890625, 0.0531768798828125, 0.062007904052734375, 0.07083892822265625, 0.07966995239257812, 0.0885009765625, 0.09733200073242188, 0.10616302490234375, 0.11499404907226562, 0.1238250732421875, 0.13265609741210938, 0.14148712158203125, 0.15031814575195312, 0.159149169921875, 0.16798019409179688, 0.17681121826171875, 0.18564224243164062, 0.1944732666015625, 0.20330429077148438, 0.21213531494140625, 0.22096633911132812, 0.22979736328125, 0.23862838745117188, 0.24745941162109375, 0.2562904357910156, 0.2651214599609375, 0.2739524841308594, 0.28278350830078125, 0.2916145324707031, 0.300445556640625, 0.3092765808105469, 0.31810760498046875, 0.3269386291503906, 0.3357696533203125, 0.3446006774902344, 0.35343170166015625, 0.3622627258300781, 0.37109375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 6.0, 5.0, 11.0, 10.0, 9.0, 9.0, 24.0, 19.0, 17.0, 32.0, 25.0, 37.0, 48.0, 44.0, 50.0, 73.0, 60.0, 57.0, 55.0, 58.0, 62.0, 48.0, 49.0, 40.0, 24.0, 28.0, 19.0, 13.0, 18.0, 11.0, 12.0, 9.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.138671875, -0.13471317291259766, -0.1307544708251953, -0.12679576873779297, -0.12283706665039062, -0.11887836456298828, -0.11491966247558594, -0.1109609603881836, -0.10700225830078125, -0.1030435562133789, -0.09908485412597656, -0.09512615203857422, -0.09116744995117188, -0.08720874786376953, -0.08325004577636719, -0.07929134368896484, -0.0753326416015625, -0.07137393951416016, -0.06741523742675781, -0.06345653533935547, -0.059497833251953125, -0.05553913116455078, -0.05158042907714844, -0.047621726989746094, -0.04366302490234375, -0.039704322814941406, -0.03574562072753906, -0.03178691864013672, -0.027828216552734375, -0.02386951446533203, -0.019910812377929688, -0.015952110290527344, -0.011993408203125, -0.008034706115722656, -0.0040760040283203125, -0.00011730194091796875, 0.003841400146484375, 0.007800102233886719, 0.011758804321289062, 0.015717506408691406, 0.01967620849609375, 0.023634910583496094, 0.027593612670898438, 0.03155231475830078, 0.035511016845703125, 0.03946971893310547, 0.04342842102050781, 0.047387123107910156, 0.0513458251953125, 0.055304527282714844, 0.05926322937011719, 0.06322193145751953, 0.06718063354492188, 0.07113933563232422, 0.07509803771972656, 0.0790567398071289, 0.08301544189453125, 0.0869741439819336, 0.09093284606933594, 0.09489154815673828, 0.09885025024414062, 0.10280895233154297, 0.10676765441894531, 0.11072635650634766, 0.11468505859375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 6.0, 10.0, 14.0, 11.0, 17.0, 30.0, 51.0, 82.0, 119.0, 219.0, 474.0, 1044.0, 3848.0, 35274.0, 953024.0, 47601.0, 4531.0, 1190.0, 463.0, 214.0, 129.0, 66.0, 47.0, 24.0, 22.0, 13.0, 7.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44921875, -0.43582916259765625, -0.4224395751953125, -0.40904998779296875, -0.395660400390625, -0.38227081298828125, -0.3688812255859375, -0.35549163818359375, -0.34210205078125, -0.32871246337890625, -0.3153228759765625, -0.30193328857421875, -0.288543701171875, -0.27515411376953125, -0.2617645263671875, -0.24837493896484375, -0.2349853515625, -0.22159576416015625, -0.2082061767578125, -0.19481658935546875, -0.181427001953125, -0.16803741455078125, -0.1546478271484375, -0.14125823974609375, -0.12786865234375, -0.11447906494140625, -0.1010894775390625, -0.08769989013671875, -0.074310302734375, -0.06092071533203125, -0.0475311279296875, -0.03414154052734375, -0.020751953125, -0.00736236572265625, 0.0060272216796875, 0.01941680908203125, 0.032806396484375, 0.04619598388671875, 0.0595855712890625, 0.07297515869140625, 0.08636474609375, 0.09975433349609375, 0.1131439208984375, 0.12653350830078125, 0.139923095703125, 0.15331268310546875, 0.1667022705078125, 0.18009185791015625, 0.1934814453125, 0.20687103271484375, 0.2202606201171875, 0.23365020751953125, 0.247039794921875, 0.26042938232421875, 0.2738189697265625, 0.28720855712890625, 0.30059814453125, 0.31398773193359375, 0.3273773193359375, 0.34076690673828125, 0.354156494140625, 0.36754608154296875, 0.3809356689453125, 0.39432525634765625, 0.40771484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 2.0, 8.0, 9.0, 6.0, 19.0, 13.0, 16.0, 23.0, 15.0, 25.0, 28.0, 34.0, 29.0, 50.0, 58.0, 65.0, 85.0, 99.0, 80.0, 54.0, 49.0, 33.0, 34.0, 33.0, 21.0, 15.0, 21.0, 14.0, 10.0, 8.0, 4.0, 2.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41845703125, -0.4044647216796875, -0.390472412109375, -0.3764801025390625, -0.36248779296875, -0.3484954833984375, -0.334503173828125, -0.3205108642578125, -0.3065185546875, -0.2925262451171875, -0.278533935546875, -0.2645416259765625, -0.25054931640625, -0.2365570068359375, -0.222564697265625, -0.2085723876953125, -0.194580078125, -0.1805877685546875, -0.166595458984375, -0.1526031494140625, -0.13861083984375, -0.1246185302734375, -0.110626220703125, -0.0966339111328125, -0.0826416015625, -0.0686492919921875, -0.054656982421875, -0.0406646728515625, -0.02667236328125, -0.0126800537109375, 0.001312255859375, 0.0153045654296875, 0.029296875, 0.0432891845703125, 0.057281494140625, 0.0712738037109375, 0.08526611328125, 0.0992584228515625, 0.113250732421875, 0.1272430419921875, 0.1412353515625, 0.1552276611328125, 0.169219970703125, 0.1832122802734375, 0.19720458984375, 0.2111968994140625, 0.225189208984375, 0.2391815185546875, 0.253173828125, 0.2671661376953125, 0.281158447265625, 0.2951507568359375, 0.30914306640625, 0.3231353759765625, 0.337127685546875, 0.3511199951171875, 0.3651123046875, 0.3791046142578125, 0.393096923828125, 0.4070892333984375, 0.42108154296875, 0.4350738525390625, 0.449066162109375, 0.4630584716796875, 0.47705078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 8.0, 10.0, 9.0, 11.0, 12.0, 15.0, 15.0, 25.0, 29.0, 27.0, 45.0, 51.0, 100.0, 122.0, 241.0, 398.0, 687.0, 1312.0, 2983.0, 7724.0, 24868.0, 162906.0, 791121.0, 37810.0, 10414.0, 3790.0, 1715.0, 839.0, 449.0, 236.0, 182.0, 106.0, 69.0, 45.0, 35.0, 42.0, 22.0, 17.0, 16.0, 11.0, 6.0, 7.0, 3.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0521240234375, -0.05039501190185547, -0.04866600036621094, -0.046936988830566406, -0.045207977294921875, -0.043478965759277344, -0.04174995422363281, -0.04002094268798828, -0.03829193115234375, -0.03656291961669922, -0.03483390808105469, -0.033104896545410156, -0.031375885009765625, -0.029646873474121094, -0.027917861938476562, -0.02618885040283203, -0.0244598388671875, -0.02273082733154297, -0.021001815795898438, -0.019272804260253906, -0.017543792724609375, -0.015814781188964844, -0.014085769653320312, -0.012356758117675781, -0.01062774658203125, -0.008898735046386719, -0.0071697235107421875, -0.005440711975097656, -0.003711700439453125, -0.0019826889038085938, -0.0002536773681640625, 0.0014753341674804688, 0.003204345703125, 0.004933357238769531, 0.0066623687744140625, 0.008391380310058594, 0.010120391845703125, 0.011849403381347656, 0.013578414916992188, 0.015307426452636719, 0.01703643798828125, 0.01876544952392578, 0.020494461059570312, 0.022223472595214844, 0.023952484130859375, 0.025681495666503906, 0.027410507202148438, 0.02913951873779297, 0.0308685302734375, 0.03259754180908203, 0.03432655334472656, 0.036055564880371094, 0.037784576416015625, 0.039513587951660156, 0.04124259948730469, 0.04297161102294922, 0.04470062255859375, 0.04642963409423828, 0.04815864562988281, 0.049887657165527344, 0.051616668701171875, 0.053345680236816406, 0.05507469177246094, 0.05680370330810547, 0.05853271484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 4.0, 7.0, 10.0, 5.0, 10.0, 13.0, 14.0, 20.0, 14.0, 30.0, 30.0, 52.0, 72.0, 94.0, 96.0, 123.0, 93.0, 71.0, 46.0, 36.0, 33.0, 27.0, 20.0, 14.0, 15.0, 7.0, 7.0, 4.0, 6.0, 6.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6226043701171875e-05, -2.5474466383457184e-05, -2.4722889065742493e-05, -2.39713117480278e-05, -2.321973443031311e-05, -2.246815711259842e-05, -2.1716579794883728e-05, -2.0965002477169037e-05, -2.0213425159454346e-05, -1.9461847841739655e-05, -1.8710270524024963e-05, -1.7958693206310272e-05, -1.720711588859558e-05, -1.645553857088089e-05, -1.57039612531662e-05, -1.4952383935451508e-05, -1.4200806617736816e-05, -1.3449229300022125e-05, -1.2697651982307434e-05, -1.1946074664592743e-05, -1.1194497346878052e-05, -1.044292002916336e-05, -9.69134271144867e-06, -8.939765393733978e-06, -8.188188076019287e-06, -7.436610758304596e-06, -6.685033440589905e-06, -5.933456122875214e-06, -5.1818788051605225e-06, -4.430301487445831e-06, -3.67872416973114e-06, -2.927146852016449e-06, -2.175569534301758e-06, -1.4239922165870667e-06, -6.724148988723755e-07, 7.916241884231567e-08, 8.307397365570068e-07, 1.582317054271698e-06, 2.333894371986389e-06, 3.0854716897010803e-06, 3.8370490074157715e-06, 4.588626325130463e-06, 5.340203642845154e-06, 6.091780960559845e-06, 6.843358278274536e-06, 7.594935595989227e-06, 8.346512913703918e-06, 9.09809023141861e-06, 9.8496675491333e-06, 1.0601244866847992e-05, 1.1352822184562683e-05, 1.2104399502277374e-05, 1.2855976819992065e-05, 1.3607554137706757e-05, 1.4359131455421448e-05, 1.5110708773136139e-05, 1.586228609085083e-05, 1.661386340856552e-05, 1.7365440726280212e-05, 1.8117018043994904e-05, 1.8868595361709595e-05, 1.9620172679424286e-05, 2.0371749997138977e-05, 2.1123327314853668e-05, 2.187490463256836e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 14.0, 17.0, 24.0, 29.0, 47.0, 72.0, 82.0, 134.0, 206.0, 306.0, 472.0, 813.0, 1475.0, 2582.0, 5250.0, 11153.0, 29972.0, 133417.0, 768507.0, 59452.0, 18226.0, 7743.0, 3697.0, 1964.0, 1043.0, 651.0, 401.0, 251.0, 180.0, 103.0, 70.0, 53.0, 36.0, 30.0, 15.0, 16.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.04241943359375, -0.04118156433105469, -0.039943695068359375, -0.03870582580566406, -0.03746795654296875, -0.03623008728027344, -0.034992218017578125, -0.03375434875488281, -0.0325164794921875, -0.03127861022949219, -0.030040740966796875, -0.028802871704101562, -0.02756500244140625, -0.026327133178710938, -0.025089263916015625, -0.023851394653320312, -0.022613525390625, -0.021375656127929688, -0.020137786865234375, -0.018899917602539062, -0.01766204833984375, -0.016424179077148438, -0.015186309814453125, -0.013948440551757812, -0.0127105712890625, -0.011472702026367188, -0.010234832763671875, -0.008996963500976562, -0.00775909423828125, -0.0065212249755859375, -0.005283355712890625, -0.0040454864501953125, -0.0028076171875, -0.0015697479248046875, -0.000331878662109375, 0.0009059906005859375, 0.00214385986328125, 0.0033817291259765625, 0.004619598388671875, 0.0058574676513671875, 0.0070953369140625, 0.008333206176757812, 0.009571075439453125, 0.010808944702148438, 0.01204681396484375, 0.013284683227539062, 0.014522552490234375, 0.015760421752929688, 0.016998291015625, 0.018236160278320312, 0.019474029541015625, 0.020711898803710938, 0.02194976806640625, 0.023187637329101562, 0.024425506591796875, 0.025663375854492188, 0.0269012451171875, 0.028139114379882812, 0.029376983642578125, 0.030614852905273438, 0.03185272216796875, 0.03309059143066406, 0.034328460693359375, 0.03556632995605469, 0.03680419921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 5.0, 4.0, 5.0, 13.0, 8.0, 21.0, 18.0, 20.0, 18.0, 22.0, 29.0, 38.0, 64.0, 102.0, 104.0, 93.0, 91.0, 70.0, 65.0, 32.0, 21.0, 23.0, 20.0, 18.0, 12.0, 15.0, 14.0, 10.0, 7.0, 2.0, 5.0, 3.0, 3.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0435791015625, -0.04209184646606445, -0.040604591369628906, -0.03911733627319336, -0.03763008117675781, -0.036142826080322266, -0.03465557098388672, -0.03316831588745117, -0.031681060791015625, -0.030193805694580078, -0.02870655059814453, -0.027219295501708984, -0.025732040405273438, -0.02424478530883789, -0.022757530212402344, -0.021270275115966797, -0.01978302001953125, -0.018295764923095703, -0.016808509826660156, -0.01532125473022461, -0.013833999633789062, -0.012346744537353516, -0.010859489440917969, -0.009372234344482422, -0.007884979248046875, -0.006397724151611328, -0.004910469055175781, -0.0034232139587402344, -0.0019359588623046875, -0.0004487037658691406, 0.0010385513305664062, 0.002525806427001953, 0.0040130615234375, 0.005500316619873047, 0.006987571716308594, 0.00847482681274414, 0.009962081909179688, 0.011449337005615234, 0.012936592102050781, 0.014423847198486328, 0.015911102294921875, 0.017398357391357422, 0.01888561248779297, 0.020372867584228516, 0.021860122680664062, 0.02334737777709961, 0.024834632873535156, 0.026321887969970703, 0.02780914306640625, 0.029296398162841797, 0.030783653259277344, 0.03227090835571289, 0.03375816345214844, 0.035245418548583984, 0.03673267364501953, 0.03821992874145508, 0.039707183837890625, 0.04119443893432617, 0.04268169403076172, 0.044168949127197266, 0.04565620422363281, 0.04714345932006836, 0.048630714416503906, 0.05011796951293945, 0.051605224609375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 14.0, 12.0, 49.0, 92.0, 569.0, 147.0, 63.0, 25.0, 14.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7520177364349365, -1.6530243158340454, -1.5540308952331543, -1.4550375938415527, -1.3560441732406616, -1.2570507526397705, -1.158057451248169, -1.0590640306472778, -0.9600706100463867, -0.8610771894454956, -0.7620838284492493, -0.6630904674530029, -0.5640970468521118, -0.4651036560535431, -0.36611026525497437, -0.267116904258728, -0.16812348365783691, -0.06913009285926819, 0.029863297939300537, 0.12885668873786926, 0.227850079536438, 0.3268434703350067, 0.42583686113357544, 0.5248302221298218, 0.6238236427307129, 0.722817063331604, 0.8218104243278503, 0.9208037853240967, 1.0197972059249878, 1.118790626525879, 1.2177839279174805, 1.3167773485183716, 1.4157705307006836, 1.5147639513015747, 1.6137573719024658, 1.7127506732940674, 1.8117440938949585, 1.9107375144958496, 2.009730815887451, 2.1087241172790527, 2.2077176570892334, 2.306710958480835, 2.4057044982910156, 2.504697799682617, 2.6036911010742188, 2.7026846408843994, 2.801677942276001, 2.9006714820861816, 2.999664783477783, 3.0986580848693848, 3.1976516246795654, 3.296644926071167, 3.3956384658813477, 3.494631767272949, 3.593625068664551, 3.6926183700561523, 3.791611909866333, 3.8906052112579346, 3.9895987510681152, 4.088592052459717, 4.187585353851318, 4.28657865524292, 4.38557243347168, 4.484565734863281, 4.583559036254883]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 3.0, 7.0, 6.0, 7.0, 7.0, 12.0, 13.0, 14.0, 25.0, 21.0, 24.0, 31.0, 30.0, 35.0, 80.0, 343.0, 94.0, 34.0, 22.0, 29.0, 18.0, 22.0, 22.0, 16.0, 9.0, 13.0, 14.0, 13.0, 7.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2773396968841553, -1.2341338396072388, -1.1909279823303223, -1.1477221250534058, -1.1045162677764893, -1.0613105297088623, -1.0181045532226562, -0.9748988151550293, -0.9316929578781128, -0.8884871006011963, -0.8452812433242798, -0.8020753860473633, -0.7588695883750916, -0.715663731098175, -0.6724578738212585, -0.6292520761489868, -0.5860461592674255, -0.542840301990509, -0.4996344745159149, -0.4564286172389984, -0.4132227897644043, -0.3700169324874878, -0.3268110752105713, -0.2836052477359772, -0.24039939045906067, -0.19719354808330536, -0.15398770570755005, -0.11078184843063354, -0.06757600605487823, -0.024370163679122925, 0.01883569359779358, 0.062041521072387695, 0.1052473783493042, 0.1484532207250595, 0.19165906310081482, 0.23486492037773132, 0.27807074785232544, 0.32127660512924194, 0.36448246240615845, 0.40768828988075256, 0.45089414715766907, 0.49410000443458557, 0.5373058319091797, 0.5805116891860962, 0.6237175464630127, 0.6669234037399292, 0.7101292610168457, 0.7533350586891174, 0.7965409159660339, 0.8397467732429504, 0.8829526305198669, 0.9261584281921387, 0.9693642854690552, 1.0125701427459717, 1.0557760000228882, 1.0989818572998047, 1.1421877145767212, 1.1853935718536377, 1.2285994291305542, 1.2718052864074707, 1.3150111436843872, 1.3582170009613037, 1.4014227390289307, 1.4446285963058472, 1.4878344535827637]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 6.0, 11.0, 18.0, 17.0, 40.0, 54.0, 86.0, 198.0, 337.0, 98.0, 66.0, 27.0, 23.0, 11.0, 4.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3984375, -0.38939666748046875, -0.3803558349609375, -0.37131500244140625, -0.362274169921875, -0.35323333740234375, -0.3441925048828125, -0.33515167236328125, -0.32611083984375, -0.31707000732421875, -0.3080291748046875, -0.29898834228515625, -0.289947509765625, -0.28090667724609375, -0.2718658447265625, -0.26282501220703125, -0.2537841796875, -0.24474334716796875, -0.2357025146484375, -0.22666168212890625, -0.217620849609375, -0.20858001708984375, -0.1995391845703125, -0.19049835205078125, -0.18145751953125, -0.17241668701171875, -0.1633758544921875, -0.15433502197265625, -0.145294189453125, -0.13625335693359375, -0.1272125244140625, -0.11817169189453125, -0.109130859375, -0.10009002685546875, -0.0910491943359375, -0.08200836181640625, -0.072967529296875, -0.06392669677734375, -0.0548858642578125, -0.04584503173828125, -0.03680419921875, -0.02776336669921875, -0.0187225341796875, -0.00968170166015625, -0.000640869140625, 0.00839996337890625, 0.0174407958984375, 0.02648162841796875, 0.0355224609375, 0.04456329345703125, 0.0536041259765625, 0.06264495849609375, 0.071685791015625, 0.08072662353515625, 0.0897674560546875, 0.09880828857421875, 0.10784912109375, 0.11688995361328125, 0.1259307861328125, 0.13497161865234375, 0.144012451171875, 0.15305328369140625, 0.1620941162109375, 0.17113494873046875, 0.18017578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 15.0, 6.0, 14.0, 32.0, 43.0, 42.0, 92.0, 170.0, 315.0, 833.0, 3182.0, 29290.0, 8342812.0, 8935.0, 1740.0, 528.0, 223.0, 125.0, 62.0, 34.0, 30.0, 19.0, 9.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3299070596694946, -1.2845041751861572, -1.2391014099121094, -1.193698525428772, -1.1482956409454346, -1.1028928756713867, -1.0574899911880493, -1.012087106704712, -0.9666843414306641, -0.9212815165519714, -0.8758786916732788, -0.8304758071899414, -0.7850729823112488, -0.7396701574325562, -0.6942672729492188, -0.6488644480705261, -0.6034616231918335, -0.5580587983131409, -0.5126559734344482, -0.46725308895111084, -0.4218502640724182, -0.3764474391937256, -0.33104458451271057, -0.28564172983169556, -0.24023890495300293, -0.1948360651731491, -0.1494332253932953, -0.10403038561344147, -0.058627545833587646, -0.013224706053733826, 0.032178133726119995, 0.07758098840713501, 0.12298381328582764, 0.16838665306568146, 0.21378949284553528, 0.2591923475265503, 0.3045951724052429, 0.34999799728393555, 0.39540085196495056, 0.4408037066459656, 0.4862065315246582, 0.5316093564033508, 0.5770121812820435, 0.6224150657653809, 0.6678178906440735, 0.7132207155227661, 0.7586236000061035, 0.8040264248847961, 0.8494292497634888, 0.8948320746421814, 0.940234899520874, 0.9856377840042114, 1.0310406684875488, 1.0764434337615967, 1.121846318244934, 1.1672492027282715, 1.2126519680023193, 1.2580548524856567, 1.3034576177597046, 1.348860502243042, 1.3942632675170898, 1.4396661520004272, 1.4850690364837646, 1.5304718017578125, 1.57587468624115]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 8.0, 3.0, 3.0, 7.0, 3.0, 7.0, 5.0, 5.0, 5.0, 9.0, 4.0, 10.0, 2.0, 4.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7810184359550476, -0.7465682029724121, -0.7121180295944214, -0.6776677966117859, -0.6432175636291504, -0.6087673902511597, -0.5743171572685242, -0.5398669242858887, -0.505416750907898, -0.47096654772758484, -0.43651631474494934, -0.40206611156463623, -0.36761587858200073, -0.3331656754016876, -0.2987154722213745, -0.264265239238739, -0.22981500625610352, -0.1953647881746292, -0.1609145700931549, -0.1264643669128418, -0.09201414883136749, -0.05756393074989319, -0.023113727569580078, 0.011336490511894226, 0.04578670859336853, 0.08023692667484283, 0.11468713730573654, 0.14913734793663025, 0.18358756601810455, 0.21803778409957886, 0.25248798727989197, 0.2869381904602051, 0.3213883638381958, 0.3558385670185089, 0.3902888000011444, 0.4247390031814575, 0.459189236164093, 0.49363943934440613, 0.5280896425247192, 0.5625398755073547, 0.5969901084899902, 0.6314403414726257, 0.6658905148506165, 0.700340747833252, 0.7347909808158875, 0.769241213798523, 0.8036913871765137, 0.8381416201591492, 0.8725917935371399, 0.9070420265197754, 0.9414921998977661, 0.9759424328804016, 1.010392665863037, 1.0448428392410278, 1.0792930126190186, 1.1137433052062988, 1.1481934785842896, 1.1826436519622803, 1.2170939445495605, 1.2515441179275513, 1.285994291305542, 1.3204445838928223, 1.354894757270813, 1.3893449306488037, 1.423795223236084]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 13.0, 15.0, 25.0, 26.0, 58.0, 115.0, 167.0, 307.0, 714.0, 1517.0, 3644.0, 10535.0, 37985.0, 169094.0, 222047.0, 55403.0, 14364.0, 4683.0, 1777.0, 824.0, 365.0, 206.0, 128.0, 74.0, 49.0, 37.0, 26.0, 13.0, 9.0, 15.0, 12.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.982421875, -0.9433135986328125, -0.904205322265625, -0.8650970458984375, -0.82598876953125, -0.7868804931640625, -0.747772216796875, -0.7086639404296875, -0.6695556640625, -0.6304473876953125, -0.591339111328125, -0.5522308349609375, -0.51312255859375, -0.4740142822265625, -0.434906005859375, -0.3957977294921875, -0.356689453125, -0.3175811767578125, -0.278472900390625, -0.2393646240234375, -0.20025634765625, -0.1611480712890625, -0.122039794921875, -0.0829315185546875, -0.0438232421875, -0.0047149658203125, 0.034393310546875, 0.0735015869140625, 0.11260986328125, 0.1517181396484375, 0.190826416015625, 0.2299346923828125, 0.26904296875, 0.3081512451171875, 0.347259521484375, 0.3863677978515625, 0.42547607421875, 0.4645843505859375, 0.503692626953125, 0.5428009033203125, 0.5819091796875, 0.6210174560546875, 0.660125732421875, 0.6992340087890625, 0.73834228515625, 0.7774505615234375, 0.816558837890625, 0.8556671142578125, 0.894775390625, 0.9338836669921875, 0.972991943359375, 1.0121002197265625, 1.05120849609375, 1.0903167724609375, 1.129425048828125, 1.1685333251953125, 1.2076416015625, 1.2467498779296875, 1.285858154296875, 1.3249664306640625, 1.36407470703125, 1.4031829833984375, 1.442291259765625, 1.4813995361328125, 1.5205078125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 11.0, 14.0, 17.0, 27.0, 22.0, 55.0, 56.0, 68.0, 97.0, 88.0, 112.0, 87.0, 75.0, 77.0, 53.0, 38.0, 31.0, 21.0, 13.0, 13.0, 9.0, 7.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1446533203125, -0.1388835906982422, -0.13311386108398438, -0.12734413146972656, -0.12157440185546875, -0.11580467224121094, -0.11003494262695312, -0.10426521301269531, -0.0984954833984375, -0.09272575378417969, -0.08695602416992188, -0.08118629455566406, -0.07541656494140625, -0.06964683532714844, -0.06387710571289062, -0.05810737609863281, -0.052337646484375, -0.04656791687011719, -0.040798187255859375, -0.03502845764160156, -0.02925872802734375, -0.023488998413085938, -0.017719268798828125, -0.011949539184570312, -0.0061798095703125, -0.0004100799560546875, 0.005359649658203125, 0.011129379272460938, 0.01689910888671875, 0.022668838500976562, 0.028438568115234375, 0.03420829772949219, 0.03997802734375, 0.04574775695800781, 0.051517486572265625, 0.05728721618652344, 0.06305694580078125, 0.06882667541503906, 0.07459640502929688, 0.08036613464355469, 0.0861358642578125, 0.09190559387207031, 0.09767532348632812, 0.10344505310058594, 0.10921478271484375, 0.11498451232910156, 0.12075424194335938, 0.1265239715576172, 0.132293701171875, 0.1380634307861328, 0.14383316040039062, 0.14960289001464844, 0.15537261962890625, 0.16114234924316406, 0.16691207885742188, 0.1726818084716797, 0.1784515380859375, 0.1842212677001953, 0.18999099731445312, 0.19576072692871094, 0.20153045654296875, 0.20730018615722656, 0.21306991577148438, 0.2188396453857422, 0.224609375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 10.0, 21.0, 22.0, 67.0, 109.0, 90.0, 68.0, 41.0, 20.0, 8.0, 7.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0866007804870605, -2.0396270751953125, -1.992653489112854, -1.9456799030303955, -1.8987061977386475, -1.851732611656189, -1.8047590255737305, -1.7577853202819824, -1.710811734199524, -1.6638381481170654, -1.6168644428253174, -1.5698908567428589, -1.5229171514511108, -1.4759435653686523, -1.4289698600769043, -1.3819962739944458, -1.3350226879119873, -1.2880491018295288, -1.2410753965377808, -1.1941018104553223, -1.1471281051635742, -1.1001545190811157, -1.0531809329986572, -1.0062072277069092, -0.9592335224151611, -0.9122598767280579, -0.8652862310409546, -0.8183126449584961, -0.7713389992713928, -0.7243653535842896, -0.6773917078971863, -0.630418062210083, -0.5834444761276245, -0.5364708304405212, -0.48949721455574036, -0.4425235688686371, -0.3955499529838562, -0.34857630729675293, -0.30160266160964966, -0.2546290457248688, -0.2076554000377655, -0.16068176925182343, -0.11370813101530075, -0.06673449277877808, -0.019760861992836, 0.02721276879310608, 0.07418641448020935, 0.12116003036499023, 0.1681336760520935, 0.21510730683803558, 0.26208093762397766, 0.30905458331108093, 0.3560281991958618, 0.4030018448829651, 0.44997549057006836, 0.49694910645484924, 0.5439227819442749, 0.5908964276313782, 0.6378700733184814, 0.6848436594009399, 0.7318173050880432, 0.7787909507751465, 0.8257645964622498, 0.872738242149353, 0.9197118282318115]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 11.0, 14.0, 26.0, 58.0, 81.0, 66.0, 62.0, 43.0, 18.0, 25.0, 10.0, 7.0, 4.0, 4.0, 3.0, 7.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5446126461029053, -0.5249119400978088, -0.5052112340927124, -0.4855104684829712, -0.46580976247787476, -0.4461090564727783, -0.4264083206653595, -0.4067075848579407, -0.38700687885284424, -0.3673061728477478, -0.347605437040329, -0.32790470123291016, -0.3082039952278137, -0.2885032892227173, -0.26880255341529846, -0.24910183250904083, -0.2294011116027832, -0.20970039069652557, -0.18999966979026794, -0.17029894888401031, -0.15059822797775269, -0.13089750707149506, -0.11119678616523743, -0.0914960652589798, -0.07179534435272217, -0.05209462344646454, -0.03239390254020691, -0.01269318163394928, 0.00700753927230835, 0.02670826017856598, 0.04640898108482361, 0.06610970199108124, 0.08581042289733887, 0.1055111438035965, 0.12521186470985413, 0.14491258561611176, 0.16461330652236938, 0.18431402742862701, 0.20401474833488464, 0.22371546924114227, 0.2434161901473999, 0.26311689615249634, 0.28281763195991516, 0.302518367767334, 0.3222190737724304, 0.34191977977752686, 0.3616205155849457, 0.3813212513923645, 0.40102195739746094, 0.4207226634025574, 0.4404233992099762, 0.460124135017395, 0.47982484102249146, 0.4995255470275879, 0.5192263126373291, 0.5389270186424255, 0.558627724647522, 0.5783284306526184, 0.5980291366577148, 0.617729902267456, 0.6374306082725525, 0.6571313142776489, 0.6768320798873901, 0.6965327858924866, 0.716233491897583]}, "eval/loss": 4.256221294403076, "eval/wer": 1.9558111860372869, "eval/runtime": 979.265, "eval/samples_per_second": 2.698, "eval/steps_per_second": 0.338} \ No newline at end of file